-
Notifications
You must be signed in to change notification settings - Fork 2
/
lexer.hh
105 lines (86 loc) · 3.13 KB
/
lexer.hh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
// Copyright (c) 2019 ASMlover. All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions
// are met:
//
// * Redistributions of source code must retain the above copyright
// notice, this list ofconditions and the following disclaimer.
//
// * Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in
// the documentation and/or other materialsprovided with the
// distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
// FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
// COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
// BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
// ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
#pragma once
#include <cctype>
#include "common.hh"
#include "token.hh"
namespace loxcc {
class Lexer final : private UnCopyable {
const str_t& source_bytes_;
sz_t begpos_{};
sz_t curpos_{};
int lineno_{1};
inline bool isalpha(char c) const noexcept {
return std::isalpha(c) || c == '_';
}
inline bool isalnum(char c) const noexcept {
return std::isalnum(c) || c == '_';
}
inline bool isdigit(char c) const noexcept {
return std::isdigit(c);
}
inline str_t gen_literal(sz_t begpos, sz_t endpos) const noexcept {
return source_bytes_.substr(begpos, endpos - begpos);
}
inline bool is_end(void) const noexcept {
return curpos_ >= source_bytes_.size();
}
inline char advance(void) noexcept {
return source_bytes_[curpos_++];
}
inline bool match(char expected) noexcept {
if (is_end() || source_bytes_[curpos_] != expected)
return false;
advance();
return true;
}
inline char peek(void) const noexcept {
return curpos_ >= source_bytes_.size() ? 0 : source_bytes_[curpos_];
}
inline char peek_next(void) const noexcept {
return curpos_ + 1 >= source_bytes_.size() ? 0 : source_bytes_[curpos_ + 1];
}
inline Token make_token(TokenKind kind) const noexcept {
return Token(kind, gen_literal(begpos_, curpos_), lineno_);
}
inline Token make_token(TokenKind kind, const str_t& literal) const noexcept {
return Token(kind, literal, lineno_);
}
inline Token make_error(const str_t& message) const noexcept {
return Token(TokenKind::TK_ERR, message, lineno_);
}
void skip_whitespace(void);
Token make_identifier(void);
Token make_numeric(void);
Token make_string(void);
public:
explicit Lexer(const str_t& source_bytes) noexcept
: source_bytes_(source_bytes) {
}
Token next_token(void);
};
}