blob: d2a61eda8da0997b0ecf341ce92a9bcdbaa6fa38 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
|
#pragma once
#include <AK/StringView.h>
#include <AK/Vector.h>
#define FOR_EACH_TOKEN_TYPE \
__TOKEN(Unknown) \
__TOKEN(Whitespace) \
__TOKEN(PreprocessorStatement) \
__TOKEN(LeftParen) \
__TOKEN(RightParen) \
__TOKEN(LeftCurly) \
__TOKEN(RightCurly) \
__TOKEN(LeftBracket) \
__TOKEN(RightBracket) \
__TOKEN(Comma) \
__TOKEN(Asterisk) \
__TOKEN(Semicolon) \
__TOKEN(DoubleQuotedString) \
__TOKEN(SingleQuotedString) \
__TOKEN(Comment) \
__TOKEN(Number) \
__TOKEN(Keyword) \
__TOKEN(KnownType) \
__TOKEN(Identifier)
struct CppPosition {
int line { -1 };
int column { -1 };
};
struct CppToken {
enum class Type {
#define __TOKEN(x) x,
FOR_EACH_TOKEN_TYPE
#undef __TOKEN
};
const char* to_string() const
{
switch (m_type) {
#define __TOKEN(x) \
case Type::x: \
return #x;
FOR_EACH_TOKEN_TYPE
#undef __TOKEN
}
ASSERT_NOT_REACHED();
}
Type m_type { Type::Unknown };
CppPosition m_start;
CppPosition m_end;
};
class CppLexer {
public:
CppLexer(const StringView&);
Vector<CppToken> lex();
private:
char peek(int offset = 0) const;
char consume();
StringView m_input;
int m_index { 0 };
CppPosition m_previous_position { 0, 0 };
CppPosition m_position { 0, 0 };
};
|