forked from google/jsonnet
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathlexer.h
154 lines (130 loc) · 3.89 KB
/
lexer.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
/*
Copyright 2015 Google Inc. All rights reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
#ifndef LEXER_H
#define LEXER_H
#include <cstdlib>
#include <iostream>
#include <string>
#include <list>
#include <sstream>
#include "static_error.h"
struct Token {
enum Kind {
// Symbols
BRACE_L,
BRACE_R,
BRACKET_L,
BRACKET_R,
COLON,
COMMA,
DOLLAR,
DOT,
PAREN_L,
PAREN_R,
SEMICOLON,
// Arbitrary length lexemes
IDENTIFIER,
NUMBER,
OPERATOR,
STRING,
// Keywords
ELSE,
ERROR,
FALSE,
FOR,
FUNCTION,
IF,
IMPORT,
IMPORTSTR,
IN,
LOCAL,
NULL_LIT,
TAILCALL,
THEN,
SELF,
SUPER,
TRUE,
// A special token that holds line/column information about the end of the file.
END_OF_FILE
} kind;
std::string data;
LocationRange location;
Token(Kind kind, const std::string &data, const LocationRange &location)
: kind(kind), data(data), location(location)
{ }
Token(Kind kind, const std::string &data="") : kind(kind), data(data) { }
static const char *toString(Kind v)
{
switch (v) {
case BRACE_L: return "\"{\"";
case BRACE_R: return "\"}\"";
case BRACKET_L: return "\"[\"";
case BRACKET_R: return "\"]\"";
case COLON: return "\":\"";
case COMMA: return "\",\"";
case DOLLAR: return "\"$\"";
case DOT: return "\".\"";
case PAREN_L: return "\"(\"";
case PAREN_R: return "\")\"";
case SEMICOLON: return "\";\"";
case IDENTIFIER: return "IDENTIFIER";
case NUMBER: return "NUMBER";
case OPERATOR: return "OPERATOR";
case STRING: return "STRING";
case ELSE: return "else";
case ERROR: return "error";
case FALSE: return "false";
case FOR: return "for";
case FUNCTION: return "function";
case IF: return "if";
case IMPORT: return "import";
case IMPORTSTR: return "importstr";
case IN: return "in";
case LOCAL: return "local";
case NULL_LIT: return "null";
case SELF: return "self";
case SUPER: return "super";
case TAILCALL: return "tailcall";
case THEN: return "then";
case TRUE: return "true";
case END_OF_FILE: return "end of file";
default:
std::cerr << "INTERNAL ERROR: Unknown token kind: " << v << std::endl;
std::abort();
}
}
};
static inline bool operator==(const Token &a, const Token &b)
{
if (a.kind != b.kind) return false;
if (a.data != b.data) return false;
return true;
}
static inline std::ostream &operator<<(std::ostream &o, Token::Kind v)
{
o << Token::toString(v);
return o;
}
static inline std::ostream &operator<<(std::ostream &o, const Token &v)
{
if (v.data == "") {
o << Token::toString(v.kind);
} else if (v.kind == Token::OPERATOR) {
o << "\"" << v.data << "\"";
} else {
o << "(" << Token::toString(v.kind) << ", \"" << v.data << "\")";
}
return o;
}
std::list<Token> jsonnet_lex(const std::string &filename, const char *input);
#endif