]>
Commit | Line | Data |
---|---|---|
1 | /* Cycript - Optimizing JavaScript Compiler/Runtime | |
2 | * Copyright (C) 2009-2015 Jay Freeman (saurik) | |
3 | */ | |
4 | ||
5 | /* GNU Affero General Public License, Version 3 {{{ */ | |
6 | /* | |
7 | * This program is free software: you can redistribute it and/or modify | |
8 | * it under the terms of the GNU Affero General Public License as published by | |
9 | * the Free Software Foundation, either version 3 of the License, or | |
10 | * (at your option) any later version. | |
11 | ||
12 | * This program is distributed in the hope that it will be useful, | |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | * GNU Affero General Public License for more details. | |
16 | ||
17 | * You should have received a copy of the GNU Affero General Public License | |
18 | * along with this program. If not, see <http://www.gnu.org/licenses/>. | |
19 | **/ | |
20 | /* }}} */ | |
21 | ||
22 | /* XXX: supposedly I will be screwed on very very long multi-line comments and need to replace these with a manual lexer. http://websrv.cs.fsu.edu/~engelen/courses/COP5621/Pr2.pdf */ | |
23 | ||
24 | %top{ | |
25 | #if defined(__clang__) | |
26 | #pragma clang diagnostic push | |
27 | #pragma clang diagnostic ignored "-Wunused-variable" | |
28 | #pragma clang diagnostic ignored "-Wdeprecated-register" | |
29 | #else | |
30 | #pragma GCC diagnostic push | |
31 | #pragma GCC diagnostic ignored "-Wsign-compare" | |
32 | #pragma GCC diagnostic ignored "-Wunused-function" | |
33 | #pragma GCC diagnostic ignored "-Wunused-variable" | |
34 | #endif | |
35 | } | |
36 | ||
37 | %{ | |
38 | ||
39 | #define YYLTYPE CYLocation | |
40 | #include "Cycript.tab.hh" | |
41 | typedef cy::parser::token tk; | |
42 | ||
43 | #include "Highlight.hpp" | |
44 | ||
45 | #define YY_EXTRA_TYPE CYDriver * | |
46 | ||
47 | // do /not/ fold token to the return: this is a macro and the ordering is dependent | |
48 | #define F(value, highlight) do { \ | |
49 | int token(value); \ | |
50 | @begin ObjectiveC | |
51 | yyextra->no_.AtImplementation = false; \ | |
52 | @end | |
53 | yyextra->no_.Function = false; \ | |
54 | yyextra->no_.NewLine = false; \ | |
55 | yyextra->no_.OpenBrace = false; \ | |
56 | yylval->highlight_ = highlight; \ | |
57 | return token; \ | |
58 | } while (false) | |
59 | ||
60 | #define P yyextra->pool_ | |
61 | #define A new(P) | |
62 | #define Y P.strmemdup(yytext, yyleng) | |
63 | ||
64 | #define I(type, Type, value, highlight) do { \ | |
65 | yylval->semantic_.type ## _ = A CY ## Type; \ | |
66 | F(value, highlight); \ | |
67 | } while (false) | |
68 | ||
69 | #define C \ | |
70 | yyextra->newline_ = yyextra->last_; \ | |
71 | yyextra->last_ = false; \ | |
72 | BEGIN(Div); | |
73 | ||
74 | #define N \ | |
75 | yyextra->last_ = true; \ | |
76 | if (yyextra->no_.NewLine) \ | |
77 | F(tk::NewLine, hi::Nothing); | |
78 | ||
79 | #define V(more) { \ | |
80 | if (const char *nl = reinterpret_cast<const char *>(memchr(yytext, '\n', yyleng))) { \ | |
81 | unsigned lines(0); \ | |
82 | size_t left; \ | |
83 | do { \ | |
84 | ++lines; \ | |
85 | left = yyleng - (nl - yytext) - 1; \ | |
86 | nl = reinterpret_cast<const char *>(memchr(nl + 1, '\n', left)); \ | |
87 | } while (nl != NULL); \ | |
88 | yylloc->step(); \ | |
89 | yylloc->end.lines(lines); \ | |
90 | yylloc->end.columns(left); \ | |
91 | more \ | |
92 | } else L \ | |
93 | } | |
94 | ||
95 | #define L { \ | |
96 | yylloc->step(); \ | |
97 | yylloc->end.columns(yyleng); \ | |
98 | } | |
99 | ||
100 | #define M { \ | |
101 | if (yyextra->commented_) { \ | |
102 | I(comment, Comment(Y), tk::Comment, hi::Comment); \ | |
103 | } \ | |
104 | } | |
105 | ||
106 | #define E(message) { \ | |
107 | CYDriver::Error error; \ | |
108 | error.location_ = *yylloc; \ | |
109 | error.message_ = "syntax error, " message; \ | |
110 | yyextra->errors_.push_back(error); \ | |
111 | yyterminate(); \ | |
112 | } | |
113 | ||
114 | int H(char c) { | |
115 | if (c >= '0' && c <= '9') | |
116 | return c - '0'; | |
117 | if (c >= 'a' && c <= 'f') | |
118 | return c - 'a' + 10; | |
119 | if (c >= 'A' && c <= 'F') | |
120 | return c - 'A' + 10; | |
121 | return -1; | |
122 | } | |
123 | ||
124 | static void U(char *&local, unsigned point) { | |
125 | if (false) { | |
126 | } else if (point < 0x000080) { | |
127 | *local++ = point; | |
128 | } else if (point < 0x000800) { | |
129 | *local++ = 0xc0 | point >> 0x06 & 0x1f; | |
130 | goto one; | |
131 | } else if (point < 0x010000) { | |
132 | *local++ = 0xe0 | point >> 0x0c & 0x0f; | |
133 | goto two; | |
134 | } else if (point < 0x110000) { | |
135 | *local++ = 0xf0 | point >> 0x12 & 0x07; | |
136 | *local++ = 0x80 | point >> 0x0c & 0x3f; | |
137 | two: | |
138 | *local++ = 0x80 | point >> 0x06 & 0x3f; | |
139 | one: | |
140 | *local++ = 0x80 | point >> 0x00 & 0x3f; | |
141 | } else _assert(false); | |
142 | } | |
143 | ||
144 | static void U(char *&local, const char *text, yy_size_t &i) { | |
145 | unsigned point; | |
146 | ||
147 | char next(text[++i]); | |
148 | if (next != '{') { | |
149 | point = H(text[i + 0]) << 12 | H(text[i + 1]) << 8 | H(text[i + 2]) << 4 | H(text[i + 3]); | |
150 | i += 3; | |
151 | } else { | |
152 | point = 0; | |
153 | for (;;) { | |
154 | next = text[++i]; | |
155 | if (next == '}') | |
156 | break; | |
157 | point = (point << 4) | H(next); | |
158 | } | |
159 | } | |
160 | ||
161 | U(local, point); | |
162 | } | |
163 | ||
164 | #define YY_INPUT(data, value, size) { \ | |
165 | if (yyextra->data_.eof()) \ | |
166 | value = YY_NULL; \ | |
167 | else { \ | |
168 | yyextra->data_.read(data, size); \ | |
169 | size_t copy(yyextra->data_.gcount()); \ | |
170 | value = copy == 0 ? YY_NULL : copy; \ | |
171 | } \ | |
172 | } | |
173 | ||
174 | %} | |
175 | ||
176 | %option prefix="cy" | |
177 | %option bison-bridge | |
178 | %option bison-locations | |
179 | %option nodefault | |
180 | %option noyywrap | |
181 | %option noyylineno | |
182 | %option nounput | |
183 | %option nounistd | |
184 | %option 8bit | |
185 | %option backup | |
186 | %option batch | |
187 | %option never-interactive | |
188 | %option pointer | |
189 | %option reentrant | |
190 | %option stack | |
191 | ||
192 | %option full | |
193 | %option ecs | |
194 | ||
195 | U1 [\x00-\x7f] | |
196 | U0 [\x80-\xbf] | |
197 | U2 [\xc2-\xdf] | |
198 | U3 [\xe0-\xef] | |
199 | U4 [\xf0-\xf4] | |
200 | ||
201 | HexDigit [0-9a-fA-F] | |
202 | LineTerminatorSequence \r?\n|\r|\xe2\x80[\xa8\xa9] | |
203 | WhiteSpace [\x09\x0b\x0c\x20]|\xc2\xa0|\xef\xbb\xbf | |
204 | UnicodeEscape \\u({HexDigit}{4}|\{{HexDigit}+\}) | |
205 | ||
206 | OctalEscape \\[1-7]|\\[4-7][0-7]|\\[0-3][0-7][0-7]? | |
207 | StringEscape \\['"\\bfnrtv]|\\0|{OctalEscape}|\\x{HexDigit}{2}|{UnicodeEscape} | |
208 | StringExtra {StringEscape}|\\{LineTerminatorSequence} | |
209 | SingleString ([^'\\\n]|{StringExtra})* | |
210 | DoubleString ([^"\\\n]|{StringExtra})* | |
211 | StringPrefix '{SingleString}|\"{DoubleString} | |
212 | ||
213 | @include UnicodeIDStart.l | |
214 | @include UnicodeIDContinue.l | |
215 | ||
216 | IdentifierMore [$_] | |
217 | ||
218 | UnicodeStart {IdentifierMore}|{UnicodeIDStart} | |
219 | UnicodePart {IdentifierMore}|\xe2\x80[\x8c\x8d]|{UnicodeIDContinue} | |
220 | UnicodeFail {U2}|{U3}|{U3}{U0}|{U4}|{U4}{U0}|{U4}{U0}{U0} | |
221 | UnicodeScrap {UnicodePart}*{UnicodeFail}? | |
222 | ||
223 | IdentifierStart {UnicodeStart}|{UnicodeEscape} | |
224 | IdentifierPart {UnicodePart}|{UnicodeEscape} | |
225 | IdentifierFail {UnicodeFail}|\\(u({HexDigit}{0,3}|\{{HexDigit}*))? | |
226 | IdentifierScrap {IdentifierPart}*{IdentifierFail}? | |
227 | ||
228 | NonTerminator [^\n] | |
229 | BackslashSequence \\{NonTerminator} | |
230 | RegularExpressionFirstChar [^\n*\\/]|{BackslashSequence} | |
231 | RegularExpressionChar [^\n\\/]|{BackslashSequence} | |
232 | RegularExpressionFlags {UnicodePart}* | |
233 | RegularExpressionChars {RegularExpressionChar}* | |
234 | RegularExpressionBody {RegularExpressionFirstChar}{RegularExpressionChars} | |
235 | ||
236 | @begin E4X | |
237 | XMLNameStart [a-zA-Z_:] | |
238 | XMLNamePart [a-zA-Z0-9.-_:] | |
239 | XMLName {XMLNameStart}{XMLNamePart}* | |
240 | @end | |
241 | ||
242 | %s Div | |
243 | %s RegExp | |
244 | ||
245 | @begin E4X | |
246 | %x XMLContent | |
247 | %x XMLTag | |
248 | @end | |
249 | ||
250 | %% | |
251 | ||
252 | /* RegEx {{{ */ | |
253 | <RegExp>\/{RegularExpressionBody}\/{RegularExpressionFlags} L C I(literal, RegEx(Y), tk::RegularExpressionLiteral, hi::Constant); | |
254 | <RegExp>\/{RegularExpressionBody}\/{RegularExpressionFlags}{UnicodeFail} L E("invalid flags") | |
255 | <RegExp>\/{RegularExpressionBody}?\\? L E("unterminated regex") | |
256 | /* }}} */ | |
257 | /* Comment {{{ */ | |
258 | #![^\n]* L M | |
259 | \/\/[^\n]* L M | |
260 | ||
261 | /* http://ostermiller.org/findcomment.html */ | |
262 | /* XXX: unify these two rules using !? */ | |
263 | \/\*!([^*]|[\r\n]|(\*+([^*/]|[\r\n])))*\*+\/ V() C I(comment, Comment(Y), tk::Comment, hi::Comment); | |
264 | \/\*([^*]|[\r\n]|(\*+([^*/]|[\r\n])))*\*+\/ V(N) M | |
265 | \/\*([^*]|[\r\n]|(\*+([^*/]|[\r\n])))*\** V() E("invalid comment") | |
266 | /* }}} */ | |
267 | /* Element {{{ */ | |
268 | @begin E4X | |
269 | <RegExp>"<>" L F(tk::LeftRight, hi::Structure); | |
270 | <XMLContent>"</>" L F(tk::LeftSlashRight, hi::Structure); | |
271 | ||
272 | <RegExp,XMLContent>\<!\[CDATA\[(\n|[^[]|\[[^[]|\[\[[^>])*]]> V() F(tk::XMLCDATA, hi::Constant); | |
273 | <RegExp,XMLContent>\<!--(\n|[^-]|-[^-])*--> V() F(tk::XMLComment, hi::Comment); | |
274 | <RegExp,XMLContent>\<?(\n|[^?]|\?[^>])*?> V() F(tk::XMLPI, hi::Meta); | |
275 | ||
276 | <XMLTag>"=" L F(tk::Equal, hi::Structure); | |
277 | <XMLTag>">" L F(tk::Right, hi::Structure); | |
278 | <XMLTag>"/>" L F(tk::SlashRight, hi::Structure); | |
279 | <XMLTag>"{" L F(tk::OpenBrace, hi::Structure); | |
280 | ||
281 | <XMLTag>\"(\n|[^"])*\"|'(\n|[^'])*' V() F(tk::XMLAttributeValue, hi::Constant); | |
282 | <XMLTag>{XMLName} L F(tk::XMLName, hi::Identifier); | |
283 | <XMLTag>[ \t\r\n] V() F(tk::XMLWhitespace, hi::Nothing); | |
284 | ||
285 | <XMLContent>"{" L F(tk::OpenBrace, hi::Structure); | |
286 | <XMLContent>"<" L F(tk::Left, hi::Structure); | |
287 | <XMLContent>"</" L F(tk::LeftSlash, hi::Structure); | |
288 | @end | |
289 | /* }}} */ | |
290 | /* Operator {{{ */ | |
291 | "..." L C F(tk::PeriodPeriodPeriod, hi::Meta); | |
292 | ".." L E("invalid operator") | |
293 | ||
294 | @begin E4X | |
295 | "::" L C F(tk::ColonColon, hi::Operator); | |
296 | ".." L C F(tk::PeriodPeriod, hi::Operator); | |
297 | @end | |
298 | ||
299 | @begin E4X ObjectiveC | |
300 | "@" L C F(tk::At, hi::Operator); | |
301 | "#" L C F(tk::Pound, hi::Operator); | |
302 | @end | |
303 | ||
304 | "&" L C F(tk::Ampersand, hi::Operator); | |
305 | "&&" L C F(tk::AmpersandAmpersand, hi::Operator); | |
306 | "&=" L C F(tk::AmpersandEqual, hi::Operator); | |
307 | "^" L C F(tk::Carrot, hi::Operator); | |
308 | "^=" L C F(tk::CarrotEqual, hi::Operator); | |
309 | "=" L C F(tk::Equal, hi::Operator); | |
310 | "==" L C F(tk::EqualEqual, hi::Operator); | |
311 | "===" L C F(tk::EqualEqualEqual, hi::Operator); | |
312 | "=>" L C F(yyextra->newline_ ? tk::EqualRight_ : tk::EqualRight, hi::Operator); | |
313 | "!" L C F(tk::Exclamation, hi::Operator); | |
314 | "!=" L C F(tk::ExclamationEqual, hi::Operator); | |
315 | "!==" L C F(tk::ExclamationEqualEqual, hi::Operator); | |
316 | "-" L C F(tk::Hyphen, hi::Operator); | |
317 | "-=" L C F(tk::HyphenEqual, hi::Operator); | |
318 | "--" L C F(yyextra->newline_ ? tk::HyphenHyphen_ : tk::HyphenHyphen, hi::Operator); | |
319 | "->" L C F(tk::HyphenRight, hi::Operator); | |
320 | "<" L C F(tk::Left, hi::Operator); | |
321 | "<=" L C F(tk::LeftEqual, hi::Operator); | |
322 | "<<" L C F(tk::LeftLeft, hi::Operator); | |
323 | "<<=" L C F(tk::LeftLeftEqual, hi::Operator); | |
324 | "%" L C F(tk::Percent, hi::Operator); | |
325 | "%=" L C F(tk::PercentEqual, hi::Operator); | |
326 | "." L C F(tk::Period, hi::Operator); | |
327 | "|" L C F(tk::Pipe, hi::Operator); | |
328 | "|=" L C F(tk::PipeEqual, hi::Operator); | |
329 | "||" L C F(tk::PipePipe, hi::Operator); | |
330 | "+" L C F(tk::Plus, hi::Operator); | |
331 | "+=" L C F(tk::PlusEqual, hi::Operator); | |
332 | "++" L C F(yyextra->newline_ ? tk::PlusPlus_ : tk::PlusPlus, hi::Operator); | |
333 | ">" L C F(tk::Right, hi::Operator); | |
334 | ">=" L C F(tk::RightEqual, hi::Operator); | |
335 | ">>" L C F(tk::RightRight, hi::Operator); | |
336 | ">>=" L C F(tk::RightRightEqual, hi::Operator); | |
337 | ">>>" L C F(tk::RightRightRight, hi::Operator); | |
338 | ">>>=" L C F(tk::RightRightRightEqual, hi::Operator); | |
339 | "*" L C F(tk::Star, hi::Operator); | |
340 | "*=" L C F(tk::StarEqual, hi::Operator); | |
341 | "~" L C F(tk::Tilde, hi::Operator); | |
342 | ||
343 | <Div>"/" L C F(tk::Slash, hi::Operator); | |
344 | <Div>"/=" L C F(tk::SlashEqual, hi::Operator); | |
345 | ||
346 | ":" L C F(tk::Colon, hi::Structure); | |
347 | "," L C F(tk::Comma, hi::Structure); | |
348 | "?" L C F(tk::Question, hi::Structure); | |
349 | ";" L C F(tk::SemiColon, hi::Structure); | |
350 | ||
351 | "(" L C F(tk::OpenParen, hi::Structure); | |
352 | ")" L C F(tk::CloseParen, hi::Structure); | |
353 | ||
354 | "{" L C F(yyextra->no_.OpenBrace ? tk::OpenBrace__ : yyextra->newline_ ? tk::OpenBrace_ : tk::OpenBrace, hi::Structure); | |
355 | "}" L C F(tk::CloseBrace, hi::Structure); | |
356 | ||
357 | "[" L C F(tk::OpenBracket, hi::Structure); | |
358 | "]" L C F(tk::CloseBracket, hi::Structure); | |
359 | /* }}} */ | |
360 | /* Keyword {{{ */ | |
361 | "@error" L C F(tk::At_error_, hi::Error); | |
362 | ||
363 | @begin Java | |
364 | "@class" L C F(tk::At_class_, hi::Meta); | |
365 | @end | |
366 | ||
367 | @begin C | |
368 | "@encode" L C F(tk::At_encode_, hi::Meta); | |
369 | @end | |
370 | ||
371 | @begin ObjectiveC | |
372 | "@end" L C F(tk::At_end_, hi::Meta); | |
373 | "@false" L C F(tk::At_false_, hi::Constant); | |
374 | "@implementation" L C F(yyextra->no_.AtImplementation ? tk::At_implementation__ : tk::At_implementation_, hi::Meta); | |
375 | "@import" L C F(tk::At_import_, hi::Special); | |
376 | "@NO" L C F(tk::At_NO_, hi::Constant); | |
377 | "@null" L C F(tk::At_null_, hi::Constant); | |
378 | "@selector" L C F(tk::At_selector_, hi::Meta); | |
379 | "@true" L C F(tk::At_true_, hi::Constant); | |
380 | "@YES" L C F(tk::At_YES_, hi::Constant); | |
381 | @end | |
382 | ||
383 | @({UnicodeStart}{UnicodeScrap}|{UnicodeFail}) L E("invalid keyword") | |
384 | /* }}} */ | |
385 | /* Highlight {{{ */ | |
386 | "undefined" L C F(tk::_undefined_, hi::Operator); | |
387 | ||
388 | @begin ObjectiveC | |
389 | "bool" L C F(tk::_bool_, hi::Type); | |
390 | "BOOL" L C F(tk::_BOOL_, hi::Type); | |
391 | "id" L C F(tk::_id_, hi::Type); | |
392 | "nil" L C F(tk::_nil_, hi::Constant); | |
393 | "NULL" L C F(tk::_NULL_, hi::Constant); | |
394 | "SEL" L C F(tk::_SEL_, hi::Type); | |
395 | @end | |
396 | /* }}} */ | |
397 | /* Reserved {{{ */ | |
398 | "abstract" L C /*FII*/ F(tk::_abstract_, hi::Meta); | |
399 | "await" L C /*II?*/ F(tk::_await_, hi::Meta); | |
400 | "boolean" L C /*FII*/ F(tk::_boolean_, hi::Type); | |
401 | "break" L C /*KKK*/ F(tk::_break_, hi::Control); | |
402 | "byte" L C /*FII*/ F(tk::_byte_, hi::Type); | |
403 | "case" L C /*KKK*/ F(tk::_case_, hi::Control); | |
404 | "catch" L C /*KKK*/ F(tk::_catch_, hi::Control); | |
405 | "char" L C /*FII*/ F(tk::_char_, hi::Type); | |
406 | "class" L C /*FFK*/ F(tk::_class_, hi::Meta); | |
407 | "const" L C /*FFK*/ F(tk::_const_, hi::Meta); | |
408 | "continue" L C /*KKK*/ F(tk::_continue_, hi::Control); | |
409 | "debugger" L C /*FKK*/ F(tk::_debugger_, hi::Meta); | |
410 | "default" L C /*KKK*/ F(tk::_default_, hi::Control); | |
411 | "delete" L C /*KKK*/ F(tk::_delete_, hi::Operator); | |
412 | "do" L C /*KKK*/ F(tk::_do_, hi::Control); | |
413 | "double" L C /*FII*/ F(tk::_double_, hi::Type); | |
414 | "else" L C /*KKK*/ F(tk::_else_, hi::Control); | |
415 | "enum" L C /*FFF*/ F(tk::_enum_, hi::Meta); | |
416 | "export" L C /*FFK*/ F(tk::_export_, hi::Meta); | |
417 | "extends" L C /*FFK*/ F(tk::_extends_, hi::Meta); | |
418 | "false" L C /*LLL*/ F(tk::_false_, hi::Constant); | |
419 | "final" L C /*FII*/ F(tk::_final_, hi::Meta); | |
420 | "finally" L C /*KKK*/ F(tk::_finally_, hi::Control); | |
421 | "float" L C /*FII*/ F(tk::_float_, hi::Type); | |
422 | "for" L C /*KKK*/ F(tk::_for_, hi::Control); | |
423 | "function" L C /*KKK*/ F(yyextra->no_.Function ? tk::_function__ : tk::_function_, hi::Meta); | |
424 | "goto" L C /*FII*/ F(tk::_goto_, hi::Control); | |
425 | "if" L C /*KKK*/ F(tk::_if_, hi::Control); | |
426 | "implements" L C /*FSS*/ F(tk::_implements_, hi::Meta); | |
427 | "import" L C /*FFK*/ F(tk::_import_, hi::Meta); | |
428 | "in" L C /*KKK*/ F(yyextra->in_.top() ? tk::_in__ : tk::_in_, hi::Operator); | |
429 | "instanceof" L C /*KKK*/ F(tk::_instanceof_, hi::Operator); | |
430 | "int" L C /*FII*/ F(tk::_int_, hi::Type); | |
431 | "interface" L C /*FSS*/ F(tk::_interface_, hi::Meta); | |
432 | "let" L C /*IS?*/ F(tk::_let_, hi::Meta); | |
433 | "long" L C /*FII*/ F(tk::_long_, hi::Type); | |
434 | "native" L C /*FII*/ F(tk::_native_, hi::Meta); | |
435 | "new" L C /*KKK*/ F(tk::_new_, hi::Operator); | |
436 | "null" L C /*LLL*/ F(tk::_null_, hi::Constant); | |
437 | "package" L C /*FSS*/ F(tk::_package_, hi::Meta); | |
438 | "private" L C /*FSS*/ F(tk::_private_, hi::Meta); | |
439 | "protected" L C /*FSS*/ F(tk::_protected_, hi::Meta); | |
440 | "public" L C /*FSS*/ F(tk::_public_, hi::Meta); | |
441 | "return" L C /*KKK*/ F(tk::_return_, hi::Control); | |
442 | "short" L C /*FII*/ F(tk::_short_, hi::Type); | |
443 | "static" L C /*FS?*/ F(tk::_static_, hi::Meta); | |
444 | "super" L C /*FFK*/ F(tk::_super_, hi::Constant); | |
445 | "switch" L C /*KKK*/ F(tk::_switch_, hi::Control); | |
446 | "synchronized" L C /*FII*/ F(tk::_synchronized_, hi::Meta); | |
447 | "this" L C /*KKK*/ F(tk::_this_, hi::Constant); | |
448 | "throw" L C /*KKK*/ F(tk::_throw_, hi::Control); | |
449 | "throws" L C /*FII*/ F(tk::_throws_, hi::Meta); | |
450 | "transient" L C /*FII*/ F(tk::_transient_, hi::Meta); | |
451 | "true" L C /*LLL*/ F(tk::_true_, hi::Constant); | |
452 | "try" L C /*KKK*/ F(tk::_try_, hi::Control); | |
453 | "typeof" L C /*KKK*/ F(tk::_typeof_, hi::Operator); | |
454 | "var" L C /*KKK*/ F(tk::_var_, hi::Meta); | |
455 | "void" L C /*KKK*/ F(tk::_void_, hi::Operator); | |
456 | "volatile" L C /*FII*/ F(tk::_volatile_, hi::Meta); | |
457 | "while" L C /*KKK*/ F(tk::_while_, hi::Control); | |
458 | "with" L C /*KKK*/ F(tk::_with_, hi::Control); | |
459 | "yield" L C /*IS?*/ F(tk::_yield_, hi::Control); | |
460 | ||
461 | "auto" L C F(tk::_auto_, hi::Meta); | |
462 | "each" L C F(tk::_each_, hi::Control); | |
463 | "of" L C F(tk::_of_, hi::Operator); | |
464 | ||
465 | @begin C | |
466 | "extern" L C F(tk::_extern_, hi::Type); | |
467 | "signed" L C F(tk::_signed_, hi::Type); | |
468 | "typedef" L C F(tk::_typedef_, hi::Meta); | |
469 | "unsigned" L C F(tk::_unsigned_, hi::Type); | |
470 | @end | |
471 | ||
472 | @begin ObjectiveC | |
473 | "NO" L C F(tk::_NO_, hi::Constant); | |
474 | "YES" L C F(tk::_YES_, hi::Constant); | |
475 | @end | |
476 | ||
477 | @begin E4X | |
478 | "namespace" L C F(tk::_namespace_, hi::Meta); | |
479 | "xml" L C F(tk::_xml_, hi::Meta); | |
480 | @end | |
481 | /* }}} */ | |
482 | /* Identifier {{{ */ | |
483 | {UnicodeStart}{UnicodePart}* L C I(identifier, Identifier(Y), tk::Identifier_, hi::Identifier); | |
484 | ||
485 | {IdentifierStart}{IdentifierPart}* L C { | |
486 | char *value(A char[yyleng + 1]); | |
487 | char *local(value); | |
488 | ||
489 | for (yy_size_t i(0), e(yyleng); i != e; ++i) { | |
490 | char next(yytext[i]); | |
491 | if (next != '\\') | |
492 | *local++ = next; | |
493 | else | |
494 | U(local, yytext, ++i); | |
495 | } | |
496 | ||
497 | *local = '\0'; | |
498 | I(identifier, Identifier(value), tk::Identifier_, hi::Identifier); | |
499 | } | |
500 | ||
501 | ({IdentifierStart}{IdentifierPart}*)?{IdentifierFail} L E("invalid identifier") | |
502 | /* }}} */ | |
503 | /* Number {{{ */ | |
504 | 0[0-7]+ L C I(number, Number(strtoull(yytext + 1, NULL, 8)), tk::NumericLiteral, hi::Constant); | |
505 | 0[0-9]+ L C I(number, Number(strtoull(yytext + 1, NULL, 10)), tk::NumericLiteral, hi::Constant); | |
506 | ||
507 | 0[xX][0-9a-fA-F]+ L C I(number, Number(strtoull(yytext + 2, NULL, 16)), tk::NumericLiteral, hi::Constant); | |
508 | 0[oO][0-7]+ L C I(number, Number(strtoull(yytext + 2, NULL, 8)), tk::NumericLiteral, hi::Constant); | |
509 | 0[bB][0-1]+ L C I(number, Number(strtoull(yytext + 2, NULL, 2)), tk::NumericLiteral, hi::Constant); | |
510 | ||
511 | (\.[0-9]+|(0|[1-9][0-9]*)(\.[0-9]*)?)([eE][+-]?[0-9]+)? L C I(number, Number(strtod(yytext, NULL)), tk::NumericLiteral, hi::Constant); | |
512 | (\.[0-9]+|(0|[1-9][0-9]*)(\.[0-9]*)?)[eE][+-]?{IdentifierScrap} L E("invalid exponent") | |
513 | (\.?[0-9]|(0|[1-9][0-9]*)\.){IdentifierScrap} L E("invalid number") | |
514 | /* }}} */ | |
515 | /* String {{{ */ | |
516 | '{SingleString}'|\"{DoubleString}\" L C { | |
517 | char *value(A char[yyleng]); | |
518 | char *local(value); | |
519 | ||
520 | for (yy_size_t i(1), e(yyleng - 1); i != e; ++i) { | |
521 | char next(yytext[i]); | |
522 | ||
523 | if (yytext[i] == '\\') | |
524 | // XXX: support more line continuation characters | |
525 | if (false) line: { | |
526 | yylloc->end.lines(1); | |
527 | yylloc->end.columns(yyleng - i); | |
528 | } else switch (next = yytext[++i]) { | |
529 | case '\n': goto line; | |
530 | ||
531 | case '\\': next = '\\'; break; | |
532 | case '\'': next = '\''; break; | |
533 | case '"': next = '"'; break; | |
534 | case 'b': next = '\b'; break; | |
535 | case 'f': next = '\f'; break; | |
536 | case 'n': next = '\n'; break; | |
537 | case 'r': next = '\r'; break; | |
538 | case 't': next = '\t'; break; | |
539 | case 'v': next = '\v'; break; | |
540 | ||
541 | case '0': case '1': case '2': case '3': | |
542 | if (yytext[i + 1] < '0' || yytext[i + 1] > '7') | |
543 | next = H(yytext[i]), i += 0; | |
544 | else if (yytext[i + 2] < '0' || yytext[i + 2] > '7') | |
545 | next = H(yytext[i]) << 3 | H(yytext[i + 1]), i += 1; | |
546 | else | |
547 | next = H(yytext[i]) << 6 | H(yytext[i + 1]) << 3 | H(yytext[i + 2]), i += 2; | |
548 | break; | |
549 | ||
550 | case '4': case '5': case '6': case '7': | |
551 | if (yytext[i + 1] < '0' || yytext[i + 1] > '7') | |
552 | next = H(yytext[i]), i += 0; | |
553 | else | |
554 | next = H(yytext[i]) << 3 | H(yytext[i + 1]), i += 1; | |
555 | break; | |
556 | ||
557 | case 'x': | |
558 | U(local, H(yytext[i + 1]) << 4 | H(yytext[i + 2])); | |
559 | i += 2; | |
560 | continue; | |
561 | ||
562 | case 'u': | |
563 | U(local, yytext, i); | |
564 | continue; | |
565 | } | |
566 | ||
567 | *local++ = next; | |
568 | } | |
569 | ||
570 | *local = '\0'; | |
571 | I(string, String(value, local - value), tk::StringLiteral, hi::Constant); | |
572 | } | |
573 | ||
574 | {StringPrefix}\\(x.{0,2}|u([^{].{0,3}|\{[^}]*)?|{UnicodeFail})? L E("invalid escape") | |
575 | {StringPrefix} L E("invalid string") | |
576 | /* }}} */ | |
577 | ||
578 | {LineTerminatorSequence} yylloc->step(); yylloc->end.lines(); N | |
579 | {WhiteSpace} L | |
580 | ||
581 | <<EOF>> if (yyextra->auto_) { yyextra->auto_ = false; F(tk::AutoComplete, hi::Nothing); } L yyterminate(); | |
582 | ||
583 | . L E("invalid character") | |
584 | ||
585 | %% | |
586 | ||
587 | void CYDriver::ScannerInit() { | |
588 | cylex_init(&scanner_); | |
589 | cyset_extra(this, scanner_); | |
590 | } | |
591 | ||
592 | void CYDriver::ScannerDestroy() { | |
593 | cylex_destroy(scanner_); | |
594 | } | |
595 | ||
596 | CYDriver::Condition CYDriver::GetCondition() { | |
597 | switch (yy_top_state(scanner_)) { | |
598 | case RegExp: | |
599 | return RegExpCondition; | |
600 | @begin E4X | |
601 | case XMLContent: | |
602 | return XMLContentCondition; | |
603 | case XMLTag: | |
604 | return XMLTagCondition; | |
605 | @end | |
606 | default: | |
607 | _assert(false); | |
608 | } | |
609 | } | |
610 | ||
611 | void CYDriver::SetCondition(Condition condition) { | |
612 | struct yyguts_t *yyg(reinterpret_cast<struct yyguts_t *>(scanner_)); | |
613 | ||
614 | switch (condition) { | |
615 | case RegExpCondition: | |
616 | BEGIN(RegExp); | |
617 | break; | |
618 | @begin E4X | |
619 | case XMLContentCondition: | |
620 | BEGIN(XMLContent); | |
621 | break; | |
622 | case XMLTagCondition: | |
623 | BEGIN(XMLTag); | |
624 | break; | |
625 | @end | |
626 | default: | |
627 | _assert(false); | |
628 | } | |
629 | } | |
630 | ||
631 | void CYDriver::PushCondition(Condition condition) { | |
632 | switch (condition) { | |
633 | case RegExpCondition: | |
634 | yy_push_state(RegExp, scanner_); | |
635 | break; | |
636 | @begin E4X | |
637 | case XMLContentCondition: | |
638 | yy_push_state(XMLContent, scanner_); | |
639 | break; | |
640 | case XMLTagCondition: | |
641 | yy_push_state(XMLTag, scanner_); | |
642 | break; | |
643 | @end | |
644 | default: | |
645 | _assert(false); | |
646 | } | |
647 | } | |
648 | ||
649 | void CYDriver::PopCondition() { | |
650 | yy_pop_state(scanner_); | |
651 | } | |
652 | ||
653 | #if defined(__clang__) | |
654 | #pragma clang diagnostic pop | |
655 | #else | |
656 | // must not pop -Wunused-function | |
657 | //#pragma GCC diagnostic pop | |
658 | #endif |