X-Git-Url: https://git.saurik.com/cycript.git/blobdiff_plain/e7ed5354ae029d47ace1bc152aa5686f495e5737..62014ea9ffc6c31f053863a89d783475a3937d74:/Cycript.l diff --git a/Cycript.l b/Cycript.l index eb0c692..4a54403 100644 --- a/Cycript.l +++ b/Cycript.l @@ -8,7 +8,31 @@ typedef cy::parser::token tk; #define T yylval->newline_ = yyextra->state_ == CYNewLine; #define C T yyextra->state_ = CYClear; #define R T yyextra->state_ = CYRestricted; -#define N if (yyextra->state_ != CYNewLine) { bool restricted(yyextra->state_ == CYRestricted); if (restricted) { yyextra->state_ = CYClear; return tk::NewLine; } else yyextra->state_ = CYNewLine; } + +#define N \ + if (yyextra->state_ != CYNewLine) { \ + bool restricted(yyextra->state_ == CYRestricted); \ + if (restricted) { \ + yyextra->state_ = CYClear; \ + return tk::NewLine; \ + } else \ + yyextra->state_ = CYNewLine; \ + } + +#define L { \ + yylloc->step(); \ + yylloc->columns(yyleng); \ +} + +int H(char c) { + if (c >= '0' && c <= '9') + return c - '0'; + if (c >= 'a' && c <= 'f') + return c - 'a' + 10; + if (c >= 'A' && c <= 'F') + return c - 'A' + 10; + return -1; +} #define YY_INPUT(data, value, size) { \ if (yyextra->size_ == 0) \ @@ -34,111 +58,152 @@ typedef cy::parser::token tk; %option reentrant Exponent [eE][+-]?[0-9]+ -Escape \\['"\\bfnrtv]|\\0|\\x[0-9a-fA-F]{2}|\\u[0-9a-fA-F]{4} +Escape \\[\\'"bfnrtv]|\\0|\\x[0-9a-fA-F]{2}|\\u[0-9a-fA-F]{4} %% \/\/[^\n]* ; \/\*(\n|[^\*]|\*[^/])\*\/ if (memchr(yytext, '\n', yyleng) != NULL) N // XXX: supposedly I will be screwed on very very long multi-line comments and need to replace this with a manual lexer. http://websrv.cs.fsu.edu/~engelen/courses/COP5621/Pr2.pdf ; XXX: this rule doesn't work anyway, fucking A :( -"&" C return tk::Ampersand; -"&&" C return tk::AmpersandAmpersand; -"&=" C return tk::AmpersandEqual; -"^" C return tk::Carrot; -"^=" C return tk::CarrotEqual; -"=" C return tk::Equal; -"==" C return tk::EqualEqual; -"===" C return tk::EqualEqualEqual; -"!" C return tk::Exclamation; -"!=" C return tk::ExclamationEqual; -"!==" C return tk::ExclamationEqualEqual; -"-" C return tk::Hyphen; -"-=" C return tk::HyphenEqual; -"--" C return yylval->newline_ ? tk::HyphenHyphen_ : tk::HyphenHyphen; -"->" C return tk::HyphenRight; -"<" C return tk::Left; -"<=" C return tk::LeftEqual; -"<<" C return tk::LeftLeft; -"<<=" C return tk::LeftLeftEqual; -"%" C return tk::Percent; -"%=" C return tk::PercentEqual; -"." C return tk::Period; -"|" C return tk::Pipe; -"|=" C return tk::PipeEqual; -"||" C return tk::PipePipe; -"+" C return tk::Plus; -"+=" C return tk::PlusEqual; -"++" C return yylval->newline_ ? tk::PlusPlus_ : tk::PlusPlus; -">" C return tk::Right; -">=" C return tk::RightEqual; -">>" C return tk::RightRight; -">>=" C return tk::RightRightEqual; -">>>" C return tk::RightRightRight; -">>>=" C return tk::RightRightRightEqual; -"/" C return tk::Slash; -"/=" C return tk::SlashEqual; -"*" C return tk::Star; -"*=" C return tk::StarEqual; -"~" C return tk::Tilde; - -":" C return tk::Colon; -"," C return tk::Comma; -"?" C return tk::Question; -";" C return tk::SemiColon; - -"(" C return tk::OpenParen; -")" C return tk::CloseParen; - -"{" C return tk::OpenBrace; -"}" C return tk::CloseBrace; - -"[" C return tk::OpenBracket; -"]" C return tk::CloseBracket; - -"@selector" C return tk::AtSelector; - -"break" R yylval->word_ = new CYWord("break"); return tk::Break; -"case" C yylval->word_ = new CYWord("case"); return tk::Case; -"catch" C yylval->word_ = new CYWord("catch"); return tk::Catch; -"continue" R yylval->word_ = new CYWord("continue"); return tk::Continue; -"default" C yylval->word_ = new CYWord("default"); return tk::Default; -"delete" C yylval->word_ = new CYWord("delete"); return tk::Delete; -"do" C yylval->word_ = new CYWord("do"); return tk::Do; -"else" C yylval->word_ = new CYWord("else"); return tk::Else; -"false" C yylval->false_ = new CYFalse(); return tk::False; -"finally" C yylval->word_ = new CYWord("finally"); return tk::Finally; -"for" C yylval->word_ = new CYWord("for"); return tk::For; -"function" C yylval->word_ = new CYWord("function"); return tk::Function; -"if" C yylval->word_ = new CYWord("if"); return tk::If; -"in" C yylval->word_ = new CYWord("in"); return tk::In; -"instanceof" C yylval->word_ = new CYWord("instanceof"); return tk::InstanceOf; -"new" C yylval->word_ = new CYWord("new"); return tk::New; -"null" C yylval->null_ = new CYNull(); return tk::Null; -"return" R yylval->word_ = new CYWord("return"); return tk::Return; -"switch" C yylval->word_ = new CYWord("switch"); return tk::Switch; -"this" C yylval->this_ = new CYThis(); return tk::This; -"throw" R yylval->word_ = new CYWord("throw"); return tk::Throw; -"true" C yylval->true_ = new CYTrue(); return tk::True; -"try" C yylval->word_ = new CYWord("try"); return tk::Try; -"typeof" C yylval->word_ = new CYWord("typeof"); return tk::TypeOf; -"var" C yylval->word_ = new CYWord("var"); return tk::Var; -"void" C yylval->word_ = new CYWord("void"); return tk::Void; -"while" C yylval->word_ = new CYWord("while"); return tk::While; -"with" C yylval->word_ = new CYWord("with"); return tk::With; - -[a-zA-Z$_][a-zA-Z$_0-9]* yylval->identifier_ = new CYIdentifier(apr_pstrmemdup(yyextra->pool_, yytext, yyleng)); C return tk::Identifier; - -(\.[0-9]+|(0|[1-9][0-9]*)(\.[0-9]*)?){Exponent}? yylval->number_ = new CYNumber(strtod(yytext, NULL)); C return tk::NumericLiteral; - -0[xX][0-9a-fA-F]+ C yylval->number_ = new CYNumber(strtoull(yytext + 2, NULL, 16)); return tk::NumericLiteral; - -0[bB][0-1]+ C yylval->number_ = new CYNumber(strtoull(yytext + 2, NULL, 2)); return tk::NumericLiteral; - -\"([^"\\\n]|{Escape})*\" C return tk::StringLiteral; -'([^'\\\n]|{Escape})*' C return tk::StringLiteral; - -\n N -[ \t] ; +"&" L C return tk::Ampersand; +"&&" L C return tk::AmpersandAmpersand; +"&=" L C return tk::AmpersandEqual; +"^" L C return tk::Carrot; +"^=" L C return tk::CarrotEqual; +"=" L C return tk::Equal; +"==" L C return tk::EqualEqual; +"===" L C return tk::EqualEqualEqual; +"!" L C return tk::Exclamation; +"!=" L C return tk::ExclamationEqual; +"!==" L C return tk::ExclamationEqualEqual; +"-" L C return tk::Hyphen; +"-=" L C return tk::HyphenEqual; +"--" L C return yylval->newline_ ? tk::HyphenHyphen_ : tk::HyphenHyphen; +"->" L C return tk::HyphenRight; +"<" L C return tk::Left; +"<=" L C return tk::LeftEqual; +"<<" L C return tk::LeftLeft; +"<<=" L C return tk::LeftLeftEqual; +"%" L C return tk::Percent; +"%=" L C return tk::PercentEqual; +"." L C return tk::Period; +"|" L C return tk::Pipe; +"|=" L C return tk::PipeEqual; +"||" L C return tk::PipePipe; +"+" L C return tk::Plus; +"+=" L C return tk::PlusEqual; +"++" L C return yylval->newline_ ? tk::PlusPlus_ : tk::PlusPlus; +">" L C return tk::Right; +">=" L C return tk::RightEqual; +">>" L C return tk::RightRight; +">>=" L C return tk::RightRightEqual; +">>>" L C return tk::RightRightRight; +">>>=" L C return tk::RightRightRightEqual; +"/" L C return tk::Slash; +"/=" L C return tk::SlashEqual; +"*" L C return tk::Star; +"*=" L C return tk::StarEqual; +"~" L C return tk::Tilde; + +":" L C return tk::Colon; +"," L C return tk::Comma; +"?" L C return tk::Question; +";" L C return tk::SemiColon; + +"(" L C return tk::OpenParen; +")" L C return tk::CloseParen; + +"{" L C return tk::OpenBrace; +"}" L C return tk::CloseBrace; + +"[" L C return tk::OpenBracket; +"]" L C return tk::CloseBracket; + +"@selector" L C return tk::AtSelector; + +"break" L R yylval->word_ = new CYWord("break"); return tk::Break; +"case" L C yylval->word_ = new CYWord("case"); return tk::Case; +"catch" L C yylval->word_ = new CYWord("catch"); return tk::Catch; +"continue" L R yylval->word_ = new CYWord("continue"); return tk::Continue; +"default" L C yylval->word_ = new CYWord("default"); return tk::Default; +"delete" L C yylval->word_ = new CYWord("delete"); return tk::Delete; +"do" L C yylval->word_ = new CYWord("do"); return tk::Do; +"else" L C yylval->word_ = new CYWord("else"); return tk::Else; +"false" L C yylval->false_ = new CYFalse(); return tk::False; +"finally" L C yylval->word_ = new CYWord("finally"); return tk::Finally; +"for" L C yylval->word_ = new CYWord("for"); return tk::For; +"function" L C yylval->word_ = new CYWord("function"); return tk::Function; +"if" L C yylval->word_ = new CYWord("if"); return tk::If; +"in" L C yylval->word_ = new CYWord("in"); return tk::In; +"instanceof" L C yylval->word_ = new CYWord("instanceof"); return tk::InstanceOf; +"new" L C yylval->word_ = new CYWord("new"); return tk::New; +"null" L C yylval->null_ = new CYNull(); return tk::Null; +"return" L R yylval->word_ = new CYWord("return"); return tk::Return; +"switch" L C yylval->word_ = new CYWord("switch"); return tk::Switch; +"this" L C yylval->this_ = new CYThis(); return tk::This; +"throw" L R yylval->word_ = new CYWord("throw"); return tk::Throw; +"true" L C yylval->true_ = new CYTrue(); return tk::True; +"try" L C yylval->word_ = new CYWord("try"); return tk::Try; +"typeof" L C yylval->word_ = new CYWord("typeof"); return tk::TypeOf; +"var" L C yylval->word_ = new CYWord("var"); return tk::Var; +"void" L C yylval->word_ = new CYWord("void"); return tk::Void; +"while" L C yylval->word_ = new CYWord("while"); return tk::While; +"with" L C yylval->word_ = new CYWord("with"); return tk::With; + +[a-zA-Z$_][a-zA-Z$_0-9]* yylval->identifier_ = new CYIdentifier(apr_pstrmemdup(yyextra->pool_, yytext, yyleng)); L C return tk::Identifier; + +(\.[0-9]+|(0|[1-9][0-9]*)(\.[0-9]*)?){Exponent}? yylval->number_ = new CYNumber(strtod(yytext, NULL)); L C return tk::NumericLiteral; + +0[xX][0-9a-fA-F]+ L C yylval->number_ = new CYNumber(strtoull(yytext + 2, NULL, 16)); return tk::NumericLiteral; + +0[bB][0-1]+ L C yylval->number_ = new CYNumber(strtoull(yytext + 2, NULL, 2)); return tk::NumericLiteral; + +\"([^"\\\n]|{Escape})*\"|'([^'\\\n]|{Escape})*' L C { + char *value(reinterpret_cast(apr_palloc(yyextra->pool_, yyleng))); + char *local(value); + + for (int i(1); i != yyleng - 1; ++i) { + char next(yytext[i]); + + if (yytext[i] == '\\') + switch (next = yytext[++i]) { + case '\\': next = '\\'; break; + case '\'': next = '\''; break; + case '"': next = '"'; break; + case 'b': next = '\b'; break; + case 'f': next = '\f'; break; + case 'n': next = '\n'; break; + case 'r': next = '\r'; break; + case 't': next = '\t'; break; + case 'v': next = '\v'; break; + case '0': next = '\0'; break; + + case 'x': + next = H(yytext[i + 1]) << 4 | H(yytext[i + 2]); + i += 2; + break; + } + + *local++ = next; + } + + *local = '\0'; + yylval->string_ = new CYString(value, local - value); + return tk::StringLiteral; +} + +\n yylloc->end.lines(); yylloc->step(); N + +[ \t] L +<> L yyterminate(); + +. { + CYDriver::Error error; + error.location_ = *yylloc; + error.message_ = "syntax error, unknown token"; + yyextra->errors_.push_back(error); + yyterminate(); +} %%