1 # Bison Regressions. -*- Autotest -*-
3 # Copyright (C) 2001-2013 Free Software Foundation, Inc.
5 # This program is free software: you can redistribute it and/or modify
6 # it under the terms of the GNU General Public License as published by
7 # the Free Software Foundation, either version 3 of the License, or
8 # (at your option) any later version.
10 # This program is distributed in the hope that it will be useful,
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 # GNU General Public License for more details.
15 # You should have received a copy of the GNU General Public License
16 # along with this program. If not, see <http://www.gnu.org/licenses/>.
18 AT_BANNER([[Regression tests.]])
21 ## ------------------ ##
22 ## Trivial grammars. ##
23 ## ------------------ ##
25 AT_SETUP([Trivial grammars])
27 AT_BISON_OPTION_PUSHDEFS
28 AT_DATA_GRAMMAR([input.y],
30 ]AT_YYERROR_DECLARE_EXTERN[
31 ]AT_YYLEX_DECLARE_EXTERN[
41 AT_BISON_OPTION_POPDEFS
43 AT_BISON_CHECK([-o input.c input.y])
45 AT_COMPILE([input.o], [-DYYDEBUG -c input.c])
51 ## ----------------- ##
52 ## YYSTYPE typedef. ##
53 ## ----------------- ##
55 AT_SETUP([YYSTYPE typedef])
57 AT_BISON_OPTION_PUSHDEFS
58 AT_DATA_GRAMMAR([input.y],
60 ]AT_YYERROR_DECLARE_EXTERN[
61 ]AT_YYLEX_DECLARE_EXTERN[
62 typedef union { char const *val; } YYSTYPE;
69 program: { $$ = ""; };
71 AT_BISON_OPTION_POPDEFS
73 AT_BISON_CHECK([-o input.c input.y])
80 ## ------------------------------------- ##
81 ## Early token definitions with --yacc. ##
82 ## ------------------------------------- ##
85 AT_SETUP([Early token definitions with --yacc])
87 # Found in GCJ: they expect the tokens to be defined before the user
88 # prologue, so that they can use the token definitions in it.
90 AT_BISON_OPTION_PUSHDEFS
91 AT_DATA_GRAMMAR([input.y],
93 ]AT_YYERROR_DECLARE_EXTERN[
94 ]AT_YYLEX_DECLARE_EXTERN[
103 # error "MY_TOKEN not defined."
111 AT_BISON_OPTION_POPDEFS
113 AT_BISON_CHECK([-y -o input.c input.y])
114 AT_COMPILE([input.o])
120 ## ---------------------------------------- ##
121 ## Early token definitions without --yacc. ##
122 ## ---------------------------------------- ##
125 AT_SETUP([Early token definitions without --yacc])
127 # Found in GCJ: they expect the tokens to be defined before the user
128 # prologue, so that they can use the token definitions in it.
130 AT_BISON_OPTION_PUSHDEFS
131 AT_DATA_GRAMMAR([input.y],
133 ]AT_YYERROR_DECLARE_EXTERN[
134 ]AT_YYLEX_DECLARE_EXTERN[
135 void print_my_token (void);
145 print_my_token (void)
147 enum yytokentype my_token = MY_TOKEN;
148 printf ("%d\n", my_token);
156 AT_BISON_OPTION_POPDEFS
158 AT_BISON_CHECK([-o input.c input.y])
159 AT_COMPILE([input.o])
165 ## ---------------- ##
166 ## Braces parsing. ##
167 ## ---------------- ##
170 AT_SETUP([Braces parsing])
172 AT_BISON_OPTION_PUSHDEFS
174 [[/* Bison used to swallow the character after '}'. */
177 exp: { tests = {{{{{{{{{{}}}}}}}}}}; };
180 AT_BISON_OPTION_POPDEFS
182 AT_BISON_CHECK([-v -o input.c input.y])
184 AT_CHECK([grep 'tests = {{{{{{{{{{}}}}}}}}}};' input.c], 0, [ignore])
189 ## ------------------ ##
190 ## Duplicate string. ##
191 ## ------------------ ##
194 AT_SETUP([Duplicate string])
196 AT_BISON_OPTION_PUSHDEFS
198 [[/* 'Bison -v' used to dump core when two tokens are defined with the same
199 string, as LE and GE below. */
206 exp: '(' exp ')' | NUM ;
209 AT_BISON_OPTION_POPDEFS
211 AT_BISON_CHECK([-v -o input.c input.y], 0, [],
212 [[input.y:6.8-14: warning: symbol "<=" used more than once as a literal string [-Wother]
218 ## ------------------- ##
219 ## Rule Line Numbers. ##
220 ## ------------------- ##
222 AT_SETUP([Rule Line Numbers])
224 AT_KEYWORDS([report])
226 AT_BISON_OPTION_PUSHDEFS
256 AT_BISON_OPTION_POPDEFS
258 AT_BISON_CHECK([-o input.c -v input.y])
260 # Check the contents of the report.
261 AT_CHECK([cat input.output], [],
275 Terminals, with rules where they appear
284 Nonterminals, with rules where they appear
289 on left: 2 4, on right: 0
291 on left: 1, on right: 2
293 on left: 3, on right: 4
298 0 $accept: . expr $end
300 'a' shift, and go to state 1
302 $default reduce using rule 3 ($@2)
310 2 expr: 'a' . $@1 'b'
312 $default reduce using rule 1 ($@1)
319 0 $accept: expr . $end
321 $end shift, and go to state 5
328 'c' shift, and go to state 6
333 2 expr: 'a' $@1 . 'b'
335 'b' shift, and go to state 7
340 0 $accept: expr $end .
349 $default reduce using rule 4 (expr)
354 2 expr: 'a' $@1 'b' .
356 $default reduce using rule 2 (expr)
363 ## ---------------------- ##
364 ## Mixing %token styles. ##
365 ## ---------------------- ##
368 AT_SETUP([Mixing %token styles])
370 # Taken from the documentation.
372 [[%token <operator> OR "||"
373 %token <operator> LE 134 "<="
380 AT_BISON_CHECK([-v -Wall -o input.c input.y], 0, [],
381 [[input.y:3.1-5: warning: useless precedence and associativity for "||" [-Wprecedence]
382 input.y:3.1-5: warning: useless precedence and associativity for "<=" [-Wprecedence]
389 ## ---------------- ##
390 ## Invalid inputs. ##
391 ## ---------------- ##
394 AT_SETUP([Invalid inputs])
406 AT_BISON_CHECK([input.y], [1], [],
407 [[input.y:2.1: error: invalid character: '?'
408 input.y:3.14: error: invalid character: '}'
409 input.y:4.1: error: invalid character: '%'
410 input.y:4.2: error: invalid character: '&'
411 input.y:5.1-17: error: invalid directive: '%a-does-not-exist'
412 input.y:6.1: error: invalid character: '%'
413 input.y:6.2: error: invalid character: '-'
414 input.y:7.1-8.0: error: missing '%}' at end of file
415 input.y:7.1-8.0: error: syntax error, unexpected %{...%}
421 AT_SETUP([Invalid inputs with {}])
433 AT_BISON_CHECK([input.y], [1], [],
434 [[input.y:3.1-15: error: syntax error, unexpected %initial-action, expecting {...}
441 ## ------------------- ##
442 ## Token definitions. ##
443 ## ------------------- ##
446 AT_SETUP([Token definitions])
448 AT_BISON_OPTION_PUSHDEFS
449 # Bison managed, when fed with '%token 'f' "f"' to #define 'f'!
450 AT_DATA_GRAMMAR([input.y],
456 %token MYEOF 0 "end of file"
461 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
462 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
464 exp: "a" "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!";
467 ]AT_YYLEX_DEFINE([{ SPECIAL }])[
470 AT_BISON_OPTION_POPDEFS
472 # Checking the warning message guarantees that the trigraph "??!" isn't
473 # unnecessarily escaped here even though it would need to be if encoded in a
474 # C-string literal. Also notice that unnecessary escaping, such as "\?", from
475 # the user specification is eliminated.
476 AT_BISON_CHECK([-o input.c input.y], [[0]], [[]],
477 [[input.y:22.8-14: warning: symbol SPECIAL redeclared [-Wother]
478 input.y:22.8-63: warning: symbol "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!" used more than once as a literal string [-Wother]
480 AT_BISON_CHECK([-fcaret -o input.c input.y], [[0]], [[]],
481 [[input.y:22.8-14: warning: symbol SPECIAL redeclared [-Wother]
482 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
484 input.y:22.8-63: warning: symbol "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!" used more than once as a literal string [-Wother]
485 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
486 ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
490 # Checking the error message here guarantees that yytname, which does contain
491 # C-string literals, does have the trigraph escaped correctly. Thus, the
492 # symbol name reported by the parser is exactly the same as that reported by
495 [[syntax error, unexpected "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!", expecting a
497 AT_PARSER_CHECK([./input], 1, [], [experr])
502 ## -------------------- ##
503 ## Characters Escapes. ##
504 ## -------------------- ##
507 AT_SETUP([Characters Escapes])
509 AT_BISON_OPTION_PUSHDEFS
510 AT_DATA_GRAMMAR([input.y],
512 ]AT_YYERROR_DECLARE_EXTERN[
513 ]AT_YYLEX_DECLARE_EXTERN[
519 | '"' "'" /* Pacify font-lock-mode: ". */
523 AT_BISON_OPTION_POPDEFS
525 AT_BISON_CHECK([-o input.c input.y])
526 AT_COMPILE([input.o])
535 # The generation of the reduction was once wrong in Bison, and made it
536 # miss some reductions. In the following test case, the reduction on
537 # 'undef_id_tok' in state 1 was missing. This is stripped down from
538 # the actual web2c.y.
540 AT_SETUP([Web2c Report])
542 AT_KEYWORDS([report])
545 [[%token undef_id_tok const_id_tok
547 %start CONST_DEC_PART
556 | CONST_DEC_LIST CONST_DEC
560 { } undef_id_tok '=' const_id_tok ';'
565 AT_BISON_CHECK([-v input.y])
566 AT_CHECK([cat input.output], 0,
569 0 $accept: CONST_DEC_PART $end
571 1 CONST_DEC_PART: CONST_DEC_LIST
573 2 CONST_DEC_LIST: CONST_DEC
574 3 | CONST_DEC_LIST CONST_DEC
578 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';'
581 Terminals, with rules where they appear
591 Nonterminals, with rules where they appear
596 on left: 1, on right: 0
598 on left: 2 3, on right: 1 3
600 on left: 5, on right: 2 3
602 on left: 4, on right: 5
607 0 $accept: . CONST_DEC_PART $end
609 $default reduce using rule 4 ($@1)
611 CONST_DEC_PART go to state 1
612 CONST_DEC_LIST go to state 2
613 CONST_DEC go to state 3
619 0 $accept: CONST_DEC_PART . $end
621 $end shift, and go to state 5
626 1 CONST_DEC_PART: CONST_DEC_LIST .
627 3 CONST_DEC_LIST: CONST_DEC_LIST . CONST_DEC
629 undef_id_tok reduce using rule 4 ($@1)
630 $default reduce using rule 1 (CONST_DEC_PART)
632 CONST_DEC go to state 6
638 2 CONST_DEC_LIST: CONST_DEC .
640 $default reduce using rule 2 (CONST_DEC_LIST)
645 5 CONST_DEC: $@1 . undef_id_tok '=' const_id_tok ';'
647 undef_id_tok shift, and go to state 7
652 0 $accept: CONST_DEC_PART $end .
659 3 CONST_DEC_LIST: CONST_DEC_LIST CONST_DEC .
661 $default reduce using rule 3 (CONST_DEC_LIST)
666 5 CONST_DEC: $@1 undef_id_tok . '=' const_id_tok ';'
668 '=' shift, and go to state 8
673 5 CONST_DEC: $@1 undef_id_tok '=' . const_id_tok ';'
675 const_id_tok shift, and go to state 9
680 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok . ';'
682 ';' shift, and go to state 10
687 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';' .
689 $default reduce using rule 5 (CONST_DEC)
695 ## --------------- ##
697 ## --------------- ##
699 # The generation of the mapping 'state -> action' was once wrong in
700 # extremely specific situations. web2c.y exhibits this situation.
701 # Below is a stripped version of the grammar. It looks like one can
702 # simplify it further, but just don't: it is tuned to exhibit a bug,
703 # which disapears when applying sane grammar transformations.
705 # It used to be wrong on yydefact only:
707 # static const yytype_uint8 yydefact[] =
709 # - 2, 0, 1, 0, 0, 2, 3, 2, 5, 4,
710 # + 2, 0, 1, 0, 0, 0, 3, 2, 5, 4,
714 # but let's check all the tables.
717 AT_SETUP([Web2c Actions])
719 AT_KEYWORDS([report])
723 statement: struct_stat;
724 struct_stat: %empty | if else;
725 if: "if" "const" "then" statement;
726 else: "else" statement;
730 AT_BISON_CHECK([-v -o input.c input.y])
732 # Check only the tables.
733 [sed -n 's/ *$//;/^static const.*\[\] =/,/^}/p' input.c >tables.c]
735 AT_CHECK([[cat tables.c]], 0,
736 [[static const yytype_uint8 yytranslate[] =
738 0, 2, 2, 2, 2, 2, 2, 2, 2, 2,
739 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
740 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
741 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
742 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
743 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
744 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
745 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
746 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
747 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
748 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
749 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
750 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
751 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
752 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
753 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
754 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
755 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
756 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
757 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
758 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
759 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
760 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
761 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
762 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
763 2, 2, 2, 2, 2, 2, 1, 2, 3, 4,
766 static const yytype_uint8 yyrline[] =
770 static const char *const yytname[] =
772 "$end", "error", "$undefined", "\"if\"", "\"const\"", "\"then\"",
773 "\"else\"", "$accept", "statement", "struct_stat", "if", "else", YY_NULL
775 static const yytype_uint16 yytoknum[] =
777 0, 256, 257, 258, 259, 260, 261
779 static const yytype_int8 yypact[] =
781 -2, -1, 4, -8, 0, 2, -8, -2, -8, -2,
784 static const yytype_uint8 yydefact[] =
786 3, 0, 0, 2, 0, 0, 1, 3, 4, 3,
789 static const yytype_int8 yypgoto[] =
793 static const yytype_int8 yydefgoto[] =
797 static const yytype_uint8 yytable[] =
799 10, 1, 11, 5, 6, 0, 7, 9
801 static const yytype_int8 yycheck[] =
803 7, 3, 9, 4, 0, -1, 6, 5
805 static const yytype_uint8 yystos[] =
807 0, 3, 8, 9, 10, 4, 0, 6, 11, 5,
810 static const yytype_uint8 yyr1[] =
812 0, 7, 8, 9, 9, 10, 11
814 static const yytype_uint8 yyr2[] =
823 ## ------------------------- ##
824 ## yycheck Bound Violation. ##
825 ## ------------------------- ##
828 # _AT_DATA_DANCER_Y(BISON-OPTIONS)
829 # --------------------------------
830 # The following grammar, taken from Andrew Suffield's GPL'd implementation
831 # of DGMTP, the Dancer Generic Message Transport Protocol, used to violate
832 # yycheck's bounds where issuing a verbose error message. Keep this test
833 # so that possible bound checking compilers could check all the skeletons.
834 m4_define([_AT_DATA_DANCER_Y],
835 [AT_DATA_GRAMMAR([dancer.y],
842 %token ARROW INVALID NUMBER STRING DATA
845 /* Grammar follows */
850 header: '<' from ARROW to '>' type ':'
851 | '<' ARROW to '>' type ':'
885 ]AT_YYLEX_DEFINE([":"])[
888 ])# _AT_DATA_DANCER_Y
891 # AT_CHECK_DANCER(BISON-OPTIONS)
892 # ------------------------------
893 # Generate the grammar, compile it, run it.
894 m4_define([AT_CHECK_DANCER],
895 [AT_SETUP([Dancer $1])
896 AT_BISON_OPTION_PUSHDEFS([$1])
897 _AT_DATA_DANCER_Y([$1])
898 AT_FULL_COMPILE([dancer])
899 AT_PARSER_CHECK([./dancer], 1, [],
900 [syntax error, unexpected ':'
902 AT_BISON_OPTION_POPDEFS
907 AT_CHECK_DANCER([%glr-parser])
908 AT_CHECK_DANCER([%skeleton "lalr1.cc"])
911 ## ------------------------------------------ ##
912 ## Diagnostic that expects two alternatives. ##
913 ## ------------------------------------------ ##
916 # _AT_DATA_EXPECT2_Y(BISON-OPTIONS)
917 # --------------------------------
918 m4_define([_AT_DATA_EXPECT2_Y],
919 [AT_DATA_GRAMMAR([expect2.y],
921 static int yylex (AT_LALR1_CC_IF([int *], [void]));
922 AT_LALR1_CC_IF([[#include <cstdlib>]],
924 ]AT_YYERROR_DECLARE])[
946 return parser.parse ();
952 yylex (]AT_LALR1_CC_IF([int *lval], [void])[)
954 static int const tokens[] =
958 static size_t toknum;
959 ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[
960 assert (toknum < sizeof tokens / sizeof *tokens);
961 return tokens[toknum++];
965 ])# _AT_DATA_EXPECT2_Y
968 # AT_CHECK_EXPECT2(BISON-OPTIONS)
969 # -------------------------------
970 # Generate the grammar, compile it, run it.
971 m4_define([AT_CHECK_EXPECT2],
972 [AT_SETUP([Expecting two tokens $1])
973 AT_BISON_OPTION_PUSHDEFS([$1])
974 _AT_DATA_EXPECT2_Y([$1])
975 AT_FULL_COMPILE([expect2])
976 AT_PARSER_CHECK([./expect2], 1, [],
977 [syntax error, unexpected '+', expecting A or B
979 AT_BISON_OPTION_POPDEFS
984 AT_CHECK_EXPECT2([%glr-parser])
985 AT_CHECK_EXPECT2([%skeleton "lalr1.cc"])
989 ## --------------------------------------------- ##
990 ## Braced code in declaration in rules section. ##
991 ## --------------------------------------------- ##
993 AT_SETUP([Braced code in declaration in rules section])
995 # Bison once mistook braced code in a declaration in the rules section to be a
997 AT_BISON_OPTION_PUSHDEFS([%debug])
998 AT_DATA_GRAMMAR([input.y],
1000 ]AT_YYERROR_DECLARE[
1009 printf ("Bison would once convert this action to a midrule because of the"
1010 " subsequent braced code.\n");
1014 %destructor { fprintf (stderr, "DESTRUCTOR\n"); } 'a';
1015 %printer { fprintf (yyoutput, "PRINTER"); } 'a';
1019 ]AT_YYLEX_DEFINE(["a"])[
1022 AT_BISON_OPTION_POPDEFS
1024 AT_BISON_CHECK([-o input.c input.y])
1026 AT_PARSER_CHECK([./input --debug], 1,
1027 [[Bison would once convert this action to a midrule because of the subsequent braced code.
1031 Reducing stack by rule 1 (line 20):
1032 -> $$ = nterm start ()
1035 Reading a token: Next token is token 'a' (PRINTER)
1036 syntax error, unexpected 'a', expecting $end
1037 Error: popping nterm start ()
1039 Cleanup: discarding lookahead token 'a' (PRINTER)
1048 ## --------------------------------- ##
1049 ## String alias declared after use. ##
1050 ## --------------------------------- ##
1052 AT_SETUP([String alias declared after use])
1054 # Bison once incorrectly asserted that the symbol number for either a token or
1055 # its alias was the highest symbol number so far at the point of the alias
1056 # declaration. That was true unless the declaration appeared after their first
1057 # uses and other tokens appeared in between.
1065 AT_BISON_CHECK([-o input.c input.y])
1071 ## -------------------------------- ##
1072 ## Extra lookahead sets in report. ##
1073 ## -------------------------------- ##
1075 AT_SETUP([[Extra lookahead sets in report]])
1077 # Bison prints each reduction's lookahead set only next to the associated
1078 # state's one item that (1) is associated with the same rule as the reduction
1079 # and (2) has its dot at the end of its RHS. Previously, Bison also
1080 # erroneously printed the lookahead set next to all of the state's other items
1081 # associated with the same rule. This bug affected only the '.output' file and
1082 # not the generated parser source code.
1084 AT_DATA([[input.y]],
1086 start: a | 'a' a 'a' ;
1090 AT_BISON_CHECK([[--report=all input.y]])
1091 AT_CHECK([[sed -n '/^State 1$/,/^State 2$/p' input.output]], [[0]],
1094 2 start: 'a' . a 'a'
1098 'a' shift, and go to state 4
1100 $default reduce using rule 3 (a)
1112 ## ---------------------------------------- ##
1113 ## Token number in precedence declaration. ##
1114 ## ---------------------------------------- ##
1116 AT_SETUP([[Token number in precedence declaration]])
1118 # POSIX says token numbers can be declared in %left, %right, and %nonassoc, but
1119 # we lost this in Bison 1.50.
1120 AT_BISON_OPTION_PUSHDEFS
1121 AT_DATA_GRAMMAR([input.y],
1123 ]AT_YYERROR_DECLARE[
1129 %left TK1 1 TK2 2 "tok alias" 3
1134 TK1 sr_conflict "tok alias"
1145 ]AT_YYLEX_DEFINE([{ 1, 2, 3, 0 }])[
1149 AT_BISON_CHECK([[-Wall -o input.c input.y]], [[0]],,
1150 [[input.y:24.5-19: warning: rule useless in parser due to conflicts [-Wother]
1151 input.y:28.5-19: warning: rule useless in parser due to conflicts [-Wother]
1152 input.y:18.1-5: warning: useless precedence and associativity for TK1 [-Wprecedence]
1154 AT_COMPILE([[input]])
1155 AT_PARSER_CHECK([[./input]])
1156 AT_BISON_OPTION_POPDEFS
1162 ## --------------------------- ##
1163 ## parse-gram.y: LALR = IELR. ##
1164 ## --------------------------- ##
1166 # If parse-gram.y's LALR and IELR parser tables ever begin to differ, we
1167 # need to fix parse-gram.y or start using IELR.
1169 AT_SETUP([[parse-gram.y: LALR = IELR]])
1171 # Avoid tests/bison's dark magic by processing a local copy of the
1172 # grammar. Avoid differences in synclines by telling bison that the
1173 # output files have the same name.
1174 [cp $abs_top_srcdir/src/parse-gram.y input.y]
1175 AT_BISON_CHECK([[-o input.c -Dlr.type=lalr input.y]])
1177 AT_CAPTURE_FILE([lalr.c])
1178 AT_BISON_CHECK([[-o input.c -Dlr.type=ielr input.y]])
1180 AT_CAPTURE_FILE([ielr.c])
1181 AT_CHECK([[diff lalr.c ielr.c]], [[0]])
1187 ## -------------------------------------------- ##
1188 ## parse.error=verbose and YYSTACK_USE_ALLOCA. ##
1189 ## -------------------------------------------- ##
1191 AT_SETUP([[parse.error=verbose and YYSTACK_USE_ALLOCA]])
1193 AT_BISON_OPTION_PUSHDEFS
1194 AT_DATA_GRAMMAR([input.y],
1196 ]AT_YYERROR_DECLARE[
1198 #define YYSTACK_USE_ALLOCA 1
1201 %define parse.error verbose
1205 start: check syntax_error syntax_error ;
1209 if (128 < sizeof yymsgbuf)
1212 "The initial size of yymsgbuf in yyparse has increased\n"
1213 "since this test group was last updated. As a result,\n"
1214 "this test group may no longer manage to induce a\n"
1215 "reallocation of the syntax error message buffer.\n"
1216 "This test group must be adjusted to produce a longer\n"
1217 "error message.\n");
1223 // Induce a syntax error message whose total length is more than
1224 // sizeof yymsgbuf in yyparse. Each token here is 64 bytes.
1226 "123456789112345678921234567893123456789412345678951234567896123A"
1227 | "123456789112345678921234567893123456789412345678951234567896123B"
1234 /* Induce two syntax error messages (which requires full error
1235 recovery by shifting 3 tokens) in order to detect any loss of the
1236 reallocated buffer. */
1237 ]AT_YYLEX_DEFINE(["abc"])[
1240 AT_BISON_OPTION_POPDEFS
1242 AT_BISON_CHECK([[-o input.c input.y]])
1243 AT_COMPILE([[input]])
1244 AT_PARSER_CHECK([[./input]], [[1]], [],
1245 [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B
1246 syntax error, unexpected $end, expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B
1253 ## ------------------------------ ##
1254 ## parse.error=verbose overflow. ##
1255 ## ------------------------------ ##
1257 # Imagine the case where YYSTACK_ALLOC_MAXIMUM = YYSIZE_MAXIMUM and an
1258 # invocation of yysyntax_error has caused yymsg_alloc to grow to exactly
1259 # YYSTACK_ALLOC_MAXIMUM (perhaps because the normal doubling of size had
1260 # to be clipped to YYSTACK_ALLOC_MAXIMUM). In an old version of yacc.c,
1261 # a subsequent invocation of yysyntax_error that overflows during its
1262 # size calculation would return YYSIZE_MAXIMUM to yyparse. Then,
1263 # yyparse would invoke yyerror using the old contents of yymsg.
1265 AT_SETUP([[parse.error=verbose overflow]])
1267 AT_BISON_OPTION_PUSHDEFS
1268 AT_DATA_GRAMMAR([input.y],
1270 ]AT_YYERROR_DECLARE[
1273 /* This prevents this test case from having to induce error messages
1274 large enough to overflow size_t. */
1275 #define YYSIZE_T unsigned char
1277 /* Bring in malloc and set EXIT_SUCCESS so yacc.c doesn't try to
1278 provide a malloc prototype using our YYSIZE_T. */
1280 #ifndef EXIT_SUCCESS
1281 # define EXIT_SUCCESS 0
1284 /* Max depth is usually much smaller than YYSTACK_ALLOC_MAXIMUM, and
1285 we don't want gcc to warn everywhere this constant would be too big
1286 to make sense for our YYSIZE_T. */
1287 #define YYMAXDEPTH 100
1290 %define parse.error verbose
1294 start: syntax_error1 check syntax_error2 ;
1296 // Induce a syntax error message whose total length causes yymsg in
1297 // yyparse to be reallocated to size YYSTACK_ALLOC_MAXIMUM, which
1298 // should be 255. Each token here is 64 bytes.
1300 "123456789112345678921234567893123456789412345678951234567896123A"
1301 | "123456789112345678921234567893123456789412345678951234567896123B"
1302 | "123456789112345678921234567893123456789412345678951234567896123C"
1308 if (yymsg_alloc != YYSTACK_ALLOC_MAXIMUM
1309 || YYSTACK_ALLOC_MAXIMUM != YYSIZE_MAXIMUM
1310 || YYSIZE_MAXIMUM != 255)
1313 "The assumptions of this test group are no longer\n"
1314 "valid, so it may no longer catch the error it was\n"
1315 "designed to catch. Specifically, the following\n"
1316 "values should all be 255:\n\n");
1317 fprintf (stderr, " yymsg_alloc = %d\n", yymsg_alloc);
1318 fprintf (stderr, " YYSTACK_ALLOC_MAXIMUM = %d\n",
1319 YYSTACK_ALLOC_MAXIMUM);
1320 fprintf (stderr, " YYSIZE_MAXIMUM = %d\n", YYSIZE_MAXIMUM);
1328 "123456789112345678921234567893123456789412345678951234567896123A"
1329 | "123456789112345678921234567893123456789412345678951234567896123B"
1330 | "123456789112345678921234567893123456789412345678951234567896123C"
1331 | "123456789112345678921234567893123456789412345678951234567896123D"
1332 | "123456789112345678921234567893123456789412345678951234567896123E"
1338 /* Induce two syntax error messages (which requires full error
1339 recovery by shifting 3 tokens). */
1340 ]AT_YYLEX_DEFINE(["abc"])[
1344 /* Push parsers throw away the message buffer between tokens, so skip
1345 this test under maintainer-push-check. */
1352 AT_BISON_CHECK([[-o input.c input.y]])
1354 # gcc warns about tautologies and fallacies involving comparisons for
1355 # unsigned char. However, it doesn't produce these same warnings for
1356 # size_t and many other types when the warnings would seem to make just
1357 # as much sense. We ignore the warnings.
1358 [CFLAGS="$NO_WERROR_CFLAGS"]
1359 AT_COMPILE([[input]])
1361 AT_PARSER_CHECK([[./input]], [[2]], [],
1362 [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B or 123456789112345678921234567893123456789412345678951234567896123C
1366 AT_BISON_OPTION_POPDEFS
1371 ## ------------------------ ##
1372 ## LAC: Exploratory stack. ##
1373 ## ------------------------ ##
1375 AT_SETUP([[LAC: Exploratory stack]])
1377 m4_pushdef([AT_LAC_CHECK], [
1379 AT_BISON_OPTION_PUSHDEFS([%debug $1])
1381 AT_DATA_GRAMMAR([input.y],
1383 ]AT_YYERROR_DECLARE[
1384 int yylex (]AT_PURE_IF([[YYSTYPE *]], [[void]])[);
1388 %define parse.error verbose
1393 // default reductions in inconsistent states
1394 // v v v v v v v v v v v v v v
1395 S: A B A A B A A A A B A A A A A A A B C C A A A A A A A A A A A A B ;
1399 A: 'a' | /*empty*/ { printf ("inconsistent default reduction\n"); } ;
1401 C: /*empty*/ { printf ("consistent default reduction\n"); } ;
1406 yylex (]AT_PURE_IF([[YYSTYPE *v]], [[void]])[)
1408 static char const *input = "bbbbc";]AT_PURE_IF([[
1416 AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity-initial=1 \
1417 -Dparse.lac.memory-trace=full \
1418 -o input.c input.y]], [[0]], [],
1419 [[input.y: warning: 21 shift/reduce conflicts [-Wconflicts-sr]
1421 AT_COMPILE([[input]])
1422 AT_PARSER_CHECK([[./input --debug > stdout.txt 2> stderr.txt]], [[1]])
1424 # Make sure syntax error doesn't forget that 'a' is expected. It would
1425 # be forgotten without lookahead correction.
1426 AT_CHECK([[grep 'syntax error,' stderr.txt]], [[0]],
1427 [[syntax error, unexpected 'c', expecting 'a' or 'b'
1430 # Check number of default reductions in inconsistent states to be sure
1431 # syntax error is detected before unnecessary reductions are performed.
1432 AT_CHECK([[$PERL -0777 -ne 'print s/inconsistent default reduction//g;' \
1433 < stdout.txt || exit 77]], [[0]], [[14]])
1435 # Check number of default reductions in consistent states to be sure
1436 # it is performed before the syntax error is detected.
1437 AT_CHECK([[$PERL -0777 -ne 'print s/\bconsistent default reduction//g;' \
1438 < stdout.txt || exit 77]], [[0]], [[2]])
1440 # Check number of reallocs to be sure reallocated memory isn't somehow
1441 # lost between LAC invocations.
1442 AT_CHECK([[$PERL -0777 -ne 'print s/\(realloc//g;' < stderr.txt \
1443 || exit 77]], [[0]], [[3]])
1445 AT_BISON_OPTION_POPDEFS
1448 AT_LAC_CHECK([[%define api.push-pull pull]])
1449 AT_LAC_CHECK([[%define api.push-pull pull %define api.pure]])
1450 AT_LAC_CHECK([[%define api.push-pull both]])
1451 AT_LAC_CHECK([[%define api.push-pull both %define api.pure]])
1453 m4_popdef([AT_LAC_CHECK])
1459 ## ------------------------ ##
1460 ## LAC: Memory exhaustion. ##
1461 ## ------------------------ ##
1463 AT_SETUP([[LAC: Memory exhaustion]])
1465 m4_pushdef([AT_LAC_CHECK],
1466 [AT_BISON_OPTION_PUSHDEFS([%debug])
1467 AT_DATA_GRAMMAR([input.y],
1469 ]AT_YYERROR_DECLARE[
1471 #define YYMAXDEPTH 8
1478 S: A A A A A A A A A ;
1479 A: /*empty*/ | 'a' ;
1483 ]AT_YYLEX_DEFINE(["$1"])[
1487 AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity-initial=1 \
1488 -o input.c input.y]], [[0]], [],
1489 [[input.y: warning: 8 shift/reduce conflicts [-Wconflicts-sr]
1491 AT_COMPILE([[input]])
1492 AT_BISON_OPTION_POPDEFS
1495 # Check for memory exhaustion during parsing.
1497 AT_PARSER_CHECK([[./input --debug]], [[2]], [],
1500 Reading a token: Now at end of input.
1501 LAC: initial context established for $end
1502 LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max size exceeded)
1504 Cleanup: discarding lookahead token $end ()
1508 # Induce an immediate syntax error with an undefined token, and check
1509 # for memory exhaustion while building syntax error message.
1510 AT_LAC_CHECK([z], [[0]])
1511 AT_PARSER_CHECK([[./input --debug]], [[2]], [],
1514 Reading a token: Next token is token $undefined ()
1515 LAC: initial context established for $undefined
1516 LAC: checking lookahead $undefined: Always Err
1517 Constructing syntax error message
1518 LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max size exceeded)
1521 Cleanup: discarding lookahead token $undefined ()
1525 m4_popdef([AT_LAC_CHECK])
1530 ## ---------------------- ##
1531 ## Lex and parse params. ##
1532 ## ---------------------- ##
1536 # Check that the identifier of the params is properly fetched
1537 # even when there are trailing blanks.
1539 m4_pushdef([AT_TEST],
1540 [AT_SETUP([[Lex and parse params: $1]])
1542 ## FIXME: Improve parsing of parse-param.
1543 AT_BISON_OPTION_PUSHDEFS([%locations %skeleton "$1" %parse-param { int x } %parse-param { int y }])
1545 AT_DATA_GRAMMAR([input.y],
1548 %union { int ival; }
1549 %parse-param { int x }
1550 // Spaces, tabs, and new lines.
1558 ]AT_YYERROR_DECLARE[
1563 exp: 'a' { fprintf (stdout, "x: %d, y: %d\n", x, y); };
1566 ]AT_YYLEX_DEFINE(["a"])[
1570 yyparse (int x, int y)
1572 yy::parser parser(x, y);
1573 return parser.parse ();
1580 return yyparse(1, 2);
1584 AT_FULL_COMPILE([input])
1585 AT_PARSER_CHECK([./input], 0, [[x: 1, y: 2
1587 AT_BISON_OPTION_POPDEFS
1592 ## FIXME: test Java, and iterate over skeletons.
1598 m4_popdef([AT_TEST])
1601 ## ----------------------- ##
1602 ## stdio.h is not needed. ##
1603 ## ----------------------- ##
1605 # At some point, by accident, yy_location_print_ was using fprintf and
1606 # FILE which are from stdio.h, which we do not require.
1607 AT_SETUP([[stdio.h is not needed]])
1609 AT_BISON_OPTION_PUSHDEFS
1611 AT_DATA_GRAMMAR([input.y],
1615 static int yylex (void) { return 0; }
1616 static void yyerror (const char* msg) { (void) msg; }
1624 AT_FULL_COMPILE([input])
1626 AT_BISON_OPTION_POPDEFS