1 # Bison Regressions. -*- Autotest -*-
3 # Copyright (C) 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009,
4 # 2010 Free Software Foundation, Inc.
6 # This program is free software: you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License as published by
8 # the Free Software Foundation, either version 3 of the License, or
9 # (at your option) any later version.
11 # This program is distributed in the hope that it will be useful,
12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 # GNU General Public License for more details.
16 # You should have received a copy of the GNU General Public License
17 # along with this program. If not, see <http://www.gnu.org/licenses/>.
19 AT_BANNER([[Regression tests.]])
22 ## ------------------ ##
23 ## Trivial grammars. ##
24 ## ------------------ ##
26 AT_SETUP([Trivial grammars])
28 AT_DATA_GRAMMAR([input.y],
30 void yyerror (char const *);
42 AT_BISON_CHECK([-o input.c input.y])
43 AT_COMPILE([input.o], [-c input.c])
44 AT_COMPILE([input.o], [-DYYDEBUG -c input.c])
50 ## ----------------- ##
51 ## YYSTYPE typedef. ##
52 ## ----------------- ##
54 AT_SETUP([YYSTYPE typedef])
56 AT_DATA_GRAMMAR([input.y],
58 void yyerror (char const *);
60 typedef union { char const *val; } YYSTYPE;
67 program: { $$ = ""; };
70 AT_BISON_CHECK([-o input.c input.y])
71 AT_COMPILE([input.o], [-c input.c])
77 ## ------------------------------------- ##
78 ## Early token definitions with --yacc. ##
79 ## ------------------------------------- ##
82 AT_SETUP([Early token definitions with --yacc])
84 # Found in GCJ: they expect the tokens to be defined before the user
85 # prologue, so that they can use the token definitions in it.
87 AT_DATA_GRAMMAR([input.y],
89 void yyerror (const char *s);
99 # error "MY_TOKEN not defined."
108 AT_BISON_CHECK([-y -o input.c input.y])
109 AT_COMPILE([input.o], [-c input.c])
115 ## ---------------------------------------- ##
116 ## Early token definitions without --yacc. ##
117 ## ---------------------------------------- ##
120 AT_SETUP([Early token definitions without --yacc])
122 # Found in GCJ: they expect the tokens to be defined before the user
123 # prologue, so that they can use the token definitions in it.
125 AT_DATA_GRAMMAR([input.y],
128 void yyerror (const char *s);
130 void print_my_token (void);
139 print_my_token (void)
141 enum yytokentype my_token = MY_TOKEN;
142 printf ("%d\n", my_token);
151 AT_BISON_CHECK([-o input.c input.y])
152 AT_COMPILE([input.o], [-c input.c])
158 ## ---------------- ##
159 ## Braces parsing. ##
160 ## ---------------- ##
163 AT_SETUP([Braces parsing])
166 [[/* Bison used to swallow the character after `}'. */
169 exp: { tests = {{{{{{{{{{}}}}}}}}}}; };
173 AT_BISON_CHECK([-v -o input.c input.y])
175 AT_CHECK([grep 'tests = {{{{{{{{{{}}}}}}}}}};' input.c], 0, [ignore])
180 ## ------------------ ##
181 ## Duplicate string. ##
182 ## ------------------ ##
185 AT_SETUP([Duplicate string])
188 [[/* `Bison -v' used to dump core when two tokens are defined with the same
189 string, as LE and GE below. */
196 exp: '(' exp ')' | NUM ;
200 AT_BISON_CHECK([-v -o input.c input.y], 0, [],
201 [[input.y:6.8-14: warning: symbol `"<="' used more than once as a literal string
207 ## ------------------- ##
208 ## Rule Line Numbers. ##
209 ## ------------------- ##
211 AT_SETUP([Rule Line Numbers])
213 AT_KEYWORDS([report])
245 AT_BISON_CHECK([-o input.c -v input.y])
247 # Check the contents of the report.
248 AT_CHECK([cat input.output], [],
262 Terminals, with rules where they appear
271 Nonterminals, with rules where they appear
276 on left: 2 4, on right: 0
278 on left: 1, on right: 2
280 on left: 3, on right: 4
285 0 $accept: . expr $end
287 'a' shift, and go to state 1
289 $default reduce using rule 3 ($@2)
297 2 expr: 'a' . $@1 'b'
299 $default reduce using rule 1 ($@1)
306 0 $accept: expr . $end
308 $end shift, and go to state 5
315 'c' shift, and go to state 6
320 2 expr: 'a' $@1 . 'b'
322 'b' shift, and go to state 7
327 0 $accept: expr $end .
336 $default reduce using rule 4 (expr)
341 2 expr: 'a' $@1 'b' .
343 $default reduce using rule 2 (expr)
350 ## ---------------------- ##
351 ## Mixing %token styles. ##
352 ## ---------------------- ##
355 AT_SETUP([Mixing %token styles])
357 # Taken from the documentation.
359 [[%token <operator> OR "||"
360 %token <operator> LE 134 "<="
367 AT_BISON_CHECK([-v -o input.c input.y])
373 ## ---------------- ##
374 ## Invalid inputs. ##
375 ## ---------------- ##
378 AT_SETUP([Invalid inputs])
390 AT_BISON_CHECK([input.y], [1], [],
391 [[input.y:2.1: invalid character: `?'
392 input.y:3.14: invalid character: `}'
393 input.y:4.1: invalid character: `%'
394 input.y:4.2: invalid character: `&'
395 input.y:5.1-17: invalid directive: `%a-does-not-exist'
396 input.y:6.1-2: invalid directive: `%-'
397 input.y:7.1-8.0: missing `%}' at end of file
398 input.y:7.1-8.0: syntax error, unexpected %{...%}
404 AT_SETUP([Invalid inputs with {}])
416 AT_BISON_CHECK([input.y], [1], [],
417 [[input.y:3.1-15: syntax error, unexpected %initial-action, expecting {...}
424 ## ------------------- ##
425 ## Token definitions. ##
426 ## ------------------- ##
429 AT_SETUP([Token definitions])
431 # Bison managed, when fed with `%token 'f' "f"' to #define 'f'!
432 AT_DATA_GRAMMAR([input.y],
436 void yyerror (const char *s);
440 %token MYEOF 0 "end of file"
445 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
446 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
448 exp: "a" "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!";
451 yyerror (char const *s)
453 fprintf (stderr, "%s\n", s);
472 # Checking the warning message guarantees that the trigraph "??!" isn't
473 # unnecessarily escaped here even though it would need to be if encoded in a
474 # C-string literal. Also notice that unnecessary escaping, such as "\?", from
475 # the user specification is eliminated.
476 AT_BISON_CHECK([-o input.c input.y], [[0]], [[]],
477 [[input.y:22.8-14: warning: symbol SPECIAL redeclared
478 input.y:22.8-63: warning: symbol `"\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!"' used more than once as a literal string
482 # Checking the error message here guarantees that yytname, which does contain
483 # C-string literals, does have the trigraph escaped correctly. Thus, the
484 # symbol name reported by the parser is exactly the same as that reported by
487 [[syntax error, unexpected "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!", expecting a
489 AT_PARSER_CHECK([./input], 1, [], [experr])
494 ## -------------------- ##
495 ## Characters Escapes. ##
496 ## -------------------- ##
499 AT_SETUP([Characters Escapes])
501 AT_DATA_GRAMMAR([input.y],
503 void yyerror (const char *s);
513 # Pacify font-lock-mode: "
515 AT_BISON_CHECK([-o input.c input.y])
516 AT_COMPILE([input.o], [-c input.c])
525 # The generation of the reduction was once wrong in Bison, and made it
526 # miss some reductions. In the following test case, the reduction on
527 # `undef_id_tok' in state 1 was missing. This is stripped down from
528 # the actual web2c.y.
530 AT_SETUP([Web2c Report])
532 AT_KEYWORDS([report])
535 [[%token undef_id_tok const_id_tok
537 %start CONST_DEC_PART
546 | CONST_DEC_LIST CONST_DEC
550 { } undef_id_tok '=' const_id_tok ';'
555 AT_BISON_CHECK([-v input.y])
556 AT_CHECK([cat input.output], 0,
559 0 $accept: CONST_DEC_PART $end
561 1 CONST_DEC_PART: CONST_DEC_LIST
563 2 CONST_DEC_LIST: CONST_DEC
564 3 | CONST_DEC_LIST CONST_DEC
568 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';'
571 Terminals, with rules where they appear
581 Nonterminals, with rules where they appear
586 on left: 1, on right: 0
588 on left: 2 3, on right: 1 3
590 on left: 5, on right: 2 3
592 on left: 4, on right: 5
597 0 $accept: . CONST_DEC_PART $end
599 $default reduce using rule 4 ($@1)
601 CONST_DEC_PART go to state 1
602 CONST_DEC_LIST go to state 2
603 CONST_DEC go to state 3
609 0 $accept: CONST_DEC_PART . $end
611 $end shift, and go to state 5
616 1 CONST_DEC_PART: CONST_DEC_LIST .
617 3 CONST_DEC_LIST: CONST_DEC_LIST . CONST_DEC
619 undef_id_tok reduce using rule 4 ($@1)
620 $default reduce using rule 1 (CONST_DEC_PART)
622 CONST_DEC go to state 6
628 2 CONST_DEC_LIST: CONST_DEC .
630 $default reduce using rule 2 (CONST_DEC_LIST)
635 5 CONST_DEC: $@1 . undef_id_tok '=' const_id_tok ';'
637 undef_id_tok shift, and go to state 7
642 0 $accept: CONST_DEC_PART $end .
649 3 CONST_DEC_LIST: CONST_DEC_LIST CONST_DEC .
651 $default reduce using rule 3 (CONST_DEC_LIST)
656 5 CONST_DEC: $@1 undef_id_tok . '=' const_id_tok ';'
658 '=' shift, and go to state 8
663 5 CONST_DEC: $@1 undef_id_tok '=' . const_id_tok ';'
665 const_id_tok shift, and go to state 9
670 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok . ';'
672 ';' shift, and go to state 10
677 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';' .
679 $default reduce using rule 5 (CONST_DEC)
685 ## --------------- ##
687 ## --------------- ##
689 # The generation of the mapping `state -> action' was once wrong in
690 # extremely specific situations. web2c.y exhibits this situation.
691 # Below is a stripped version of the grammar. It looks like one can
692 # simplify it further, but just don't: it is tuned to exhibit a bug,
693 # which disapears when applying sane grammar transformations.
695 # It used to be wrong on yydefact only:
697 # static const yytype_uint8 yydefact[] =
699 # - 2, 0, 1, 0, 0, 2, 3, 2, 5, 4,
700 # + 2, 0, 1, 0, 0, 0, 3, 2, 5, 4,
704 # but let's check all the tables.
707 AT_SETUP([Web2c Actions])
709 AT_KEYWORDS([report])
713 statement: struct_stat;
714 struct_stat: /* empty. */ | if else;
715 if: "if" "const" "then" statement;
716 else: "else" statement;
720 AT_BISON_CHECK([-v -o input.c input.y])
722 # Check only the tables.
723 [sed -n 's/ *$//;/^static const.*\[\] =/,/^}/p' input.c >tables.c]
725 AT_CHECK([[cat tables.c]], 0,
726 [[static const yytype_uint8 yytranslate[] =
728 0, 2, 2, 2, 2, 2, 2, 2, 2, 2,
729 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
730 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
731 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
732 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
733 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
734 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
735 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
736 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
737 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
738 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
739 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
740 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
741 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
742 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
743 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
744 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
745 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
746 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
747 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
748 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
749 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
750 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
751 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
752 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
753 2, 2, 2, 2, 2, 2, 1, 2, 3, 4,
756 static const yytype_uint8 yyrline[] =
760 static const char *const yytname[] =
762 "$end", "error", "$undefined", "\"if\"", "\"const\"", "\"then\"",
763 "\"else\"", "$accept", "statement", "struct_stat", "if", "else", 0
765 static const yytype_uint16 yytoknum[] =
767 0, 256, 257, 258, 259, 260, 261
769 static const yytype_int8 yypact[] =
771 -2, -1, 4, -8, 0, 2, -8, -2, -8, -2,
774 static const yytype_uint8 yydefact[] =
776 3, 0, 0, 2, 0, 0, 1, 3, 4, 3,
779 static const yytype_int8 yypgoto[] =
783 static const yytype_int8 yydefgoto[] =
787 static const yytype_uint8 yytable[] =
789 10, 1, 11, 5, 6, 0, 7, 9
791 static const yytype_int8 yycheck[] =
793 7, 3, 9, 4, 0, -1, 6, 5
795 static const yytype_uint8 yystos[] =
797 0, 3, 8, 9, 10, 4, 0, 6, 11, 5,
800 static const yytype_uint8 yyr1[] =
802 0, 7, 8, 9, 9, 10, 11
804 static const yytype_uint8 yyr2[] =
813 ## ------------------------- ##
814 ## yycheck Bound Violation. ##
815 ## ------------------------- ##
818 # _AT_DATA_DANCER_Y(BISON-OPTIONS)
819 # --------------------------------
820 # The following grammar, taken from Andrew Suffield's GPL'd implementation
821 # of DGMTP, the Dancer Generic Message Transport Protocol, used to violate
822 # yycheck's bounds where issuing a verbose error message. Keep this test
823 # so that possible bound checking compilers could check all the skeletons.
824 m4_define([_AT_DATA_DANCER_Y],
825 [AT_DATA_GRAMMAR([dancer.y],
827 static int yylex (AT_LALR1_CC_IF([int *], [void]));
828 AT_LALR1_CC_IF([#include <cstdlib>],
831 static void yyerror (const char *);])
834 %token ARROW INVALID NUMBER STRING DATA
838 /* Grammar follows */
843 header: '<' from ARROW to '>' type ':'
844 | '<' ARROW to '>' type ':'
878 [/* A C++ error reporting function. */
880 yy::parser::error (const std::string& m)
882 std::cerr << m << std::endl;
890 parser.set_debug_level (YYDEBUG);
892 return parser.parse ();
896 yyerror (const char *s)
898 fprintf (stderr, "%s\n", s);
902 yylex (AT_LALR1_CC_IF([int *lval], [void]))
904 static int const tokens[] =
908 static size_t toknum;
909 ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[
910 if (! (toknum < sizeof tokens / sizeof *tokens))
912 return tokens[toknum++];
921 ])# _AT_DATA_DANCER_Y
924 # AT_CHECK_DANCER(BISON-OPTIONS)
925 # ------------------------------
926 # Generate the grammar, compile it, run it.
927 m4_define([AT_CHECK_DANCER],
928 [AT_SETUP([Dancer $1])
929 AT_BISON_OPTION_PUSHDEFS([$1])
930 _AT_DATA_DANCER_Y([$1])
931 AT_BISON_CHECK([-o dancer.c dancer.y])
932 AT_FULL_COMPILE([dancer])
933 AT_PARSER_CHECK([./dancer], 1, [],
934 [syntax error, unexpected ':'
936 AT_BISON_OPTION_POPDEFS
941 AT_CHECK_DANCER([%glr-parser])
942 AT_CHECK_DANCER([%skeleton "lalr1.cc"])
945 ## ------------------------------------------ ##
946 ## Diagnostic that expects two alternatives. ##
947 ## ------------------------------------------ ##
950 # _AT_DATA_EXPECT2_Y(BISON-OPTIONS)
951 # --------------------------------
952 m4_define([_AT_DATA_EXPECT2_Y],
953 [AT_DATA_GRAMMAR([expect2.y],
955 static int yylex (AT_LALR1_CC_IF([int *], [void]));
956 AT_LALR1_CC_IF([#include <cstdlib>],
959 static void yyerror (const char *);])
977 [/* A C++ error reporting function. */
979 yy::parser::error (const std::string& m)
981 std::cerr << m << std::endl;
988 return parser.parse ();
992 yyerror (const char *s)
994 fprintf (stderr, "%s\n", s);
998 yylex (AT_LALR1_CC_IF([int *lval], [void]))
1000 static int const tokens[] =
1004 static size_t toknum;
1005 ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[
1006 if (! (toknum < sizeof tokens / sizeof *tokens))
1008 return tokens[toknum++];
1017 ])# _AT_DATA_EXPECT2_Y
1020 # AT_CHECK_EXPECT2(BISON-OPTIONS)
1021 # ------------------------------
1022 # Generate the grammar, compile it, run it.
1023 m4_define([AT_CHECK_EXPECT2],
1024 [AT_SETUP([Expecting two tokens $1])
1025 AT_BISON_OPTION_PUSHDEFS([$1])
1026 _AT_DATA_EXPECT2_Y([$1])
1027 AT_BISON_CHECK([-o expect2.c expect2.y])
1028 AT_FULL_COMPILE([expect2])
1029 AT_PARSER_CHECK([./expect2], 1, [],
1030 [syntax error, unexpected '+', expecting A or B
1032 AT_BISON_OPTION_POPDEFS
1037 AT_CHECK_EXPECT2([%glr-parser])
1038 AT_CHECK_EXPECT2([%skeleton "lalr1.cc"])
1042 ## --------------------------------------------- ##
1043 ## Braced code in declaration in rules section. ##
1044 ## --------------------------------------------- ##
1046 AT_SETUP([Braced code in declaration in rules section])
1048 # Bison once mistook braced code in a declaration in the rules section to be a
1051 AT_DATA_GRAMMAR([input.y],
1054 static void yyerror (char const *msg);
1055 static int yylex (void);
1064 printf ("Bison would once convert this action to a midrule because of the"
1065 " subsequent braced code.\n");
1069 %destructor { fprintf (stderr, "DESTRUCTOR\n"); } 'a';
1070 %printer { fprintf (yyoutput, "PRINTER"); } 'a';
1075 yyerror (char const *msg)
1077 fprintf (stderr, "%s\n", msg);
1094 AT_BISON_CHECK([-t -o input.c input.y])
1096 AT_PARSER_CHECK([./input], 0,
1097 [[Bison would once convert this action to a midrule because of the subsequent braced code.
1101 Reducing stack by rule 1 (line 20):
1102 -> $$ = nterm start ()
1105 Reading a token: Next token is token 'a' (PRINTER)
1106 syntax error, unexpected 'a', expecting $end
1107 Error: popping nterm start ()
1109 Cleanup: discarding lookahead token 'a' (PRINTER)
1118 ## --------------------------------- ##
1119 ## String alias declared after use. ##
1120 ## --------------------------------- ##
1122 AT_SETUP([String alias declared after use])
1124 # Bison once incorrectly asserted that the symbol number for either a token or
1125 # its alias was the highest symbol number so far at the point of the alias
1126 # declaration. That was true unless the declaration appeared after their first
1127 # uses and other tokens appeared in between.
1135 AT_BISON_CHECK([-t -o input.c input.y])
1141 ## -------------------------------- ##
1142 ## Extra lookahead sets in report. ##
1143 ## -------------------------------- ##
1145 AT_SETUP([[Extra lookahead sets in report]])
1147 # Bison prints each reduction's lookahead set only next to the associated
1148 # state's one item that (1) is associated with the same rule as the reduction
1149 # and (2) has its dot at the end of its RHS. Previously, Bison also
1150 # erroneously printed the lookahead set next to all of the state's other items
1151 # associated with the same rule. This bug affected only the `.output' file and
1152 # not the generated parser source code.
1154 AT_DATA([[input.y]],
1156 start: a | 'a' a 'a' ;
1160 AT_BISON_CHECK([[--report=all input.y]])
1161 AT_CHECK([[sed -n '/^state 1$/,/^state 2$/p' input.output]], [[0]],
1164 2 start: 'a' . a 'a'
1168 'a' shift, and go to state 4
1170 $default reduce using rule 3 (a)
1182 ## ---------------------------------------- ##
1183 ## Token number in precedence declaration. ##
1184 ## ---------------------------------------- ##
1186 AT_SETUP([[Token number in precedence declaration]])
1188 # POSIX says token numbers can be declared in %left, %right, and %nonassoc, but
1189 # we lost this in Bison 1.50.
1191 AT_DATA_GRAMMAR([input.y],
1194 void yyerror (char const *);
1199 %left TK1 1 TK2 2 "tok alias" 3
1203 start: TK1 sr_conflict "tok alias" ;
1213 yyerror (char const *msg)
1215 fprintf (stderr, "%s\n", msg);
1221 static int const input[] = { 1, 2, 3, 0 };
1222 static int const *inputp = input;
1233 AT_BISON_CHECK([[-o input.c input.y]], [[0]],,
1234 [[input.y:24.5-19: warning: rule useless in parser due to conflicts: sr_conflict: TK2 "tok alias"
1236 AT_COMPILE([[input]])
1237 AT_PARSER_CHECK([[./input]])
1243 ## --------------------------- ##
1244 ## parse-gram.y: LALR = IELR. ##
1245 ## --------------------------- ##
1247 # If parse-gram.y's LALR and IELR parser tables ever begin to differ, we
1248 # need to fix parse-gram.y or start using IELR.
1250 AT_SETUP([[parse-gram.y: LALR = IELR]])
1252 # Avoid tests/bison's dark magic by processing a local copy of the
1253 # grammar. Avoid differences in synclines by telling bison that the
1254 # output files have the same name.
1255 [cp $abs_top_srcdir/src/parse-gram.y input.y]
1256 AT_BISON_CHECK([[-o input.c -Dlr.type=lalr input.y]])
1258 AT_BISON_CHECK([[-o input.c -Dlr.type=ielr input.y]])
1260 AT_CHECK([[diff -u lalr.c ielr.c]])
1266 ## -------------------------------------------- ##
1267 ## parse.error=verbose and YYSTACK_USE_ALLOCA. ##
1268 ## -------------------------------------------- ##
1270 AT_SETUP([[parse.error=verbose and YYSTACK_USE_ALLOCA]])
1272 AT_DATA_GRAMMAR([input.y],
1275 void yyerror (char const *);
1277 #define YYSTACK_USE_ALLOCA 1
1280 %define parse.error verbose
1284 start: check syntax_error syntax_error ;
1288 if (128 < sizeof yymsgbuf)
1291 "The initial size of yymsgbuf in yyparse has increased\n"
1292 "since this test group was last updated. As a result,\n"
1293 "this test group may no longer manage to induce a\n"
1294 "reallocation of the syntax error message buffer.\n"
1295 "This test group must be adjusted to produce a longer\n"
1296 "error message.\n");
1302 // Induce a syntax error message whose total length is more than
1303 // sizeof yymsgbuf in yyparse. Each token here is 64 bytes.
1305 "123456789112345678921234567893123456789412345678951234567896123A"
1306 | "123456789112345678921234567893123456789412345678951234567896123B"
1313 yyerror (char const *msg)
1315 fprintf (stderr, "%s\n", msg);
1321 /* Induce two syntax error messages (which requires full error
1322 recovery by shifting 3 tokens) in order to detect any loss of the
1323 reallocated buffer. */
1324 static char const *input = "abc";
1335 AT_BISON_CHECK([[-o input.c input.y]])
1336 AT_COMPILE([[input]])
1337 AT_PARSER_CHECK([[./input]], [[1]], [],
1338 [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B
1339 syntax error, unexpected $end, expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B
1346 ## ------------------------------ ##
1347 ## parse.error=verbose overflow. ##
1348 ## ------------------------------ ##
1350 # Imagine the case where YYSTACK_ALLOC_MAXIMUM = YYSIZE_MAXIMUM and an
1351 # invocation of yysyntax_error has caused yymsg_alloc to grow to exactly
1352 # YYSTACK_ALLOC_MAXIMUM (perhaps because the normal doubling of size had
1353 # to be clipped to YYSTACK_ALLOC_MAXIMUM). In an old version of yacc.c,
1354 # a subsequent invocation of yysyntax_error that overflows during its
1355 # size calculation would return YYSIZE_MAXIMUM to yyparse. Then,
1356 # yyparse would invoke yyerror using the old contents of yymsg.
1358 AT_SETUP([[parse.error=verbose overflow]])
1360 AT_DATA_GRAMMAR([input.y],
1363 void yyerror (char const *);
1366 /* This prevents this test case from having to induce error messages
1367 large enough to overflow size_t. */
1368 #define YYSIZE_T unsigned char
1370 /* Bring in malloc and set EXIT_SUCCESS so yacc.c doesn't try to
1371 provide a malloc prototype using our YYSIZE_T. */
1373 #ifndef EXIT_SUCCESS
1374 # define EXIT_SUCCESS 0
1377 /* Max depth is usually much smaller than YYSTACK_ALLOC_MAXIMUM, and
1378 we don't want gcc to warn everywhere this constant would be too big
1379 to make sense for our YYSIZE_T. */
1380 #define YYMAXDEPTH 100
1383 %define parse.error verbose
1387 start: syntax_error1 check syntax_error2 ;
1389 // Induce a syntax error message whose total length causes yymsg in
1390 // yyparse to be reallocated to size YYSTACK_ALLOC_MAXIMUM, which
1391 // should be 255. Each token here is 64 bytes.
1393 "123456789112345678921234567893123456789412345678951234567896123A"
1394 | "123456789112345678921234567893123456789412345678951234567896123B"
1395 | "123456789112345678921234567893123456789412345678951234567896123C"
1401 if (yymsg_alloc != YYSTACK_ALLOC_MAXIMUM
1402 || YYSTACK_ALLOC_MAXIMUM != YYSIZE_MAXIMUM
1403 || YYSIZE_MAXIMUM != 255)
1406 "The assumptions of this test group are no longer\n"
1407 "valid, so it may no longer catch the error it was\n"
1408 "designed to catch. Specifically, the following\n"
1409 "values should all be 255:\n\n");
1410 fprintf (stderr, " yymsg_alloc = %d\n", yymsg_alloc);
1411 fprintf (stderr, " YYSTACK_ALLOC_MAXIMUM = %d\n",
1412 YYSTACK_ALLOC_MAXIMUM);
1413 fprintf (stderr, " YYSIZE_MAXIMUM = %d\n", YYSIZE_MAXIMUM);
1421 "123456789112345678921234567893123456789412345678951234567896123A"
1422 | "123456789112345678921234567893123456789412345678951234567896123B"
1423 | "123456789112345678921234567893123456789412345678951234567896123C"
1424 | "123456789112345678921234567893123456789412345678951234567896123D"
1425 | "123456789112345678921234567893123456789412345678951234567896123E"
1431 yyerror (char const *msg)
1433 fprintf (stderr, "%s\n", msg);
1439 /* Induce two syntax error messages (which requires full error
1440 recovery by shifting 3 tokens). */
1441 static char const *input = "abc";
1448 /* Push parsers throw away the message buffer between tokens, so skip
1449 this test under maintainer-push-check. */
1456 AT_BISON_CHECK([[-o input.c input.y]])
1458 # gcc warns about tautologies and fallacies involving comparisons for
1459 # unsigned char. However, it doesn't produce these same warnings for
1460 # size_t and many other types when the warnings would seem to make just
1461 # as much sense. We ignore the warnings.
1462 [CFLAGS="$NO_WERROR_CFLAGS"]
1463 AT_COMPILE([[input]])
1465 AT_PARSER_CHECK([[./input]], [[2]], [],
1466 [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B or 123456789112345678921234567893123456789412345678951234567896123C
1475 ## ------------------------ ##
1476 ## LAC: Exploratory stack. ##
1477 ## ------------------------ ##
1479 AT_SETUP([[LAC: Exploratory stack]])
1481 m4_pushdef([AT_LAC_CHECK], [
1483 AT_BISON_OPTION_PUSHDEFS([$1])
1485 AT_DATA_GRAMMAR([input.y],
1488 void yyerror (char const *);
1489 int yylex (]AT_PURE_IF([[YYSTYPE *]], [[void]])[);
1493 %define parse.error verbose
1498 // default reductions in inconsistent states
1499 // v v v v v v v v v v v v v v
1500 S: A B A A B A A A A B A A A A A A A B C C A A A A A A A A A A A A B ;
1504 A: 'a' | /*empty*/ { printf ("inconsistent default reduction\n"); } ;
1506 C: /*empty*/ { printf ("consistent default reduction\n"); } ;
1511 yyerror (char const *msg)
1513 fprintf (stderr, "%s\n", msg);
1517 yylex (]AT_PURE_IF([[YYSTYPE *v]], [[void]])[)
1519 static char const *input = "bbbbc";]AT_PURE_IF([[
1532 AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity-initial=1 \
1533 -Dparse.lac.memory-trace=full \
1534 -t -o input.c input.y]], [[0]], [],
1535 [[input.y: conflicts: 21 shift/reduce
1537 AT_COMPILE([[input]])
1538 AT_PARSER_CHECK([[./input > stdout.txt 2> stderr.txt]], [[1]])
1540 # Make sure syntax error doesn't forget that 'a' is expected. It would
1541 # be forgotten without lookahead correction.
1542 AT_CHECK([[grep 'syntax error,' stderr.txt]], [[0]],
1543 [[syntax error, unexpected 'c', expecting 'a' or 'b'
1546 # Check number of default reductions in inconsistent states to be sure
1547 # syntax error is detected before unnecessary reductions are performed.
1548 AT_CHECK([[perl -0777 -ne 'print s/inconsistent default reduction//g;' \
1549 < stdout.txt || exit 77]], [[0]], [[14]])
1551 # Check number of default reductions in consistent states to be sure
1552 # it is performed before the syntax error is detected.
1553 AT_CHECK([[perl -0777 -ne 'print s/\bconsistent default reduction//g;' \
1554 < stdout.txt || exit 77]], [[0]], [[2]])
1556 # Check number of reallocs to be sure reallocated memory isn't somehow
1557 # lost between LAC invocations.
1558 AT_CHECK([[perl -0777 -ne 'print s/\(realloc//g;' < stderr.txt \
1559 || exit 77]], [[0]], [[3]])
1561 AT_BISON_OPTION_POPDEFS
1564 AT_LAC_CHECK([[%define api.push-pull pull]])
1565 AT_LAC_CHECK([[%define api.push-pull pull %define api.pure]])
1566 AT_LAC_CHECK([[%define api.push-pull both]])
1567 AT_LAC_CHECK([[%define api.push-pull both %define api.pure]])
1569 m4_popdef([AT_LAC_CHECK])
1575 ## ------------------------ ##
1576 ## LAC: Memory exhaustion. ##
1577 ## ------------------------ ##
1579 AT_SETUP([[LAC: Memory exhaustion]])
1581 m4_pushdef([AT_LAC_CHECK], [
1583 AT_DATA_GRAMMAR([input.y],
1586 void yyerror (char const *);
1588 #define YYMAXDEPTH 8
1595 S: A A A A A A A A A ;
1596 A: /*empty*/ | 'a' ;
1601 yyerror (char const *msg)
1603 fprintf (stderr, "%s\n", msg);
1609 static char const *input = "]$1[";
1621 AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity-initial=1 \
1622 -t -o input.c input.y]], [[0]], [],
1623 [[input.y: conflicts: 8 shift/reduce
1625 AT_COMPILE([[input]])
1629 # Check for memory exhaustion during parsing.
1631 AT_PARSER_CHECK([[./input]], [[2]], [[]],
1634 Reading a token: Now at end of input.
1635 LAC: initial context established for $end
1636 LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max size exceeded)
1638 Cleanup: discarding lookahead token $end ()
1642 # Induce an immediate syntax error with an undefined token, and check
1643 # for memory exhaustion while building syntax error message.
1644 AT_LAC_CHECK([[z]], [[0]])
1645 AT_PARSER_CHECK([[./input]], [[2]], [[]],
1648 Reading a token: Next token is token $undefined ()
1649 LAC: initial context established for $undefined
1650 LAC: checking lookahead $undefined: Always Err
1651 Constructing syntax error message
1652 LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max size exceeded)
1655 Cleanup: discarding lookahead token $undefined ()
1659 m4_popdef([AT_LAC_CHECK])