]>
Commit | Line | Data |
---|---|---|
342b8b6e | 1 | # Bison Regressions. -*- Autotest -*- |
d42cf844 | 2 | |
6e30ede8 PE |
3 | # Copyright (C) 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008, 2009, |
4 | # 2010 Free Software Foundation, Inc. | |
c95f2d78 | 5 | |
f16b0819 | 6 | # This program is free software: you can redistribute it and/or modify |
342b8b6e | 7 | # it under the terms of the GNU General Public License as published by |
f16b0819 PE |
8 | # the Free Software Foundation, either version 3 of the License, or |
9 | # (at your option) any later version. | |
10 | # | |
342b8b6e AD |
11 | # This program is distributed in the hope that it will be useful, |
12 | # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | # GNU General Public License for more details. | |
f16b0819 | 15 | # |
342b8b6e | 16 | # You should have received a copy of the GNU General Public License |
f16b0819 | 17 | # along with this program. If not, see <http://www.gnu.org/licenses/>. |
c95f2d78 | 18 | |
342b8b6e | 19 | AT_BANNER([[Regression tests.]]) |
c95f2d78 | 20 | |
2b25d624 | 21 | |
276f48df PE |
22 | ## ------------------ ## |
23 | ## Trivial grammars. ## | |
24 | ## ------------------ ## | |
25 | ||
26 | AT_SETUP([Trivial grammars]) | |
27 | ||
28 | AT_DATA_GRAMMAR([input.y], | |
29 | [[%{ | |
30 | void yyerror (char const *); | |
31 | int yylex (void); | |
50cce58e | 32 | #define YYSTYPE int * |
276f48df PE |
33 | %} |
34 | ||
35 | %error-verbose | |
36 | ||
37 | %% | |
38 | ||
39 | program: 'x'; | |
40 | ]]) | |
41 | ||
da730230 | 42 | AT_BISON_CHECK([-o input.c input.y]) |
276f48df | 43 | AT_COMPILE([input.o], [-c input.c]) |
50cce58e | 44 | AT_COMPILE([input.o], [-DYYDEBUG -c input.c]) |
276f48df PE |
45 | |
46 | AT_CLEANUP | |
47 | ||
48 | ||
49 | ||
ddc8ede1 PE |
50 | ## ----------------- ## |
51 | ## YYSTYPE typedef. ## | |
52 | ## ----------------- ## | |
53 | ||
54 | AT_SETUP([YYSTYPE typedef]) | |
55 | ||
56 | AT_DATA_GRAMMAR([input.y], | |
57 | [[%{ | |
58 | void yyerror (char const *); | |
59 | int yylex (void); | |
60 | typedef union { char const *val; } YYSTYPE; | |
61 | %} | |
62 | ||
63 | %type <val> program | |
64 | ||
65 | %% | |
66 | ||
67 | program: { $$ = ""; }; | |
68 | ]]) | |
69 | ||
da730230 | 70 | AT_BISON_CHECK([-o input.c input.y]) |
ddc8ede1 PE |
71 | AT_COMPILE([input.o], [-c input.c]) |
72 | ||
73 | AT_CLEANUP | |
74 | ||
75 | ||
76 | ||
b931235e JD |
77 | ## ------------------------------------- ## |
78 | ## Early token definitions with --yacc. ## | |
79 | ## ------------------------------------- ## | |
69078d4b AD |
80 | |
81 | ||
b931235e | 82 | AT_SETUP([Early token definitions with --yacc]) |
69078d4b AD |
83 | |
84 | # Found in GCJ: they expect the tokens to be defined before the user | |
85 | # prologue, so that they can use the token definitions in it. | |
86 | ||
9501dc6e | 87 | AT_DATA_GRAMMAR([input.y], |
69078d4b AD |
88 | [[%{ |
89 | void yyerror (const char *s); | |
90 | int yylex (void); | |
91 | %} | |
92 | ||
93 | %union | |
94 | { | |
95 | int val; | |
96 | }; | |
9bc0dd67 JD |
97 | %{ |
98 | #ifndef MY_TOKEN | |
99 | # error "MY_TOKEN not defined." | |
100 | #endif | |
101 | %} | |
b931235e JD |
102 | %token MY_TOKEN |
103 | %% | |
104 | exp: MY_TOKEN; | |
105 | %% | |
106 | ]]) | |
107 | ||
da730230 | 108 | AT_BISON_CHECK([-y -o input.c input.y]) |
b931235e JD |
109 | AT_COMPILE([input.o], [-c input.c]) |
110 | ||
111 | AT_CLEANUP | |
112 | ||
113 | ||
114 | ||
115 | ## ---------------------------------------- ## | |
116 | ## Early token definitions without --yacc. ## | |
117 | ## ---------------------------------------- ## | |
118 | ||
119 | ||
120 | AT_SETUP([Early token definitions without --yacc]) | |
121 | ||
122 | # Found in GCJ: they expect the tokens to be defined before the user | |
123 | # prologue, so that they can use the token definitions in it. | |
124 | ||
125 | AT_DATA_GRAMMAR([input.y], | |
126 | [[%{ | |
127 | #include <stdio.h> | |
128 | void yyerror (const char *s); | |
129 | int yylex (void); | |
130 | void print_my_token (void); | |
9bc0dd67 JD |
131 | %} |
132 | ||
133 | %union | |
134 | { | |
135 | int val; | |
136 | }; | |
137 | %{ | |
b931235e JD |
138 | void |
139 | print_my_token (void) | |
140 | { | |
141 | enum yytokentype my_token = MY_TOKEN; | |
142 | printf ("%d\n", my_token); | |
143 | } | |
69078d4b AD |
144 | %} |
145 | %token MY_TOKEN | |
146 | %% | |
147 | exp: MY_TOKEN; | |
148 | %% | |
149 | ]]) | |
150 | ||
da730230 | 151 | AT_BISON_CHECK([-o input.c input.y]) |
002b9b7d | 152 | AT_COMPILE([input.o], [-c input.c]) |
69078d4b AD |
153 | |
154 | AT_CLEANUP | |
155 | ||
156 | ||
157 | ||
2b25d624 AD |
158 | ## ---------------- ## |
159 | ## Braces parsing. ## | |
160 | ## ---------------- ## | |
161 | ||
162 | ||
69078d4b | 163 | AT_SETUP([Braces parsing]) |
2b25d624 AD |
164 | |
165 | AT_DATA([input.y], | |
166 | [[/* Bison used to swallow the character after `}'. */ | |
167 | ||
168 | %% | |
bfcf1f3a | 169 | exp: { tests = {{{{{{{{{{}}}}}}}}}}; }; |
2b25d624 AD |
170 | %% |
171 | ]]) | |
172 | ||
da730230 | 173 | AT_BISON_CHECK([-v -o input.c input.y]) |
2b25d624 | 174 | |
a4bf0390 | 175 | AT_CHECK([grep 'tests = {{{{{{{{{{}}}}}}}}}};' input.c], 0, [ignore]) |
2b25d624 AD |
176 | |
177 | AT_CLEANUP | |
178 | ||
179 | ||
c95f2d78 AD |
180 | ## ------------------ ## |
181 | ## Duplicate string. ## | |
182 | ## ------------------ ## | |
183 | ||
184 | ||
185 | AT_SETUP([Duplicate string]) | |
186 | ||
f499b062 | 187 | AT_DATA([input.y], |
c95f2d78 AD |
188 | [[/* `Bison -v' used to dump core when two tokens are defined with the same |
189 | string, as LE and GE below. */ | |
190 | ||
191 | %token NUM | |
192 | %token LE "<=" | |
193 | %token GE "<=" | |
194 | ||
195 | %% | |
196 | exp: '(' exp ')' | NUM ; | |
197 | %% | |
198 | ]]) | |
199 | ||
da730230 | 200 | AT_BISON_CHECK([-v -o input.c input.y], 0, [], |
a5d50994 | 201 | [[input.y:6.8-14: warning: symbol `"<="' used more than once as a literal string |
69078d4b | 202 | ]]) |
c95f2d78 | 203 | |
d803322e | 204 | AT_CLEANUP |
c95f2d78 AD |
205 | |
206 | ||
2ca209c1 AD |
207 | ## ------------------- ## |
208 | ## Rule Line Numbers. ## | |
209 | ## ------------------- ## | |
210 | ||
211 | AT_SETUP([Rule Line Numbers]) | |
212 | ||
6b98e4b5 AD |
213 | AT_KEYWORDS([report]) |
214 | ||
2ca209c1 AD |
215 | AT_DATA([input.y], |
216 | [[%% | |
217 | expr: | |
218 | 'a' | |
219 | ||
220 | { | |
221 | ||
222 | } | |
223 | ||
224 | 'b' | |
225 | ||
226 | { | |
227 | ||
228 | } | |
229 | ||
230 | | | |
231 | ||
232 | ||
233 | { | |
234 | ||
235 | ||
236 | } | |
237 | ||
238 | 'c' | |
239 | ||
240 | { | |
241 | ||
bfcf1f3a | 242 | }; |
2ca209c1 AD |
243 | ]]) |
244 | ||
da730230 | 245 | AT_BISON_CHECK([-o input.c -v input.y]) |
2ca209c1 AD |
246 | |
247 | # Check the contents of the report. | |
248 | AT_CHECK([cat input.output], [], | |
d2d1b42b | 249 | [[Grammar |
2ca209c1 | 250 | |
88bce5a2 | 251 | 0 $accept: expr $end |
6b98e4b5 | 252 | |
f91b1629 | 253 | 1 $@1: /* empty */ |
6b98e4b5 | 254 | |
f91b1629 | 255 | 2 expr: 'a' $@1 'b' |
6b98e4b5 | 256 | |
f91b1629 | 257 | 3 $@2: /* empty */ |
6b98e4b5 | 258 | |
f91b1629 | 259 | 4 expr: $@2 'c' |
2ca209c1 | 260 | |
d2d1b42b | 261 | |
2ca209c1 AD |
262 | Terminals, with rules where they appear |
263 | ||
88bce5a2 | 264 | $end (0) 0 |
2ca209c1 AD |
265 | 'a' (97) 2 |
266 | 'b' (98) 2 | |
267 | 'c' (99) 4 | |
268 | error (256) | |
269 | ||
d2d1b42b | 270 | |
2ca209c1 AD |
271 | Nonterminals, with rules where they appear |
272 | ||
88bce5a2 | 273 | $accept (6) |
b365aa05 AD |
274 | on left: 0 |
275 | expr (7) | |
276 | on left: 2 4, on right: 0 | |
f91b1629 | 277 | $@1 (8) |
2ca209c1 | 278 | on left: 1, on right: 2 |
f91b1629 | 279 | $@2 (9) |
2ca209c1 AD |
280 | on left: 3, on right: 4 |
281 | ||
282 | ||
283 | state 0 | |
284 | ||
88bce5a2 | 285 | 0 $accept: . expr $end |
643a5994 | 286 | |
87675353 | 287 | 'a' shift, and go to state 1 |
2ca209c1 | 288 | |
f91b1629 | 289 | $default reduce using rule 3 ($@2) |
2ca209c1 | 290 | |
87675353 | 291 | expr go to state 2 |
f91b1629 | 292 | $@2 go to state 3 |
2ca209c1 AD |
293 | |
294 | ||
295 | state 1 | |
296 | ||
f91b1629 | 297 | 2 expr: 'a' . $@1 'b' |
2ca209c1 | 298 | |
f91b1629 | 299 | $default reduce using rule 1 ($@1) |
2ca209c1 | 300 | |
f91b1629 | 301 | $@1 go to state 4 |
2ca209c1 AD |
302 | |
303 | ||
304 | state 2 | |
305 | ||
88bce5a2 | 306 | 0 $accept: expr . $end |
2ca209c1 | 307 | |
88bce5a2 | 308 | $end shift, and go to state 5 |
2ca209c1 AD |
309 | |
310 | ||
311 | state 3 | |
312 | ||
f91b1629 | 313 | 4 expr: $@2 . 'c' |
2ca209c1 | 314 | |
87675353 | 315 | 'c' shift, and go to state 6 |
2ca209c1 AD |
316 | |
317 | ||
318 | state 4 | |
319 | ||
f91b1629 | 320 | 2 expr: 'a' $@1 . 'b' |
2ca209c1 | 321 | |
87675353 | 322 | 'b' shift, and go to state 7 |
2ca209c1 AD |
323 | |
324 | ||
325 | state 5 | |
326 | ||
88bce5a2 | 327 | 0 $accept: expr $end . |
2ca209c1 | 328 | |
e8832397 | 329 | $default accept |
2ca209c1 AD |
330 | |
331 | ||
332 | state 6 | |
333 | ||
f91b1629 | 334 | 4 expr: $@2 'c' . |
b365aa05 | 335 | |
87675353 | 336 | $default reduce using rule 4 (expr) |
2ca209c1 AD |
337 | |
338 | ||
339 | state 7 | |
340 | ||
f91b1629 | 341 | 2 expr: 'a' $@1 'b' . |
b365aa05 | 342 | |
87675353 | 343 | $default reduce using rule 2 (expr) |
2ca209c1 AD |
344 | ]]) |
345 | ||
346 | AT_CLEANUP | |
347 | ||
348 | ||
349 | ||
cd5aafcf AD |
350 | ## ---------------------- ## |
351 | ## Mixing %token styles. ## | |
352 | ## ---------------------- ## | |
353 | ||
354 | ||
355 | AT_SETUP([Mixing %token styles]) | |
356 | ||
357 | # Taken from the documentation. | |
358 | AT_DATA([input.y], | |
359 | [[%token <operator> OR "||" | |
360 | %token <operator> LE 134 "<=" | |
361 | %left OR "<=" | |
362 | %% | |
363 | exp: ; | |
364 | %% | |
365 | ]]) | |
366 | ||
da730230 | 367 | AT_BISON_CHECK([-v -o input.c input.y]) |
cd5aafcf | 368 | |
d803322e | 369 | AT_CLEANUP |
cd5aafcf AD |
370 | |
371 | ||
372 | ||
29ae55f1 AD |
373 | ## ---------------- ## |
374 | ## Invalid inputs. ## | |
375 | ## ---------------- ## | |
561f9a30 AD |
376 | |
377 | ||
29ae55f1 | 378 | AT_SETUP([Invalid inputs]) |
561f9a30 AD |
379 | |
380 | AT_DATA([input.y], | |
381 | [[%% | |
382 | ? | |
561f9a30 | 383 | default: 'a' } |
29ae55f1 | 384 | %& |
2dfbfc12 | 385 | %a-does-not-exist |
29ae55f1 | 386 | %- |
e9955c83 | 387 | %{ |
561f9a30 AD |
388 | ]]) |
389 | ||
da730230 | 390 | AT_BISON_CHECK([input.y], [1], [], |
e9955c83 AD |
391 | [[input.y:2.1: invalid character: `?' |
392 | input.y:3.14: invalid character: `}' | |
393 | input.y:4.1: invalid character: `%' | |
394 | input.y:4.2: invalid character: `&' | |
2dfbfc12 | 395 | input.y:5.1-17: invalid directive: `%a-does-not-exist' |
c046698e | 396 | input.y:6.1-2: invalid directive: `%-' |
2115939b | 397 | input.y:7.1-8.0: missing `%}' at end of file |
47aee066 | 398 | input.y:7.1-8.0: syntax error, unexpected %{...%} |
e0c40012 | 399 | ]]) |
561f9a30 AD |
400 | |
401 | AT_CLEANUP | |
402 | ||
403 | ||
fc01665e PE |
404 | AT_SETUP([Invalid inputs with {}]) |
405 | ||
406 | AT_DATA([input.y], | |
407 | [[ | |
408 | %destructor | |
409 | %initial-action | |
410 | %lex-param | |
411 | %parse-param | |
412 | %printer | |
413 | %union | |
414 | ]]) | |
415 | ||
da730230 | 416 | AT_BISON_CHECK([input.y], [1], [], |
e9071366 | 417 | [[input.y:3.1-15: syntax error, unexpected %initial-action, expecting {...} |
fc01665e PE |
418 | ]]) |
419 | ||
420 | AT_CLEANUP | |
421 | ||
422 | ||
270a173c | 423 | |
b87f8b21 AD |
424 | ## ------------------- ## |
425 | ## Token definitions. ## | |
426 | ## ------------------- ## | |
427 | ||
428 | ||
429 | AT_SETUP([Token definitions]) | |
430 | ||
431 | # Bison managed, when fed with `%token 'f' "f"' to #define 'f'! | |
9501dc6e | 432 | AT_DATA_GRAMMAR([input.y], |
db7c8e9a | 433 | [%{ |
cf806753 | 434 | #include <stdlib.h> |
ca407bdf | 435 | #include <stdio.h> |
db7c8e9a AD |
436 | void yyerror (const char *s); |
437 | int yylex (void); | |
438 | %} | |
ca407bdf PE |
439 | [%error-verbose |
440 | %token MYEOF 0 "end of file" | |
b87f8b21 | 441 | %token 'a' "a" |
4f136612 PE |
442 | %token B_TOKEN "b" |
443 | %token C_TOKEN 'c' | |
444 | %token 'd' D_TOKEN | |
3d54b576 | 445 | %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!" |
1cfe6375 | 446 | %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!" |
b87f8b21 | 447 | %% |
3d54b576 | 448 | exp: "a" "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"; |
ca407bdf PE |
449 | %% |
450 | void | |
451 | yyerror (char const *s) | |
452 | { | |
453 | fprintf (stderr, "%s\n", s); | |
454 | } | |
455 | ||
456 | int | |
457 | yylex (void) | |
458 | { | |
cf806753 PE |
459 | static int called; |
460 | if (called++) | |
461 | abort (); | |
ca407bdf PE |
462 | return SPECIAL; |
463 | } | |
464 | ||
465 | int | |
466 | main (void) | |
467 | { | |
468 | return yyparse (); | |
469 | } | |
b87f8b21 AD |
470 | ]]) |
471 | ||
1cfe6375 JD |
472 | # Checking the warning message guarantees that the trigraph "??!" isn't |
473 | # unnecessarily escaped here even though it would need to be if encoded in a | |
474 | # C-string literal. Also notice that unnecessary escaping, such as "\?", from | |
475 | # the user specification is eliminated. | |
476 | AT_BISON_CHECK([-o input.c input.y], [[0]], [[]], | |
477 | [[input.y:22.8-14: warning: symbol SPECIAL redeclared | |
478 | input.y:22.8-63: warning: symbol `"\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!"' used more than once as a literal string | |
479 | ]]) | |
ca407bdf | 480 | AT_COMPILE([input]) |
1cfe6375 JD |
481 | |
482 | # Checking the error message here guarantees that yytname, which does contain | |
483 | # C-string literals, does have the trigraph escaped correctly. Thus, the | |
484 | # symbol name reported by the parser is exactly the same as that reported by | |
485 | # Bison itself. | |
3d54b576 | 486 | AT_DATA([experr], |
1cfe6375 | 487 | [[syntax error, unexpected "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!", expecting a |
3d54b576 PE |
488 | ]]) |
489 | AT_PARSER_CHECK([./input], 1, [], [experr]) | |
b87f8b21 AD |
490 | AT_CLEANUP |
491 | ||
492 | ||
493 | ||
eb714592 AD |
494 | ## -------------------- ## |
495 | ## Characters Escapes. ## | |
496 | ## -------------------- ## | |
497 | ||
498 | ||
499 | AT_SETUP([Characters Escapes]) | |
500 | ||
9501dc6e | 501 | AT_DATA_GRAMMAR([input.y], |
eb714592 AD |
502 | [%{ |
503 | void yyerror (const char *s); | |
504 | int yylex (void); | |
505 | %} | |
6d0ef4ec | 506 | [%% |
eb714592 AD |
507 | exp: |
508 | '\'' "\'" | |
509 | | '\"' "\"" | |
510 | | '"' "'" | |
511 | ; | |
512 | ]]) | |
9501dc6e | 513 | # Pacify font-lock-mode: " |
eb714592 | 514 | |
da730230 | 515 | AT_BISON_CHECK([-o input.c input.y]) |
eb714592 AD |
516 | AT_COMPILE([input.o], [-c input.c]) |
517 | AT_CLEANUP | |
518 | ||
519 | ||
520 | ||
b9752825 AD |
521 | ## -------------- ## |
522 | ## Web2c Report. ## | |
523 | ## -------------- ## | |
776209d6 AD |
524 | |
525 | # The generation of the reduction was once wrong in Bison, and made it | |
526 | # miss some reductions. In the following test case, the reduction on | |
527 | # `undef_id_tok' in state 1 was missing. This is stripped down from | |
528 | # the actual web2c.y. | |
529 | ||
b9752825 | 530 | AT_SETUP([Web2c Report]) |
776209d6 | 531 | |
6b98e4b5 AD |
532 | AT_KEYWORDS([report]) |
533 | ||
776209d6 AD |
534 | AT_DATA([input.y], |
535 | [[%token undef_id_tok const_id_tok | |
536 | ||
537 | %start CONST_DEC_PART | |
538 | \f | |
539 | %% | |
540 | CONST_DEC_PART: | |
541 | CONST_DEC_LIST | |
542 | ; | |
543 | ||
544 | CONST_DEC_LIST: | |
545 | CONST_DEC | |
546 | | CONST_DEC_LIST CONST_DEC | |
547 | ; | |
548 | ||
549 | CONST_DEC: | |
550 | { } undef_id_tok '=' const_id_tok ';' | |
551 | ; | |
552 | %% | |
776209d6 AD |
553 | ]]) |
554 | ||
da730230 | 555 | AT_BISON_CHECK([-v input.y]) |
87675353 | 556 | AT_CHECK([cat input.output], 0, |
776209d6 | 557 | [[Grammar |
87675353 | 558 | |
88bce5a2 | 559 | 0 $accept: CONST_DEC_PART $end |
87675353 | 560 | |
6b98e4b5 | 561 | 1 CONST_DEC_PART: CONST_DEC_LIST |
87675353 | 562 | |
6b98e4b5 AD |
563 | 2 CONST_DEC_LIST: CONST_DEC |
564 | 3 | CONST_DEC_LIST CONST_DEC | |
87675353 | 565 | |
f91b1629 | 566 | 4 $@1: /* empty */ |
87675353 | 567 | |
f91b1629 | 568 | 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';' |
87675353 AD |
569 | |
570 | ||
776209d6 | 571 | Terminals, with rules where they appear |
87675353 | 572 | |
88bce5a2 | 573 | $end (0) 0 |
776209d6 AD |
574 | ';' (59) 5 |
575 | '=' (61) 5 | |
576 | error (256) | |
007a50a4 AD |
577 | undef_id_tok (258) 5 |
578 | const_id_tok (259) 5 | |
87675353 AD |
579 | |
580 | ||
776209d6 | 581 | Nonterminals, with rules where they appear |
87675353 | 582 | |
88bce5a2 | 583 | $accept (7) |
78d5bae9 AD |
584 | on left: 0 |
585 | CONST_DEC_PART (8) | |
586 | on left: 1, on right: 0 | |
587 | CONST_DEC_LIST (9) | |
776209d6 | 588 | on left: 2 3, on right: 1 3 |
78d5bae9 | 589 | CONST_DEC (10) |
776209d6 | 590 | on left: 5, on right: 2 3 |
f91b1629 | 591 | $@1 (11) |
776209d6 | 592 | on left: 4, on right: 5 |
87675353 AD |
593 | |
594 | ||
776209d6 | 595 | state 0 |
87675353 | 596 | |
88bce5a2 | 597 | 0 $accept: . CONST_DEC_PART $end |
87675353 | 598 | |
f91b1629 | 599 | $default reduce using rule 4 ($@1) |
87675353 AD |
600 | |
601 | CONST_DEC_PART go to state 1 | |
602 | CONST_DEC_LIST go to state 2 | |
603 | CONST_DEC go to state 3 | |
f91b1629 | 604 | $@1 go to state 4 |
87675353 AD |
605 | |
606 | ||
776209d6 | 607 | state 1 |
87675353 | 608 | |
88bce5a2 | 609 | 0 $accept: CONST_DEC_PART . $end |
87675353 | 610 | |
88bce5a2 | 611 | $end shift, and go to state 5 |
87675353 AD |
612 | |
613 | ||
78d5bae9 | 614 | state 2 |
87675353 | 615 | |
ce4ccb4b AD |
616 | 1 CONST_DEC_PART: CONST_DEC_LIST . |
617 | 3 CONST_DEC_LIST: CONST_DEC_LIST . CONST_DEC | |
87675353 | 618 | |
f91b1629 | 619 | undef_id_tok reduce using rule 4 ($@1) |
87675353 AD |
620 | $default reduce using rule 1 (CONST_DEC_PART) |
621 | ||
622 | CONST_DEC go to state 6 | |
f91b1629 | 623 | $@1 go to state 4 |
87675353 AD |
624 | |
625 | ||
78d5bae9 | 626 | state 3 |
87675353 | 627 | |
ce4ccb4b | 628 | 2 CONST_DEC_LIST: CONST_DEC . |
87675353 AD |
629 | |
630 | $default reduce using rule 2 (CONST_DEC_LIST) | |
631 | ||
632 | ||
776209d6 | 633 | state 4 |
87675353 | 634 | |
f91b1629 | 635 | 5 CONST_DEC: $@1 . undef_id_tok '=' const_id_tok ';' |
87675353 AD |
636 | |
637 | undef_id_tok shift, and go to state 7 | |
638 | ||
639 | ||
78d5bae9 | 640 | state 5 |
87675353 | 641 | |
88bce5a2 | 642 | 0 $accept: CONST_DEC_PART $end . |
87675353 | 643 | |
e8832397 | 644 | $default accept |
87675353 AD |
645 | |
646 | ||
78d5bae9 | 647 | state 6 |
87675353 | 648 | |
ce4ccb4b | 649 | 3 CONST_DEC_LIST: CONST_DEC_LIST CONST_DEC . |
87675353 AD |
650 | |
651 | $default reduce using rule 3 (CONST_DEC_LIST) | |
652 | ||
653 | ||
78d5bae9 | 654 | state 7 |
87675353 | 655 | |
f91b1629 | 656 | 5 CONST_DEC: $@1 undef_id_tok . '=' const_id_tok ';' |
87675353 AD |
657 | |
658 | '=' shift, and go to state 8 | |
659 | ||
660 | ||
78d5bae9 | 661 | state 8 |
87675353 | 662 | |
f91b1629 | 663 | 5 CONST_DEC: $@1 undef_id_tok '=' . const_id_tok ';' |
87675353 AD |
664 | |
665 | const_id_tok shift, and go to state 9 | |
666 | ||
667 | ||
78d5bae9 | 668 | state 9 |
87675353 | 669 | |
f91b1629 | 670 | 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok . ';' |
87675353 AD |
671 | |
672 | ';' shift, and go to state 10 | |
673 | ||
674 | ||
78d5bae9 | 675 | state 10 |
87675353 | 676 | |
f91b1629 | 677 | 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';' . |
87675353 AD |
678 | |
679 | $default reduce using rule 5 (CONST_DEC) | |
776209d6 AD |
680 | ]]) |
681 | ||
682 | AT_CLEANUP | |
b9752825 AD |
683 | |
684 | ||
685 | ## --------------- ## | |
686 | ## Web2c Actions. ## | |
687 | ## --------------- ## | |
688 | ||
689 | # The generation of the mapping `state -> action' was once wrong in | |
690 | # extremely specific situations. web2c.y exhibits this situation. | |
691 | # Below is a stripped version of the grammar. It looks like one can | |
692 | # simplify it further, but just don't: it is tuned to exhibit a bug, | |
693 | # which disapears when applying sane grammar transformations. | |
694 | # | |
695 | # It used to be wrong on yydefact only: | |
696 | # | |
d42cf844 | 697 | # static const yytype_uint8 yydefact[] = |
b9752825 AD |
698 | # { |
699 | # - 2, 0, 1, 0, 0, 2, 3, 2, 5, 4, | |
700 | # + 2, 0, 1, 0, 0, 0, 3, 2, 5, 4, | |
701 | # 0, 0 | |
702 | # }; | |
703 | # | |
704 | # but let's check all the tables. | |
705 | ||
706 | ||
707 | AT_SETUP([Web2c Actions]) | |
708 | ||
6b98e4b5 AD |
709 | AT_KEYWORDS([report]) |
710 | ||
b9752825 AD |
711 | AT_DATA([input.y], |
712 | [[%% | |
713 | statement: struct_stat; | |
714 | struct_stat: /* empty. */ | if else; | |
715 | if: "if" "const" "then" statement; | |
716 | else: "else" statement; | |
717 | %% | |
718 | ]]) | |
719 | ||
da730230 | 720 | AT_BISON_CHECK([-v -o input.c input.y]) |
b9752825 | 721 | |
728c4be2 | 722 | # Check only the tables. |
ce4ccb4b AD |
723 | [sed -n 's/ *$//;/^static const.*\[\] =/,/^}/p' input.c >tables.c] |
724 | ||
725 | AT_CHECK([[cat tables.c]], 0, | |
d42cf844 | 726 | [[static const yytype_uint8 yytranslate[] = |
b9752825 AD |
727 | { |
728 | 0, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
729 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
730 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
731 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
732 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
733 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
734 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
735 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
736 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
737 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
738 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
739 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
740 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
741 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
742 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
743 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
744 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
745 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
746 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
747 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
748 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
749 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
750 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
751 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
752 | 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, | |
007a50a4 AD |
753 | 2, 2, 2, 2, 2, 2, 1, 2, 3, 4, |
754 | 5, 6 | |
b9752825 | 755 | }; |
d42cf844 | 756 | static const yytype_uint8 yyprhs[] = |
b9752825 | 757 | { |
e7b8bef1 | 758 | 0, 0, 3, 5, 6, 9, 14 |
b9752825 | 759 | }; |
d42cf844 | 760 | static const yytype_int8 yyrhs[] = |
b9752825 | 761 | { |
e7b8bef1 AD |
762 | 8, 0, -1, 9, -1, -1, 10, 11, -1, 3, |
763 | 4, 5, 8, -1, 6, 8, -1 | |
b9752825 | 764 | }; |
d42cf844 | 765 | static const yytype_uint8 yyrline[] = |
b9752825 | 766 | { |
e7b8bef1 | 767 | 0, 2, 2, 3, 3, 4, 5 |
b9752825 AD |
768 | }; |
769 | static const char *const yytname[] = | |
770 | { | |
9e0876fb PE |
771 | "$end", "error", "$undefined", "\"if\"", "\"const\"", "\"then\"", |
772 | "\"else\"", "$accept", "statement", "struct_stat", "if", "else", 0 | |
b9752825 | 773 | }; |
d42cf844 | 774 | static const yytype_uint16 yytoknum[] = |
b9752825 | 775 | { |
3650b4b8 | 776 | 0, 256, 257, 258, 259, 260, 261 |
b9752825 | 777 | }; |
d42cf844 | 778 | static const yytype_uint8 yyr1[] = |
b9752825 | 779 | { |
e7b8bef1 | 780 | 0, 7, 8, 9, 9, 10, 11 |
b9752825 | 781 | }; |
d42cf844 | 782 | static const yytype_uint8 yyr2[] = |
b9752825 | 783 | { |
e7b8bef1 | 784 | 0, 2, 1, 0, 2, 4, 2 |
b9752825 | 785 | }; |
d42cf844 | 786 | static const yytype_uint8 yydefact[] = |
b9752825 | 787 | { |
e8832397 | 788 | 3, 0, 0, 2, 0, 0, 1, 3, 4, 3, |
e7b8bef1 | 789 | 6, 5 |
b9752825 | 790 | }; |
d42cf844 | 791 | static const yytype_int8 yydefgoto[] = |
b9752825 | 792 | { |
e7b8bef1 | 793 | -1, 2, 3, 4, 8 |
b9752825 | 794 | }; |
d42cf844 | 795 | static const yytype_int8 yypact[] = |
b9752825 | 796 | { |
12b0043a AD |
797 | -2, -1, 4, -8, 0, 2, -8, -2, -8, -2, |
798 | -8, -8 | |
b9752825 | 799 | }; |
d42cf844 | 800 | static const yytype_int8 yypgoto[] = |
b9752825 | 801 | { |
12b0043a | 802 | -8, -7, -8, -8, -8 |
b9752825 | 803 | }; |
d42cf844 | 804 | static const yytype_uint8 yytable[] = |
b9752825 | 805 | { |
e7b8bef1 | 806 | 10, 1, 11, 5, 6, 0, 7, 9 |
b9752825 | 807 | }; |
d42cf844 | 808 | static const yytype_int8 yycheck[] = |
b9752825 | 809 | { |
e7b8bef1 | 810 | 7, 3, 9, 4, 0, -1, 6, 5 |
b9752825 | 811 | }; |
d42cf844 | 812 | static const yytype_uint8 yystos[] = |
5504898e AD |
813 | { |
814 | 0, 3, 8, 9, 10, 4, 0, 6, 11, 5, | |
815 | 8, 8 | |
816 | }; | |
b9752825 AD |
817 | ]]) |
818 | ||
819 | AT_CLEANUP | |
22e304a6 AD |
820 | |
821 | ||
822 | ## ------------------------- ## | |
823 | ## yycheck Bound Violation. ## | |
824 | ## ------------------------- ## | |
825 | ||
826 | ||
827 | # _AT_DATA_DANCER_Y(BISON-OPTIONS) | |
828 | # -------------------------------- | |
829 | # The following grammar, taken from Andrew Suffield's GPL'd implementation | |
830 | # of DGMTP, the Dancer Generic Message Transport Protocol, used to violate | |
831 | # yycheck's bounds where issuing a verbose error message. Keep this test | |
832 | # so that possible bound checking compilers could check all the skeletons. | |
833 | m4_define([_AT_DATA_DANCER_Y], | |
834 | [AT_DATA_GRAMMAR([dancer.y], | |
835 | [%{ | |
848dc439 PE |
836 | static int yylex (AT_LALR1_CC_IF([int *], [void])); |
837 | AT_LALR1_CC_IF([], | |
cf806753 PE |
838 | [#include <stdlib.h> |
839 | #include <stdio.h> | |
848dc439 | 840 | static void yyerror (const char *);]) |
22e304a6 AD |
841 | %} |
842 | $1 | |
843 | %token ARROW INVALID NUMBER STRING DATA | |
844 | %defines | |
845 | %verbose | |
846 | %error-verbose | |
847 | /* Grammar follows */ | |
848 | %% | |
849 | line: header body | |
850 | ; | |
851 | ||
852 | header: '<' from ARROW to '>' type ':' | |
853 | | '<' ARROW to '>' type ':' | |
854 | | ARROW to type ':' | |
855 | | type ':' | |
856 | | '<' '>' | |
857 | ; | |
858 | ||
859 | from: DATA | |
860 | | STRING | |
861 | | INVALID | |
862 | ; | |
863 | ||
864 | to: DATA | |
865 | | STRING | |
866 | | INVALID | |
867 | ; | |
868 | ||
869 | type: DATA | |
870 | | STRING | |
871 | | INVALID | |
872 | ; | |
873 | ||
874 | body: /* empty */ | |
875 | | body member | |
876 | ; | |
877 | ||
878 | member: STRING | |
879 | | DATA | |
880 | | '+' NUMBER | |
881 | | '-' NUMBER | |
882 | | NUMBER | |
883 | | INVALID | |
884 | ; | |
885 | %% | |
886 | AT_LALR1_CC_IF( | |
68e11668 | 887 | [/* A C++ error reporting function. */ |
22e304a6 | 888 | void |
99880de5 | 889 | yy::parser::error (const location&, const std::string& m) |
22e304a6 | 890 | { |
efeed023 | 891 | std::cerr << m << std::endl; |
22e304a6 AD |
892 | } |
893 | ||
894 | int | |
99880de5 | 895 | yyparse () |
22e304a6 | 896 | { |
99880de5 | 897 | yy::parser parser; |
fa7b79c0 PE |
898 | #if YYDEBUG |
899 | parser.set_debug_level (YYDEBUG); | |
900 | #endif | |
22e304a6 AD |
901 | return parser.parse (); |
902 | } | |
903 | ], | |
904 | [static void | |
905 | yyerror (const char *s) | |
906 | { | |
907 | fprintf (stderr, "%s\n", s); | |
908 | }]) | |
909 | ||
910 | static int | |
848dc439 | 911 | yylex (AT_LALR1_CC_IF([int *lval], [void])) |
22e304a6 | 912 | [{ |
cf806753 | 913 | static int const tokens[] = |
22e304a6 AD |
914 | { |
915 | ':', -1 | |
916 | }; | |
cf806753 | 917 | static size_t toknum; |
848dc439 | 918 | ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[ |
cf806753 PE |
919 | if (! (toknum < sizeof tokens / sizeof *tokens)) |
920 | abort (); | |
22e304a6 AD |
921 | return tokens[toknum++]; |
922 | }] | |
923 | ||
924 | int | |
925 | main (void) | |
926 | { | |
927 | return yyparse (); | |
928 | } | |
929 | ]) | |
930 | ])# _AT_DATA_DANCER_Y | |
931 | ||
932 | ||
933 | # AT_CHECK_DANCER(BISON-OPTIONS) | |
934 | # ------------------------------ | |
935 | # Generate the grammar, compile it, run it. | |
936 | m4_define([AT_CHECK_DANCER], | |
937 | [AT_SETUP([Dancer $1]) | |
938 | AT_BISON_OPTION_PUSHDEFS([$1]) | |
939 | _AT_DATA_DANCER_Y([$1]) | |
da730230 | 940 | AT_BISON_CHECK([-o dancer.c dancer.y]) |
11c4e57d | 941 | AT_FULL_COMPILE([dancer]) |
22e304a6 | 942 | AT_PARSER_CHECK([./dancer], 1, [], |
d5286af1 | 943 | [syntax error, unexpected ':' |
22e304a6 AD |
944 | ]) |
945 | AT_BISON_OPTION_POPDEFS | |
946 | AT_CLEANUP | |
947 | ]) | |
948 | ||
949 | AT_CHECK_DANCER() | |
950 | AT_CHECK_DANCER([%glr-parser]) | |
951 | AT_CHECK_DANCER([%skeleton "lalr1.cc"]) | |
d6645148 PE |
952 | |
953 | ||
954 | ## ------------------------------------------ ## | |
955 | ## Diagnostic that expects two alternatives. ## | |
956 | ## ------------------------------------------ ## | |
957 | ||
958 | ||
959 | # _AT_DATA_EXPECT2_Y(BISON-OPTIONS) | |
960 | # -------------------------------- | |
961 | m4_define([_AT_DATA_EXPECT2_Y], | |
962 | [AT_DATA_GRAMMAR([expect2.y], | |
963 | [%{ | |
964 | static int yylex (AT_LALR1_CC_IF([int *], [void])); | |
965 | AT_LALR1_CC_IF([], | |
966 | [#include <stdio.h> | |
c4bd5bf7 | 967 | #include <stdlib.h> |
d6645148 PE |
968 | static void yyerror (const char *);]) |
969 | %} | |
970 | $1 | |
971 | %defines | |
972 | %error-verbose | |
973 | %token A 1000 | |
974 | %token B | |
975 | ||
976 | %% | |
977 | program: /* empty */ | |
978 | | program e ';' | |
979 | | program error ';'; | |
980 | ||
981 | e: e '+' t | t; | |
982 | t: A | B; | |
983 | ||
984 | %% | |
985 | AT_LALR1_CC_IF( | |
986 | [/* A C++ error reporting function. */ | |
987 | void | |
988 | yy::parser::error (const location&, const std::string& m) | |
989 | { | |
990 | std::cerr << m << std::endl; | |
991 | } | |
992 | ||
993 | int | |
994 | yyparse () | |
995 | { | |
996 | yy::parser parser; | |
997 | return parser.parse (); | |
998 | } | |
999 | ], | |
1000 | [static void | |
1001 | yyerror (const char *s) | |
1002 | { | |
1003 | fprintf (stderr, "%s\n", s); | |
1004 | }]) | |
1005 | ||
1006 | static int | |
1007 | yylex (AT_LALR1_CC_IF([int *lval], [void])) | |
1008 | [{ | |
cf806753 | 1009 | static int const tokens[] = |
d6645148 PE |
1010 | { |
1011 | 1000, '+', '+', -1 | |
1012 | }; | |
cf806753 | 1013 | static size_t toknum; |
d6645148 | 1014 | ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[ |
cf806753 PE |
1015 | if (! (toknum < sizeof tokens / sizeof *tokens)) |
1016 | abort (); | |
d6645148 PE |
1017 | return tokens[toknum++]; |
1018 | }] | |
1019 | ||
1020 | int | |
1021 | main (void) | |
1022 | { | |
1023 | return yyparse (); | |
1024 | } | |
1025 | ]) | |
1026 | ])# _AT_DATA_EXPECT2_Y | |
1027 | ||
1028 | ||
1029 | # AT_CHECK_EXPECT2(BISON-OPTIONS) | |
1030 | # ------------------------------ | |
1031 | # Generate the grammar, compile it, run it. | |
1032 | m4_define([AT_CHECK_EXPECT2], | |
1033 | [AT_SETUP([Expecting two tokens $1]) | |
1034 | AT_BISON_OPTION_PUSHDEFS([$1]) | |
1035 | _AT_DATA_EXPECT2_Y([$1]) | |
da730230 | 1036 | AT_BISON_CHECK([-o expect2.c expect2.y]) |
11c4e57d | 1037 | AT_FULL_COMPILE([expect2]) |
d6645148 PE |
1038 | AT_PARSER_CHECK([./expect2], 1, [], |
1039 | [syntax error, unexpected '+', expecting A or B | |
1040 | ]) | |
1041 | AT_BISON_OPTION_POPDEFS | |
1042 | AT_CLEANUP | |
1043 | ]) | |
1044 | ||
1045 | AT_CHECK_EXPECT2() | |
1046 | AT_CHECK_EXPECT2([%glr-parser]) | |
1047 | AT_CHECK_EXPECT2([%skeleton "lalr1.cc"]) | |
4210cd0b JD |
1048 | |
1049 | ||
1050 | ||
1051 | ## --------------------------------------------- ## | |
1052 | ## Braced code in declaration in rules section. ## | |
1053 | ## --------------------------------------------- ## | |
1054 | ||
1055 | AT_SETUP([Braced code in declaration in rules section]) | |
1056 | ||
1057 | # Bison once mistook braced code in a declaration in the rules section to be a | |
1058 | # rule action. | |
1059 | ||
1060 | AT_DATA_GRAMMAR([input.y], | |
1061 | [[%{ | |
1062 | #include <stdio.h> | |
381ecb06 JD |
1063 | static void yyerror (char const *msg); |
1064 | static int yylex (void); | |
4210cd0b JD |
1065 | %} |
1066 | ||
1067 | %error-verbose | |
1068 | ||
1069 | %% | |
1070 | ||
1071 | start: | |
1072 | { | |
1073 | printf ("Bison would once convert this action to a midrule because of the" | |
1074 | " subsequent braced code.\n"); | |
1075 | } | |
1076 | ; | |
1077 | ||
1078 | %destructor { fprintf (stderr, "DESTRUCTOR\n"); } 'a'; | |
1079 | %printer { fprintf (yyoutput, "PRINTER"); } 'a'; | |
1080 | ||
1081 | %% | |
1082 | ||
381ecb06 | 1083 | static void |
4210cd0b JD |
1084 | yyerror (char const *msg) |
1085 | { | |
1086 | fprintf (stderr, "%s\n", msg); | |
1087 | } | |
1088 | ||
381ecb06 | 1089 | static int |
4210cd0b JD |
1090 | yylex (void) |
1091 | { | |
1092 | return 'a'; | |
1093 | } | |
1094 | ||
1095 | int | |
1096 | main (void) | |
1097 | { | |
1098 | yydebug = 1; | |
1099 | return !yyparse (); | |
1100 | } | |
1101 | ]]) | |
1102 | ||
da730230 | 1103 | AT_BISON_CHECK([-t -o input.c input.y]) |
4210cd0b JD |
1104 | AT_COMPILE([input]) |
1105 | AT_PARSER_CHECK([./input], 0, | |
1106 | [[Bison would once convert this action to a midrule because of the subsequent braced code. | |
1107 | ]], | |
1108 | [[Starting parse | |
1109 | Entering state 0 | |
231ed89a | 1110 | Reducing stack by rule 1 (line 20): |
4210cd0b JD |
1111 | -> $$ = nterm start () |
1112 | Stack now 0 | |
1113 | Entering state 1 | |
1114 | Reading a token: Next token is token 'a' (PRINTER) | |
1115 | syntax error, unexpected 'a', expecting $end | |
1116 | Error: popping nterm start () | |
1117 | Stack now 0 | |
1118 | Cleanup: discarding lookahead token 'a' (PRINTER) | |
1119 | DESTRUCTOR | |
1120 | Stack now 0 | |
1121 | ]]) | |
1122 | ||
1123 | AT_CLEANUP | |
965537bc JD |
1124 | |
1125 | ||
1126 | ||
1127 | ## --------------------------------- ## | |
1128 | ## String alias declared after use. ## | |
1129 | ## --------------------------------- ## | |
1130 | ||
1131 | AT_SETUP([String alias declared after use]) | |
1132 | ||
1133 | # Bison once incorrectly asserted that the symbol number for either a token or | |
1134 | # its alias was the highest symbol number so far at the point of the alias | |
1135 | # declaration. That was true unless the declaration appeared after their first | |
6d0ef4ec | 1136 | # uses and other tokens appeared in between. |
965537bc JD |
1137 | |
1138 | AT_DATA([input.y], | |
1139 | [[%% | |
1140 | start: 'a' "A" 'b'; | |
1141 | %token 'a' "A"; | |
1142 | ]]) | |
1143 | ||
da730230 | 1144 | AT_BISON_CHECK([-t -o input.c input.y]) |
965537bc JD |
1145 | |
1146 | AT_CLEANUP | |
a0de5091 JD |
1147 | |
1148 | ||
1149 | ||
1150 | ## -------------------------------- ## | |
1151 | ## Extra lookahead sets in report. ## | |
1152 | ## -------------------------------- ## | |
1153 | ||
1154 | AT_SETUP([[Extra lookahead sets in report]]) | |
1155 | ||
88c78747 JD |
1156 | # Bison prints each reduction's lookahead set only next to the associated |
1157 | # state's one item that (1) is associated with the same rule as the reduction | |
1158 | # and (2) has its dot at the end of its RHS. Previously, Bison also | |
1159 | # erroneously printed the lookahead set next to all of the state's other items | |
1160 | # associated with the same rule. This bug affected only the `.output' file and | |
1161 | # not the generated parser source code. | |
a0de5091 JD |
1162 | |
1163 | AT_DATA([[input.y]], | |
1164 | [[%% | |
1165 | start: a | 'a' a 'a' ; | |
1166 | a: 'a' ; | |
1167 | ]]) | |
1168 | ||
da730230 | 1169 | AT_BISON_CHECK([[--report=all input.y]]) |
a0de5091 JD |
1170 | AT_CHECK([[sed -n '/^state 1$/,/^state 2$/p' input.output]], [[0]], |
1171 | [[state 1 | |
1172 | ||
1173 | 2 start: 'a' . a 'a' | |
1174 | 3 a: . 'a' | |
1175 | 3 | 'a' . [$end] | |
1176 | ||
1177 | 'a' shift, and go to state 4 | |
1178 | ||
1179 | $default reduce using rule 3 (a) | |
1180 | ||
1181 | a go to state 5 | |
1182 | ||
1183 | ||
1184 | state 2 | |
1185 | ]]) | |
1186 | ||
1187 | AT_CLEANUP | |
ab7f29f8 JD |
1188 | |
1189 | ||
1190 | ||
1191 | ## ---------------------------------------- ## | |
1192 | ## Token number in precedence declaration. ## | |
1193 | ## ---------------------------------------- ## | |
1194 | ||
14da0cdd | 1195 | AT_SETUP([[Token number in precedence declaration]]) |
ab7f29f8 JD |
1196 | |
1197 | # POSIX says token numbers can be declared in %left, %right, and %nonassoc, but | |
1198 | # we lost this in Bison 1.50. | |
1199 | ||
1200 | AT_DATA_GRAMMAR([input.y], | |
1201 | [[%{ | |
1202 | #include <stdio.h> | |
1203 | void yyerror (char const *); | |
1204 | int yylex (void); | |
1205 | %} | |
1206 | ||
1207 | %error-verbose | |
1208 | %left TK1 1 TK2 2 "tok alias" 3 | |
1209 | ||
1210 | %% | |
1211 | ||
1212 | start: TK1 sr_conflict "tok alias" ; | |
1213 | ||
1214 | sr_conflict: | |
1215 | TK2 | |
1216 | | TK2 "tok alias" | |
1217 | ; | |
1218 | ||
1219 | %% | |
1220 | ||
1221 | void | |
1222 | yyerror (char const *msg) | |
1223 | { | |
1224 | fprintf (stderr, "%s\n", msg); | |
1225 | } | |
1226 | ||
1227 | int | |
1228 | yylex (void) | |
1229 | { | |
1230 | static int const input[] = { 1, 2, 3, 0 }; | |
1231 | static int const *inputp = input; | |
1232 | return *inputp++; | |
1233 | } | |
1234 | ||
1235 | int | |
1236 | main (void) | |
1237 | { | |
1238 | return yyparse (); | |
1239 | } | |
1240 | ]]) | |
1241 | ||
1242 | AT_BISON_CHECK([[-o input.c input.y]], [[0]],, | |
1243 | [[input.y:24.5-19: warning: rule useless in parser due to conflicts: sr_conflict: TK2 "tok alias" | |
1244 | ]]) | |
1245 | AT_COMPILE([[input]]) | |
1246 | AT_PARSER_CHECK([[./input]]) | |
1247 | ||
1248 | AT_CLEANUP | |
873ac263 JD |
1249 | |
1250 | ||
1251 | ||
1252 | ## --------------------------- ## | |
1253 | ## parse-gram.y: LALR = IELR. ## | |
1254 | ## --------------------------- ## | |
1255 | ||
1256 | # If parse-gram.y's LALR and IELR parser tables ever begin to differ, we | |
1257 | # need to fix parse-gram.y or start using IELR. | |
1258 | ||
1259 | AT_SETUP([[parse-gram.y: LALR = IELR]]) | |
1260 | ||
1261 | # Avoid differences in synclines by telling bison that the output files | |
1262 | # have the same name. | |
4b7a4c1b JD |
1263 | [cp $abs_top_srcdir/src/parse-gram.y input.y] |
1264 | AT_BISON_CHECK([[-o input.c -Dlr.type=lalr input.y]]) | |
1265 | [mv input.c lalr.c] | |
1266 | AT_BISON_CHECK([[-o input.c -Dlr.type=ielr input.y]]) | |
1267 | [mv input.c ielr.c] | |
873ac263 JD |
1268 | AT_CHECK([[diff -u lalr.c ielr.c]]) |
1269 | ||
1270 | AT_CLEANUP | |
d88cf117 JD |
1271 | |
1272 | ||
1273 | ||
1274 | ## --------------------------------------- ## | |
1275 | ## %error-verbose and YYSTACK_USE_ALLOCA. ## | |
1276 | ## --------------------------------------- ## | |
1277 | ||
1278 | AT_SETUP([[%error-verbose and YYSTACK_USE_ALLOCA]]) | |
1279 | ||
1280 | AT_DATA_GRAMMAR([input.y], | |
1281 | [[%code { | |
1282 | #include <stdio.h> | |
1283 | void yyerror (char const *); | |
1284 | int yylex (void); | |
1285 | #define YYSTACK_USE_ALLOCA 1 | |
1286 | } | |
1287 | ||
1288 | %error-verbose | |
1289 | ||
1290 | %% | |
1291 | ||
1292 | start: check syntax_error syntax_error ; | |
1293 | ||
1294 | check: | |
1295 | { | |
1296 | if (128 < sizeof yymsgbuf) | |
1297 | { | |
1298 | fprintf (stderr, | |
1299 | "The initial size of yymsgbuf in yyparse has increased\n" | |
1300 | "since this test group was last updated. As a result,\n" | |
1301 | "this test group may no longer manage to induce a\n" | |
1302 | "reallocation of the syntax error message buffer.\n" | |
1303 | "This test group must be adjusted to produce a longer\n" | |
1304 | "error message.\n"); | |
1305 | YYABORT; | |
1306 | } | |
1307 | } | |
1308 | ; | |
1309 | ||
1310 | // Induce a syntax error message whose total length is more than | |
1311 | // sizeof yymsgbuf in yyparse. Each token here is 64 bytes. | |
1312 | syntax_error: | |
1313 | "123456789112345678921234567893123456789412345678951234567896123A" | |
1314 | | "123456789112345678921234567893123456789412345678951234567896123B" | |
1315 | | error 'a' 'b' 'c' | |
1316 | ; | |
1317 | ||
1318 | %% | |
1319 | ||
1320 | void | |
1321 | yyerror (char const *msg) | |
1322 | { | |
1323 | fprintf (stderr, "%s\n", msg); | |
1324 | } | |
1325 | ||
1326 | int | |
1327 | yylex (void) | |
1328 | { | |
1329 | /* Induce two syntax error messages (which requires full error | |
1330 | recovery by shifting 3 tokens) in order to detect any loss of the | |
1331 | reallocated buffer. */ | |
1332 | static char const *input = "abc"; | |
1333 | return *input++; | |
1334 | } | |
1335 | ||
1336 | int | |
1337 | main (void) | |
1338 | { | |
1339 | return yyparse (); | |
1340 | } | |
1341 | ]]) | |
1342 | ||
1343 | AT_BISON_CHECK([[-o input.c input.y]]) | |
1344 | AT_COMPILE([[input]]) | |
1345 | AT_PARSER_CHECK([[./input]], [[1]], [], | |
1346 | [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B | |
1347 | syntax error, unexpected $end, expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B | |
1348 | ]]) | |
1349 | ||
1350 | AT_CLEANUP | |
1351 | ||
1352 | ||
1353 | ||
1354 | ## ------------------------- ## | |
1355 | ## %error-verbose overflow. ## | |
1356 | ## ------------------------- ## | |
1357 | ||
1358 | # Imagine the case where YYSTACK_ALLOC_MAXIMUM = YYSIZE_MAXIMUM and an | |
1359 | # invocation of yysyntax_error has caused yymsg_alloc to grow to exactly | |
1360 | # YYSTACK_ALLOC_MAXIMUM (perhaps because the normal doubling of size had | |
69a2ab11 JD |
1361 | # to be clipped to YYSTACK_ALLOC_MAXIMUM). In an old version of yacc.c, |
1362 | # a subsequent invocation of yysyntax_error that overflows during its | |
1363 | # size calculation would return YYSIZE_MAXIMUM to yyparse. Then, | |
1364 | # yyparse would invoke yyerror using the old contents of yymsg. | |
d88cf117 JD |
1365 | |
1366 | AT_SETUP([[%error-verbose overflow]]) | |
1367 | ||
d88cf117 JD |
1368 | AT_DATA_GRAMMAR([input.y], |
1369 | [[%code { | |
1370 | #include <stdio.h> | |
1371 | void yyerror (char const *); | |
1372 | int yylex (void); | |
1373 | ||
1374 | /* This prevents this test case from having to induce error messages | |
1375 | large enough to overflow size_t. */ | |
1376 | #define YYSIZE_T unsigned char | |
1377 | ||
ea6046b9 | 1378 | /* Bring in malloc and set EXIT_SUCCESS so yacc.c doesn't try to |
23761f42 | 1379 | provide a malloc prototype using our YYSIZE_T. */ |
d88cf117 | 1380 | #include <stdlib.h> |
ea6046b9 PE |
1381 | #ifndef EXIT_SUCCESS |
1382 | # define EXIT_SUCCESS 0 | |
23761f42 | 1383 | #endif |
d88cf117 JD |
1384 | |
1385 | /* Max depth is usually much smaller than YYSTACK_ALLOC_MAXIMUM, and | |
1386 | we don't want gcc to warn everywhere this constant would be too big | |
1387 | to make sense for our YYSIZE_T. */ | |
1388 | #define YYMAXDEPTH 100 | |
1389 | } | |
1390 | ||
1391 | %error-verbose | |
1392 | ||
1393 | %% | |
1394 | ||
1395 | start: syntax_error1 check syntax_error2 ; | |
1396 | ||
1397 | // Induce a syntax error message whose total length causes yymsg in | |
1398 | // yyparse to be reallocated to size YYSTACK_ALLOC_MAXIMUM, which | |
1399 | // should be 255. Each token here is 64 bytes. | |
1400 | syntax_error1: | |
1401 | "123456789112345678921234567893123456789412345678951234567896123A" | |
1402 | | "123456789112345678921234567893123456789412345678951234567896123B" | |
1403 | | "123456789112345678921234567893123456789412345678951234567896123C" | |
1404 | | error 'a' 'b' 'c' | |
1405 | ; | |
1406 | ||
1407 | check: | |
1408 | { | |
1409 | if (yymsg_alloc != YYSTACK_ALLOC_MAXIMUM | |
1410 | || YYSTACK_ALLOC_MAXIMUM != YYSIZE_MAXIMUM | |
1411 | || YYSIZE_MAXIMUM != 255) | |
1412 | { | |
1413 | fprintf (stderr, | |
1414 | "The assumptions of this test group are no longer\n" | |
1415 | "valid, so it may no longer catch the error it was\n" | |
1416 | "designed to catch. Specifically, the following\n" | |
1417 | "values should all be 255:\n\n"); | |
1418 | fprintf (stderr, " yymsg_alloc = %d\n", yymsg_alloc); | |
1419 | fprintf (stderr, " YYSTACK_ALLOC_MAXIMUM = %d\n", | |
1420 | YYSTACK_ALLOC_MAXIMUM); | |
1421 | fprintf (stderr, " YYSIZE_MAXIMUM = %d\n", YYSIZE_MAXIMUM); | |
1422 | YYABORT; | |
1423 | } | |
1424 | } | |
1425 | ; | |
1426 | ||
1427 | // Now overflow. | |
1428 | syntax_error2: | |
1429 | "123456789112345678921234567893123456789412345678951234567896123A" | |
1430 | | "123456789112345678921234567893123456789412345678951234567896123B" | |
1431 | | "123456789112345678921234567893123456789412345678951234567896123C" | |
1432 | | "123456789112345678921234567893123456789412345678951234567896123D" | |
1433 | | "123456789112345678921234567893123456789412345678951234567896123E" | |
1434 | ; | |
1435 | ||
1436 | %% | |
1437 | ||
1438 | void | |
1439 | yyerror (char const *msg) | |
1440 | { | |
1441 | fprintf (stderr, "%s\n", msg); | |
1442 | } | |
1443 | ||
1444 | int | |
1445 | yylex (void) | |
1446 | { | |
1447 | /* Induce two syntax error messages (which requires full error | |
1448 | recovery by shifting 3 tokens). */ | |
1449 | static char const *input = "abc"; | |
1450 | return *input++; | |
1451 | } | |
1452 | ||
1453 | int | |
1454 | main (void) | |
1455 | { | |
1456 | /* Push parsers throw away the message buffer between tokens, so skip | |
1457 | this test under maintainer-push-check. */ | |
1458 | if (YYPUSH) | |
1459 | return 77; | |
1460 | return yyparse (); | |
1461 | } | |
1462 | ]]) | |
1463 | ||
1464 | AT_BISON_CHECK([[-o input.c input.y]]) | |
1465 | ||
1466 | # gcc warns about tautologies and fallacies involving comparisons for | |
1467 | # unsigned char. However, it doesn't produce these same warnings for | |
1468 | # size_t and many other types when the warnings would seem to make just | |
1469 | # as much sense. We ignore the warnings. | |
1470 | [CFLAGS="$NO_WERROR_CFLAGS"] | |
1471 | AT_COMPILE([[input]]) | |
1472 | ||
1473 | AT_PARSER_CHECK([[./input]], [[2]], [], | |
1474 | [[syntax error, unexpected 'a', expecting 123456789112345678921234567893123456789412345678951234567896123A or 123456789112345678921234567893123456789412345678951234567896123B or 123456789112345678921234567893123456789412345678951234567896123C | |
1475 | syntax error | |
1476 | memory exhausted | |
1477 | ]]) | |
1478 | ||
1479 | AT_CLEANUP | |
ea13bea8 JD |
1480 | |
1481 | ||
1482 | ||
1483 | ## ------------------------ ## | |
1484 | ## LAC: Exploratory stack. ## | |
1485 | ## ------------------------ ## | |
1486 | ||
1487 | AT_SETUP([[LAC: Exploratory stack]]) | |
1488 | ||
1489 | m4_pushdef([AT_LAC_CHECK], [ | |
1490 | ||
1491 | AT_BISON_OPTION_PUSHDEFS([$1]) | |
1492 | ||
1493 | AT_DATA_GRAMMAR([input.y], | |
1494 | [[%code { | |
1495 | #include <stdio.h> | |
1496 | void yyerror (char const *); | |
1497 | int yylex (]AT_PURE_IF([[YYSTYPE *]], [[void]])[); | |
1498 | } | |
1499 | ||
1500 | ]$1[ | |
1501 | %error-verbose | |
1502 | %token 'c' | |
1503 | ||
1504 | %% | |
1505 | ||
1506 | // default reductions in inconsistent states | |
1507 | // v v v v v v v v v v v v v v | |
1508 | S: A B A A B A A A A B A A A A A A A B C C A A A A A A A A A A A A B ; | |
1509 | ||
1510 | A: 'a' | /*empty*/ { printf ("inconsistent default reduction\n"); } ; | |
1511 | B: 'b' ; | |
1512 | C: /*empty*/ { printf ("consistent default reduction\n"); } ; | |
1513 | ||
1514 | %% | |
1515 | ||
1516 | void | |
1517 | yyerror (char const *msg) | |
1518 | { | |
1519 | fprintf (stderr, "%s\n", msg); | |
1520 | } | |
1521 | ||
1522 | int | |
1523 | yylex (]AT_PURE_IF([[YYSTYPE *v]], [[void]])[) | |
1524 | { | |
1525 | static char const *input = "bbbbc";]AT_PURE_IF([[ | |
1526 | *v = 0;]])[ | |
1527 | return *input++; | |
1528 | } | |
1529 | ||
1530 | int | |
1531 | main (void) | |
1532 | { | |
1533 | yydebug = 1; | |
1534 | return yyparse (); | |
1535 | } | |
1536 | ]]) | |
1537 | ||
1538 | # Give exactly the right amount of memory to be sure there's no | |
1539 | # off-by-one error, for example. | |
1540 | AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity=12 \ | |
1541 | -t -o input.c input.y]], [[0]], [], | |
1542 | [[input.y: conflicts: 21 shift/reduce | |
1543 | ]]) | |
1544 | AT_COMPILE([[input]]) | |
1545 | AT_PARSER_CHECK([[./input > stdout.txt 2> stderr.txt]], [[1]]) | |
1546 | ||
1547 | # Make sure syntax error doesn't forget that 'a' is expected. It would | |
1548 | # be forgotten without lookahead correction. | |
1549 | AT_CHECK([[grep 'syntax error,' stderr.txt]], [[0]], | |
1550 | [[syntax error, unexpected 'c', expecting 'a' or 'b' | |
1551 | ]]) | |
1552 | ||
1553 | # Check number of default reductions in inconsistent states to be sure | |
1554 | # syntax error is detected before unnecessary reductions are performed. | |
1555 | AT_CHECK([[perl -0777 -ne 'print s/inconsistent default reduction//g;' \ | |
1556 | < stdout.txt || exit 77]], [[0]], [[14]]) | |
1557 | ||
1558 | # Check number of default reductions in consistent states to be sure | |
1559 | # it is performed before the syntax error is detected. | |
1560 | AT_CHECK([[perl -0777 -ne 'print s/\bconsistent default reduction//g;' \ | |
1561 | < stdout.txt || exit 77]], [[0]], [[2]]) | |
1562 | ||
1563 | AT_BISON_OPTION_POPDEFS | |
1564 | ]) | |
1565 | ||
1566 | AT_LAC_CHECK([[%define api.push-pull pull]]) | |
1567 | AT_LAC_CHECK([[%define api.push-pull pull %define api.pure]]) | |
1568 | AT_LAC_CHECK([[%define api.push-pull both]]) | |
1569 | AT_LAC_CHECK([[%define api.push-pull both %define api.pure]]) | |
1570 | ||
1571 | m4_popdef([AT_LAC_CHECK]) | |
1572 | ||
1573 | AT_CLEANUP | |
1574 | ||
1575 | ||
1576 | ||
1577 | ## ------------------------ ## | |
1578 | ## LAC: Memory exhaustion. ## | |
1579 | ## ------------------------ ## | |
1580 | ||
1581 | AT_SETUP([[LAC: Memory exhaustion]]) | |
1582 | ||
1583 | m4_pushdef([AT_LAC_CHECK], [ | |
1584 | ||
1585 | AT_DATA_GRAMMAR([input.y], | |
1586 | [[%code { | |
1587 | #include <stdio.h> | |
1588 | void yyerror (char const *); | |
1589 | int yylex (void); | |
1590 | } | |
1591 | ||
1592 | %error-verbose | |
1593 | ||
1594 | %% | |
1595 | ||
1596 | S: A A A A A A A A A ; | |
1597 | A: /*empty*/ | 'a' ; | |
1598 | ||
1599 | %% | |
1600 | ||
1601 | void | |
1602 | yyerror (char const *msg) | |
1603 | { | |
1604 | fprintf (stderr, "%s\n", msg); | |
1605 | } | |
1606 | ||
1607 | int | |
1608 | yylex (void) | |
1609 | { | |
1610 | static char const *input = "]$1["; | |
1611 | return *input++; | |
1612 | } | |
1613 | ||
1614 | int | |
1615 | main (void) | |
1616 | { | |
1617 | yydebug = 1; | |
1618 | return yyparse (); | |
1619 | } | |
1620 | ]]) | |
1621 | ||
1622 | AT_BISON_CHECK([[-Dparse.lac=full -Dparse.lac.es-capacity=8 \ | |
1623 | -t -o input.c input.y]], [[0]], [], | |
1624 | [[input.y: conflicts: 8 shift/reduce | |
1625 | ]]) | |
1626 | AT_COMPILE([[input]]) | |
1627 | ||
1628 | ]) | |
1629 | ||
1630 | # Check for memory exhaustion during parsing. | |
1631 | AT_LAC_CHECK([[]]) | |
1632 | AT_PARSER_CHECK([[./input]], [[2]], [[]], | |
1633 | [[Starting parse | |
1634 | Entering state 0 | |
1635 | Reading a token: Now at end of input. | |
1636 | LAC: initial context established for $end | |
1637 | LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max stack size exceeded) | |
1638 | memory exhausted | |
1639 | Cleanup: discarding lookahead token $end () | |
1640 | Stack now 0 | |
1641 | ]]) | |
1642 | ||
1643 | # Induce an immediate syntax error with an undefined token, and check | |
1644 | # for memory exhaustion while building syntax error message. | |
1645 | AT_LAC_CHECK([[z]], [[0]]) | |
1646 | AT_PARSER_CHECK([[./input]], [[2]], [[]], | |
1647 | [[Starting parse | |
1648 | Entering state 0 | |
1649 | Reading a token: Next token is token $undefined () | |
1650 | LAC: initial context established for $undefined | |
1651 | LAC: checking lookahead $undefined: Always Err | |
1652 | Constructing syntax error message | |
1653 | LAC: checking lookahead $end: R2 G3 R2 G5 R2 G6 R2 G7 R2 G8 R2 G9 R2 G10 R2 G11 R2 (max stack size exceeded) | |
1654 | syntax error | |
1655 | memory exhausted | |
1656 | Cleanup: discarding lookahead token $undefined () | |
1657 | Stack now 0 | |
1658 | ]]) | |
1659 | ||
1660 | m4_popdef([AT_LAC_CHECK]) | |
1661 | ||
1662 | AT_CLEANUP |