]> git.saurik.com Git - bison.git/blob - tests/regression.at
fa2278a8f7ed6aaec8268a9da5c5b7a1cbcfe0d1
[bison.git] / tests / regression.at
1 # Bison Regressions. -*- Autotest -*-
2
3 # Copyright (C) 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008 Free Software
4 # Foundation, Inc.
5
6 # This program is free software: you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License as published by
8 # the Free Software Foundation, either version 3 of the License, or
9 # (at your option) any later version.
10 #
11 # This program is distributed in the hope that it will be useful,
12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 # GNU General Public License for more details.
15 #
16 # You should have received a copy of the GNU General Public License
17 # along with this program. If not, see <http://www.gnu.org/licenses/>.
18
19 AT_BANNER([[Regression tests.]])
20
21
22 ## ------------------ ##
23 ## Trivial grammars. ##
24 ## ------------------ ##
25
26 AT_SETUP([Trivial grammars])
27
28 AT_DATA_GRAMMAR([input.y],
29 [[%{
30 void yyerror (char const *);
31 int yylex (void);
32 #define YYSTYPE int *
33 %}
34
35 %error-verbose
36
37 %%
38
39 program: 'x';
40 ]])
41
42 AT_BISON_CHECK([-o input.c input.y])
43 AT_COMPILE([input.o], [-c input.c])
44 AT_COMPILE([input.o], [-DYYDEBUG -c input.c])
45
46 AT_CLEANUP
47
48
49
50 ## ----------------- ##
51 ## YYSTYPE typedef. ##
52 ## ----------------- ##
53
54 AT_SETUP([YYSTYPE typedef])
55
56 AT_DATA_GRAMMAR([input.y],
57 [[%{
58 void yyerror (char const *);
59 int yylex (void);
60 typedef union { char const *val; } YYSTYPE;
61 %}
62
63 %type <val> program
64
65 %%
66
67 program: { $$ = ""; };
68 ]])
69
70 AT_BISON_CHECK([-o input.c input.y])
71 AT_COMPILE([input.o], [-c input.c])
72
73 AT_CLEANUP
74
75
76
77 ## ------------------------------------- ##
78 ## Early token definitions with --yacc. ##
79 ## ------------------------------------- ##
80
81
82 AT_SETUP([Early token definitions with --yacc])
83
84 # Found in GCJ: they expect the tokens to be defined before the user
85 # prologue, so that they can use the token definitions in it.
86
87 AT_DATA_GRAMMAR([input.y],
88 [[%{
89 void yyerror (const char *s);
90 int yylex (void);
91 %}
92
93 %union
94 {
95 int val;
96 };
97 %{
98 #ifndef MY_TOKEN
99 # error "MY_TOKEN not defined."
100 #endif
101 %}
102 %token MY_TOKEN
103 %%
104 exp: MY_TOKEN;
105 %%
106 ]])
107
108 AT_BISON_CHECK([-y -o input.c input.y])
109 AT_COMPILE([input.o], [-c input.c])
110
111 AT_CLEANUP
112
113
114
115 ## ---------------------------------------- ##
116 ## Early token definitions without --yacc. ##
117 ## ---------------------------------------- ##
118
119
120 AT_SETUP([Early token definitions without --yacc])
121
122 # Found in GCJ: they expect the tokens to be defined before the user
123 # prologue, so that they can use the token definitions in it.
124
125 AT_DATA_GRAMMAR([input.y],
126 [[%{
127 #include <stdio.h>
128 void yyerror (const char *s);
129 int yylex (void);
130 void print_my_token (void);
131 %}
132
133 %union
134 {
135 int val;
136 };
137 %{
138 void
139 print_my_token (void)
140 {
141 enum yytokentype my_token = MY_TOKEN;
142 printf ("%d\n", my_token);
143 }
144 %}
145 %token MY_TOKEN
146 %%
147 exp: MY_TOKEN;
148 %%
149 ]])
150
151 AT_BISON_CHECK([-o input.c input.y])
152 AT_COMPILE([input.o], [-c input.c])
153
154 AT_CLEANUP
155
156
157
158 ## ---------------- ##
159 ## Braces parsing. ##
160 ## ---------------- ##
161
162
163 AT_SETUP([Braces parsing])
164
165 AT_DATA([input.y],
166 [[/* Bison used to swallow the character after `}'. */
167
168 %%
169 exp: { tests = {{{{{{{{{{}}}}}}}}}}; };
170 %%
171 ]])
172
173 AT_BISON_CHECK([-v -o input.c input.y])
174
175 AT_CHECK([grep 'tests = {{{{{{{{{{}}}}}}}}}};' input.c], 0, [ignore])
176
177 AT_CLEANUP
178
179
180 ## ------------------ ##
181 ## Duplicate string. ##
182 ## ------------------ ##
183
184
185 AT_SETUP([Duplicate string])
186
187 AT_DATA([input.y],
188 [[/* `Bison -v' used to dump core when two tokens are defined with the same
189 string, as LE and GE below. */
190
191 %token NUM
192 %token LE "<="
193 %token GE "<="
194
195 %%
196 exp: '(' exp ')' | NUM ;
197 %%
198 ]])
199
200 AT_BISON_CHECK([-v -o input.c input.y], 0, [],
201 [[input.y:6.8-14: warning: symbol `"<="' used more than once as a literal string
202 ]])
203
204 AT_CLEANUP
205
206
207 ## ------------------- ##
208 ## Rule Line Numbers. ##
209 ## ------------------- ##
210
211 AT_SETUP([Rule Line Numbers])
212
213 AT_KEYWORDS([report])
214
215 AT_DATA([input.y],
216 [[%%
217 expr:
218 'a'
219
220 {
221
222 }
223
224 'b'
225
226 {
227
228 }
229
230 |
231
232
233 {
234
235
236 }
237
238 'c'
239
240 {
241
242 };
243 ]])
244
245 AT_BISON_CHECK([-o input.c -v input.y])
246
247 # Check the contents of the report.
248 AT_CHECK([cat input.output], [],
249 [[Grammar
250
251 0 $accept: expr $end
252
253 1 $@1: /* empty */
254
255 2 expr: 'a' $@1 'b'
256
257 3 $@2: /* empty */
258
259 4 expr: $@2 'c'
260
261
262 Terminals, with rules where they appear
263
264 $end (0) 0
265 'a' (97) 2
266 'b' (98) 2
267 'c' (99) 4
268 error (256)
269
270
271 Nonterminals, with rules where they appear
272
273 $accept (6)
274 on left: 0
275 expr (7)
276 on left: 2 4, on right: 0
277 $@1 (8)
278 on left: 1, on right: 2
279 $@2 (9)
280 on left: 3, on right: 4
281
282
283 state 0
284
285 0 $accept: . expr $end
286
287 'a' shift, and go to state 1
288
289 $default reduce using rule 3 ($@2)
290
291 expr go to state 2
292 $@2 go to state 3
293
294
295 state 1
296
297 2 expr: 'a' . $@1 'b'
298
299 $default reduce using rule 1 ($@1)
300
301 $@1 go to state 4
302
303
304 state 2
305
306 0 $accept: expr . $end
307
308 $end shift, and go to state 5
309
310
311 state 3
312
313 4 expr: $@2 . 'c'
314
315 'c' shift, and go to state 6
316
317
318 state 4
319
320 2 expr: 'a' $@1 . 'b'
321
322 'b' shift, and go to state 7
323
324
325 state 5
326
327 0 $accept: expr $end .
328
329 $default accept
330
331
332 state 6
333
334 4 expr: $@2 'c' .
335
336 $default reduce using rule 4 (expr)
337
338
339 state 7
340
341 2 expr: 'a' $@1 'b' .
342
343 $default reduce using rule 2 (expr)
344 ]])
345
346 AT_CLEANUP
347
348
349
350 ## ---------------------- ##
351 ## Mixing %token styles. ##
352 ## ---------------------- ##
353
354
355 AT_SETUP([Mixing %token styles])
356
357 # Taken from the documentation.
358 AT_DATA([input.y],
359 [[%token <operator> OR "||"
360 %token <operator> LE 134 "<="
361 %left OR "<="
362 %%
363 exp: ;
364 %%
365 ]])
366
367 AT_BISON_CHECK([-v -o input.c input.y])
368
369 AT_CLEANUP
370
371
372
373 ## ---------------- ##
374 ## Invalid inputs. ##
375 ## ---------------- ##
376
377
378 AT_SETUP([Invalid inputs])
379
380 AT_DATA([input.y],
381 [[%%
382 ?
383 default: 'a' }
384 %&
385 %a-does-not-exist
386 %-
387 %{
388 ]])
389
390 AT_BISON_CHECK([input.y], [1], [],
391 [[input.y:2.1: invalid character: `?'
392 input.y:3.14: invalid character: `}'
393 input.y:4.1: invalid character: `%'
394 input.y:4.2: invalid character: `&'
395 input.y:5.1-17: invalid directive: `%a-does-not-exist'
396 input.y:6.1: invalid character: `%'
397 input.y:6.2: invalid character: `-'
398 input.y:7.1-8.0: missing `%}' at end of file
399 input.y:7.1-8.0: syntax error, unexpected %{...%}
400 ]])
401
402 AT_CLEANUP
403
404
405 AT_SETUP([Invalid inputs with {}])
406
407 AT_DATA([input.y],
408 [[
409 %destructor
410 %initial-action
411 %lex-param
412 %parse-param
413 %printer
414 %union
415 ]])
416
417 AT_BISON_CHECK([input.y], [1], [],
418 [[input.y:3.1-15: syntax error, unexpected %initial-action, expecting {...}
419 ]])
420
421 AT_CLEANUP
422
423
424
425 ## ------------------- ##
426 ## Token definitions. ##
427 ## ------------------- ##
428
429
430 AT_SETUP([Token definitions])
431
432 # Bison managed, when fed with `%token 'f' "f"' to #define 'f'!
433 AT_DATA_GRAMMAR([input.y],
434 [%{
435 #include <stdlib.h>
436 #include <stdio.h>
437 void yyerror (const char *s);
438 int yylex (void);
439 %}
440 [%error-verbose
441 %token MYEOF 0 "end of file"
442 %token 'a' "a"
443 %token B_TOKEN "b"
444 %token C_TOKEN 'c'
445 %token 'd' D_TOKEN
446 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
447 %token SPECIAL "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!"
448 %%
449 exp: "a" "\\\'\?\"\a\b\f\n\r\t\v\001\201\x001\x000081??!";
450 %%
451 void
452 yyerror (char const *s)
453 {
454 fprintf (stderr, "%s\n", s);
455 }
456
457 int
458 yylex (void)
459 {
460 static int called;
461 if (called++)
462 abort ();
463 return SPECIAL;
464 }
465
466 int
467 main (void)
468 {
469 return yyparse ();
470 }
471 ]])
472
473 # Checking the warning message guarantees that the trigraph "??!" isn't
474 # unnecessarily escaped here even though it would need to be if encoded in a
475 # C-string literal. Also notice that unnecessary escaping, such as "\?", from
476 # the user specification is eliminated.
477 AT_BISON_CHECK([-o input.c input.y], [[0]], [[]],
478 [[input.y:22.8-14: warning: symbol SPECIAL redeclared
479 input.y:22.8-63: warning: symbol `"\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!"' used more than once as a literal string
480 ]])
481 AT_COMPILE([input])
482
483 # Checking the error message here guarantees that yytname, which does contain
484 # C-string literals, does have the trigraph escaped correctly. Thus, the
485 # symbol name reported by the parser is exactly the same as that reported by
486 # Bison itself.
487 AT_DATA([experr],
488 [[syntax error, unexpected "\\'?\"\a\b\f\n\r\t\v\001\201\001\201??!", expecting a
489 ]])
490 AT_PARSER_CHECK([./input], 1, [], [experr])
491 AT_CLEANUP
492
493
494
495 ## -------------------- ##
496 ## Characters Escapes. ##
497 ## -------------------- ##
498
499
500 AT_SETUP([Characters Escapes])
501
502 AT_DATA_GRAMMAR([input.y],
503 [%{
504 void yyerror (const char *s);
505 int yylex (void);
506 %}
507 [%%
508 exp:
509 '\'' "\'"
510 | '\"' "\""
511 | '"' "'"
512 ;
513 ]])
514 # Pacify font-lock-mode: "
515
516 AT_BISON_CHECK([-o input.c input.y])
517 AT_COMPILE([input.o], [-c input.c])
518 AT_CLEANUP
519
520
521
522 ## -------------- ##
523 ## Web2c Report. ##
524 ## -------------- ##
525
526 # The generation of the reduction was once wrong in Bison, and made it
527 # miss some reductions. In the following test case, the reduction on
528 # `undef_id_tok' in state 1 was missing. This is stripped down from
529 # the actual web2c.y.
530
531 AT_SETUP([Web2c Report])
532
533 AT_KEYWORDS([report])
534
535 AT_DATA([input.y],
536 [[%token undef_id_tok const_id_tok
537
538 %start CONST_DEC_PART
539 \f
540 %%
541 CONST_DEC_PART:
542 CONST_DEC_LIST
543 ;
544
545 CONST_DEC_LIST:
546 CONST_DEC
547 | CONST_DEC_LIST CONST_DEC
548 ;
549
550 CONST_DEC:
551 { } undef_id_tok '=' const_id_tok ';'
552 ;
553 %%
554 ]])
555
556 AT_BISON_CHECK([-v input.y])
557 AT_CHECK([cat input.output], 0,
558 [[Grammar
559
560 0 $accept: CONST_DEC_PART $end
561
562 1 CONST_DEC_PART: CONST_DEC_LIST
563
564 2 CONST_DEC_LIST: CONST_DEC
565 3 | CONST_DEC_LIST CONST_DEC
566
567 4 $@1: /* empty */
568
569 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';'
570
571
572 Terminals, with rules where they appear
573
574 $end (0) 0
575 ';' (59) 5
576 '=' (61) 5
577 error (256)
578 undef_id_tok (258) 5
579 const_id_tok (259) 5
580
581
582 Nonterminals, with rules where they appear
583
584 $accept (7)
585 on left: 0
586 CONST_DEC_PART (8)
587 on left: 1, on right: 0
588 CONST_DEC_LIST (9)
589 on left: 2 3, on right: 1 3
590 CONST_DEC (10)
591 on left: 5, on right: 2 3
592 $@1 (11)
593 on left: 4, on right: 5
594
595
596 state 0
597
598 0 $accept: . CONST_DEC_PART $end
599
600 $default reduce using rule 4 ($@1)
601
602 CONST_DEC_PART go to state 1
603 CONST_DEC_LIST go to state 2
604 CONST_DEC go to state 3
605 $@1 go to state 4
606
607
608 state 1
609
610 0 $accept: CONST_DEC_PART . $end
611
612 $end shift, and go to state 5
613
614
615 state 2
616
617 1 CONST_DEC_PART: CONST_DEC_LIST .
618 3 CONST_DEC_LIST: CONST_DEC_LIST . CONST_DEC
619
620 undef_id_tok reduce using rule 4 ($@1)
621 $default reduce using rule 1 (CONST_DEC_PART)
622
623 CONST_DEC go to state 6
624 $@1 go to state 4
625
626
627 state 3
628
629 2 CONST_DEC_LIST: CONST_DEC .
630
631 $default reduce using rule 2 (CONST_DEC_LIST)
632
633
634 state 4
635
636 5 CONST_DEC: $@1 . undef_id_tok '=' const_id_tok ';'
637
638 undef_id_tok shift, and go to state 7
639
640
641 state 5
642
643 0 $accept: CONST_DEC_PART $end .
644
645 $default accept
646
647
648 state 6
649
650 3 CONST_DEC_LIST: CONST_DEC_LIST CONST_DEC .
651
652 $default reduce using rule 3 (CONST_DEC_LIST)
653
654
655 state 7
656
657 5 CONST_DEC: $@1 undef_id_tok . '=' const_id_tok ';'
658
659 '=' shift, and go to state 8
660
661
662 state 8
663
664 5 CONST_DEC: $@1 undef_id_tok '=' . const_id_tok ';'
665
666 const_id_tok shift, and go to state 9
667
668
669 state 9
670
671 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok . ';'
672
673 ';' shift, and go to state 10
674
675
676 state 10
677
678 5 CONST_DEC: $@1 undef_id_tok '=' const_id_tok ';' .
679
680 $default reduce using rule 5 (CONST_DEC)
681 ]])
682
683 AT_CLEANUP
684
685
686 ## --------------- ##
687 ## Web2c Actions. ##
688 ## --------------- ##
689
690 # The generation of the mapping `state -> action' was once wrong in
691 # extremely specific situations. web2c.y exhibits this situation.
692 # Below is a stripped version of the grammar. It looks like one can
693 # simplify it further, but just don't: it is tuned to exhibit a bug,
694 # which disapears when applying sane grammar transformations.
695 #
696 # It used to be wrong on yydefact only:
697 #
698 # static const yytype_uint8 yydefact[] =
699 # {
700 # - 2, 0, 1, 0, 0, 2, 3, 2, 5, 4,
701 # + 2, 0, 1, 0, 0, 0, 3, 2, 5, 4,
702 # 0, 0
703 # };
704 #
705 # but let's check all the tables.
706
707
708 AT_SETUP([Web2c Actions])
709
710 AT_KEYWORDS([report])
711
712 AT_DATA([input.y],
713 [[%%
714 statement: struct_stat;
715 struct_stat: /* empty. */ | if else;
716 if: "if" "const" "then" statement;
717 else: "else" statement;
718 %%
719 ]])
720
721 AT_BISON_CHECK([-v -o input.c input.y])
722
723 # Check only the tables.
724 [sed -n 's/ *$//;/^static const.*\[\] =/,/^}/p' input.c >tables.c]
725
726 AT_CHECK([[cat tables.c]], 0,
727 [[static const yytype_uint8 yytranslate[] =
728 {
729 0, 2, 2, 2, 2, 2, 2, 2, 2, 2,
730 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
731 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
732 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
733 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
734 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
735 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
736 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
737 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
738 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
739 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
740 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
741 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
742 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
743 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
744 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
745 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
746 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
747 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
748 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
749 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
750 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
751 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
752 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
753 2, 2, 2, 2, 2, 2, 2, 2, 2, 2,
754 2, 2, 2, 2, 2, 2, 1, 2, 3, 4,
755 5, 6
756 };
757 static const yytype_uint8 yyprhs[] =
758 {
759 0, 0, 3, 5, 6, 9, 14
760 };
761 static const yytype_int8 yyrhs[] =
762 {
763 8, 0, -1, 9, -1, -1, 10, 11, -1, 3,
764 4, 5, 8, -1, 6, 8, -1
765 };
766 static const yytype_uint8 yyrline[] =
767 {
768 0, 2, 2, 3, 3, 4, 5
769 };
770 static const char *const yytname[] =
771 {
772 "$end", "error", "$undefined", "\"if\"", "\"const\"", "\"then\"",
773 "\"else\"", "$accept", "statement", "struct_stat", "if", "else", 0
774 };
775 static const yytype_uint16 yytoknum[] =
776 {
777 0, 256, 257, 258, 259, 260, 261
778 };
779 static const yytype_uint8 yyr1[] =
780 {
781 0, 7, 8, 9, 9, 10, 11
782 };
783 static const yytype_uint8 yyr2[] =
784 {
785 0, 2, 1, 0, 2, 4, 2
786 };
787 static const yytype_uint8 yydefact[] =
788 {
789 3, 0, 0, 2, 0, 0, 1, 3, 4, 3,
790 6, 5
791 };
792 static const yytype_int8 yydefgoto[] =
793 {
794 -1, 2, 3, 4, 8
795 };
796 static const yytype_int8 yypact[] =
797 {
798 -2, -1, 4, -8, 0, 2, -8, -2, -8, -2,
799 -8, -8
800 };
801 static const yytype_int8 yypgoto[] =
802 {
803 -8, -7, -8, -8, -8
804 };
805 static const yytype_uint8 yytable[] =
806 {
807 10, 1, 11, 5, 6, 0, 7, 9
808 };
809 static const yytype_int8 yycheck[] =
810 {
811 7, 3, 9, 4, 0, -1, 6, 5
812 };
813 static const yytype_uint8 yystos[] =
814 {
815 0, 3, 8, 9, 10, 4, 0, 6, 11, 5,
816 8, 8
817 };
818 ]])
819
820 AT_CLEANUP
821
822
823 ## ------------------------- ##
824 ## yycheck Bound Violation. ##
825 ## ------------------------- ##
826
827
828 # _AT_DATA_DANCER_Y(BISON-OPTIONS)
829 # --------------------------------
830 # The following grammar, taken from Andrew Suffield's GPL'd implementation
831 # of DGMTP, the Dancer Generic Message Transport Protocol, used to violate
832 # yycheck's bounds where issuing a verbose error message. Keep this test
833 # so that possible bound checking compilers could check all the skeletons.
834 m4_define([_AT_DATA_DANCER_Y],
835 [AT_DATA_GRAMMAR([dancer.y],
836 [%{
837 static int yylex (AT_LALR1_CC_IF([int *], [void]));
838 AT_LALR1_CC_IF([],
839 [#include <stdlib.h>
840 #include <stdio.h>
841 static void yyerror (const char *);])
842 %}
843 $1
844 %token ARROW INVALID NUMBER STRING DATA
845 %defines
846 %verbose
847 %error-verbose
848 /* Grammar follows */
849 %%
850 line: header body
851 ;
852
853 header: '<' from ARROW to '>' type ':'
854 | '<' ARROW to '>' type ':'
855 | ARROW to type ':'
856 | type ':'
857 | '<' '>'
858 ;
859
860 from: DATA
861 | STRING
862 | INVALID
863 ;
864
865 to: DATA
866 | STRING
867 | INVALID
868 ;
869
870 type: DATA
871 | STRING
872 | INVALID
873 ;
874
875 body: /* empty */
876 | body member
877 ;
878
879 member: STRING
880 | DATA
881 | '+' NUMBER
882 | '-' NUMBER
883 | NUMBER
884 | INVALID
885 ;
886 %%
887 AT_LALR1_CC_IF(
888 [/* A C++ error reporting function. */
889 void
890 yy::parser::error (const location&, const std::string& m)
891 {
892 std::cerr << m << std::endl;
893 }
894
895 int
896 yyparse ()
897 {
898 yy::parser parser;
899 #if YYDEBUG
900 parser.set_debug_level (YYDEBUG);
901 #endif
902 return parser.parse ();
903 }
904 ],
905 [static void
906 yyerror (const char *s)
907 {
908 fprintf (stderr, "%s\n", s);
909 }])
910
911 static int
912 yylex (AT_LALR1_CC_IF([int *lval], [void]))
913 [{
914 static int const tokens[] =
915 {
916 ':', -1
917 };
918 static size_t toknum;
919 ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[
920 if (! (toknum < sizeof tokens / sizeof *tokens))
921 abort ();
922 return tokens[toknum++];
923 }]
924
925 int
926 main (void)
927 {
928 return yyparse ();
929 }
930 ])
931 ])# _AT_DATA_DANCER_Y
932
933
934 # AT_CHECK_DANCER(BISON-OPTIONS)
935 # ------------------------------
936 # Generate the grammar, compile it, run it.
937 m4_define([AT_CHECK_DANCER],
938 [AT_SETUP([Dancer $1])
939 AT_BISON_OPTION_PUSHDEFS([$1])
940 _AT_DATA_DANCER_Y([$1])
941 AT_BISON_CHECK([-o dancer.c dancer.y])
942 AT_FULL_COMPILE([dancer])
943 AT_PARSER_CHECK([./dancer], 1, [],
944 [syntax error, unexpected ':'
945 ])
946 AT_BISON_OPTION_POPDEFS
947 AT_CLEANUP
948 ])
949
950 AT_CHECK_DANCER()
951 AT_CHECK_DANCER([%glr-parser])
952 AT_CHECK_DANCER([%skeleton "lalr1.cc"])
953
954
955 ## ------------------------------------------ ##
956 ## Diagnostic that expects two alternatives. ##
957 ## ------------------------------------------ ##
958
959
960 # _AT_DATA_EXPECT2_Y(BISON-OPTIONS)
961 # --------------------------------
962 m4_define([_AT_DATA_EXPECT2_Y],
963 [AT_DATA_GRAMMAR([expect2.y],
964 [%{
965 static int yylex (AT_LALR1_CC_IF([int *], [void]));
966 AT_LALR1_CC_IF([],
967 [#include <stdio.h>
968 #include <stdlib.h>
969 static void yyerror (const char *);])
970 %}
971 $1
972 %defines
973 %error-verbose
974 %token A 1000
975 %token B
976
977 %%
978 program: /* empty */
979 | program e ';'
980 | program error ';';
981
982 e: e '+' t | t;
983 t: A | B;
984
985 %%
986 AT_LALR1_CC_IF(
987 [/* A C++ error reporting function. */
988 void
989 yy::parser::error (const location&, const std::string& m)
990 {
991 std::cerr << m << std::endl;
992 }
993
994 int
995 yyparse ()
996 {
997 yy::parser parser;
998 return parser.parse ();
999 }
1000 ],
1001 [static void
1002 yyerror (const char *s)
1003 {
1004 fprintf (stderr, "%s\n", s);
1005 }])
1006
1007 static int
1008 yylex (AT_LALR1_CC_IF([int *lval], [void]))
1009 [{
1010 static int const tokens[] =
1011 {
1012 1000, '+', '+', -1
1013 };
1014 static size_t toknum;
1015 ]AT_LALR1_CC_IF([*lval = 0; /* Pacify GCC. */])[
1016 if (! (toknum < sizeof tokens / sizeof *tokens))
1017 abort ();
1018 return tokens[toknum++];
1019 }]
1020
1021 int
1022 main (void)
1023 {
1024 return yyparse ();
1025 }
1026 ])
1027 ])# _AT_DATA_EXPECT2_Y
1028
1029
1030 # AT_CHECK_EXPECT2(BISON-OPTIONS)
1031 # ------------------------------
1032 # Generate the grammar, compile it, run it.
1033 m4_define([AT_CHECK_EXPECT2],
1034 [AT_SETUP([Expecting two tokens $1])
1035 AT_BISON_OPTION_PUSHDEFS([$1])
1036 _AT_DATA_EXPECT2_Y([$1])
1037 AT_BISON_CHECK([-o expect2.c expect2.y])
1038 AT_FULL_COMPILE([expect2])
1039 AT_PARSER_CHECK([./expect2], 1, [],
1040 [syntax error, unexpected '+', expecting A or B
1041 ])
1042 AT_BISON_OPTION_POPDEFS
1043 AT_CLEANUP
1044 ])
1045
1046 AT_CHECK_EXPECT2()
1047 AT_CHECK_EXPECT2([%glr-parser])
1048 AT_CHECK_EXPECT2([%skeleton "lalr1.cc"])
1049
1050
1051
1052 ## --------------------------------------------- ##
1053 ## Braced code in declaration in rules section. ##
1054 ## --------------------------------------------- ##
1055
1056 AT_SETUP([Braced code in declaration in rules section])
1057
1058 # Bison once mistook braced code in a declaration in the rules section to be a
1059 # rule action.
1060
1061 AT_DATA_GRAMMAR([input.y],
1062 [[%{
1063 #include <stdio.h>
1064 static void yyerror (char const *msg);
1065 static int yylex (void);
1066 %}
1067
1068 %error-verbose
1069
1070 %%
1071
1072 start:
1073 {
1074 printf ("Bison would once convert this action to a midrule because of the"
1075 " subsequent braced code.\n");
1076 }
1077 ;
1078
1079 %destructor { fprintf (stderr, "DESTRUCTOR\n"); } 'a';
1080 %printer { fprintf (yyoutput, "PRINTER"); } 'a';
1081
1082 %%
1083
1084 static void
1085 yyerror (char const *msg)
1086 {
1087 fprintf (stderr, "%s\n", msg);
1088 }
1089
1090 static int
1091 yylex (void)
1092 {
1093 return 'a';
1094 }
1095
1096 int
1097 main (void)
1098 {
1099 yydebug = 1;
1100 return !yyparse ();
1101 }
1102 ]])
1103
1104 AT_BISON_CHECK([-t -o input.c input.y])
1105 AT_COMPILE([input])
1106 AT_PARSER_CHECK([./input], 0,
1107 [[Bison would once convert this action to a midrule because of the subsequent braced code.
1108 ]],
1109 [[Starting parse
1110 Entering state 0
1111 Reducing stack by rule 1 (line 20):
1112 -> $$ = nterm start ()
1113 Stack now 0
1114 Entering state 1
1115 Reading a token: Next token is token 'a' (PRINTER)
1116 syntax error, unexpected 'a', expecting $end
1117 Error: popping nterm start ()
1118 Stack now 0
1119 Cleanup: discarding lookahead token 'a' (PRINTER)
1120 DESTRUCTOR
1121 Stack now 0
1122 ]])
1123
1124 AT_CLEANUP
1125
1126
1127
1128 ## --------------------------------- ##
1129 ## String alias declared after use. ##
1130 ## --------------------------------- ##
1131
1132 AT_SETUP([String alias declared after use])
1133
1134 # Bison once incorrectly asserted that the symbol number for either a token or
1135 # its alias was the highest symbol number so far at the point of the alias
1136 # declaration. That was true unless the declaration appeared after their first
1137 # uses and other tokens appeared in between.
1138
1139 AT_DATA([input.y],
1140 [[%%
1141 start: 'a' "A" 'b';
1142 %token 'a' "A";
1143 ]])
1144
1145 AT_BISON_CHECK([-t -o input.c input.y])
1146
1147 AT_CLEANUP
1148
1149
1150
1151 ## -------------------------------- ##
1152 ## Extra lookahead sets in report. ##
1153 ## -------------------------------- ##
1154
1155 AT_SETUP([[Extra lookahead sets in report]])
1156
1157 # Bison prints each reduction's lookahead set only next to the associated
1158 # state's one item that (1) is associated with the same rule as the reduction
1159 # and (2) has its dot at the end of its RHS. Previously, Bison also
1160 # erroneously printed the lookahead set next to all of the state's other items
1161 # associated with the same rule. This bug affected only the `.output' file and
1162 # not the generated parser source code.
1163
1164 AT_DATA([[input.y]],
1165 [[%%
1166 start: a | 'a' a 'a' ;
1167 a: 'a' ;
1168 ]])
1169
1170 AT_BISON_CHECK([[--report=all input.y]])
1171 AT_CHECK([[sed -n '/^state 1$/,/^state 2$/p' input.output]], [[0]],
1172 [[state 1
1173
1174 2 start: 'a' . a 'a'
1175 3 a: . 'a'
1176 3 | 'a' . [$end]
1177
1178 'a' shift, and go to state 4
1179
1180 $default reduce using rule 3 (a)
1181
1182 a go to state 5
1183
1184
1185 state 2
1186 ]])
1187
1188 AT_CLEANUP
1189
1190
1191
1192 ## ---------------------------------------- ##
1193 ## Token number in precedence declaration. ##
1194 ## ---------------------------------------- ##
1195
1196 AT_SETUP([[Token number in precedence declaration]])
1197
1198 # POSIX says token numbers can be declared in %left, %right, and %nonassoc, but
1199 # we lost this in Bison 1.50.
1200
1201 AT_DATA_GRAMMAR([input.y],
1202 [[%{
1203 #include <stdio.h>
1204 void yyerror (char const *);
1205 int yylex (void);
1206 %}
1207
1208 %error-verbose
1209 %left TK1 1 TK2 2 "tok alias" 3
1210
1211 %%
1212
1213 start: TK1 sr_conflict "tok alias" ;
1214
1215 sr_conflict:
1216 TK2
1217 | TK2 "tok alias"
1218 ;
1219
1220 %%
1221
1222 void
1223 yyerror (char const *msg)
1224 {
1225 fprintf (stderr, "%s\n", msg);
1226 }
1227
1228 int
1229 yylex (void)
1230 {
1231 static int const input[] = { 1, 2, 3, 0 };
1232 static int const *inputp = input;
1233 return *inputp++;
1234 }
1235
1236 int
1237 main (void)
1238 {
1239 return yyparse ();
1240 }
1241 ]])
1242
1243 AT_BISON_CHECK([[-o input.c input.y]], [[0]],,
1244 [[input.y:24.5-19: warning: rule useless in parser due to conflicts: sr_conflict: TK2 "tok alias"
1245 ]])
1246 AT_COMPILE([[input]])
1247 AT_PARSER_CHECK([[./input]])
1248
1249 AT_CLEANUP
1250
1251
1252
1253 ## ----------------------------------------------- ##
1254 ## Fix user actions without a trailing semicolon. ##
1255 ## ----------------------------------------------- ##
1256
1257 AT_SETUP([[Fix user actions without a trailing semicolon]])
1258
1259 # This feature is undocumented, but we accidentally broke it in 2.3a, and there
1260 # was a complaint at:
1261 # <http://lists.gnu.org/archive/html/bug-bison/2008-11/msg00001.html>.
1262
1263 AT_DATA([input.y],
1264 [[%%
1265 start: {asdffdsa} ;
1266 ]])
1267
1268 AT_BISON_CHECK([[-o input.c input.y]])
1269 AT_CHECK([[sed -n '/asdffdsa/s/^ *//p' input.c]], [[0]],
1270 [[{asdffdsa;}
1271 ]])
1272
1273 AT_CLEANUP