]> git.saurik.com Git - bison.git/blob - tests/input.at
* bootstrap.conf (gnulib_modules): Add config-h.
[bison.git] / tests / input.at
1 # Checking the Bison scanner. -*- Autotest -*-
2 # Copyright (C) 2002, 2003, 2004, 2005, 2006 Free Software Foundation, Inc.
3
4 # This program is free software; you can redistribute it and/or modify
5 # it under the terms of the GNU General Public License as published by
6 # the Free Software Foundation; either version 2, or (at your option)
7 # any later version.
8
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU General Public License for more details.
13
14 # You should have received a copy of the GNU General Public License
15 # along with this program; if not, write to the Free Software
16 # Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
17 # 02110-1301, USA.
18
19 AT_BANNER([[Input Processing.]])
20
21 # Mostly test that we are robust to mistakes.
22
23
24 ## ------------ ##
25 ## Invalid $n. ##
26 ## ------------ ##
27
28 AT_SETUP([Invalid \$n and @n])
29
30 AT_DATA([input.y],
31 [[%%
32 exp: { $$ = $1 ; };
33 exp: { @$ = @1 ; };
34 ]])
35
36 AT_CHECK([bison input.y], [1], [],
37 [[input.y:2.13-14: integer out of range: `$1'
38 input.y:3.13-14: integer out of range: `@1'
39 ]])
40
41 AT_CLEANUP
42
43
44 ## -------------- ##
45 ## Type Clashes. ##
46 ## -------------- ##
47
48 AT_SETUP([Type Clashes])
49
50 AT_DATA([input.y],
51 [[%union { int bar; }
52 %token foo
53 %type <bar> exp
54 %%
55 exp: foo { $$; } foo { $2; } foo
56 | foo
57 | /* Empty. */
58 ;
59 ]])
60
61 AT_CHECK([bison input.y], [1], [],
62 [[input.y:5.12-13: $$ for the midrule at $2 of `exp' has no declared type
63 input.y:5.24-25: $2 of `exp' has no declared type
64 input.y:5.6-32: warning: type clash on default action: <bar> != <>
65 input.y:6.6-8: warning: type clash on default action: <bar> != <>
66 input.y:7.5: warning: empty rule for typed nonterminal, and no action
67 ]])
68
69 AT_CLEANUP
70
71
72 # _AT_UNUSED_VALUES_DECLARATIONS()
73 # --------------------------------------------
74 # Generate the token, type, and destructor
75 # declarations for the unused values tests.
76
77 m4_define([_AT_UNUSED_VALUES_DECLARATIONS],
78 [[[%token <integer> INT;
79 %type <integer> a b c d e f g h i j k l;
80 %destructor { destroy ($$); } INT a b c d e f g h i j k l;]]])
81
82
83 # AT_CHECK_UNUSED_VALUES(DECLARATIONS_AFTER)
84 # --------------------------------------------
85 # Generate a grammar to test unused values,
86 # compile it, run it. If DECLARATIONS_AFTER
87 # is set, then the token, type, and destructor
88 # declarations are generated after the rules
89 # rather than before.
90
91 m4_define([AT_CHECK_UNUSED_VALUES],
92 [AT_DATA([input.y],
93 m4_ifval($1, [
94
95
96 ], [_AT_UNUSED_VALUES_DECLARATIONS
97 ])[[%%
98 start:
99 'a' a { $]2[ } | 'b' b { $]2[ } | 'c' c { $]2[ } | 'd' d { $]2[ } | 'e' e { $]2[ }
100 | 'f' f { $]2[ } | 'g' g { $]2[ } | 'h' h { $]2[ } | 'i' i { $]2[ } | 'j' j { $]2[ }
101 | 'k' k { $]2[ } | 'l' l { $]2[ }
102 ;
103
104 a: INT | INT { } INT { } INT { };
105 b: INT | /* empty */;
106 c: INT | INT { $]1[ } INT { } INT { };
107 d: INT | INT { } INT { $]1[ } INT { };
108 e: INT | INT { } INT { } INT { $]1[ };
109 f: INT | INT { } INT { } INT { $]$[ = $]1[ + $]3[ + $]5[; };
110 g: INT | INT { $<integer>$; } INT { $<integer>$; } INT { };
111 h: INT | INT { $<integer>$; } INT { $<integer>$ = $<integer>2; } INT { };
112 i: INT | INT INT { } { $]$[ = $]1[ + $]2[; };
113 j: INT | INT INT { $<integer>$ = 1; } { $]$[ = $]1[ + $]2[; };
114 k: INT | INT INT { $<integer>$; } { $<integer>$ = $<integer>3; } { };
115 l: INT | INT { $<integer>$ = $<integer>1; } INT { $<integer>$ = $<integer>2 + $<integer>3; } INT { $<integer>$ = $<integer>4 + $<integer>5; };]]m4_ifval($1, [
116 _AT_UNUSED_VALUES_DECLARATIONS])
117 )
118
119 AT_CHECK([bison input.y], [0], [],
120 [[input.y:11.10-32: warning: unset value: $]$[
121 input.y:11.10-32: warning: unused value: $]1[
122 input.y:11.10-32: warning: unused value: $]3[
123 input.y:11.10-32: warning: unused value: $]5[
124 input.y:12.9: warning: empty rule for typed nonterminal, and no action
125 input.y:13.10-35: warning: unset value: $]$[
126 input.y:13.10-35: warning: unused value: $]3[
127 input.y:13.10-35: warning: unused value: $]5[
128 input.y:14.10-35: warning: unset value: $]$[
129 input.y:14.10-35: warning: unused value: $]3[
130 input.y:14.10-35: warning: unused value: $]5[
131 input.y:15.10-36: warning: unset value: $]$[
132 input.y:15.10-36: warning: unused value: $]3[
133 input.y:15.10-36: warning: unused value: $]5[
134 input.y:17.10-58: warning: unset value: $]$[
135 input.y:17.10-58: warning: unused value: $]1[
136 input.y:17.10-58: warning: unused value: $]2[
137 input.y:17.10-58: warning: unused value: $]3[
138 input.y:17.10-58: warning: unused value: $]4[
139 input.y:17.10-58: warning: unused value: $]5[
140 input.y:18.10-72: warning: unset value: $]$[
141 input.y:18.10-72: warning: unused value: $]1[
142 input.y:18.10-72: warning: unused value: $]3[
143 input.y:18.10-72: warning: unused value: $]4[
144 input.y:18.10-72: warning: unused value: $]5[
145 input.y:20.10-55: warning: unused value: $]3[
146 input.y:21.10-68: warning: unset value: $]$[
147 input.y:21.10-68: warning: unused value: $]1[
148 input.y:21.10-68: warning: unused value: $]2[
149 input.y:21.10-68: warning: unused value: $]4[
150 ]])])
151
152
153 ## --------------- ##
154 ## Unused values. ##
155 ## --------------- ##
156
157 AT_SETUP([Unused values])
158 AT_CHECK_UNUSED_VALUES
159 AT_CLEANUP
160
161
162 ## ------------------------------------------ ##
163 ## Unused values before symbol declarations. ##
164 ## ------------------------------------------ ##
165
166 AT_SETUP([Unused values before symbol declarations])
167 AT_CHECK_UNUSED_VALUES([1])
168 AT_CLEANUP
169
170
171 ## --------------------------------------------- ##
172 ## Default %printer and %destructor redeclared. ##
173 ## --------------------------------------------- ##
174
175 AT_SETUP([Default %printer and %destructor redeclared])
176
177 AT_DATA([[input.y]],
178 [[%destructor { destroy ($$); } %symbol-default %symbol-default
179 %printer { destroy ($$); } %symbol-default %symbol-default
180
181 %destructor { destroy ($$); } %symbol-default
182 %printer { destroy ($$); } %symbol-default
183
184 %%
185
186 start: ;
187
188 %destructor { destroy ($$); } %symbol-default;
189 %printer { destroy ($$); } %symbol-default;
190 ]])
191
192 AT_CHECK([bison input.y], [1], [],
193 [[input.y:1.13-29: redeclaration for default %destructor
194 input.y:1.13-29: previous declaration
195 input.y:2.10-26: redeclaration for default %printer
196 input.y:2.10-26: previous declaration
197 input.y:4.13-29: redeclaration for default %destructor
198 input.y:1.13-29: previous declaration
199 input.y:5.10-26: redeclaration for default %printer
200 input.y:2.10-26: previous declaration
201 input.y:11.13-29: redeclaration for default %destructor
202 input.y:4.13-29: previous declaration
203 input.y:12.10-26: redeclaration for default %printer
204 input.y:5.10-26: previous declaration
205 ]])
206
207 AT_CLEANUP
208
209
210 ## ---------------------------------------------- ##
211 ## Per-type %printer and %destructor redeclared. ##
212 ## ---------------------------------------------- ##
213
214 AT_SETUP([Per-type %printer and %destructor redeclared])
215
216 AT_DATA([[input.y]],
217 [[%destructor { destroy ($$); } <field1> <field2>
218 %printer { destroy ($$); } <field1> <field2>
219
220 %destructor { destroy ($$); } <field1> <field1>
221 %printer { destroy ($$); } <field2> <field2>
222
223 %%
224
225 start: ;
226
227 %destructor { destroy ($$); } <field2> <field1>;
228 %printer { destroy ($$); } <field2> <field1>;
229 ]])
230
231 AT_CHECK([bison input.y], [1], [],
232 [[input.y:4.13-29: %destructor redeclaration for <field1>
233 input.y:1.13-29: previous declaration
234 input.y:4.13-29: %destructor redeclaration for <field1>
235 input.y:4.13-29: previous declaration
236 input.y:5.10-26: %printer redeclaration for <field2>
237 input.y:2.10-26: previous declaration
238 input.y:5.10-26: %printer redeclaration for <field2>
239 input.y:5.10-26: previous declaration
240 input.y:11.13-29: %destructor redeclaration for <field1>
241 input.y:4.13-29: previous declaration
242 input.y:11.13-29: %destructor redeclaration for <field2>
243 input.y:1.13-29: previous declaration
244 input.y:12.10-26: %printer redeclaration for <field1>
245 input.y:2.10-26: previous declaration
246 input.y:12.10-26: %printer redeclaration for <field2>
247 input.y:5.10-26: previous declaration
248 ]])
249
250 AT_CLEANUP
251
252
253 ## ---------------------------------------- ##
254 ## Unused values with default %destructor. ##
255 ## ---------------------------------------- ##
256
257 AT_SETUP([Unused values with default %destructor])
258
259 AT_DATA([[input.y]],
260 [[%destructor { destroy ($$); } %symbol-default
261
262 %%
263
264 start: end end { $1; } ;
265 end: { } ;
266 ]])
267
268 AT_CHECK([bison input.y], [0], [],
269 [[input.y:5.8-22: warning: unset value: $$
270 input.y:5.8-22: warning: unused value: $2
271 input.y:6.6-8: warning: unset value: $$
272 ]])
273
274 AT_CLEANUP
275
276
277 ## ----------------------------------------- ##
278 ## Unused values with per-type %destructor. ##
279 ## ----------------------------------------- ##
280
281 AT_SETUP([Unused values with per-type %destructor])
282
283 AT_DATA([[input.y]],
284 [[%destructor { destroy ($$); } <field1>
285 %type <field1> start end
286
287 %%
288
289 start: end end { $1; } ;
290 end: { } ;
291 ]])
292
293 AT_CHECK([bison input.y], [0], [],
294 [[input.y:6.8-22: warning: unset value: $$
295 input.y:6.8-22: warning: unused value: $2
296 input.y:7.6-8: warning: unset value: $$
297 ]])
298
299 AT_CLEANUP
300
301
302 ## ---------------------- ##
303 ## Incompatible Aliases. ##
304 ## ---------------------- ##
305
306 AT_SETUP([Incompatible Aliases])
307
308 AT_DATA([input.y],
309 [[%token foo "foo"
310
311 %type <bar> foo
312 %printer {bar} foo
313 %destructor {bar} foo
314 %left foo
315
316 %type <baz> "foo"
317 %printer {baz} "foo"
318 %destructor {baz} "foo"
319 %left "foo"
320
321 %%
322 exp: foo;
323 ]])
324
325 AT_CHECK([bison input.y], [1], [],
326 [[input.y:8.7-11: %type redeclaration for foo
327 input.y:3.7-11: previous declaration
328 input.y:10.13-17: %destructor redeclaration for foo
329 input.y:5.13-17: previous declaration
330 input.y:9.10-14: %printer redeclaration for foo
331 input.y:4.10-14: previous declaration
332 input.y:11.1-5: %left redeclaration for foo
333 input.y:6.1-5: previous declaration
334 ]])
335
336 AT_CLEANUP
337
338
339
340 ## ----------------------- ##
341 ## Torturing the Scanner. ##
342 ## ----------------------- ##
343
344 # Be sure to compile and run, so that the C compiler checks what
345 # we do.
346
347 AT_SETUP([Torturing the Scanner])
348
349
350 AT_DATA([input.y], [])
351 AT_CHECK([bison input.y], [1], [],
352 [[input.y:1.1: syntax error, unexpected end of file
353 ]])
354
355
356 AT_DATA([input.y],
357 [{}
358 ])
359 AT_CHECK([bison input.y], [1], [],
360 [[input.y:1.1-2: syntax error, unexpected {...}
361 ]])
362
363
364 AT_DATA_GRAMMAR([input.y],
365 [[%{
366 /* This is seen in GCC: a %{ and %} in middle of a comment. */
367 const char *foo = "So %{ and %} can be here too.";
368
369 #if 0
370 /* These examples test Bison while not stressing C compilers too much.
371 Many C compilers mishandle backslash-newlines, so this part of the
372 test is inside "#if 0". The comment and string are written so that
373 the "#endif" will be seen regardless of the C compiler bugs that we
374 know about, namely:
375
376 HP C (as of late 2002) mishandles *\[newline]\[newline]/ within a
377 comment.
378
379 The Apple Darwin compiler (as of late 2002) mishandles
380 \\[newline]' within a character constant.
381
382 */
383
384 /\
385 * A comment with backslash-newlines in it. %} *\
386 \
387 /
388 /* { Close the above comment, if the C compiler mishandled it. */
389
390 char str[] = "\\
391 " A string with backslash-newlines in it %{ %} \\
392 \
393 "";
394
395 char apostrophe = '\'';
396 #endif
397
398 #include <stdio.h>
399 %}
400 /* %{ and %} can be here too. */
401
402 %{
403 /* Exercise pre-prologue dependency to %union. */
404 typedef int value;
405 %}
406
407 /* Exercise M4 quoting: '@:>@@:>@', 0. */
408
409 /* Also exercise %union. */
410 %union
411 {
412 value ival; /* A comment to exercise an old bug. */
413 };
414
415
416 /* Exercise post-prologue dependency to %union. */
417 %{
418 static YYSTYPE value_as_yystype (value val);
419
420 /* Exercise quotes in declarations. */
421 char quote[] = "@:>@@:>@,";
422 %}
423
424 %{
425 static void yyerror (const char *s);
426 static int yylex (void);
427 %}
428
429 %type <ival> '@<:@'
430
431 /* Exercise quotes in strings. */
432 %token FAKE "fake @<:@@:>@ \a\b\f\n\r\t\v\"\'\?\\\u005B\U0000005c ??!??'??(??)??-??/??<??=??> \x1\1"
433
434 %%
435 /* Exercise M4 quoting: '@:>@@:>@', @<:@, 1. */
436 exp: '@<:@' '\1' two '$' '@' '{' oline output.or.oline.opt
437 {
438 /* Exercise quotes in braces. */
439 char tmp[] = "@<:@%c@:>@,\n";
440 printf (tmp, $1);
441 }
442 ;
443
444 two: '\x000000000000000000000000000000000000000000000000000000000000000000002';
445 oline: '@' 'o' 'l' 'i' 'n' 'e' '@' '_' '_' 'o' 'l' 'i' 'n' 'e' '_' '_';
446 output.or.oline.opt: ;|oline;;|output;;;
447 output: '#' 'o' 'u' 't' 'p' 'u' 't' ' ';
448 %%
449 /* Exercise M4 quoting: '@:>@@:>@', @<:@, 2. */
450
451 static YYSTYPE
452 value_as_yystype (value val)
453 {
454 YYSTYPE res;
455 res.ival = val;
456 return res;
457 }
458
459 static int
460 yylex (void)
461 {
462 static char const input[] = "@<:@\1\2$@{@oline@__@&t@oline__\
463 #output "; /* "
464 */
465 static size_t toknum;
466 if (! (toknum < sizeof input))
467 abort ();
468 yylval = value_as_yystype (input[toknum]);
469 return input[toknum++];
470 }
471
472 static void
473 yyerror (const char *msg)
474 {
475 fprintf (stderr, "%s\n", msg);
476 }
477 ]])
478
479 # Pacify Emacs'font-lock-mode: "
480
481 AT_DATA([main.c],
482 [[typedef int value;
483 #include "input.h"
484
485 int yyparse (void);
486
487 int
488 main (void)
489 {
490 return yyparse ();
491 }
492 ]])
493
494 AT_CHECK([bison -d -v -o input.c input.y])
495 AT_COMPILE([input.o], [-c input.c])
496 AT_COMPILE([main.o], [-c main.c])
497 AT_COMPILE([input], [input.o main.o])
498 AT_PARSER_CHECK([./input], 0,
499 [[[@<:@],
500 ]])
501
502 AT_CLEANUP
503
504
505 ## ---------------------- ##
506 ## Typed symbol aliases. ##
507 ## ---------------------- ##
508
509 AT_SETUP([Typed symbol aliases])
510
511 # Bison 2.0 broke typed symbol aliases - ensure they work.
512
513 AT_DATA_GRAMMAR([input.y],
514 [[%union
515 {
516 int val;
517 };
518 %token <val> MY_TOKEN "MY TOKEN"
519 %type <val> exp
520 %%
521 exp: "MY TOKEN";
522 %%
523 ]])
524
525 AT_CHECK([bison -o input.c input.y])
526
527 AT_CLEANUP
528
529
530 ## --------- ##
531 ## Require. ##
532 ## --------- ##
533
534 m4_define([AT_CHECK_REQUIRE],
535 [AT_SETUP([Require $1])
536 AT_DATA_GRAMMAR([input.y],
537 [[%require "$1";
538 %%
539 empty_file:;
540 ]])
541 AT_CHECK([bison -o input.c input.y], $2, [], ignore)
542 AT_CLEANUP
543 ])
544
545 AT_CHECK_REQUIRE(1.0, 0)
546 AT_CHECK_REQUIRE(AT_PACKAGE_VERSION, 0)
547 ## FIXME: Some day augment this version number.
548 AT_CHECK_REQUIRE(100.0, 63)
549
550
551 ## ------------------------------------- ##
552 ## String aliases for character tokens. ##
553 ## ------------------------------------- ##
554
555 AT_SETUP([String aliases for character tokens])
556
557 # Bison once thought a character token and its alias were different symbols
558 # with the same user token number.
559
560 AT_DATA_GRAMMAR([input.y],
561 [[%token 'a' "a"
562 %%
563 start: 'a';
564 %%
565 ]])
566
567 AT_CHECK([bison -o input.c input.y])
568
569 AT_CLEANUP
570
571
572 ## --------------------- ##
573 ## Unclosed constructs. ##
574 ## --------------------- ##
575
576 AT_SETUP([Unclosed constructs])
577
578 # Bison's scan-gram.l once forgot to STRING_FINISH some unclosed constructs, so
579 # they were prepended to whatever it STRING_GROW'ed next. It also threw them
580 # away rather than returning them to the parser. The effect was confusing
581 # subsequent error messages.
582
583 AT_DATA([input.y],
584 [[%token A "a
585 %token B "b"
586 %token AB "ab" // Used to complain that "ab" was already used.
587 %token C '1
588 %token TWO "2"
589 %token TICK_TWELVE "'12" // Used to complain that "'12" was already used.
590
591 %%
592
593 start: ;
594
595 // Used to report a syntax error because it didn't see any kind of symbol
596 // identifier.
597 %type <f> 'a
598 ;
599 %type <f> "a
600 ;
601 // Used to report a syntax error because it didn't see braced code.
602 %destructor { free ($$)
603 ]])
604
605 AT_CHECK([bison -o input.c input.y], 1, [],
606 [[input.y:1.10-2.0: missing `"' at end of line
607 input.y:4.10-5.0: missing `'' at end of line
608 input.y:14.11-15.0: missing `'' at end of line
609 input.y:16.11-17.0: missing `"' at end of line
610 input.y:19.13-20.0: missing `}' at end of file
611 input.y:20.1: syntax error, unexpected end of file
612 ]])
613
614 AT_CLEANUP
615
616
617 ## ------------------------- ##
618 ## %start after first rule. ##
619 ## ------------------------- ##
620
621 AT_SETUP([%start after first rule])
622
623 # Bison once complained that a %start after the first rule was a redeclaration
624 # of the start symbol.
625
626 AT_DATA([input.y],
627 [[%%
628 false_start: ;
629 start: false_start ;
630 %start start;
631 ]])
632
633 AT_CHECK([bison -o input.c input.y])
634
635 AT_CLEANUP