1 /* Output the generated parsing program for Bison.
3 Copyright (C) 1984, 1986, 1989, 1992, 2000-2013 Free Software
6 This file is part of Bison, the GNU Compiler Compiler.
8 This program is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
24 #include <concat-filename.h>
25 #include <configmake.h>
27 #include <get-errno.h>
29 #include <spawn-pipe.h>
31 #include <wait-process.h>
37 #include "muscle-tab.h"
40 #include "scan-code.h" /* max_left_semantic_context */
41 #include "scan-skel.h"
45 static struct obstack format_obstack
;
48 /*-------------------------------------------------------------------.
49 | Create a function NAME which associates to the muscle NAME the |
50 | result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of |
51 | TYPE), and to the muscle NAME_max, the max value of the |
53 `-------------------------------------------------------------------*/
56 #define GENERATE_MUSCLE_INSERT_TABLE(Name, Type) \
59 Name (char const *name, \
72 obstack_printf (&format_obstack, "%6d", first); \
73 for (i = begin; i < end; ++i) \
75 obstack_1grow (&format_obstack, ','); \
78 obstack_sgrow (&format_obstack, "\n "); \
83 obstack_printf (&format_obstack, "%6d", table_data[i]); \
84 if (table_data[i] < min) \
85 min = table_data[i]; \
86 if (max < table_data[i]) \
87 max = table_data[i]; \
89 muscle_insert (name, obstack_finish0 (&format_obstack)); \
93 /* Build 'NAME_min' and 'NAME_max' in the obstack. */ \
94 obstack_printf (&format_obstack, "%s_min", name); \
95 MUSCLE_INSERT_LONG_INT (obstack_finish0 (&format_obstack), lmin); \
96 obstack_printf (&format_obstack, "%s_max", name); \
97 MUSCLE_INSERT_LONG_INT (obstack_finish0 (&format_obstack), lmax); \
100 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_unsigned_int_table
, unsigned int)
101 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_int_table
, int)
102 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_base_table
, base_number
)
103 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_rule_number_table
, rule_number
)
104 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_symbol_number_table
, symbol_number
)
105 GENERATE_MUSCLE_INSERT_TABLE (muscle_insert_state_number_table
, state_number
)
107 /*----------------------------------------------------------------.
108 | Print to OUT a representation of CP quoted and escaped for M4. |
109 `----------------------------------------------------------------*/
112 quoted_output (FILE *out
, char const *cp
)
119 case '$': fputs ("$][", out
); break;
120 case '@': fputs ("@@", out
); break;
121 case '[': fputs ("@{", out
); break;
122 case ']': fputs ("@}", out
); break;
123 default: fputc (*cp
, out
); break;
129 /*----------------------------------------------------------------.
130 | Print to OUT a representation of STRING quoted and escaped both |
132 `----------------------------------------------------------------*/
135 string_output (FILE *out
, char const *string
)
137 quoted_output (out
, quotearg_style (c_quoting_style
, string
));
141 /*------------------------------------------------------------------.
142 | Prepare the muscles related to the symbols: translate, tname, and |
144 `------------------------------------------------------------------*/
147 prepare_symbols (void)
149 MUSCLE_INSERT_INT ("tokens_number", ntokens
);
150 MUSCLE_INSERT_INT ("nterms_number", nvars
);
151 MUSCLE_INSERT_INT ("symbols_number", nsyms
);
152 MUSCLE_INSERT_INT ("undef_token_number", undeftoken
->number
);
153 MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number
);
155 muscle_insert_symbol_number_table ("translate",
157 token_translations
[0],
158 1, max_user_token_number
+ 1);
160 /* tname -- token names. */
163 /* We assume that the table will be output starting at column 2. */
165 struct quoting_options
*qo
= clone_quoting_options (0);
166 set_quoting_style (qo
, c_quoting_style
);
167 set_quoting_flags (qo
, QA_SPLIT_TRIGRAPHS
);
168 for (i
= 0; i
< nsyms
; i
++)
170 char *cp
= quotearg_alloc (symbols
[i
]->tag
, -1, qo
);
171 /* Width of the next token, including the two quotes, the
172 comma and the space. */
173 int width
= strlen (cp
) + 2;
177 obstack_sgrow (&format_obstack
, "\n ");
182 obstack_1grow (&format_obstack
, ' ');
183 obstack_escape (&format_obstack
, cp
);
185 obstack_1grow (&format_obstack
, ',');
189 obstack_sgrow (&format_obstack
, " ]b4_null[");
191 /* Finish table and store. */
192 muscle_insert ("tname", obstack_finish0 (&format_obstack
));
195 /* Output YYTOKNUM. */
198 int *values
= xnmalloc (ntokens
, sizeof *values
);
199 for (i
= 0; i
< ntokens
; ++i
)
200 values
[i
] = symbols
[i
]->user_token_number
;
201 muscle_insert_int_table ("toknum", values
,
202 values
[0], 1, ntokens
);
208 /*----------------------------------------------------------------.
209 | Prepare the muscles related to the rules: r1, r2, rline, dprec, |
210 | merger, immediate. |
211 `----------------------------------------------------------------*/
216 unsigned int *rline
= xnmalloc (nrules
, sizeof *rline
);
217 symbol_number
*r1
= xnmalloc (nrules
, sizeof *r1
);
218 unsigned int *r2
= xnmalloc (nrules
, sizeof *r2
);
219 int *dprec
= xnmalloc (nrules
, sizeof *dprec
);
220 int *merger
= xnmalloc (nrules
, sizeof *merger
);
221 int *immediate
= xnmalloc (nrules
, sizeof *immediate
);
224 for (r
= 0; r
< nrules
; ++r
)
226 /* LHS of the rule R. */
227 r1
[r
] = rules
[r
].lhs
->number
;
228 /* Length of rule R's RHS. */
229 r2
[r
] = rule_rhs_length (&rules
[r
]);
230 /* Line where rule was defined. */
231 rline
[r
] = rules
[r
].location
.start
.line
;
232 /* Dynamic precedence (GLR). */
233 dprec
[r
] = rules
[r
].dprec
;
234 /* Merger-function index (GLR). */
235 merger
[r
] = rules
[r
].merger
;
236 /* Immediate reduction flags (GLR). */
237 immediate
[r
] = rules
[r
].is_predicate
;
240 muscle_insert_unsigned_int_table ("rline", rline
, 0, 0, nrules
);
241 muscle_insert_symbol_number_table ("r1", r1
, 0, 0, nrules
);
242 muscle_insert_unsigned_int_table ("r2", r2
, 0, 0, nrules
);
243 muscle_insert_int_table ("dprec", dprec
, 0, 0, nrules
);
244 muscle_insert_int_table ("merger", merger
, 0, 0, nrules
);
245 muscle_insert_int_table ("immediate", immediate
, 0, 0, nrules
);
247 MUSCLE_INSERT_INT ("rules_number", nrules
);
248 MUSCLE_INSERT_INT ("max_left_semantic_context", max_left_semantic_context
);
258 /*--------------------------------------------.
259 | Prepare the muscles related to the states. |
260 `--------------------------------------------*/
263 prepare_states (void)
266 symbol_number
*values
= xnmalloc (nstates
, sizeof *values
);
267 for (i
= 0; i
< nstates
; ++i
)
268 values
[i
] = states
[i
]->accessing_symbol
;
269 muscle_insert_symbol_number_table ("stos", values
,
273 MUSCLE_INSERT_INT ("last", high
);
274 MUSCLE_INSERT_INT ("final_state_number", final_state
->number
);
275 MUSCLE_INSERT_INT ("states_number", nstates
);
279 /*-------------------------------------------------------.
280 | Compare two symbols by type-name, and then by number. |
281 `-------------------------------------------------------*/
284 symbol_type_name_cmp (const symbol
**lhs
, const symbol
**rhs
)
286 int res
= uniqstr_cmp ((*lhs
)->type_name
, (*rhs
)->type_name
);
288 res
= (*lhs
)->number
- (*rhs
)->number
;
293 /*----------------------------------------------------------------.
294 | Return a (malloc'ed) table of the symbols sorted by type-name. |
295 `----------------------------------------------------------------*/
298 symbols_by_type_name (void)
300 typedef int (*qcmp_type
) (const void *, const void *);
301 symbol
**res
= xmemdup (symbols
, nsyms
* sizeof *res
);
302 qsort (res
, nsyms
, sizeof *res
, (qcmp_type
) &symbol_type_name_cmp
);
307 /*------------------------------------------------------------------.
308 | Define b4_type_names, which is a list of (lists of the numbers of |
309 | symbols with same type-name). |
310 `------------------------------------------------------------------*/
313 type_names_output (FILE *out
)
316 symbol
**syms
= symbols_by_type_name ();
317 fputs ("m4_define([b4_type_names],\n[", out
);
318 for (i
= 0; i
< nsyms
; /* nothing */)
320 /* The index of the first symbol of the current type-name. */
322 fputs (i
? ",\n[" : "[", out
);
323 for (; i
< nsyms
&& syms
[i
]->type_name
== syms
[i0
]->type_name
; ++i
)
324 fprintf (out
, "%s%d", i
!= i0
? ", " : "", syms
[i
]->number
);
327 fputs ("])\n\n", out
);
332 /*-------------------------------------.
333 | The list of all the symbol numbers. |
334 `-------------------------------------*/
337 symbol_numbers_output (FILE *out
)
340 fputs ("m4_define([b4_symbol_numbers],\n[", out
);
341 for (i
= 0; i
< nsyms
; ++i
)
342 fprintf (out
, "%s[%d]", i
? ", " : "", i
);
343 fputs ("])\n\n", out
);
347 /*---------------------------------.
348 | Output the user actions to OUT. |
349 `---------------------------------*/
352 user_actions_output (FILE *out
)
356 fputs ("m4_define([b4_actions], \n[", out
);
357 for (r
= 0; r
< nrules
; ++r
)
360 fprintf (out
, "b4_%scase(%d, [b4_syncline(%d, ",
361 rules
[r
].is_predicate
? "predicate_" : "",
362 r
+ 1, rules
[r
].action_location
.start
.line
);
363 string_output (out
, rules
[r
].action_location
.start
.file
);
364 fprintf (out
, ")\n[ %s]])\n\n", rules
[r
].action
);
366 fputs ("])\n\n", out
);
369 /*------------------------------------.
370 | Output the merge functions to OUT. |
371 `------------------------------------*/
374 merger_output (FILE *out
)
379 fputs ("m4_define([b4_mergers], \n[[", out
);
380 for (n
= 1, p
= merge_functions
; p
!= NULL
; n
+= 1, p
= p
->next
)
382 if (p
->type
[0] == '\0')
383 fprintf (out
, " case %d: *yy0 = %s (*yy0, *yy1); break;\n",
386 fprintf (out
, " case %d: yy0->%s = %s (*yy0, *yy1); break;\n",
387 n
, p
->type
, p
->name
);
389 fputs ("]])\n\n", out
);
393 /*---------------------------------------------.
394 | Prepare the muscles for symbol definitions. |
395 `---------------------------------------------*/
398 prepare_symbol_definitions (void)
401 for (i
= 0; i
< nsyms
; ++i
)
403 symbol
*sym
= symbols
[i
];
407 #define SET_KEY(Entry) \
408 obstack_printf (&format_obstack, "symbol(%d, %s)", \
410 key = obstack_finish0 (&format_obstack);
412 #define SET_KEY2(Entry, Suffix) \
413 obstack_printf (&format_obstack, "symbol(%d, %s_%s)", \
415 key = obstack_finish0 (&format_obstack);
417 /* Whether the symbol has an identifier. */
418 value
= symbol_id_get (sym
);
420 MUSCLE_INSERT_INT (key
, !!value
);
422 /* Its identifier. */
424 MUSCLE_INSERT_STRING (key
, value
? value
: "");
426 /* Its tag. Typically for documentation purpose. */
428 MUSCLE_INSERT_STRING (key
, sym
->tag
);
430 SET_KEY ("user_number");
431 MUSCLE_INSERT_INT (key
, sym
->user_token_number
);
433 SET_KEY ("is_token");
434 MUSCLE_INSERT_INT (key
,
435 i
< ntokens
&& sym
!= errtoken
&& sym
!= undeftoken
);
438 MUSCLE_INSERT_INT (key
, sym
->number
);
440 SET_KEY ("has_type");
441 MUSCLE_INSERT_INT (key
, !!sym
->type_name
);
444 MUSCLE_INSERT_STRING (key
, sym
->type_name
? sym
->type_name
: "");
448 for (j
= 0; j
< CODE_PROPS_SIZE
; ++j
)
450 /* "printer", not "%printer". */
451 char const *pname
= code_props_type_string (j
) + 1;
452 code_props
const *p
= symbol_code_props_get (sym
, j
);
453 SET_KEY2 ("has", pname
);
454 MUSCLE_INSERT_INT (key
, !!p
->code
);
458 SET_KEY2 (pname
, "file");
459 MUSCLE_INSERT_STRING (key
, p
->location
.start
.file
);
461 SET_KEY2 (pname
, "line");
462 MUSCLE_INSERT_INT (key
, p
->location
.start
.line
);
465 MUSCLE_INSERT_STRING_RAW (key
, p
->code
);
476 prepare_actions (void)
478 /* Figure out the actions for the specified state, indexed by
479 lookahead token type. */
481 muscle_insert_rule_number_table ("defact", yydefact
,
482 yydefact
[0], 1, nstates
);
484 /* Figure out what to do after reducing with each rule, depending on
485 the saved state from before the beginning of parsing the data
486 that matched this rule. */
487 muscle_insert_state_number_table ("defgoto", yydefgoto
,
488 yydefgoto
[0], 1, nsyms
- ntokens
);
492 muscle_insert_base_table ("pact", base
,
493 base
[0], 1, nstates
);
494 MUSCLE_INSERT_INT ("pact_ninf", base_ninf
);
497 muscle_insert_base_table ("pgoto", base
,
498 base
[nstates
], nstates
+ 1, nvectors
);
500 muscle_insert_base_table ("table", table
,
501 table
[0], 1, high
+ 1);
502 MUSCLE_INSERT_INT ("table_ninf", table_ninf
);
504 muscle_insert_base_table ("check", check
,
505 check
[0], 1, high
+ 1);
507 /* GLR parsing slightly modifies YYTABLE and YYCHECK (and thus
508 YYPACT) so that in states with unresolved conflicts, the default
509 reduction is not used in the conflicted entries, so that there is
510 a place to put a conflict pointer.
512 This means that YYCONFLP and YYCONFL are nonsense for a non-GLR
513 parser, so we could avoid accidents by not writing them out in
514 that case. Nevertheless, it seems even better to be able to use
515 the GLR skeletons even without the non-deterministic tables. */
516 muscle_insert_unsigned_int_table ("conflict_list_heads", conflict_table
,
517 conflict_table
[0], 1, high
+ 1);
518 muscle_insert_unsigned_int_table ("conflicting_rules", conflict_list
,
519 0, 1, conflict_list_cnt
);
523 /*--------------------------------------------.
524 | Output the definitions of all the muscles. |
525 `--------------------------------------------*/
528 muscles_output (FILE *out
)
530 fputs ("m4_init()\n", out
);
532 symbol_numbers_output (out
);
533 type_names_output (out
);
534 user_actions_output (out
);
536 muscles_m4_output (out
);
539 /*---------------------------.
540 | Call the skeleton parser. |
541 `---------------------------*/
544 output_skeleton (void)
549 /* Compute the names of the package data dir and skeleton files. */
550 char const *m4
= (m4
= getenv ("M4")) ? m4
: M4
;
551 char const *datadir
= pkgdatadir ();
552 char *m4sugar
= xconcatenated_filename (datadir
, "m4sugar/m4sugar.m4", NULL
);
553 char *m4bison
= xconcatenated_filename (datadir
, "bison.m4", NULL
);
554 char *skel
= (IS_PATH_WITH_DIR (skeleton
)
556 : xconcatenated_filename (datadir
, skeleton
, NULL
));
558 /* Test whether m4sugar.m4 is readable, to check for proper
559 installation. A faulty installation can cause deadlock, so a
560 cheap sanity check is worthwhile. */
561 xfclose (xfopen (m4sugar
, "r"));
563 /* Create an m4 subprocess connected to us via two pipes. */
565 if (trace_flag
& trace_tools
)
566 fprintf (stderr
, "running: %s %s - %s %s\n",
567 m4
, m4sugar
, m4bison
, skel
);
569 /* Some future version of GNU M4 (most likely 1.6) may treat the -dV in a
570 position-dependent manner. Keep it as the first argument so that all
573 See the thread starting at
574 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
577 char const *argv
[10];
581 /* When POSIXLY_CORRECT is set, GNU M4 1.6 and later disable GNU
582 extensions, which Bison's skeletons depend on. With older M4,
583 it has no effect. M4 1.4.12 added a -g/--gnu command-line
584 option to make it explicit that a program wants GNU M4
585 extensions even when POSIXLY_CORRECT is set.
587 See the thread starting at
588 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
591 argv
[i
++] = M4_GNU_OPTION
;
595 if (trace_flag
& trace_m4
)
602 aver (i
<= ARRAY_CARDINALITY (argv
));
604 /* The ugly cast is because gnulib gets the const-ness wrong. */
605 pid
= create_pipe_bidi ("m4", m4
, (char **)(void*)argv
, false, true,
613 if (trace_flag
& trace_muscles
)
614 muscles_output (stderr
);
616 FILE *out
= xfdopen (filter_fd
[1], "w");
617 muscles_output (out
);
621 /* Read and process m4's output. */
622 timevar_push (TV_M4
);
624 FILE *in
= xfdopen (filter_fd
[0], "r");
626 /* scan_skel should have read all of M4's output. Otherwise, when we
627 close the pipe, we risk letting M4 report a broken-pipe to the
632 wait_subprocess (pid
, "m4", false, false, true, true, NULL
);
639 /* BISON_USE_PUSH_FOR_PULL is for the test suite and should not be
640 documented for the user. */
641 char const *cp
= getenv ("BISON_USE_PUSH_FOR_PULL");
642 bool use_push_for_pull_flag
= cp
&& *cp
&& strtol (cp
, 0, 10);
645 MUSCLE_INSERT_BOOL ("defines_flag", defines_flag
);
646 MUSCLE_INSERT_BOOL ("glr_flag", glr_parser
);
647 MUSCLE_INSERT_BOOL ("nondeterministic_flag", nondeterministic_parser
);
648 MUSCLE_INSERT_BOOL ("synclines_flag", !no_lines_flag
);
649 MUSCLE_INSERT_BOOL ("tag_seen_flag", tag_seen
);
650 MUSCLE_INSERT_BOOL ("token_table_flag", token_table_flag
);
651 MUSCLE_INSERT_BOOL ("use_push_for_pull_flag", use_push_for_pull_flag
);
652 MUSCLE_INSERT_BOOL ("yacc_flag", yacc_flag
);
655 if (spec_name_prefix
)
656 MUSCLE_INSERT_STRING ("prefix", spec_name_prefix
);
658 MUSCLE_INSERT_STRING ("file_name_all_but_ext", all_but_ext
);
660 #define DEFINE(Name) MUSCLE_INSERT_STRING (#Name, Name ? Name : "")
662 DEFINE (parser_file_name
);
663 DEFINE (spec_defines_file
);
664 DEFINE (spec_file_prefix
);
665 DEFINE (spec_graph_file
);
666 DEFINE (spec_name_prefix
);
667 DEFINE (spec_outfile
);
668 DEFINE (spec_verbose_file
);
671 /* Find the right skeleton file, and add muscles about the skeletons. */
673 MUSCLE_INSERT_C_STRING ("skeleton", skeleton
);
675 skeleton
= language
->skeleton
;
677 /* About the skeletons. */
679 /* b4_pkgdatadir is used inside m4_include in the skeletons, so digraphs
680 would never be expanded. Hopefully no one has M4-special characters in
681 his Bison installation path. */
682 MUSCLE_INSERT_STRING_RAW ("pkgdatadir", pkgdatadir ());
687 /*----------------------------------------------------------.
688 | Output the parsing tables and the parser code to ftable. |
689 `----------------------------------------------------------*/
694 obstack_init (&format_obstack
);
700 prepare_symbol_definitions ();
704 /* Process the selected skeleton file. */
707 obstack_free (&format_obstack
, NULL
);
713 char const *cp
= getenv ("BISON_PKGDATADIR");
714 return cp
? cp
: PKGDATADIR
;