1 /* Output the generated parsing program for Bison.
3 Copyright (C) 1984, 1986, 1989, 1992, 2000-2012 Free Software
6 This file is part of Bison, the GNU Compiler Compiler.
8 This program is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
24 #include <concat-filename.h>
25 #include <configmake.h>
27 #include <get-errno.h>
29 #include <spawn-pipe.h>
31 #include <wait-process.h>
37 #include "muscle-tab.h"
40 #include "scan-code.h" /* max_left_semantic_context */
41 #include "scan-skel.h"
45 static struct obstack format_obstack
;
48 /*-------------------------------------------------------------------.
49 | Create a function NAME which associates to the muscle NAME the |
50 | result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of |
51 | TYPE), and to the muscle NAME_max, the max value of the |
53 `-------------------------------------------------------------------*/
56 #define GENERATE_MUSCLE_INSERT_TABLE(Name, Type) \
59 Name (char const *name, \
72 obstack_printf (&format_obstack, "%6d", first); \
73 for (i = begin; i < end; ++i) \
75 obstack_1grow (&format_obstack, ','); \
78 obstack_sgrow (&format_obstack, "\n "); \
83 obstack_printf (&format_obstack, "%6d", table_data[i]); \
84 if (table_data[i] < min) \
85 min = table_data[i]; \
86 if (max < table_data[i]) \
87 max = table_data[i]; \
89 muscle_insert (name, obstack_finish0 (&format_obstack)); \
93 /* Build `NAME_min' and `NAME_max' in the obstack. */ \
94 obstack_printf (&format_obstack, "%s_min", name); \
95 MUSCLE_INSERT_LONG_INT (obstack_finish0 (&format_obstack), lmin); \
96 obstack_printf (&format_obstack, "%s_max", name); \
97 MUSCLE_INSERT_LONG_INT (obstack_finish0 (&format_obstack), lmax); \
100 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_unsigned_int_table
, unsigned int)
101 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_int_table
, int)
102 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_base_table
, base_number
)
103 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_rule_number_table
, rule_number
)
104 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_symbol_number_table
, symbol_number
)
105 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_state_number_table
, state_number
)
108 /*----------------------------------------------------------------.
109 | Print to OUT a representation of CP quoted and escaped for M4. |
110 `----------------------------------------------------------------*/
113 quoted_output (FILE *out
, char const *cp
)
120 case '$': fputs ("$][", out
); break;
121 case '@': fputs ("@@", out
); break;
122 case '[': fputs ("@{", out
); break;
123 case ']': fputs ("@}", out
); break;
124 default: fputc (*cp
, out
); break;
130 /*----------------------------------------------------------------.
131 | Print to OUT a representation of STRING quoted and escaped both |
133 `----------------------------------------------------------------*/
136 string_output (FILE *out
, char const *string
)
138 quoted_output (out
, quotearg_style (c_quoting_style
, string
));
142 /*------------------------------------------------------------------.
143 | Prepare the muscles related to the symbols: translate, tname, and |
145 `------------------------------------------------------------------*/
148 prepare_symbols (void)
150 MUSCLE_INSERT_INT ("tokens_number", ntokens
);
151 MUSCLE_INSERT_INT ("nterms_number", nvars
);
152 MUSCLE_INSERT_INT ("symbols_number", nsyms
);
153 MUSCLE_INSERT_INT ("undef_token_number", undeftoken
->number
);
154 MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number
);
156 muscle_insert_symbol_number_table ("translate",
158 token_translations
[0],
159 1, max_user_token_number
+ 1);
161 /* tname -- token names. */
164 /* We assume that the table will be output starting at column 2. */
166 struct quoting_options
*qo
= clone_quoting_options (0);
167 set_quoting_style (qo
, c_quoting_style
);
168 set_quoting_flags (qo
, QA_SPLIT_TRIGRAPHS
);
169 for (i
= 0; i
< nsyms
; i
++)
171 char *cp
= quotearg_alloc (symbols
[i
]->tag
, -1, qo
);
172 /* Width of the next token, including the two quotes, the
173 comma and the space. */
174 int width
= strlen (cp
) + 2;
178 obstack_sgrow (&format_obstack
, "\n ");
183 obstack_1grow (&format_obstack
, ' ');
184 obstack_escape (&format_obstack
, cp
);
186 obstack_1grow (&format_obstack
, ',');
190 obstack_sgrow (&format_obstack
, " ]b4_null[");
192 /* Finish table and store. */
193 muscle_insert ("tname", obstack_finish0 (&format_obstack
));
196 /* Output YYTOKNUM. */
199 int *values
= xnmalloc (ntokens
, sizeof *values
);
200 for (i
= 0; i
< ntokens
; ++i
)
201 values
[i
] = symbols
[i
]->user_token_number
;
202 muscle_insert_int_table ("toknum", values
,
203 values
[0], 1, ntokens
);
209 /*----------------------------------------------------------------.
210 | Prepare the muscles related to the rules: r1, r2, rline, dprec, |
211 | merger, immediate. |
212 `----------------------------------------------------------------*/
217 unsigned int *rline
= xnmalloc (nrules
, sizeof *rline
);
218 symbol_number
*r1
= xnmalloc (nrules
, sizeof *r1
);
219 unsigned int *r2
= xnmalloc (nrules
, sizeof *r2
);
220 int *dprec
= xnmalloc (nrules
, sizeof *dprec
);
221 int *merger
= xnmalloc (nrules
, sizeof *merger
);
222 int *immediate
= xnmalloc (nrules
, sizeof *immediate
);
225 for (r
= 0; r
< nrules
; ++r
)
227 /* LHS of the rule R. */
228 r1
[r
] = rules
[r
].lhs
->number
;
229 /* Length of rule R's RHS. */
230 r2
[r
] = rule_rhs_length(&rules
[r
]);
231 /* Line where rule was defined. */
232 rline
[r
] = rules
[r
].location
.start
.line
;
233 /* Dynamic precedence (GLR). */
234 dprec
[r
] = rules
[r
].dprec
;
235 /* Merger-function index (GLR). */
236 merger
[r
] = rules
[r
].merger
;
237 /* Immediate reduction flags (GLR). */
238 immediate
[r
] = rules
[r
].is_predicate
;
241 muscle_insert_unsigned_int_table ("rline", rline
, 0, 0, nrules
);
242 muscle_insert_symbol_number_table ("r1", r1
, 0, 0, nrules
);
243 muscle_insert_unsigned_int_table ("r2", r2
, 0, 0, nrules
);
244 muscle_insert_int_table ("dprec", dprec
, 0, 0, nrules
);
245 muscle_insert_int_table ("merger", merger
, 0, 0, nrules
);
246 muscle_insert_int_table ("immediate", immediate
, 0, 0, nrules
);
248 MUSCLE_INSERT_INT ("rules_number", nrules
);
249 MUSCLE_INSERT_INT ("max_left_semantic_context", max_left_semantic_context
);
259 /*--------------------------------------------.
260 | Prepare the muscles related to the states. |
261 `--------------------------------------------*/
264 prepare_states (void)
267 symbol_number
*values
= xnmalloc (nstates
, sizeof *values
);
268 for (i
= 0; i
< nstates
; ++i
)
269 values
[i
] = states
[i
]->accessing_symbol
;
270 muscle_insert_symbol_number_table ("stos", values
,
274 MUSCLE_INSERT_INT ("last", high
);
275 MUSCLE_INSERT_INT ("final_state_number", final_state
->number
);
276 MUSCLE_INSERT_INT ("states_number", nstates
);
280 /*-------------------------------------------------------.
281 | Compare two symbols by type-name, and then by number. |
282 `-------------------------------------------------------*/
285 symbol_type_name_cmp (const symbol
**lhs
, const symbol
**rhs
)
287 int res
= uniqstr_cmp ((*lhs
)->type_name
, (*rhs
)->type_name
);
289 res
= (*lhs
)->number
- (*rhs
)->number
;
294 /*----------------------------------------------------------------.
295 | Return a (malloc'ed) table of the symbols sorted by type-name. |
296 `----------------------------------------------------------------*/
299 symbols_by_type_name (void)
301 typedef int (*qcmp_type
) (const void *, const void *);
302 symbol
**res
= xmemdup (symbols
, nsyms
* sizeof *res
);
303 qsort (res
, nsyms
, sizeof *res
, (qcmp_type
) &symbol_type_name_cmp
);
308 /*------------------------------------------------------------------.
309 | Define b4_type_names, which is a list of (lists of the numbers of |
310 | symbols with same type-name). |
311 `------------------------------------------------------------------*/
314 type_names_output (FILE *out
)
317 symbol
**syms
= symbols_by_type_name ();
318 fputs ("m4_define([b4_type_names],\n[", out
);
319 for (i
= 0; i
< nsyms
; /* nothing */)
321 // The index of the first symbol of the current type-name.
323 fputs (i
? ",\n[" : "[", out
);
324 for (; i
< nsyms
&& syms
[i
]->type_name
== syms
[i0
]->type_name
; ++i
)
325 fprintf (out
, "%s%d", i
!= i0
? ", " : "", syms
[i
]->number
);
328 fputs ("])\n\n", out
);
333 /*-------------------------------------.
334 | The list of all the symbol numbers. |
335 `-------------------------------------*/
338 symbol_numbers_output (FILE *out
)
341 fputs ("m4_define([b4_symbol_numbers],\n[", out
);
342 for (i
= 0; i
< nsyms
; ++i
)
343 fprintf (out
, "%s[%d]", i
? ", " : "", i
);
344 fputs ("])\n\n", out
);
348 /*---------------------------------.
349 | Output the user actions to OUT. |
350 `---------------------------------*/
353 user_actions_output (FILE *out
)
357 fputs ("m4_define([b4_actions], \n[", out
);
358 for (r
= 0; r
< nrules
; ++r
)
361 fprintf (out
, "b4_%scase(%d, [b4_syncline(%d, ",
362 rules
[r
].is_predicate
? "predicate_" : "",
363 r
+ 1, rules
[r
].action_location
.start
.line
);
364 string_output (out
, rules
[r
].action_location
.start
.file
);
365 fprintf (out
, ")\n[ %s]])\n\n", rules
[r
].action
);
367 fputs ("])\n\n", out
);
370 /*------------------------------------.
371 | Output the merge functions to OUT. |
372 `------------------------------------*/
375 merger_output (FILE *out
)
380 fputs ("m4_define([b4_mergers], \n[[", out
);
381 for (n
= 1, p
= merge_functions
; p
!= NULL
; n
+= 1, p
= p
->next
)
383 if (p
->type
[0] == '\0')
384 fprintf (out
, " case %d: *yy0 = %s (*yy0, *yy1); break;\n",
387 fprintf (out
, " case %d: yy0->%s = %s (*yy0, *yy1); break;\n",
388 n
, p
->type
, p
->name
);
390 fputs ("]])\n\n", out
);
394 /*---------------------------------------------.
395 | Prepare the muscles for symbol definitions. |
396 `---------------------------------------------*/
399 prepare_symbol_definitions (void)
402 for (i
= 0; i
< nsyms
; ++i
)
404 symbol
*sym
= symbols
[i
];
408 #define SET_KEY(Entry) \
409 obstack_printf (&format_obstack, "symbol(%d, %s)", \
411 key = obstack_finish0 (&format_obstack);
413 #define SET_KEY2(Entry, Suffix) \
414 obstack_printf (&format_obstack, "symbol(%d, %s_%s)", \
416 key = obstack_finish0 (&format_obstack);
418 // Whether the symbol has an identifier.
419 value
= symbol_id_get (sym
);
421 MUSCLE_INSERT_INT (key
, !!value
);
425 MUSCLE_INSERT_STRING (key
, value
? value
: "");
427 // Its tag. Typically for documentation purpose.
429 MUSCLE_INSERT_STRING (key
, sym
->tag
);
431 SET_KEY("user_number");
432 MUSCLE_INSERT_INT (key
, sym
->user_token_number
);
435 MUSCLE_INSERT_INT (key
,
436 i
< ntokens
&& sym
!= errtoken
&& sym
!= undeftoken
);
439 MUSCLE_INSERT_INT (key
, sym
->number
);
442 MUSCLE_INSERT_INT (key
, !!sym
->type_name
);
445 MUSCLE_INSERT_STRING (key
, sym
->type_name
? sym
->type_name
: "");
449 for (j
= 0; j
< CODE_PROPS_SIZE
; ++j
)
451 /* "printer", not "%printer". */
452 char const *pname
= code_props_type_string (j
) + 1;
453 code_props
const *p
= symbol_code_props_get (sym
, j
);
454 SET_KEY2("has", pname
);
455 MUSCLE_INSERT_INT (key
, !!p
->code
);
459 SET_KEY2(pname
, "file");
460 MUSCLE_INSERT_STRING (key
, p
->location
.start
.file
);
462 SET_KEY2(pname
, "line");
463 MUSCLE_INSERT_INT (key
, p
->location
.start
.line
);
466 MUSCLE_INSERT_STRING_RAW (key
, p
->code
);
477 prepare_actions (void)
479 /* Figure out the actions for the specified state, indexed by
480 lookahead token type. */
482 muscle_insert_rule_number_table ("defact", yydefact
,
483 yydefact
[0], 1, nstates
);
485 /* Figure out what to do after reducing with each rule, depending on
486 the saved state from before the beginning of parsing the data
487 that matched this rule. */
488 muscle_insert_state_number_table ("defgoto", yydefgoto
,
489 yydefgoto
[0], 1, nsyms
- ntokens
);
493 muscle_insert_base_table ("pact", base
,
494 base
[0], 1, nstates
);
495 MUSCLE_INSERT_INT ("pact_ninf", base_ninf
);
498 muscle_insert_base_table ("pgoto", base
,
499 base
[nstates
], nstates
+ 1, nvectors
);
501 muscle_insert_base_table ("table", table
,
502 table
[0], 1, high
+ 1);
503 MUSCLE_INSERT_INT ("table_ninf", table_ninf
);
505 muscle_insert_base_table ("check", check
,
506 check
[0], 1, high
+ 1);
508 /* GLR parsing slightly modifies YYTABLE and YYCHECK (and thus
509 YYPACT) so that in states with unresolved conflicts, the default
510 reduction is not used in the conflicted entries, so that there is
511 a place to put a conflict pointer.
513 This means that YYCONFLP and YYCONFL are nonsense for a non-GLR
514 parser, so we could avoid accidents by not writing them out in
515 that case. Nevertheless, it seems even better to be able to use
516 the GLR skeletons even without the non-deterministic tables. */
517 muscle_insert_unsigned_int_table ("conflict_list_heads", conflict_table
,
518 conflict_table
[0], 1, high
+ 1);
519 muscle_insert_unsigned_int_table ("conflicting_rules", conflict_list
,
520 0, 1, conflict_list_cnt
);
524 /*--------------------------------------------.
525 | Output the definitions of all the muscles. |
526 `--------------------------------------------*/
529 muscles_output (FILE *out
)
531 fputs ("m4_init()\n", out
);
533 symbol_numbers_output (out
);
534 type_names_output (out
);
535 user_actions_output (out
);
537 muscles_m4_output (out
);
540 /*---------------------------.
541 | Call the skeleton parser. |
542 `---------------------------*/
545 output_skeleton (void)
550 /* Compute the names of the package data dir and skeleton files. */
551 char const *m4
= (m4
= getenv ("M4")) ? m4
: M4
;
552 char const *datadir
= pkgdatadir ();
553 char *m4sugar
= xconcatenated_filename (datadir
, "m4sugar/m4sugar.m4", NULL
);
554 char *m4bison
= xconcatenated_filename (datadir
, "bison.m4", NULL
);
555 char *skel
= (IS_PATH_WITH_DIR (skeleton
)
557 : xconcatenated_filename (datadir
, skeleton
, NULL
));
559 /* Test whether m4sugar.m4 is readable, to check for proper
560 installation. A faulty installation can cause deadlock, so a
561 cheap sanity check is worthwhile. */
562 xfclose (xfopen (m4sugar
, "r"));
564 /* Create an m4 subprocess connected to us via two pipes. */
566 if (trace_flag
& trace_tools
)
567 fprintf (stderr
, "running: %s %s - %s %s\n",
568 m4
, m4sugar
, m4bison
, skel
);
570 /* Some future version of GNU M4 (most likely 1.6) may treat the -dV in a
571 position-dependent manner. Keep it as the first argument so that all
574 See the thread starting at
575 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
578 char const *argv
[10];
582 /* When POSIXLY_CORRECT is set, GNU M4 1.6 and later disable GNU
583 extensions, which Bison's skeletons depend on. With older M4,
584 it has no effect. M4 1.4.12 added a -g/--gnu command-line
585 option to make it explicit that a program wants GNU M4
586 extensions even when POSIXLY_CORRECT is set.
588 See the thread starting at
589 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
592 argv
[i
++] = M4_GNU_OPTION
;
596 if (trace_flag
& trace_m4
)
603 aver (i
<= ARRAY_CARDINALITY (argv
));
605 /* The ugly cast is because gnulib gets the const-ness wrong. */
606 pid
= create_pipe_bidi ("m4", m4
, (char **)(void*)argv
, false, true,
614 if (trace_flag
& trace_muscles
)
615 muscles_output (stderr
);
617 FILE *out
= xfdopen (filter_fd
[1], "w");
618 muscles_output (out
);
622 /* Read and process m4's output. */
623 timevar_push (TV_M4
);
625 FILE *in
= xfdopen (filter_fd
[0], "r");
627 /* scan_skel should have read all of M4's output. Otherwise, when we
628 close the pipe, we risk letting M4 report a broken-pipe to the
633 wait_subprocess (pid
, "m4", false, false, true, true, NULL
);
640 /* BISON_USE_PUSH_FOR_PULL is for the test suite and should not be
641 documented for the user. */
642 char const *cp
= getenv ("BISON_USE_PUSH_FOR_PULL");
643 bool use_push_for_pull_flag
= cp
&& *cp
&& strtol (cp
, 0, 10);
646 MUSCLE_INSERT_BOOL ("defines_flag", defines_flag
);
647 MUSCLE_INSERT_BOOL ("glr_flag", glr_parser
);
648 MUSCLE_INSERT_BOOL ("nondeterministic_flag", nondeterministic_parser
);
649 MUSCLE_INSERT_BOOL ("synclines_flag", !no_lines_flag
);
650 MUSCLE_INSERT_BOOL ("tag_seen_flag", tag_seen
);
651 MUSCLE_INSERT_BOOL ("token_table_flag", token_table_flag
);
652 MUSCLE_INSERT_BOOL ("use_push_for_pull_flag", use_push_for_pull_flag
);
653 MUSCLE_INSERT_BOOL ("yacc_flag", yacc_flag
);
656 if (spec_name_prefix
)
657 MUSCLE_INSERT_STRING ("prefix", spec_name_prefix
);
659 MUSCLE_INSERT_STRING ("file_name_all_but_ext", all_but_ext
);
661 #define DEFINE(Name) MUSCLE_INSERT_STRING (#Name, Name ? Name : "")
663 DEFINE (parser_file_name
);
664 DEFINE (spec_defines_file
);
665 DEFINE (spec_file_prefix
);
666 DEFINE (spec_graph_file
);
667 DEFINE (spec_name_prefix
);
668 DEFINE (spec_outfile
);
669 DEFINE (spec_verbose_file
);
672 /* Find the right skeleton file, and add muscles about the skeletons. */
674 MUSCLE_INSERT_C_STRING ("skeleton", skeleton
);
676 skeleton
= language
->skeleton
;
678 /* About the skeletons. */
680 /* b4_pkgdatadir is used inside m4_include in the skeletons, so digraphs
681 would never be expanded. Hopefully no one has M4-special characters in
682 his Bison installation path. */
683 MUSCLE_INSERT_STRING_RAW ("pkgdatadir", pkgdatadir ());
688 /*----------------------------------------------------------.
689 | Output the parsing tables and the parser code to ftable. |
690 `----------------------------------------------------------*/
695 obstack_init (&format_obstack
);
701 prepare_symbol_definitions ();
705 /* Process the selected skeleton file. */
708 obstack_free (&format_obstack
, NULL
);
714 char const *cp
= getenv ("BISON_PKGDATADIR");
715 return cp
? cp
: PKGDATADIR
;