1 /* Output the generated parsing program for Bison.
3 Copyright (C) 1984, 1986, 1989, 1992, 2000-2012 Free Software
6 This file is part of Bison, the GNU Compiler Compiler.
8 This program is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
24 #include <configmake.h>
26 #include <get-errno.h>
28 #include <spawn-pipe.h>
30 #include <wait-process.h>
36 #include "muscle-tab.h"
39 #include "scan-code.h" /* max_left_semantic_context */
40 #include "scan-skel.h"
44 # define ARRAY_CARDINALITY(Array) (sizeof (Array) / sizeof *(Array))
46 static struct obstack format_obstack
;
49 /*-------------------------------------------------------------------.
50 | Create a function NAME which associates to the muscle NAME the |
51 | result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of |
52 | TYPE), and to the muscle NAME_max, the max value of the |
54 `-------------------------------------------------------------------*/
57 #define GENERATE_MUSCLE_INSERT_TABLE(Name, Type) \
60 Name (char const *name, \
73 obstack_fgrow1 (&format_obstack, "%6d", first); \
74 for (i = begin; i < end; ++i) \
76 obstack_1grow (&format_obstack, ','); \
79 obstack_sgrow (&format_obstack, "\n "); \
84 obstack_fgrow1 (&format_obstack, "%6d", table_data[i]); \
85 if (table_data[i] < min) \
86 min = table_data[i]; \
87 if (max < table_data[i]) \
88 max = table_data[i]; \
90 obstack_1grow (&format_obstack, 0); \
91 muscle_insert (name, obstack_finish (&format_obstack)); \
95 /* Build `NAME_min' and `NAME_max' in the obstack. */ \
96 obstack_fgrow1 (&format_obstack, "%s_min", name); \
97 obstack_1grow (&format_obstack, 0); \
98 MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmin); \
99 obstack_fgrow1 (&format_obstack, "%s_max", name); \
100 obstack_1grow (&format_obstack, 0); \
101 MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmax); \
104 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_unsigned_int_table
, unsigned int)
105 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_int_table
, int)
106 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_base_table
, base_number
)
107 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_rule_number_table
, rule_number
)
108 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_symbol_number_table
, symbol_number
)
109 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_item_number_table
, item_number
)
110 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_state_number_table
, state_number
)
113 /*--------------------------------------------------------------------.
114 | Print to OUT a representation of STRING escaped both for C and M4. |
115 `--------------------------------------------------------------------*/
118 escaped_output (FILE *out
, char const *string
)
123 for (p
= quotearg_style (c_quoting_style
, string
); *p
; p
++)
126 case '$': fputs ("$][", out
); break;
127 case '@': fputs ("@@", out
); break;
128 case '[': fputs ("@{", out
); break;
129 case ']': fputs ("@}", out
); break;
130 default: fputc (*p
, out
); break;
137 /*------------------------------------------------------------------.
138 | Prepare the muscles related to the symbols: translate, tname, and |
140 `------------------------------------------------------------------*/
143 prepare_symbols (void)
145 MUSCLE_INSERT_INT ("tokens_number", ntokens
);
146 MUSCLE_INSERT_INT ("nterms_number", nvars
);
147 MUSCLE_INSERT_INT ("undef_token_number", undeftoken
->number
);
148 MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number
);
150 muscle_insert_symbol_number_table ("translate",
152 token_translations
[0],
153 1, max_user_token_number
+ 1);
155 /* tname -- token names. */
158 /* We assume that the table will be output starting at column 2. */
160 struct quoting_options
*qo
= clone_quoting_options (0);
161 set_quoting_style (qo
, c_quoting_style
);
162 set_quoting_flags (qo
, QA_SPLIT_TRIGRAPHS
);
163 for (i
= 0; i
< nsyms
; i
++)
165 char *cp
= quotearg_alloc (symbols
[i
]->tag
, -1, qo
);
166 /* Width of the next token, including the two quotes, the
167 comma and the space. */
168 int width
= strlen (cp
) + 2;
172 obstack_sgrow (&format_obstack
, "\n ");
177 obstack_1grow (&format_obstack
, ' ');
178 MUSCLE_OBSTACK_SGROW (&format_obstack
, cp
);
180 obstack_1grow (&format_obstack
, ',');
184 obstack_sgrow (&format_obstack
, " ]b4_null[");
186 /* Finish table and store. */
187 obstack_1grow (&format_obstack
, 0);
188 muscle_insert ("tname", obstack_finish (&format_obstack
));
191 /* Output YYTOKNUM. */
194 int *values
= xnmalloc (ntokens
, sizeof *values
);
195 for (i
= 0; i
< ntokens
; ++i
)
196 values
[i
] = symbols
[i
]->user_token_number
;
197 muscle_insert_int_table ("toknum", values
,
198 values
[0], 1, ntokens
);
204 /*-------------------------------------------------------------.
205 | Prepare the muscles related to the rules: rhs, prhs, r1, r2, |
206 | rline, dprec, merger. |
207 `-------------------------------------------------------------*/
214 item_number
*rhs
= xnmalloc (nritems
, sizeof *rhs
);
215 unsigned int *prhs
= xnmalloc (nrules
, sizeof *prhs
);
216 unsigned int *rline
= xnmalloc (nrules
, sizeof *rline
);
217 symbol_number
*r1
= xnmalloc (nrules
, sizeof *r1
);
218 unsigned int *r2
= xnmalloc (nrules
, sizeof *r2
);
219 int *dprec
= xnmalloc (nrules
, sizeof *dprec
);
220 int *merger
= xnmalloc (nrules
, sizeof *merger
);
222 for (r
= 0; r
< nrules
; ++r
)
224 item_number
*rhsp
= NULL
;
225 /* Index of rule R in RHS. */
227 /* RHS of the rule R. */
228 for (rhsp
= rules
[r
].rhs
; *rhsp
>= 0; ++rhsp
)
230 /* LHS of the rule R. */
231 r1
[r
] = rules
[r
].lhs
->number
;
232 /* Length of rule R's RHS. */
234 /* Separator in RHS. */
236 /* Line where rule was defined. */
237 rline
[r
] = rules
[r
].location
.start
.line
;
238 /* Dynamic precedence (GLR). */
239 dprec
[r
] = rules
[r
].dprec
;
240 /* Merger-function index (GLR). */
241 merger
[r
] = rules
[r
].merger
;
245 muscle_insert_item_number_table ("rhs", rhs
, ritem
[0], 1, nritems
);
246 muscle_insert_unsigned_int_table ("prhs", prhs
, 0, 0, nrules
);
247 muscle_insert_unsigned_int_table ("rline", rline
, 0, 0, nrules
);
248 muscle_insert_symbol_number_table ("r1", r1
, 0, 0, nrules
);
249 muscle_insert_unsigned_int_table ("r2", r2
, 0, 0, nrules
);
250 muscle_insert_int_table ("dprec", dprec
, 0, 0, nrules
);
251 muscle_insert_int_table ("merger", merger
, 0, 0, nrules
);
253 MUSCLE_INSERT_INT ("rules_number", nrules
);
254 MUSCLE_INSERT_INT ("max_left_semantic_context", max_left_semantic_context
);
265 /*--------------------------------------------.
266 | Prepare the muscles related to the states. |
267 `--------------------------------------------*/
270 prepare_states (void)
273 symbol_number
*values
= xnmalloc (nstates
, sizeof *values
);
274 for (i
= 0; i
< nstates
; ++i
)
275 values
[i
] = states
[i
]->accessing_symbol
;
276 muscle_insert_symbol_number_table ("stos", values
,
280 MUSCLE_INSERT_INT ("last", high
);
281 MUSCLE_INSERT_INT ("final_state_number", final_state
->number
);
282 MUSCLE_INSERT_INT ("states_number", nstates
);
287 /*---------------------------------.
288 | Output the user actions to OUT. |
289 `---------------------------------*/
292 user_actions_output (FILE *out
)
296 fputs ("m4_define([b4_actions], \n[", out
);
297 for (r
= 0; r
< nrules
; ++r
)
300 fprintf (out
, "b4_case(%d, [b4_syncline(%d, ", r
+ 1,
301 rules
[r
].action_location
.start
.line
);
302 escaped_output (out
, rules
[r
].action_location
.start
.file
);
303 fprintf (out
, ")\n[ %s]])\n\n", rules
[r
].action
);
305 fputs ("])\n\n", out
);
308 /*--------------------------------------.
309 | Output the merge functions to OUT. |
310 `--------------------------------------*/
313 merger_output (FILE *out
)
318 fputs ("m4_define([b4_mergers], \n[[", out
);
319 for (n
= 1, p
= merge_functions
; p
!= NULL
; n
+= 1, p
= p
->next
)
321 if (p
->type
[0] == '\0')
322 fprintf (out
, " case %d: *yy0 = %s (*yy0, *yy1); break;\n",
325 fprintf (out
, " case %d: yy0->%s = %s (*yy0, *yy1); break;\n",
326 n
, p
->type
, p
->name
);
328 fputs ("]])\n\n", out
);
331 /*--------------------------------------.
332 | Output the tokens definition to OUT. |
333 `--------------------------------------*/
336 token_definitions_output (FILE *out
)
339 char const *sep
= "";
341 fputs ("m4_define([b4_tokens], \n[", out
);
342 for (i
= 0; i
< ntokens
; ++i
)
344 symbol
*sym
= symbols
[i
];
345 int number
= sym
->user_token_number
;
347 /* At this stage, if there are literal string aliases, they are
348 part of SYMBOLS, so we should not find their aliased symbols
350 aver (number
!= USER_NUMBER_HAS_STRING_ALIAS
);
352 /* Skip error token. */
356 /* If this string has an alias, then it is necessarily the alias
357 which is to be output. */
361 /* Don't output literal chars or strings (when defined only as a
362 string). Note that must be done after the alias resolution:
363 think about `%token 'f' "f"'. */
364 if (sym
->tag
[0] == '\'' || sym
->tag
[0] == '\"')
367 /* Don't #define nonliteral tokens whose names contain periods,
368 dashes or '$' (as does the default value of the EOF token). */
369 if (mbschr (sym
->tag
, '.')
370 || mbschr (sym
->tag
, '-')
371 || mbschr (sym
->tag
, '$'))
374 fprintf (out
, "%s[[[%s]], %d]",
375 sep
, sym
->tag
, number
);
378 fputs ("])\n\n", out
);
382 /*---------------------------------------------------.
383 | Output the symbol destructors or printers to OUT. |
384 `---------------------------------------------------*/
387 symbol_code_props_output (FILE *out
, char const *what
,
388 code_props
const *(*get
)(symbol
const *))
391 char const *sep
= "";
393 fputs ("m4_define([b4_symbol_", out
);
395 fputs ("], \n[", out
);
396 for (i
= 0; i
< nsyms
; ++i
)
398 symbol
*sym
= symbols
[i
];
399 char const *code
= (*get
) (sym
)->code
;
402 location loc
= (*get
) (sym
)->location
;
404 Symbol-name, Symbol-number,
405 code, optional typename. */
406 fprintf (out
, "%s[", sep
);
408 escaped_output (out
, loc
.start
.file
);
409 fprintf (out
, ", %d, ", loc
.start
.line
);
410 escaped_output (out
, sym
->tag
);
411 fprintf (out
, ", %d, [[%s]]", sym
->number
, code
);
413 fprintf (out
, ", [[%s]]", sym
->type_name
);
417 fputs ("])\n\n", out
);
422 prepare_actions (void)
424 /* Figure out the actions for the specified state, indexed by
425 lookahead token type. */
427 muscle_insert_rule_number_table ("defact", yydefact
,
428 yydefact
[0], 1, nstates
);
430 /* Figure out what to do after reducing with each rule, depending on
431 the saved state from before the beginning of parsing the data
432 that matched this rule. */
433 muscle_insert_state_number_table ("defgoto", yydefgoto
,
434 yydefgoto
[0], 1, nsyms
- ntokens
);
438 muscle_insert_base_table ("pact", base
,
439 base
[0], 1, nstates
);
440 MUSCLE_INSERT_INT ("pact_ninf", base_ninf
);
443 muscle_insert_base_table ("pgoto", base
,
444 base
[nstates
], nstates
+ 1, nvectors
);
446 muscle_insert_base_table ("table", table
,
447 table
[0], 1, high
+ 1);
448 MUSCLE_INSERT_INT ("table_ninf", table_ninf
);
450 muscle_insert_base_table ("check", check
,
451 check
[0], 1, high
+ 1);
453 /* GLR parsing slightly modifies YYTABLE and YYCHECK (and thus
454 YYPACT) so that in states with unresolved conflicts, the default
455 reduction is not used in the conflicted entries, so that there is
456 a place to put a conflict pointer.
458 This means that YYCONFLP and YYCONFL are nonsense for a non-GLR
459 parser, so we could avoid accidents by not writing them out in
460 that case. Nevertheless, it seems even better to be able to use
461 the GLR skeletons even without the non-deterministic tables. */
462 muscle_insert_unsigned_int_table ("conflict_list_heads", conflict_table
,
463 conflict_table
[0], 1, high
+ 1);
464 muscle_insert_unsigned_int_table ("conflicting_rules", conflict_list
,
465 0, 1, conflict_list_cnt
);
468 /*--------------------------------------------.
469 | Output the definitions of all the muscles. |
470 `--------------------------------------------*/
473 muscles_output (FILE *out
)
475 fputs ("m4_init()\n", out
);
477 user_actions_output (out
);
479 token_definitions_output (out
);
480 symbol_code_props_output (out
, "destructors", &symbol_destructor_get
);
481 symbol_code_props_output (out
, "printers", &symbol_printer_get
);
483 muscles_m4_output (out
);
486 /*---------------------------.
487 | Call the skeleton parser. |
488 `---------------------------*/
491 output_skeleton (void)
495 char const *argv
[10];
498 /* Compute the names of the package data dir and skeleton files. */
499 char const m4sugar
[] = "m4sugar/m4sugar.m4";
500 char const m4bison
[] = "bison.m4";
505 char const *m4
= (p
= getenv ("M4")) ? p
: M4
;
506 char const *pkgdatadir
= compute_pkgdatadir ();
507 size_t skeleton_size
= strlen (skeleton
) + 1;
508 size_t pkgdatadirlen
= strlen (pkgdatadir
);
509 while (pkgdatadirlen
&& pkgdatadir
[pkgdatadirlen
- 1] == '/')
511 full_skeleton
= xmalloc (pkgdatadirlen
+ 1
512 + (skeleton_size
< sizeof m4sugar
513 ? sizeof m4sugar
: skeleton_size
));
514 memcpy (full_skeleton
, pkgdatadir
, pkgdatadirlen
);
515 full_skeleton
[pkgdatadirlen
] = '/';
516 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, m4sugar
);
517 full_m4sugar
= xstrdup (full_skeleton
);
518 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, m4bison
);
519 full_m4bison
= xstrdup (full_skeleton
);
520 if (mbschr (skeleton
, '/'))
521 strcpy (full_skeleton
, skeleton
);
523 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, skeleton
);
525 /* Test whether m4sugar.m4 is readable, to check for proper
526 installation. A faulty installation can cause deadlock, so a
527 cheap sanity check is worthwhile. */
528 xfclose (xfopen (full_m4sugar
, "r"));
530 /* Create an m4 subprocess connected to us via two pipes. */
532 if (trace_flag
& trace_tools
)
533 fprintf (stderr
, "running: %s %s - %s %s\n",
534 m4
, full_m4sugar
, full_m4bison
, full_skeleton
);
536 /* Some future version of GNU M4 (most likely 1.6) may treat the -dV in a
537 position-dependent manner. Keep it as the first argument so that all
540 See the thread starting at
541 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
547 /* When POSIXLY_CORRECT is set, GNU M4 1.6 and later disable GNU
548 extensions, which Bison's skeletons depend on. With older M4,
549 it has no effect. M4 1.4.12 added a -g/--gnu command-line
550 option to make it explicit that a program wants GNU M4
551 extensions even when POSIXLY_CORRECT is set.
553 See the thread starting at
554 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
557 argv
[i
++] = M4_GNU_OPTION
;
560 argv
[i
++] = pkgdatadir
;
561 if (trace_flag
& trace_m4
)
563 argv
[i
++] = full_m4sugar
;
565 argv
[i
++] = full_m4bison
;
566 argv
[i
++] = full_skeleton
;
568 aver (i
<= ARRAY_CARDINALITY (argv
));
571 /* The ugly cast is because gnulib gets the const-ness wrong. */
572 pid
= create_pipe_bidi ("m4", m4
, (char **)(void*)argv
, false, true,
576 free (full_skeleton
);
578 if (trace_flag
& trace_muscles
)
579 muscles_output (stderr
);
581 FILE *out
= fdopen (filter_fd
[1], "w");
583 error (EXIT_FAILURE
, get_errno (),
585 muscles_output (out
);
589 /* Read and process m4's output. */
590 timevar_push (TV_M4
);
591 in
= fdopen (filter_fd
[0], "r");
593 error (EXIT_FAILURE
, get_errno (),
596 /* scan_skel should have read all of M4's output. Otherwise, when we
597 close the pipe, we risk letting M4 report a broken-pipe to the
601 wait_subprocess (pid
, "m4", false, false, true, true, NULL
);
608 /* BISON_USE_PUSH_FOR_PULL is for the test suite and should not be documented
610 char const *use_push_for_pull_env
= getenv ("BISON_USE_PUSH_FOR_PULL");
611 bool use_push_for_pull_flag
= false;
612 if (use_push_for_pull_env
!= NULL
613 && use_push_for_pull_env
[0] != '\0'
614 && 0 != strcmp (use_push_for_pull_env
, "0"))
615 use_push_for_pull_flag
= true;
618 MUSCLE_INSERT_BOOL ("debug_flag", debug_flag
);
619 MUSCLE_INSERT_BOOL ("defines_flag", defines_flag
);
620 MUSCLE_INSERT_BOOL ("error_verbose_flag", error_verbose
);
621 MUSCLE_INSERT_BOOL ("glr_flag", glr_parser
);
622 MUSCLE_INSERT_BOOL ("locations_flag", locations_flag
);
623 MUSCLE_INSERT_BOOL ("nondeterministic_flag", nondeterministic_parser
);
624 MUSCLE_INSERT_BOOL ("synclines_flag", !no_lines_flag
);
625 MUSCLE_INSERT_BOOL ("tag_seen_flag", tag_seen
);
626 MUSCLE_INSERT_BOOL ("token_table_flag", token_table_flag
);
627 MUSCLE_INSERT_BOOL ("use_push_for_pull_flag", use_push_for_pull_flag
);
628 MUSCLE_INSERT_BOOL ("yacc_flag", yacc_flag
);
631 if (spec_name_prefix
)
632 MUSCLE_INSERT_STRING ("prefix", spec_name_prefix
);
634 MUSCLE_INSERT_STRING ("file_name_all_but_ext", all_but_ext
);
636 #define DEFINE(Name) MUSCLE_INSERT_STRING (#Name, Name ? Name : "")
638 DEFINE (parser_file_name
);
639 DEFINE (spec_defines_file
);
640 DEFINE (spec_file_prefix
);
641 DEFINE (spec_graph_file
);
642 DEFINE (spec_name_prefix
);
643 DEFINE (spec_outfile
);
644 DEFINE (spec_verbose_file
);
647 /* Find the right skeleton file, and add muscles about the skeletons. */
649 MUSCLE_INSERT_C_STRING ("skeleton", skeleton
);
651 skeleton
= language
->skeleton
;
653 /* About the skeletons. */
655 /* b4_pkgdatadir is used inside m4_include in the skeletons, so digraphs
656 would never be expanded. Hopefully no one has M4-special characters in
657 his Bison installation path. */
658 MUSCLE_INSERT_STRING_RAW ("pkgdatadir", compute_pkgdatadir ());
663 /*----------------------------------------------------------.
664 | Output the parsing tables and the parser code to ftable. |
665 `----------------------------------------------------------*/
670 obstack_init (&format_obstack
);
679 /* Process the selected skeleton file. */
682 obstack_free (&format_obstack
, NULL
);
686 compute_pkgdatadir (void)
688 char const *pkgdatadir
= getenv ("BISON_PKGDATADIR");
689 return pkgdatadir
? pkgdatadir
: PKGDATADIR
;