1 /* Output the generated parsing program for Bison.
3 Copyright (C) 1984, 1986, 1989, 1992, 2000, 2001, 2002, 2003, 2004,
4 2005, 2006, 2007, 2008-2009 Free Software Foundation, Inc.
6 This file is part of Bison, the GNU Compiler Compiler.
8 This program is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
25 #include <configmake.h>
27 #include <get-errno.h>
36 #include "muscle_tab.h"
39 #include "scan-code.h" /* max_left_semantic_context */
40 #include "scan-skel.h"
44 # define ARRAY_CARDINALITY(Array) (sizeof (Array) / sizeof *(Array))
46 static struct obstack format_obstack
;
49 /*-------------------------------------------------------------------.
50 | Create a function NAME which associates to the muscle NAME the |
51 | result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of |
52 | TYPE), and to the muscle NAME_max, the max value of the |
54 `-------------------------------------------------------------------*/
57 #define GENERATE_MUSCLE_INSERT_TABLE(Name, Type) \
60 Name (char const *name, \
73 obstack_fgrow1 (&format_obstack, "%6d", first); \
74 for (i = begin; i < end; ++i) \
76 obstack_1grow (&format_obstack, ','); \
79 obstack_sgrow (&format_obstack, "\n "); \
84 obstack_fgrow1 (&format_obstack, "%6d", table_data[i]); \
85 if (table_data[i] < min) \
86 min = table_data[i]; \
87 if (max < table_data[i]) \
88 max = table_data[i]; \
90 obstack_1grow (&format_obstack, 0); \
91 muscle_insert (name, obstack_finish (&format_obstack)); \
95 /* Build `NAME_min' and `NAME_max' in the obstack. */ \
96 obstack_fgrow1 (&format_obstack, "%s_min", name); \
97 obstack_1grow (&format_obstack, 0); \
98 MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmin); \
99 obstack_fgrow1 (&format_obstack, "%s_max", name); \
100 obstack_1grow (&format_obstack, 0); \
101 MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmax); \
104 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_unsigned_int_table
, unsigned int)
105 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_int_table
, int)
106 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_base_table
, base_number
)
107 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_rule_number_table
, rule_number
)
108 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_symbol_number_table
, symbol_number
)
109 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_item_number_table
, item_number
)
110 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_state_number_table
, state_number
)
113 /*--------------------------------------------------------------------.
114 | Print to OUT a representation of STRING escaped both for C and M4. |
115 `--------------------------------------------------------------------*/
118 escaped_output (FILE *out
, char const *string
)
123 for (p
= quotearg_style (c_quoting_style
, string
); *p
; p
++)
126 case '$': fputs ("$][", out
); break;
127 case '@': fputs ("@@", out
); break;
128 case '[': fputs ("@{", out
); break;
129 case ']': fputs ("@}", out
); break;
130 default: fputc (*p
, out
); break;
137 /*------------------------------------------------------------------.
138 | Prepare the muscles related to the symbols: translate, tname, and |
140 `------------------------------------------------------------------*/
143 prepare_symbols (void)
145 MUSCLE_INSERT_BOOL ("token_table", token_table_flag
);
146 MUSCLE_INSERT_INT ("tokens_number", ntokens
);
147 MUSCLE_INSERT_INT ("nterms_number", nvars
);
148 MUSCLE_INSERT_INT ("undef_token_number", undeftoken
->number
);
149 MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number
);
151 muscle_insert_symbol_number_table ("translate",
153 token_translations
[0],
154 1, max_user_token_number
+ 1);
156 /* tname -- token names. */
159 /* We assume that the table will be output starting at column 2. */
161 struct quoting_options
*qo
= clone_quoting_options (0);
162 set_quoting_style (qo
, c_quoting_style
);
163 set_quoting_flags (qo
, QA_SPLIT_TRIGRAPHS
);
164 for (i
= 0; i
< nsyms
; i
++)
166 char *cp
= quotearg_alloc (symbols
[i
]->tag
, -1, qo
);
167 /* Width of the next token, including the two quotes, the
168 comma and the space. */
169 int width
= strlen (cp
) + 2;
173 obstack_sgrow (&format_obstack
, "\n ");
178 obstack_1grow (&format_obstack
, ' ');
179 MUSCLE_OBSTACK_SGROW (&format_obstack
, cp
);
181 obstack_1grow (&format_obstack
, ',');
185 obstack_sgrow (&format_obstack
, " ]b4_null[");
187 /* Finish table and store. */
188 obstack_1grow (&format_obstack
, 0);
189 muscle_insert ("tname", obstack_finish (&format_obstack
));
192 /* Output YYTOKNUM. */
195 int *values
= xnmalloc (ntokens
, sizeof *values
);
196 for (i
= 0; i
< ntokens
; ++i
)
197 values
[i
] = symbols
[i
]->user_token_number
;
198 muscle_insert_int_table ("toknum", values
,
199 values
[0], 1, ntokens
);
205 /*-------------------------------------------------------------.
206 | Prepare the muscles related to the rules: rhs, prhs, r1, r2, |
207 | rline, dprec, merger. |
208 `-------------------------------------------------------------*/
215 item_number
*rhs
= xnmalloc (nritems
, sizeof *rhs
);
216 unsigned int *prhs
= xnmalloc (nrules
, sizeof *prhs
);
217 unsigned int *rline
= xnmalloc (nrules
, sizeof *rline
);
218 symbol_number
*r1
= xnmalloc (nrules
, sizeof *r1
);
219 unsigned int *r2
= xnmalloc (nrules
, sizeof *r2
);
220 int *dprec
= xnmalloc (nrules
, sizeof *dprec
);
221 int *merger
= xnmalloc (nrules
, sizeof *merger
);
223 for (r
= 0; r
< nrules
; ++r
)
225 item_number
*rhsp
= NULL
;
226 /* Index of rule R in RHS. */
228 /* RHS of the rule R. */
229 for (rhsp
= rules
[r
].rhs
; *rhsp
>= 0; ++rhsp
)
231 /* LHS of the rule R. */
232 r1
[r
] = rules
[r
].lhs
->number
;
233 /* Length of rule R's RHS. */
235 /* Separator in RHS. */
237 /* Line where rule was defined. */
238 rline
[r
] = rules
[r
].location
.start
.line
;
239 /* Dynamic precedence (GLR). */
240 dprec
[r
] = rules
[r
].dprec
;
241 /* Merger-function index (GLR). */
242 merger
[r
] = rules
[r
].merger
;
246 muscle_insert_item_number_table ("rhs", rhs
, ritem
[0], 1, nritems
);
247 muscle_insert_unsigned_int_table ("prhs", prhs
, 0, 0, nrules
);
248 muscle_insert_unsigned_int_table ("rline", rline
, 0, 0, nrules
);
249 muscle_insert_symbol_number_table ("r1", r1
, 0, 0, nrules
);
250 muscle_insert_unsigned_int_table ("r2", r2
, 0, 0, nrules
);
251 muscle_insert_int_table ("dprec", dprec
, 0, 0, nrules
);
252 muscle_insert_int_table ("merger", merger
, 0, 0, nrules
);
254 MUSCLE_INSERT_INT ("rules_number", nrules
);
255 MUSCLE_INSERT_INT ("max_left_semantic_context", max_left_semantic_context
);
266 /*--------------------------------------------.
267 | Prepare the muscles related to the states. |
268 `--------------------------------------------*/
271 prepare_states (void)
274 symbol_number
*values
= xnmalloc (nstates
, sizeof *values
);
275 for (i
= 0; i
< nstates
; ++i
)
276 values
[i
] = states
[i
]->accessing_symbol
;
277 muscle_insert_symbol_number_table ("stos", values
,
281 MUSCLE_INSERT_INT ("last", high
);
282 MUSCLE_INSERT_INT ("final_state_number", final_state
->number
);
283 MUSCLE_INSERT_INT ("states_number", nstates
);
288 /*---------------------------------.
289 | Output the user actions to OUT. |
290 `---------------------------------*/
293 user_actions_output (FILE *out
)
297 fputs ("m4_define([b4_actions], \n[", out
);
298 for (r
= 0; r
< nrules
; ++r
)
301 fprintf (out
, "b4_case(%d, [b4_syncline(%d, ", r
+ 1,
302 rules
[r
].action_location
.start
.line
);
303 escaped_output (out
, rules
[r
].action_location
.start
.file
);
304 fprintf (out
, ")\n[ %s]])\n\n", rules
[r
].action
);
306 fputs ("])\n\n", out
);
309 /*--------------------------------------.
310 | Output the merge functions to OUT. |
311 `--------------------------------------*/
314 merger_output (FILE *out
)
319 fputs ("m4_define([b4_mergers], \n[[", out
);
320 for (n
= 1, p
= merge_functions
; p
!= NULL
; n
+= 1, p
= p
->next
)
322 if (p
->type
[0] == '\0')
323 fprintf (out
, " case %d: *yy0 = %s (*yy0, *yy1); break;\n",
326 fprintf (out
, " case %d: yy0->%s = %s (*yy0, *yy1); break;\n",
327 n
, p
->type
, p
->name
);
329 fputs ("]])\n\n", out
);
332 /*--------------------------------------.
333 | Output the tokens definition to OUT. |
334 `--------------------------------------*/
337 token_definitions_output (FILE *out
)
340 char const *sep
= "";
342 fputs ("m4_define([b4_tokens], \n[", out
);
343 for (i
= 0; i
< ntokens
; ++i
)
345 symbol
*sym
= symbols
[i
];
346 int number
= sym
->user_token_number
;
348 /* At this stage, if there are literal aliases, they are part of
349 SYMBOLS, so we should not find symbols which are the aliases
351 aver (number
!= USER_NUMBER_ALIAS
);
353 /* Skip error token. */
357 /* If this string has an alias, then it is necessarily the alias
358 which is to be output. */
362 /* Don't output literal chars or strings (when defined only as a
363 string). Note that must be done after the alias resolution:
364 think about `%token 'f' "f"'. */
365 if (sym
->tag
[0] == '\'' || sym
->tag
[0] == '\"')
368 /* Don't #define nonliteral tokens whose names contain periods
369 or '$' (as does the default value of the EOF token). */
370 if (strchr (sym
->tag
, '.') || strchr (sym
->tag
, '$'))
373 fprintf (out
, "%s[[[%s]], %d]",
374 sep
, sym
->tag
, number
);
377 fputs ("])\n\n", out
);
381 /*---------------------------------------------------.
382 | Output the symbol destructors or printers to OUT. |
383 `---------------------------------------------------*/
386 symbol_code_props_output (FILE *out
, char const *what
,
387 code_props
const *(*get
)(symbol
const *))
390 char const *sep
= "";
392 fputs ("m4_define([b4_symbol_", out
);
394 fputs ("], \n[", out
);
395 for (i
= 0; i
< nsyms
; ++i
)
397 symbol
*sym
= symbols
[i
];
398 char const *code
= (*get
) (sym
)->code
;
401 location loc
= (*get
) (sym
)->location
;
403 Symbol-name, Symbol-number,
404 code, optional typename. */
405 fprintf (out
, "%s[", sep
);
407 escaped_output (out
, loc
.start
.file
);
408 fprintf (out
, ", %d, ", loc
.start
.line
);
409 escaped_output (out
, sym
->tag
);
410 fprintf (out
, ", %d, [[%s]]", sym
->number
, code
);
412 fprintf (out
, ", [[%s]]", sym
->type_name
);
416 fputs ("])\n\n", out
);
421 prepare_actions (void)
423 /* Figure out the actions for the specified state, indexed by
424 lookahead token type. */
426 muscle_insert_rule_number_table ("defact", yydefact
,
427 yydefact
[0], 1, nstates
);
429 /* Figure out what to do after reducing with each rule, depending on
430 the saved state from before the beginning of parsing the data
431 that matched this rule. */
432 muscle_insert_state_number_table ("defgoto", yydefgoto
,
433 yydefgoto
[0], 1, nsyms
- ntokens
);
437 muscle_insert_base_table ("pact", base
,
438 base
[0], 1, nstates
);
439 MUSCLE_INSERT_INT ("pact_ninf", base_ninf
);
442 muscle_insert_base_table ("pgoto", base
,
443 base
[nstates
], nstates
+ 1, nvectors
);
445 muscle_insert_base_table ("table", table
,
446 table
[0], 1, high
+ 1);
447 MUSCLE_INSERT_INT ("table_ninf", table_ninf
);
449 muscle_insert_base_table ("check", check
,
450 check
[0], 1, high
+ 1);
452 /* GLR parsing slightly modifies YYTABLE and YYCHECK (and thus
453 YYPACT) so that in states with unresolved conflicts, the default
454 reduction is not used in the conflicted entries, so that there is
455 a place to put a conflict pointer.
457 This means that YYCONFLP and YYCONFL are nonsense for a non-GLR
458 parser, so we could avoid accidents by not writing them out in
459 that case. Nevertheless, it seems even better to be able to use
460 the GLR skeletons even without the non-deterministic tables. */
461 muscle_insert_unsigned_int_table ("conflict_list_heads", conflict_table
,
462 conflict_table
[0], 1, high
+ 1);
463 muscle_insert_unsigned_int_table ("conflicting_rules", conflict_list
,
464 0, 1, conflict_list_cnt
);
468 /*---------------------------.
469 | Call the skeleton parser. |
470 `---------------------------*/
473 output_skeleton (void)
478 char const *argv
[10];
481 /* Compute the names of the package data dir and skeleton files. */
482 char const m4sugar
[] = "m4sugar/m4sugar.m4";
483 char const m4bison
[] = "bison.m4";
488 char const *m4
= (p
= getenv ("M4")) ? p
: M4
;
489 char const *pkgdatadir
= compute_pkgdatadir ();
490 size_t skeleton_size
= strlen (skeleton
) + 1;
491 size_t pkgdatadirlen
= strlen (pkgdatadir
);
492 while (pkgdatadirlen
&& pkgdatadir
[pkgdatadirlen
- 1] == '/')
494 full_skeleton
= xmalloc (pkgdatadirlen
+ 1
495 + (skeleton_size
< sizeof m4sugar
496 ? sizeof m4sugar
: skeleton_size
));
497 strncpy (full_skeleton
, pkgdatadir
, pkgdatadirlen
);
498 full_skeleton
[pkgdatadirlen
] = '/';
499 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, m4sugar
);
500 full_m4sugar
= xstrdup (full_skeleton
);
501 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, m4bison
);
502 full_m4bison
= xstrdup (full_skeleton
);
503 if (strchr (skeleton
, '/'))
504 strcpy (full_skeleton
, skeleton
);
506 strcpy (full_skeleton
+ pkgdatadirlen
+ 1, skeleton
);
508 /* Test whether m4sugar.m4 is readable, to check for proper
509 installation. A faulty installation can cause deadlock, so a
510 cheap sanity check is worthwhile. */
511 xfclose (xfopen (full_m4sugar
, "r"));
513 /* Create an m4 subprocess connected to us via two pipes. */
515 if (trace_flag
& trace_tools
)
516 fprintf (stderr
, "running: %s %s - %s %s\n",
517 m4
, full_m4sugar
, full_m4bison
, full_skeleton
);
519 /* Some future version of GNU M4 (most likely 1.6) may treat the -dV in a
520 position-dependent manner. Keep it as the first argument so that all
523 See the thread starting at
524 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
530 /* When POSIXLY_CORRECT is set, GNU M4 1.6 and later disable GNU
531 extensions, which Bison's skeletons depend on. With older M4,
532 it has no effect. M4 1.4.12 added a -g/--gnu command-line
533 option to make it explicit that a program wants GNU M4
534 extensions even when POSIXLY_CORRECT is set.
536 See the thread starting at
537 <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html>
540 argv
[i
++] = M4_GNU_OPTION
;
543 argv
[i
++] = pkgdatadir
;
544 if (trace_flag
& trace_m4
)
546 argv
[i
++] = full_m4sugar
;
548 argv
[i
++] = full_m4bison
;
549 argv
[i
++] = full_skeleton
;
551 assert (i
<= ARRAY_CARDINALITY (argv
));
555 pid
= create_subpipe (argv
, filter_fd
);
558 free (full_skeleton
);
560 out
= fdopen (filter_fd
[0], "w");
562 error (EXIT_FAILURE
, get_errno (),
565 /* Output the definitions of all the muscles. */
566 fputs ("m4_init()\n", out
);
568 user_actions_output (out
);
570 token_definitions_output (out
);
571 symbol_code_props_output (out
, "destructors", &symbol_destructor_get
);
572 symbol_code_props_output (out
, "printers", &symbol_printer_get
);
574 muscles_m4_output (out
);
577 /* Read and process m4's output. */
578 timevar_push (TV_M4
);
579 end_of_output_subpipe (pid
, filter_fd
);
580 in
= fdopen (filter_fd
[1], "r");
582 error (EXIT_FAILURE
, get_errno (),
586 reap_subpipe (pid
, m4
);
593 /* BISON_USE_PUSH_FOR_PULL is for the test suite and should not be documented
595 char const *use_push_for_pull_env
= getenv ("BISON_USE_PUSH_FOR_PULL");
596 bool use_push_for_pull_flag
= false;
597 if (use_push_for_pull_env
!= NULL
598 && use_push_for_pull_env
[0] != '\0'
599 && 0 != strcmp (use_push_for_pull_env
, "0"))
600 use_push_for_pull_flag
= true;
603 MUSCLE_INSERT_BOOL ("debug_flag", debug_flag
);
604 MUSCLE_INSERT_BOOL ("defines_flag", defines_flag
);
605 MUSCLE_INSERT_BOOL ("error_verbose_flag", error_verbose
);
606 MUSCLE_INSERT_BOOL ("glr_flag", glr_parser
);
607 MUSCLE_INSERT_BOOL ("locations_flag", locations_flag
);
608 MUSCLE_INSERT_BOOL ("nondeterministic_flag", nondeterministic_parser
);
609 MUSCLE_INSERT_BOOL ("synclines_flag", !no_lines_flag
);
610 MUSCLE_INSERT_BOOL ("tag_seen_flag", tag_seen
);
611 MUSCLE_INSERT_BOOL ("use_push_for_pull_flag", use_push_for_pull_flag
);
612 MUSCLE_INSERT_BOOL ("yacc_flag", yacc_flag
);
615 if (spec_name_prefix
)
616 MUSCLE_INSERT_STRING ("prefix", spec_name_prefix
);
618 MUSCLE_INSERT_STRING ("file_name_all_but_ext", all_but_ext
);
620 #define DEFINE(Name) MUSCLE_INSERT_STRING (#Name, Name ? Name : "")
622 DEFINE (parser_file_name
);
623 DEFINE (spec_defines_file
);
624 DEFINE (spec_file_prefix
);
625 DEFINE (spec_graph_file
);
626 DEFINE (spec_name_prefix
);
627 DEFINE (spec_outfile
);
628 DEFINE (spec_verbose_file
);
631 /* Find the right skeleton file, and add muscles about the skeletons. */
633 MUSCLE_INSERT_C_STRING ("skeleton", skeleton
);
635 skeleton
= language
->skeleton
;
637 /* About the skeletons. */
639 /* b4_pkgdatadir is used inside m4_include in the skeletons, so digraphs
640 would never be expanded. Hopefully no one has M4-special characters in
641 his Bison installation path. */
642 MUSCLE_INSERT_STRING_RAW ("pkgdatadir", compute_pkgdatadir ());
647 /*----------------------------------------------------------.
648 | Output the parsing tables and the parser code to ftable. |
649 `----------------------------------------------------------*/
654 obstack_init (&format_obstack
);
663 /* Process the selected skeleton file. */
666 obstack_free (&format_obstack
, NULL
);
670 compute_pkgdatadir (void)
672 char const *pkgdatadir
= getenv ("BISON_PKGDATADIR");
673 return pkgdatadir
? pkgdatadir
: PKGDATADIR
;