1 /* Output the generated parsing program for Bison. 
   3    Copyright (C) 1984, 1986, 1989, 1992, 2000, 2001, 2002, 2003, 2004, 
   4    2005, 2006, 2007, 2008-2009 Free Software Foundation, Inc. 
   6    This file is part of Bison, the GNU Compiler Compiler. 
   8    This program is free software: you can redistribute it and/or modify 
   9    it under the terms of the GNU General Public License as published by 
  10    the Free Software Foundation, either version 3 of the License, or 
  11    (at your option) any later version. 
  13    This program is distributed in the hope that it will be useful, 
  14    but WITHOUT ANY WARRANTY; without even the implied warranty of 
  15    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
  16    GNU General Public License for more details. 
  18    You should have received a copy of the GNU General Public License 
  19    along with this program.  If not, see <http://www.gnu.org/licenses/>.  */ 
  25 #include <configmake.h> 
  27 #include <get-errno.h> 
  36 #include "muscle_tab.h" 
  39 #include "scan-code.h"    /* max_left_semantic_context */ 
  40 #include "scan-skel.h" 
  44 # define ARRAY_CARDINALITY(Array) (sizeof (Array) / sizeof *(Array)) 
  46 static struct obstack format_obstack
; 
  49 /*-------------------------------------------------------------------. 
  50 | Create a function NAME which associates to the muscle NAME the     | 
  51 | result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of | 
  52 | TYPE), and to the muscle NAME_max, the max value of the            | 
  54 `-------------------------------------------------------------------*/ 
  57 #define GENERATE_MUSCLE_INSERT_TABLE(Name, Type)                        \ 
  60 Name (char const *name,                                                 \ 
  73   obstack_fgrow1 (&format_obstack, "%6d", first);                       \ 
  74   for (i = begin; i < end; ++i)                                         \ 
  76       obstack_1grow (&format_obstack, ',');                             \ 
  79           obstack_sgrow (&format_obstack, "\n  ");                      \ 
  84       obstack_fgrow1 (&format_obstack, "%6d", table_data[i]);           \ 
  85       if (table_data[i] < min)                                          \ 
  86         min = table_data[i];                                            \ 
  87       if (max < table_data[i])                                          \ 
  88         max = table_data[i];                                            \ 
  90   obstack_1grow (&format_obstack, 0);                                   \ 
  91   muscle_insert (name, obstack_finish (&format_obstack));               \ 
  95   /* Build `NAME_min' and `NAME_max' in the obstack. */                 \ 
  96   obstack_fgrow1 (&format_obstack, "%s_min", name);                     \ 
  97   obstack_1grow (&format_obstack, 0);                                   \ 
  98   MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmin);      \ 
  99   obstack_fgrow1 (&format_obstack, "%s_max", name);                     \ 
 100   obstack_1grow (&format_obstack, 0);                                   \ 
 101   MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), lmax);      \ 
 104 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_unsigned_int_table
, unsigned int) 
 105 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_int_table
, int) 
 106 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_base_table
, base_number
) 
 107 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_rule_number_table
, rule_number
) 
 108 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_symbol_number_table
, symbol_number
) 
 109 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_item_number_table
, item_number
) 
 110 GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_state_number_table
, state_number
) 
 113 /*--------------------------------------------------------------------. 
 114 | Print to OUT a representation of STRING escaped both for C and M4.  | 
 115 `--------------------------------------------------------------------*/ 
 118 escaped_output (FILE *out
, char const *string
) 
 123   for (p 
= quotearg_style (c_quoting_style
, string
); *p
; p
++) 
 126       case '$': fputs ("$][", out
); break; 
 127       case '@': fputs ("@@",  out
); break; 
 128       case '[': fputs ("@{",  out
); break; 
 129       case ']': fputs ("@}",  out
); break; 
 130       default: fputc (*p
, out
); break; 
 137 /*------------------------------------------------------------------. 
 138 | Prepare the muscles related to the symbols: translate, tname, and | 
 140 `------------------------------------------------------------------*/ 
 143 prepare_symbols (void) 
 145   MUSCLE_INSERT_BOOL ("token_table", token_table_flag
); 
 146   MUSCLE_INSERT_INT ("tokens_number", ntokens
); 
 147   MUSCLE_INSERT_INT ("nterms_number", nvars
); 
 148   MUSCLE_INSERT_INT ("undef_token_number", undeftoken
->number
); 
 149   MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number
); 
 151   muscle_insert_symbol_number_table ("translate", 
 153                                      token_translations
[0], 
 154                                      1, max_user_token_number 
+ 1); 
 156   /* tname -- token names.  */ 
 159     /* We assume that the table will be output starting at column 2. */ 
 161     struct quoting_options 
*qo 
= clone_quoting_options (0); 
 162     set_quoting_style (qo
, c_quoting_style
); 
 163     set_quoting_flags (qo
, QA_SPLIT_TRIGRAPHS
); 
 164     for (i 
= 0; i 
< nsyms
; i
++) 
 166         char *cp 
= quotearg_alloc (symbols
[i
]->tag
, -1, qo
); 
 167         /* Width of the next token, including the two quotes, the 
 168            comma and the space.  */ 
 169         int width 
= strlen (cp
) + 2; 
 173             obstack_sgrow (&format_obstack
, "\n "); 
 178           obstack_1grow (&format_obstack
, ' '); 
 179         MUSCLE_OBSTACK_SGROW (&format_obstack
, cp
); 
 181         obstack_1grow (&format_obstack
, ','); 
 185     obstack_sgrow (&format_obstack
, " ]b4_null["); 
 187     /* Finish table and store. */ 
 188     obstack_1grow (&format_obstack
, 0); 
 189     muscle_insert ("tname", obstack_finish (&format_obstack
)); 
 192   /* Output YYTOKNUM. */ 
 195     int *values 
= xnmalloc (ntokens
, sizeof *values
); 
 196     for (i 
= 0; i 
< ntokens
; ++i
) 
 197       values
[i
] = symbols
[i
]->user_token_number
; 
 198     muscle_insert_int_table ("toknum", values
, 
 199                              values
[0], 1, ntokens
); 
 205 /*-------------------------------------------------------------. 
 206 | Prepare the muscles related to the rules: rhs, prhs, r1, r2, | 
 207 | rline, dprec, merger.                                        | 
 208 `-------------------------------------------------------------*/ 
 215   item_number 
*rhs 
= xnmalloc (nritems
, sizeof *rhs
); 
 216   unsigned int *prhs 
= xnmalloc (nrules
, sizeof *prhs
); 
 217   unsigned int *rline 
= xnmalloc (nrules
, sizeof *rline
); 
 218   symbol_number 
*r1 
= xnmalloc (nrules
, sizeof *r1
); 
 219   unsigned int *r2 
= xnmalloc (nrules
, sizeof *r2
); 
 220   int *dprec 
= xnmalloc (nrules
, sizeof *dprec
); 
 221   int *merger 
= xnmalloc (nrules
, sizeof *merger
); 
 223   for (r 
= 0; r 
< nrules
; ++r
) 
 225       item_number 
*rhsp 
= NULL
; 
 226       /* Index of rule R in RHS. */ 
 228       /* RHS of the rule R. */ 
 229       for (rhsp 
= rules
[r
].rhs
; *rhsp 
>= 0; ++rhsp
) 
 231       /* LHS of the rule R. */ 
 232       r1
[r
] = rules
[r
].lhs
->number
; 
 233       /* Length of rule R's RHS. */ 
 235       /* Separator in RHS. */ 
 237       /* Line where rule was defined. */ 
 238       rline
[r
] = rules
[r
].location
.start
.line
; 
 239       /* Dynamic precedence (GLR).  */ 
 240       dprec
[r
] = rules
[r
].dprec
; 
 241       /* Merger-function index (GLR).  */ 
 242       merger
[r
] = rules
[r
].merger
; 
 246   muscle_insert_item_number_table ("rhs", rhs
, ritem
[0], 1, nritems
); 
 247   muscle_insert_unsigned_int_table ("prhs", prhs
, 0, 0, nrules
); 
 248   muscle_insert_unsigned_int_table ("rline", rline
, 0, 0, nrules
); 
 249   muscle_insert_symbol_number_table ("r1", r1
, 0, 0, nrules
); 
 250   muscle_insert_unsigned_int_table ("r2", r2
, 0, 0, nrules
); 
 251   muscle_insert_int_table ("dprec", dprec
, 0, 0, nrules
); 
 252   muscle_insert_int_table ("merger", merger
, 0, 0, nrules
); 
 254   MUSCLE_INSERT_INT ("rules_number", nrules
); 
 255   MUSCLE_INSERT_INT ("max_left_semantic_context", max_left_semantic_context
); 
 266 /*--------------------------------------------. 
 267 | Prepare the muscles related to the states.  | 
 268 `--------------------------------------------*/ 
 271 prepare_states (void) 
 274   symbol_number 
*values 
= xnmalloc (nstates
, sizeof *values
); 
 275   for (i 
= 0; i 
< nstates
; ++i
) 
 276     values
[i
] = states
[i
]->accessing_symbol
; 
 277   muscle_insert_symbol_number_table ("stos", values
, 
 281   MUSCLE_INSERT_INT ("last", high
); 
 282   MUSCLE_INSERT_INT ("final_state_number", final_state
->number
); 
 283   MUSCLE_INSERT_INT ("states_number", nstates
); 
 288 /*---------------------------------. 
 289 | Output the user actions to OUT.  | 
 290 `---------------------------------*/ 
 293 user_actions_output (FILE *out
) 
 297   fputs ("m4_define([b4_actions], \n[", out
); 
 298   for (r 
= 0; r 
< nrules
; ++r
) 
 301         fprintf (out
, "b4_case(%d, [b4_syncline(%d, ", r 
+ 1, 
 302                  rules
[r
].action_location
.start
.line
); 
 303         escaped_output (out
, rules
[r
].action_location
.start
.file
); 
 304         fprintf (out
, ")\n[    %s]])\n\n", rules
[r
].action
); 
 306   fputs ("])\n\n", out
); 
 309 /*--------------------------------------. 
 310 | Output the merge functions to OUT.   | 
 311 `--------------------------------------*/ 
 314 merger_output (FILE *out
) 
 319   fputs ("m4_define([b4_mergers], \n[[", out
); 
 320   for (n 
= 1, p 
= merge_functions
; p 
!= NULL
; n 
+= 1, p 
= p
->next
) 
 322       if (p
->type
[0] == '\0') 
 323         fprintf (out
, "  case %d: *yy0 = %s (*yy0, *yy1); break;\n", 
 326         fprintf (out
, "  case %d: yy0->%s = %s (*yy0, *yy1); break;\n", 
 327                  n
, p
->type
, p
->name
); 
 329   fputs ("]])\n\n", out
); 
 332 /*--------------------------------------. 
 333 | Output the tokens definition to OUT.  | 
 334 `--------------------------------------*/ 
 337 token_definitions_output (FILE *out
) 
 340   char const *sep 
= ""; 
 342   fputs ("m4_define([b4_tokens], \n[", out
); 
 343   for (i 
= 0; i 
< ntokens
; ++i
) 
 345       symbol 
*sym 
= symbols
[i
]; 
 346       int number 
= sym
->user_token_number
; 
 348       /* At this stage, if there are literal aliases, they are part of 
 349          SYMBOLS, so we should not find symbols which are the aliases 
 351       aver (number 
!= USER_NUMBER_ALIAS
); 
 353       /* Skip error token.  */ 
 357       /* If this string has an alias, then it is necessarily the alias 
 358          which is to be output.  */ 
 362       /* Don't output literal chars or strings (when defined only as a 
 363          string).  Note that must be done after the alias resolution: 
 364          think about `%token 'f' "f"'.  */ 
 365       if (sym
->tag
[0] == '\'' || sym
->tag
[0] == '\"') 
 368       /* Don't #define nonliteral tokens whose names contain periods 
 369          or '$' (as does the default value of the EOF token).  */ 
 370       if (strchr (sym
->tag
, '.') || strchr (sym
->tag
, '$')) 
 373       fprintf (out
, "%s[[[%s]], %d]", 
 374                sep
, sym
->tag
, number
); 
 377   fputs ("])\n\n", out
); 
 381 /*---------------------------------------------------. 
 382 | Output the symbol destructors or printers to OUT.  | 
 383 `---------------------------------------------------*/ 
 386 symbol_code_props_output (FILE *out
, char const *what
, 
 387                           code_props 
const *(*get
)(symbol 
const *)) 
 390   char const *sep 
= ""; 
 392   fputs ("m4_define([b4_symbol_", out
); 
 394   fputs ("], \n[", out
); 
 395   for (i 
= 0; i 
< nsyms
; ++i
) 
 397       symbol 
*sym 
= symbols
[i
]; 
 398       char const *code 
= (*get
) (sym
)->code
; 
 401           location loc 
= (*get
) (sym
)->location
; 
 403              Symbol-name, Symbol-number, 
 404              code, optional typename.  */ 
 405           fprintf (out
, "%s[", sep
); 
 407           escaped_output (out
, loc
.start
.file
); 
 408           fprintf (out
, ", %d, ", loc
.start
.line
); 
 409           escaped_output (out
, sym
->tag
); 
 410           fprintf (out
, ", %d, [[%s]]", sym
->number
, code
); 
 412             fprintf (out
, ", [[%s]]", sym
->type_name
); 
 416   fputs ("])\n\n", out
); 
 421 prepare_actions (void) 
 423   /* Figure out the actions for the specified state, indexed by 
 424      lookahead token type.  */ 
 426   muscle_insert_rule_number_table ("defact", yydefact
, 
 427                                    yydefact
[0], 1, nstates
); 
 429   /* Figure out what to do after reducing with each rule, depending on 
 430      the saved state from before the beginning of parsing the data 
 431      that matched this rule.  */ 
 432   muscle_insert_state_number_table ("defgoto", yydefgoto
, 
 433                                     yydefgoto
[0], 1, nsyms 
- ntokens
); 
 437   muscle_insert_base_table ("pact", base
, 
 438                              base
[0], 1, nstates
); 
 439   MUSCLE_INSERT_INT ("pact_ninf", base_ninf
); 
 442   muscle_insert_base_table ("pgoto", base
, 
 443                              base
[nstates
], nstates 
+ 1, nvectors
); 
 445   muscle_insert_base_table ("table", table
, 
 446                             table
[0], 1, high 
+ 1); 
 447   MUSCLE_INSERT_INT ("table_ninf", table_ninf
); 
 449   muscle_insert_base_table ("check", check
, 
 450                             check
[0], 1, high 
+ 1); 
 452   /* GLR parsing slightly modifies YYTABLE and YYCHECK (and thus 
 453      YYPACT) so that in states with unresolved conflicts, the default 
 454      reduction is not used in the conflicted entries, so that there is 
 455      a place to put a conflict pointer. 
 457      This means that YYCONFLP and YYCONFL are nonsense for a non-GLR 
 458      parser, so we could avoid accidents by not writing them out in 
 459      that case.  Nevertheless, it seems even better to be able to use 
 460      the GLR skeletons even without the non-deterministic tables.  */ 
 461   muscle_insert_unsigned_int_table ("conflict_list_heads", conflict_table
, 
 462                                     conflict_table
[0], 1, high 
+ 1); 
 463   muscle_insert_unsigned_int_table ("conflicting_rules", conflict_list
, 
 464                                     0, 1, conflict_list_cnt
); 
 468 /*---------------------------. 
 469 | Call the skeleton parser.  | 
 470 `---------------------------*/ 
 473 output_skeleton (void) 
 478   char const *argv
[10]; 
 481   /* Compute the names of the package data dir and skeleton files.  */ 
 482   char const m4sugar
[] = "m4sugar/m4sugar.m4"; 
 483   char const m4bison
[] = "bison.m4"; 
 488   char const *m4 
= (p 
= getenv ("M4")) ? p 
: M4
; 
 489   char const *pkgdatadir 
= compute_pkgdatadir (); 
 490   size_t skeleton_size 
= strlen (skeleton
) + 1; 
 491   size_t pkgdatadirlen 
= strlen (pkgdatadir
); 
 492   while (pkgdatadirlen 
&& pkgdatadir
[pkgdatadirlen 
- 1] == '/') 
 494   full_skeleton 
= xmalloc (pkgdatadirlen 
+ 1 
 495                            + (skeleton_size 
< sizeof m4sugar
 
 496                               ? sizeof m4sugar 
: skeleton_size
)); 
 497   strncpy (full_skeleton
, pkgdatadir
, pkgdatadirlen
); 
 498   full_skeleton
[pkgdatadirlen
] = '/'; 
 499   strcpy (full_skeleton 
+ pkgdatadirlen 
+ 1, m4sugar
); 
 500   full_m4sugar 
= xstrdup (full_skeleton
); 
 501   strcpy (full_skeleton 
+ pkgdatadirlen 
+ 1, m4bison
); 
 502   full_m4bison 
= xstrdup (full_skeleton
); 
 503   if (strchr (skeleton
, '/')) 
 504     strcpy (full_skeleton
, skeleton
); 
 506     strcpy (full_skeleton 
+ pkgdatadirlen 
+ 1, skeleton
); 
 508   /* Test whether m4sugar.m4 is readable, to check for proper 
 509      installation.  A faulty installation can cause deadlock, so a 
 510      cheap sanity check is worthwhile.  */ 
 511   xfclose (xfopen (full_m4sugar
, "r")); 
 513   /* Create an m4 subprocess connected to us via two pipes.  */ 
 515   if (trace_flag 
& trace_tools
) 
 516     fprintf (stderr
, "running: %s %s - %s %s\n", 
 517              m4
, full_m4sugar
, full_m4bison
, full_skeleton
); 
 519   /* Some future version of GNU M4 (most likely 1.6) may treat the -dV in a 
 520      position-dependent manner.  Keep it as the first argument so that all 
 523      See the thread starting at 
 524      <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html> 
 530     /* When POSIXLY_CORRECT is set, GNU M4 1.6 and later disable GNU 
 531        extensions, which Bison's skeletons depend on.  With older M4, 
 532        it has no effect.  M4 1.4.12 added a -g/--gnu command-line 
 533        option to make it explicit that a program wants GNU M4 
 534        extensions even when POSIXLY_CORRECT is set. 
 536        See the thread starting at 
 537        <http://lists.gnu.org/archive/html/bug-bison/2008-07/msg00000.html> 
 540       argv
[i
++] = M4_GNU_OPTION
; 
 543     argv
[i
++] = pkgdatadir
; 
 544     if (trace_flag 
& trace_m4
) 
 546     argv
[i
++] = full_m4sugar
; 
 548     argv
[i
++] = full_m4bison
; 
 549     argv
[i
++] = full_skeleton
; 
 551     assert (i 
<= ARRAY_CARDINALITY (argv
)); 
 555   pid 
= create_subpipe (argv
, filter_fd
); 
 558   free (full_skeleton
); 
 560   out 
= fdopen (filter_fd
[0], "w"); 
 562     error (EXIT_FAILURE
, get_errno (), 
 565   /* Output the definitions of all the muscles.  */ 
 566   fputs ("m4_init()\n", out
); 
 568   user_actions_output (out
); 
 570   token_definitions_output (out
); 
 571   symbol_code_props_output (out
, "destructors", &symbol_destructor_get
); 
 572   symbol_code_props_output (out
, "printers", &symbol_printer_get
); 
 574   muscles_m4_output (out
); 
 577   /* Read and process m4's output.  */ 
 578   timevar_push (TV_M4
); 
 579   end_of_output_subpipe (pid
, filter_fd
); 
 580   in 
= fdopen (filter_fd
[1], "r"); 
 582     error (EXIT_FAILURE
, get_errno (), 
 586   reap_subpipe (pid
, m4
); 
 593   /* BISON_USE_PUSH_FOR_PULL is for the test suite and should not be documented 
 595   char const *use_push_for_pull_env 
= getenv ("BISON_USE_PUSH_FOR_PULL"); 
 596   bool use_push_for_pull_flag 
= false; 
 597   if (use_push_for_pull_env 
!= NULL
 
 598       && use_push_for_pull_env
[0] != '\0' 
 599       && 0 != strcmp (use_push_for_pull_env
, "0")) 
 600     use_push_for_pull_flag 
= true; 
 603   MUSCLE_INSERT_BOOL ("debug_flag", debug_flag
); 
 604   MUSCLE_INSERT_BOOL ("defines_flag", defines_flag
); 
 605   MUSCLE_INSERT_BOOL ("error_verbose_flag", error_verbose
); 
 606   MUSCLE_INSERT_BOOL ("glr_flag", glr_parser
); 
 607   MUSCLE_INSERT_BOOL ("locations_flag", locations_flag
); 
 608   MUSCLE_INSERT_BOOL ("nondeterministic_flag", nondeterministic_parser
); 
 609   MUSCLE_INSERT_BOOL ("synclines_flag", !no_lines_flag
); 
 610   MUSCLE_INSERT_BOOL ("tag_seen_flag", tag_seen
); 
 611   MUSCLE_INSERT_BOOL ("use_push_for_pull_flag", use_push_for_pull_flag
); 
 612   MUSCLE_INSERT_BOOL ("yacc_flag", yacc_flag
); 
 615   if (spec_name_prefix
) 
 616     MUSCLE_INSERT_STRING ("prefix", spec_name_prefix
); 
 618   MUSCLE_INSERT_STRING ("file_name_all_but_ext", all_but_ext
); 
 620 #define DEFINE(Name) MUSCLE_INSERT_STRING (#Name, Name ? Name : "") 
 622   DEFINE (parser_file_name
); 
 623   DEFINE (spec_defines_file
); 
 624   DEFINE (spec_file_prefix
); 
 625   DEFINE (spec_graph_file
); 
 626   DEFINE (spec_name_prefix
); 
 627   DEFINE (spec_outfile
); 
 628   DEFINE (spec_verbose_file
); 
 631   /* Find the right skeleton file, and add muscles about the skeletons.  */ 
 633     MUSCLE_INSERT_C_STRING ("skeleton", skeleton
); 
 635     skeleton 
= language
->skeleton
; 
 637   /* About the skeletons.  */ 
 639     /* b4_pkgdatadir is used inside m4_include in the skeletons, so digraphs 
 640        would never be expanded.  Hopefully no one has M4-special characters in 
 641        his Bison installation path.  */ 
 642     MUSCLE_INSERT_STRING_RAW ("pkgdatadir", compute_pkgdatadir ()); 
 647 /*----------------------------------------------------------. 
 648 | Output the parsing tables and the parser code to ftable.  | 
 649 `----------------------------------------------------------*/ 
 654   obstack_init (&format_obstack
); 
 663   /* Process the selected skeleton file.  */ 
 666   obstack_free (&format_obstack
, NULL
); 
 670 compute_pkgdatadir (void) 
 672   char const *pkgdatadir 
= getenv ("BISON_PKGDATADIR"); 
 673   return pkgdatadir 
? pkgdatadir 
: PKGDATADIR
;