]> git.saurik.com Git - bison.git/blame - src/reader.c
Fix some memory leaks.
[bison.git] / src / reader.c
CommitLineData
35dcf428 1/* Input parser for Bison
9c4637fa 2
05ac60f3 3 Copyright (C) 1984, 1986, 1989, 1992, 1998, 2000, 2001, 2002, 2003,
00f5d575 4 2005, 2006, 2007, 2009 Free Software Foundation, Inc.
1ff442ca 5
41aca2e0 6 This file is part of Bison, the GNU Compiler Compiler.
1ff442ca 7
f16b0819 8 This program is free software: you can redistribute it and/or modify
41aca2e0 9 it under the terms of the GNU General Public License as published by
f16b0819
PE
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
1ff442ca 12
f16b0819 13 This program is distributed in the hope that it will be useful,
41aca2e0
AD
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
1ff442ca 17
41aca2e0 18 You should have received a copy of the GNU General Public License
f16b0819 19 along with this program. If not, see <http://www.gnu.org/licenses/>. */
1ff442ca 20
2cec9080 21#include <config.h>
1ff442ca 22#include "system.h"
17ee7397 23
b9f1d9a4 24#include <quote.h>
17ee7397
PE
25#include <quotearg.h>
26
27#include "complain.h"
28#include "conflicts.h"
1ff442ca 29#include "files.h"
17ee7397 30#include "getargs.h"
1ff442ca 31#include "gram.h"
00f5d575 32#include "muscle-tab.h"
b2ca4022 33#include "reader.h"
17ee7397
PE
34#include "symlist.h"
35#include "symtab.h"
e9071366
AD
36#include "scan-gram.h"
37#include "scan-code.h"
1ff442ca 38
02d12d0d
PE
39static void check_and_convert_grammar (void);
40
17ee7397 41static symbol_list *grammar = NULL;
d0829076 42static bool start_flag = false;
676385e2 43merger_list *merge_functions;
1ff442ca 44
34f98f46 45/* Was %union seen? */
ddc8ede1
PE
46bool union_seen = false;
47
48/* Was a tag seen? */
49bool tag_seen = false;
39a06c25
PE
50
51/* Should rules have a default precedence? */
52bool default_prec = true;
0d533154 53\f
e9955c83
AD
54/*-----------------------.
55| Set the start symbol. |
56`-----------------------*/
1ff442ca 57
e9955c83 58void
a737b216 59grammar_start_symbol_set (symbol *sym, location loc)
1ff442ca
NF
60{
61 if (start_flag)
17ee7397 62 complain_at (loc, _("multiple %s declarations"), "%start");
943819bf
RS
63 else
64 {
d0829076 65 start_flag = true;
a737b216 66 startsymbol = sym;
17ee7397 67 startsymbol_location = loc;
943819bf 68 }
1ff442ca
NF
69}
70
a70083a3
AD
71\f
72
8ee5b538
JD
73/*------------------------------------------------------------------------.
74| Return the merger index for a merging function named NAME. Records the |
75| function, if new, in MERGER_LIST. |
76`------------------------------------------------------------------------*/
676385e2
PH
77
78static int
8ee5b538 79get_merge_function (uniqstr name)
676385e2
PH
80{
81 merger_list *syms;
82 merger_list head;
83 int n;
84
85 if (! glr_parser)
86 return 0;
87
676385e2 88 head.next = merge_functions;
affac613 89 for (syms = &head, n = 1; syms->next; syms = syms->next, n += 1)
17ee7397 90 if (UNIQSTR_EQ (name, syms->next->name))
676385e2 91 break;
a5d50994
AD
92 if (syms->next == NULL)
93 {
da2a7671 94 syms->next = xmalloc (sizeof syms->next[0]);
17ee7397 95 syms->next->name = uniqstr_new (name);
8ee5b538
JD
96 /* After all symbol type declarations have been parsed, packgram invokes
97 record_merge_function_type to set the type. */
98 syms->next->type = NULL;
a5d50994
AD
99 syms->next->next = NULL;
100 merge_functions = head.next;
101 }
676385e2
PH
102 return n;
103}
104
8ee5b538
JD
105/*-------------------------------------------------------------------------.
106| For the existing merging function with index MERGER, record the result |
107| type as TYPE as required by the lhs of the rule whose %merge declaration |
108| is at DECLARATION_LOC. |
109`-------------------------------------------------------------------------*/
110
111static void
112record_merge_function_type (int merger, uniqstr type, location declaration_loc)
113{
114 int merger_find;
115 merger_list *merge_function;
116
117 if (merger <= 0)
118 return;
119
120 if (type == NULL)
121 type = uniqstr_new ("");
122
123 merger_find = 1;
124 for (merge_function = merge_functions;
125 merge_function != NULL && merger_find != merger;
126 merge_function = merge_function->next)
127 merger_find += 1;
4f82b42a 128 aver (merge_function != NULL && merger_find == merger);
dd60572a 129 if (merge_function->type != NULL && !UNIQSTR_EQ (merge_function->type, type))
8ee5b538 130 {
3b452f4e
JD
131 complain_at (declaration_loc,
132 _("result type clash on merge function `%s': <%s> != <%s>"),
133 merge_function->name, type, merge_function->type);
134 complain_at (merge_function->type_declaration_location,
135 _("previous declaration"));
8ee5b538 136 }
dd60572a
JD
137 merge_function->type = uniqstr_new (type);
138 merge_function->type_declaration_location = declaration_loc;
8ee5b538
JD
139}
140
676385e2
PH
141/*--------------------------------------.
142| Free all merge-function definitions. |
143`--------------------------------------*/
144
145void
146free_merger_functions (void)
147{
affac613
AD
148 merger_list *L0 = merge_functions;
149 while (L0)
676385e2
PH
150 {
151 merger_list *L1 = L0->next;
152 free (L0);
153 L0 = L1;
154 }
155}
156
a70083a3 157\f
107f7dfb 158/*-------------------------------------------------------------------.
17ee7397 159| Parse the input grammar into a one symbol_list structure. Each |
107f7dfb
AD
160| rule is represented by a sequence of symbols: the left hand side |
161| followed by the contents of the right hand side, followed by a |
162| null pointer instead of a symbol to terminate the rule. The next |
163| symbol is the lhs of the following rule. |
164| |
fdbcd8e2
AD
165| All actions are copied out, labelled by the rule number they apply |
166| to. |
107f7dfb 167`-------------------------------------------------------------------*/
1ff442ca 168
f6d0f937 169/* The (currently) last symbol of GRAMMAR. */
04098407 170static symbol_list *grammar_end = NULL;
f6d0f937 171
52328c6e 172/* Append SYM to the grammar. */
b9f1d9a4 173static symbol_list *
17ee7397 174grammar_symbol_append (symbol *sym, location loc)
f6d0f937 175{
3be03b13 176 symbol_list *p = symbol_list_sym_new (sym, loc);
f6d0f937
AD
177
178 if (grammar_end)
179 grammar_end->next = p;
180 else
181 grammar = p;
182
183 grammar_end = p;
8f3596a6 184
e3233bf6 185 /* A null SYM stands for an end of rule; it is not an actual
8f3596a6
AD
186 part of it. */
187 if (sym)
188 ++nritems;
b9f1d9a4
AR
189
190 return p;
f6d0f937
AD
191}
192
872b52bc
AR
193static void
194assign_named_ref (symbol_list *p, named_ref *named_ref)
195{
196 symbol *sym = p->content.sym;
197
198 if (named_ref->id == sym->tag)
199 {
200 warn_at (named_ref->loc,
201 _("duplicated symbol name for %s ignored"),
202 quote (sym->tag));
203 named_ref_free (named_ref);
204 }
205 else
206 p->named_ref = named_ref;
207}
208
209
8efe435c
AD
210/* The rule currently being defined, and the previous rule.
211 CURRENT_RULE points to the first LHS of the current rule, while
212 PREVIOUS_RULE_END points to the *end* of the previous rule (NULL). */
e256e17f 213static symbol_list *current_rule = NULL;
04098407 214static symbol_list *previous_rule_end = NULL;
da4160c3
AD
215
216
8efe435c
AD
217/*----------------------------------------------.
218| Create a new rule for LHS in to the GRAMMAR. |
219`----------------------------------------------*/
da4160c3 220
e9955c83 221void
b9f1d9a4
AR
222grammar_current_rule_begin (symbol *lhs, location loc,
223 named_ref *lhs_named_ref)
da4160c3 224{
b9f1d9a4
AR
225 symbol_list* p;
226
da4160c3
AD
227 /* Start a new rule and record its lhs. */
228 ++nrules;
8efe435c 229 previous_rule_end = grammar_end;
b9f1d9a4
AR
230
231 p = grammar_symbol_append (lhs, loc);
232 if (lhs_named_ref)
872b52bc 233 assign_named_ref(p, lhs_named_ref);
b9f1d9a4 234
da4160c3
AD
235 current_rule = grammar_end;
236
237 /* Mark the rule's lhs as a nonterminal if not already so. */
da4160c3
AD
238 if (lhs->class == unknown_sym)
239 {
240 lhs->class = nterm_sym;
241 lhs->number = nvars;
242 ++nvars;
243 }
244 else if (lhs->class == token_sym)
17ee7397 245 complain_at (loc, _("rule given for %s, which is a token"), lhs->tag);
da4160c3
AD
246}
247
affac613 248
d40ba6c2 249/*----------------------------------------------------------------------.
17bd8a73
JD
250| A symbol should be used if either: |
251| 1. It has a destructor. |
252| 2. --warnings=midrule-values and the symbol is a mid-rule symbol |
253| (i.e., the generated LHS replacing a mid-rule action) that was |
254| assigned to or used, as in "exp: { $$ = 1; } { $$ = $1; }". |
d40ba6c2 255`----------------------------------------------------------------------*/
84866159
AD
256
257static bool
d40ba6c2 258symbol_should_be_used (symbol_list const *s)
84866159 259{
95021767 260 if (symbol_destructor_get (s->content.sym)->code)
17bd8a73
JD
261 return true;
262 if (warnings_flag & warnings_midrule_values)
f6857bbf 263 return ((s->midrule && s->midrule->action_props.is_value_used)
b0f4c4ea
JD
264 || (s->midrule_parent_rule
265 && symbol_list_n_get (s->midrule_parent_rule,
f6857bbf
JD
266 s->midrule_parent_rhs_index)
267 ->action_props.is_value_used));
17bd8a73 268 return false;
84866159
AD
269}
270
8f3596a6
AD
271/*----------------------------------------------------------------.
272| Check that the rule R is properly defined. For instance, there |
273| should be no type clash on the default action. |
274`----------------------------------------------------------------*/
e9955c83
AD
275
276static void
8f3596a6 277grammar_rule_check (const symbol_list *r)
e9955c83 278{
affac613 279 /* Type check.
e9955c83 280
affac613
AD
281 If there is an action, then there is nothing we can do: the user
282 is allowed to shoot herself in the foot.
3f4c0f80 283
affac613
AD
284 Don't worry about the default action if $$ is untyped, since $$'s
285 value can't be used. */
f6857bbf 286 if (!r->action_props.code && r->content.sym->type_name)
e9955c83 287 {
3be03b13 288 symbol *first_rhs = r->next->content.sym;
affac613
AD
289 /* If $$ is being set in default way, report if any type mismatch. */
290 if (first_rhs)
291 {
3be03b13 292 char const *lhs_type = r->content.sym->type_name;
affac613
AD
293 const char *rhs_type =
294 first_rhs->type_name ? first_rhs->type_name : "";
295 if (!UNIQSTR_EQ (lhs_type, rhs_type))
8f3596a6 296 warn_at (r->location,
affac613
AD
297 _("type clash on default action: <%s> != <%s>"),
298 lhs_type, rhs_type);
299 }
300 /* Warn if there is no default for $$ but we need one. */
301 else
8f3596a6 302 warn_at (r->location,
affac613
AD
303 _("empty rule for typed nonterminal, and no action"));
304 }
e3233bf6 305
d40ba6c2 306 /* Check that symbol values that should be used are in fact used. */
8f3596a6 307 {
668c5d19 308 symbol_list const *l = r;
8f3596a6 309 int n = 0;
3be03b13 310 for (; l && l->content.sym; l = l->next, ++n)
f6857bbf 311 if (! (l->action_props.is_value_used
d40ba6c2 312 || !symbol_should_be_used (l)
8f3596a6 313 /* The default action, $$ = $1, `uses' both. */
f6857bbf 314 || (!r->action_props.code && (n == 0 || n == 1))))
668c5d19
PE
315 {
316 if (n)
317 warn_at (r->location, _("unused value: $%d"), n);
318 else
319 warn_at (r->location, _("unset value: $$"));
320 }
8f3596a6 321 }
e9955c83
AD
322}
323
324
8efe435c
AD
325/*-------------------------------------.
326| End the currently being grown rule. |
327`-------------------------------------*/
e9955c83
AD
328
329void
8f3596a6 330grammar_current_rule_end (location loc)
e9955c83
AD
331{
332 /* Put an empty link in the list to mark the end of this rule */
8efe435c 333 grammar_symbol_append (NULL, grammar_end->location);
17ee7397 334 current_rule->location = loc;
e9955c83
AD
335}
336
337
8efe435c
AD
338/*-------------------------------------------------------------------.
339| The previous action turns out the be a mid-rule action. Attach it |
340| to the current rule, i.e., create a dummy symbol, attach it this |
341| mid-rule action, and append this dummy nonterminal to the current |
342| rule. |
343`-------------------------------------------------------------------*/
1485e106 344
6b702268 345void
1485e106
AD
346grammar_midrule_action (void)
347{
348 /* Since the action was written out with this rule's number, we must
349 give the new rule this number by inserting the new rule before
350 it. */
351
8efe435c
AD
352 /* Make a DUMMY nonterminal, whose location is that of the midrule
353 action. Create the MIDRULE. */
f6857bbf 354 location dummy_location = current_rule->action_props.location;
17ee7397 355 symbol *dummy = dummy_symbol_get (dummy_location);
3be03b13 356 symbol_list *midrule = symbol_list_sym_new (dummy, dummy_location);
1485e106 357
872b52bc 358 /* Remember named_ref of previous action. */
b9f1d9a4
AR
359 named_ref *named_ref = current_rule->action_props.named_ref;
360
1485e106
AD
361 /* Make a new rule, whose body is empty, before the current one, so
362 that the action just read can belong to it. */
363 ++nrules;
364 ++nritems;
8efe435c
AD
365 /* Attach its location and actions to that of the DUMMY. */
366 midrule->location = dummy_location;
f6857bbf
JD
367 code_props_rule_action_init (&midrule->action_props,
368 current_rule->action_props.code,
369 current_rule->action_props.location,
b9f1d9a4 370 midrule, 0);
f6857bbf 371 code_props_none_init (&current_rule->action_props);
1485e106 372
8efe435c
AD
373 if (previous_rule_end)
374 previous_rule_end->next = midrule;
1485e106 375 else
8efe435c 376 grammar = midrule;
1485e106 377
8efe435c 378 /* End the dummy's rule. */
3be03b13 379 midrule->next = symbol_list_sym_new (NULL, dummy_location);
84866159 380 midrule->next->next = current_rule;
1485e106 381
84866159 382 previous_rule_end = midrule->next;
1485e106 383
8efe435c 384 /* Insert the dummy nonterminal replacing the midrule action into
84866159 385 the current rule. Bind it to its dedicated rule. */
b9f1d9a4 386 grammar_current_rule_symbol_append (dummy, dummy_location, named_ref);
6ec2c0f2 387 grammar_end->midrule = midrule;
ffa4ba3a
JD
388 midrule->midrule_parent_rule = current_rule;
389 midrule->midrule_parent_rhs_index = symbol_list_length (current_rule->next);
1485e106
AD
390}
391
9af3fbce
AD
392/* Set the precedence symbol of the current rule to PRECSYM. */
393
e9955c83 394void
17ee7397 395grammar_current_rule_prec_set (symbol *precsym, location loc)
9af3fbce 396{
26b8a438 397 symbol_class_set (precsym, token_sym, loc, false);
9af3fbce 398 if (current_rule->ruleprec)
17ee7397 399 complain_at (loc, _("only one %s allowed per rule"), "%prec");
9af3fbce
AD
400 current_rule->ruleprec = precsym;
401}
402
676385e2
PH
403/* Attach dynamic precedence DPREC to the current rule. */
404
405void
17ee7397 406grammar_current_rule_dprec_set (int dprec, location loc)
676385e2
PH
407{
408 if (! glr_parser)
17ee7397 409 warn_at (loc, _("%s affects only GLR parsers"), "%dprec");
676385e2 410 if (dprec <= 0)
17ee7397 411 complain_at (loc, _("%s must be followed by positive number"), "%dprec");
39f41916 412 else if (current_rule->dprec != 0)
17ee7397 413 complain_at (loc, _("only one %s allowed per rule"), "%dprec");
676385e2
PH
414 current_rule->dprec = dprec;
415}
416
417/* Attach a merge function NAME with argument type TYPE to current
418 rule. */
419
420void
17ee7397 421grammar_current_rule_merge_set (uniqstr name, location loc)
676385e2
PH
422{
423 if (! glr_parser)
17ee7397 424 warn_at (loc, _("%s affects only GLR parsers"), "%merge");
39f41916 425 if (current_rule->merger != 0)
17ee7397 426 complain_at (loc, _("only one %s allowed per rule"), "%merge");
8ee5b538
JD
427 current_rule->merger = get_merge_function (name);
428 current_rule->merger_declaration_location = loc;
676385e2
PH
429}
430
17ee7397 431/* Attach SYM to the current rule. If needed, move the previous
2e047461
AD
432 action as a mid-rule action. */
433
e9955c83 434void
b9f1d9a4
AR
435grammar_current_rule_symbol_append (symbol *sym, location loc,
436 named_ref *named_ref)
2e047461 437{
b9f1d9a4 438 symbol_list *p;
f6857bbf 439 if (current_rule->action_props.code)
2e047461 440 grammar_midrule_action ();
b9f1d9a4 441 p = grammar_symbol_append (sym, loc);
b9f1d9a4 442 if (named_ref)
872b52bc 443 assign_named_ref(p, named_ref);
2e047461
AD
444}
445
6b702268 446/* Attach an ACTION to the current rule. */
2e047461 447
e9955c83 448void
b9f1d9a4
AR
449grammar_current_rule_action_append (const char *action, location loc,
450 named_ref *named_ref)
2e047461 451{
f6857bbf 452 if (current_rule->action_props.code)
381ecb06 453 grammar_midrule_action ();
ffa4ba3a 454 /* After all symbol declarations have been parsed, packgram invokes
f6857bbf
JD
455 code_props_translate_code. */
456 code_props_rule_action_init (&current_rule->action_props, action, loc,
b9f1d9a4 457 current_rule, named_ref);
2e047461
AD
458}
459
a70083a3 460\f
a70083a3
AD
461/*---------------------------------------------------------------.
462| Convert the rules into the representation using RRHS, RLHS and |
d9b739c3 463| RITEM. |
a70083a3 464`---------------------------------------------------------------*/
1ff442ca 465
4a120d45 466static void
118fb205 467packgram (void)
1ff442ca 468{
9222837b 469 unsigned int itemno = 0;
17ee7397
PE
470 rule_number ruleno = 0;
471 symbol_list *p = grammar;
1ff442ca 472
e9ad4aec
PE
473 ritem = xnmalloc (nritems + 1, sizeof *ritem);
474
475 /* This sentinel is used by build_relations in gram.c. */
476 *ritem++ = 0;
477
da2a7671 478 rules = xnmalloc (nrules, sizeof *rules);
1ff442ca 479
1ff442ca
NF
480 while (p)
481 {
e9071366 482 int rule_length = 0;
17ee7397 483 symbol *ruleprec = p->ruleprec;
3be03b13 484 record_merge_function_type (p->merger, p->content.sym->type_name,
8ee5b538 485 p->merger_declaration_location);
d7e1f00c 486 rules[ruleno].user_number = ruleno;
c3b407f4 487 rules[ruleno].number = ruleno;
3be03b13 488 rules[ruleno].lhs = p->content.sym;
99013900 489 rules[ruleno].rhs = ritem + itemno;
da2a7671
PE
490 rules[ruleno].prec = NULL;
491 rules[ruleno].dprec = p->dprec;
492 rules[ruleno].merger = p->merger;
493 rules[ruleno].precsym = NULL;
8efe435c 494 rules[ruleno].location = p->location;
b4afb6bb 495 rules[ruleno].useful = true;
f6857bbf
JD
496 rules[ruleno].action = p->action_props.code;
497 rules[ruleno].action_location = p->action_props.location;
1ff442ca 498
f91b1629
JD
499 /* If the midrule's $$ is set or its $n is used, remove the `$' from the
500 symbol name so that it's a user-defined symbol so that the default
501 %destructor and %printer apply. */
502 if (p->midrule_parent_rule
f6857bbf 503 && (p->action_props.is_value_used
b0f4c4ea 504 || symbol_list_n_get (p->midrule_parent_rule,
f6857bbf
JD
505 p->midrule_parent_rhs_index)
506 ->action_props.is_value_used))
f91b1629
JD
507 p->content.sym->tag += 1;
508
868d2d96
JD
509 /* Don't check the generated rule 0. It has no action, so some rhs
510 symbols may appear unused, but the parsing algorithm ensures that
511 %destructor's are invoked appropriately. */
512 if (p != grammar)
513 grammar_rule_check (p);
ffa4ba3a 514
3be03b13 515 for (p = p->next; p && p->content.sym; p = p->next)
1ff442ca 516 {
e9071366
AD
517 ++rule_length;
518
519 /* Don't allow rule_length == INT_MAX, since that might
520 cause confusion with strtol if INT_MAX == LONG_MAX. */
521 if (rule_length == INT_MAX)
522 fatal_at (rules[ruleno].location, _("rule is too long"));
523
17ee7397 524 /* item_number = symbol_number.
5fbb0954 525 But the former needs to contain more: negative rule numbers. */
3be03b13
JD
526 ritem[itemno++] =
527 symbol_number_as_item_number (p->content.sym->number);
1ff442ca 528 /* A rule gets by default the precedence and associativity
e9071366 529 of its last token. */
3be03b13
JD
530 if (p->content.sym->class == token_sym && default_prec)
531 rules[ruleno].prec = p->content.sym;
1ff442ca
NF
532 }
533
534 /* If this rule has a %prec,
a70083a3 535 the specified symbol's precedence replaces the default. */
1ff442ca
NF
536 if (ruleprec)
537 {
03b31c0c
AD
538 rules[ruleno].precsym = ruleprec;
539 rules[ruleno].prec = ruleprec;
1ff442ca 540 }
e9071366 541 /* An item ends by the rule number (negated). */
4b3d3a8e 542 ritem[itemno++] = rule_number_as_item_number (ruleno);
4f82b42a 543 aver (itemno < ITEM_NUMBER_MAX);
f3849179 544 ++ruleno;
4f82b42a 545 aver (ruleno < RULE_NUMBER_MAX);
1ff442ca 546
a70083a3
AD
547 if (p)
548 p = p->next;
1ff442ca
NF
549 }
550
4f82b42a 551 aver (itemno == nritems);
3067fbef 552
273a74fa 553 if (trace_flag & trace_sets)
3067fbef 554 ritem_print (stderr);
1ff442ca 555}
a70083a3 556\f
fdbcd8e2
AD
557/*------------------------------------------------------------------.
558| Read in the grammar specification and record it in the format |
559| described in gram.h. All actions are copied into ACTION_OBSTACK, |
560| in each case forming the body of a C function (YYACTION) which |
561| contains a switch statement to decide which action to execute. |
562`------------------------------------------------------------------*/
a70083a3
AD
563
564void
565reader (void)
566{
a70083a3 567 /* Initialize the symbol table. */
db8837cb 568 symbols_new ();
b6610515 569
88bce5a2
AD
570 /* Construct the accept symbol. */
571 accept = symbol_get ("$accept", empty_location);
572 accept->class = nterm_sym;
573 accept->number = nvars++;
30171f79 574
a70083a3 575 /* Construct the error token */
39f41916 576 errtoken = symbol_get ("error", empty_location);
d7020c20 577 errtoken->class = token_sym;
72a23c97 578 errtoken->number = ntokens++;
b6610515 579
a70083a3
AD
580 /* Construct a token that represents all undefined literal tokens.
581 It is always token number 2. */
88bce5a2 582 undeftoken = symbol_get ("$undefined", empty_location);
d7020c20 583 undeftoken->class = token_sym;
72a23c97 584 undeftoken->number = ntokens++;
a70083a3 585
2b81e969 586 gram_in = xfopen (grammar_file, "r");
e9955c83 587
473d0a75
AD
588 gram__flex_debug = trace_flag & trace_scan;
589 gram_debug = trace_flag & trace_parse;
e9071366 590 gram_scanner_initialize ();
78c3da9e 591 gram_parse ();
331dbc1b 592
ba5c6d94 593 /* Set front-end %define variable defaults. */
67212941 594 muscle_percent_define_default ("lr.keep-unreachable-states", "false");
db34f798
JD
595 {
596 char *lr_type;
ba5c6d94
JD
597 /* IELR would be a better default, but LALR is historically the
598 default. */
db34f798
JD
599 muscle_percent_define_default ("lr.type", "LALR");
600 lr_type = muscle_percent_define_get ("lr.type");
601 if (0 != strcmp (lr_type, "canonical LR"))
5bab9d08 602 muscle_percent_define_default ("lr.default-reductions", "all");
db34f798 603 else
5bab9d08 604 muscle_percent_define_default ("lr.default-reductions", "accepting");
db34f798
JD
605 free (lr_type);
606 }
7254f6a8 607
ba5c6d94 608 /* Check front-end %define variables. */
7254f6a8
JD
609 {
610 static char const * const values[] = {
db34f798 611 "lr.type", "LALR", "IELR", "canonical LR", NULL,
5bab9d08 612 "lr.default-reductions", "all", "consistent", "accepting", NULL,
7254f6a8
JD
613 NULL
614 };
615 muscle_percent_define_check_values (values);
616 }
617
02d12d0d
PE
618 if (! complaint_issued)
619 check_and_convert_grammar ();
620
621 xfclose (gram_in);
622}
623
b275314e 624
02d12d0d
PE
625/*-------------------------------------------------------------.
626| Check the grammar that has just been read, and convert it to |
627| internal form. |
628`-------------------------------------------------------------*/
629
630static void
631check_and_convert_grammar (void)
632{
633 /* Grammar has been read. Do some checking. */
e9955c83
AD
634 if (nrules == 0)
635 fatal (_("no rules in the input grammar"));
636
637 /* Report any undefined symbols and consider them nonterminals. */
638 symbols_check_defined ();
b7c49edf 639
88bce5a2
AD
640 /* If the user did not define her ENDTOKEN, do it now. */
641 if (!endtoken)
b7c49edf 642 {
88bce5a2
AD
643 endtoken = symbol_get ("$end", empty_location);
644 endtoken->class = token_sym;
645 endtoken->number = 0;
b7c49edf 646 /* Value specified by POSIX. */
88bce5a2 647 endtoken->user_token_number = 0;
b7c49edf
AD
648 }
649
4d7370cb
JD
650 /* Find the start symbol if no %start. */
651 if (!start_flag)
652 {
653 symbol_list *node;
654 for (node = grammar;
3be03b13 655 node != NULL && symbol_is_dummy (node->content.sym);
4d7370cb
JD
656 node = node->next)
657 {
658 for (node = node->next;
3be03b13 659 node != NULL && node->content.sym != NULL;
4d7370cb
JD
660 node = node->next)
661 ;
662 }
4f82b42a 663 aver (node != NULL);
3be03b13
JD
664 grammar_start_symbol_set (node->content.sym,
665 node->content.sym->location);
4d7370cb
JD
666 }
667
02d12d0d 668 /* Insert the initial rule, whose line is that of the first rule
e9955c83
AD
669 (not that of the start symbol):
670
88bce5a2 671 accept: %start EOF. */
e9955c83 672 {
3be03b13 673 symbol_list *p = symbol_list_sym_new (accept, empty_location);
8efe435c 674 p->location = grammar->location;
3be03b13
JD
675 p->next = symbol_list_sym_new (startsymbol, empty_location);
676 p->next->next = symbol_list_sym_new (endtoken, empty_location);
677 p->next->next->next = symbol_list_sym_new (NULL, empty_location);
e9955c83
AD
678 p->next->next->next->next = grammar;
679 nrules += 1;
680 nritems += 3;
681 grammar = p;
682 }
683
4f82b42a 684 aver (nsyms <= SYMBOL_NUMBER_MAXIMUM && nsyms == ntokens + nvars);
b0c4483e 685
a70083a3
AD
686 /* Assign the symbols their symbol numbers. Write #defines for the
687 token symbols into FDEFINES if requested. */
2f1afb73 688 symbols_pack ();
93ede233 689
574add85
JD
690 /* Scan rule actions after invoking symbol_check_alias_consistency (in
691 symbols_pack above) so that token types are set correctly before the rule
692 action type checking.
693
694 Before invoking grammar_rule_check (in packgram below) on any rule, make
695 sure all actions have already been scanned in order to set `used' flags.
696 Otherwise, checking that a midrule's $$ should be set will not always work
697 properly because the check must forward-reference the midrule's parent
698 rule. For the same reason, all the `used' flags must be set before
699 checking whether to remove `$' from any midrule symbol name (also in
700 packgram). */
14462c2b
JD
701 {
702 symbol_list *sym;
703 for (sym = grammar; sym; sym = sym->next)
704 code_props_translate_code (&sym->action_props);
705 }
574add85 706
a70083a3 707 /* Convert the grammar into the format described in gram.h. */
6d0ef4ec 708 packgram ();
8419d367 709
17ee7397 710 /* The grammar as a symbol_list is no longer needed. */
17bd8a73 711 symbol_list_free (grammar);
a70083a3 712}