src/reader.c

/* Input parser for Bison

   Copyright (C) 1984, 1986, 1989, 1992, 1998, 2000, 2001, 2002, 2003,
   2005, 2006 Free Software Foundation, Inc.

   This file is part of Bison, the GNU Compiler Compiler.

   Bison is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation; either version 2, or (at your option)
   any later version.

   Bison is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with Bison; see the file COPYING.  If not, write to
   the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
   Boston, MA 02110-1301, USA.  */

#include <config.h>
#include "system.h"
#include <assert.h>

#include <quotearg.h>

#include "complain.h"
#include "conflicts.h"
#include "files.h"
#include "getargs.h"
#include "gram.h"
#include "muscle_tab.h"
#include "reader.h"
#include "symlist.h"
#include "symtab.h"
#include "scan-gram.h"
#include "scan-code.h"

static void check_and_convert_grammar (void);

static symbol_list *grammar = NULL;
static bool start_flag = false;
merger_list *merge_functions;

/* Was %union seen?  */
bool typed = false;

/* Should rules have a default precedence?  */
bool default_prec = true;
\f
/*-----------------------.
| Set the start symbol.  |
`-----------------------*/

void
grammar_start_symbol_set (symbol *sym, location loc)
{
  if (start_flag)
    complain_at (loc, _("multiple %s declarations"), "%start");
  else
    {
      start_flag = true;
      startsymbol = sym;
      startsymbol_location = loc;
    }
}


/*---------------------------------------------------------------------.
| There are two prologues: one before the first %union and one after.  |
|  Augment the one specified by POST.                                  |
`---------------------------------------------------------------------*/

void
prologue_augment (const char *prologue, location loc, bool post)
{
  struct obstack *oout =
    !post ? &pre_prologue_obstack : &post_prologue_obstack;

  obstack_fgrow1 (oout, "]b4_syncline(%d, [[", loc.start.line);
  /* FIXME: Protection of M4 characters missing here.  See
     output.c:escaped_output.  */
  MUSCLE_OBSTACK_SGROW (oout,
			quotearg_style (c_quoting_style, loc.start.file));
  obstack_sgrow (oout, "]])[\n");
  obstack_sgrow (oout, prologue);
}

\f

/*-------------------------------------------------------------------.
| Return the merger index for a merging function named NAME, whose   |
| arguments have type TYPE.  Records the function, if new, in        |
| MERGER_LIST.							     |
`-------------------------------------------------------------------*/

static int
get_merge_function (uniqstr name, uniqstr type, location loc)
{
  merger_list *syms;
  merger_list head;
  int n;

  if (! glr_parser)
    return 0;

  if (type == NULL)
    type = uniqstr_new ("");

  head.next = merge_functions;
  for (syms = &head, n = 1; syms->next; syms = syms->next, n += 1)
    if (UNIQSTR_EQ (name, syms->next->name))
      break;
  if (syms->next == NULL)
    {
      syms->next = xmalloc (sizeof syms->next[0]);
      syms->next->name = uniqstr_new (name);
      syms->next->type = uniqstr_new (type);
      syms->next->next = NULL;
      merge_functions = head.next;
    }
  else if (!UNIQSTR_EQ (type, syms->next->type))
    warn_at (loc, _("result type clash on merge function %s: <%s> != <%s>"),
	     name, type, syms->next->type);
  return n;
}

/*--------------------------------------.
| Free all merge-function definitions.	|
`--------------------------------------*/

void
free_merger_functions (void)
{
  merger_list *L0 = merge_functions;
  while (L0)
    {
      merger_list *L1 = L0->next;
      free (L0);
      L0 = L1;
    }
}

\f
/*-------------------------------------------------------------------.
| Parse the input grammar into a one symbol_list structure.  Each    |
| rule is represented by a sequence of symbols: the left hand side   |
| followed by the contents of the right hand side, followed by a     |
| null pointer instead of a symbol to terminate the rule.  The next  |
| symbol is the lhs of the following rule.                           |
|                                                                    |
| All actions are copied out, labelled by the rule number they apply |
| to.                                                                |
`-------------------------------------------------------------------*/

/* The (currently) last symbol of GRAMMAR. */
static symbol_list *grammar_end = NULL;

/* Append SYM to the grammar.  */
static void
grammar_symbol_append (symbol *sym, location loc)
{
  symbol_list *p = symbol_list_new (sym, loc);

  if (grammar_end)
    grammar_end->next = p;
  else
    grammar = p;

  grammar_end = p;

  /* A null SYM stands for an end of rule; it is not an actual
     part of it.  */
  if (sym)
    ++nritems;
}

/* The rule currently being defined, and the previous rule.
   CURRENT_RULE points to the first LHS of the current rule, while
   PREVIOUS_RULE_END points to the *end* of the previous rule (NULL).  */
symbol_list *current_rule = NULL;
static symbol_list *previous_rule_end = NULL;


/*----------------------------------------------.
| Create a new rule for LHS in to the GRAMMAR.  |
`----------------------------------------------*/

void
grammar_current_rule_begin (symbol *lhs, location loc)
{
  if (!start_flag)
    {
      startsymbol = lhs;
      startsymbol_location = loc;
      start_flag = true;
    }

  /* Start a new rule and record its lhs.  */
  ++nrules;
  previous_rule_end = grammar_end;
  grammar_symbol_append (lhs, loc);
  current_rule = grammar_end;

  /* Mark the rule's lhs as a nonterminal if not already so.  */
  if (lhs->class == unknown_sym)
    {
      lhs->class = nterm_sym;
      lhs->number = nvars;
      ++nvars;
    }
  else if (lhs->class == token_sym)
    complain_at (loc, _("rule given for %s, which is a token"), lhs->tag);
}


/*----------------------------------------------------------------------.
| A symbol should be used if it has a destructor, or if it is a         |
| mid-rule symbol (i.e., the generated LHS replacing a mid-rule         |
| action) that was assigned to, as in "exp: { $$ = 1; } { $$ = $1; }".  |
`----------------------------------------------------------------------*/

static bool
symbol_should_be_used (symbol_list const *s)
{
  return (s->sym->destructor
	  || (s->midrule && s->midrule->used));
}

/*----------------------------------------------------------------.
| Check that the rule R is properly defined.  For instance, there |
| should be no type clash on the default action.                  |
`----------------------------------------------------------------*/

static void
grammar_rule_check (const symbol_list *r)
{
  /* Type check.

     If there is an action, then there is nothing we can do: the user
     is allowed to shoot herself in the foot.

     Don't worry about the default action if $$ is untyped, since $$'s
     value can't be used.  */
  if (!r->action && r->sym->type_name)
    {
      symbol *first_rhs = r->next->sym;
      /* If $$ is being set in default way, report if any type mismatch.  */
      if (first_rhs)
	{
	  char const *lhs_type = r->sym->type_name;
	  const char *rhs_type =
	    first_rhs->type_name ? first_rhs->type_name : "";
	  if (!UNIQSTR_EQ (lhs_type, rhs_type))
	    warn_at (r->location,
		     _("type clash on default action: <%s> != <%s>"),
		     lhs_type, rhs_type);
	}
      /* Warn if there is no default for $$ but we need one.  */
      else
	warn_at (r->location,
		 _("empty rule for typed nonterminal, and no action"));
    }

  /* Check that symbol values that should be used are in fact used.  */
  {
    symbol_list const *l = r;
    int n = 0;
    for (; l && l->sym; l = l->next, ++n)
      if (! (l->used
	     || !symbol_should_be_used (l)
	     /* The default action, $$ = $1, `uses' both.  */
	     || (!r->action && (n == 0 || n == 1))))
	{
	  if (n)
	    warn_at (r->location, _("unused value: $%d"), n);
	  else
	    warn_at (r->location, _("unset value: $$"));
	}
  }
}


/*-------------------------------------.
| End the currently being grown rule.  |
`-------------------------------------*/

void
grammar_current_rule_end (location loc)
{
  /* Put an empty link in the list to mark the end of this rule  */
  grammar_symbol_append (NULL, grammar_end->location);
  current_rule->location = loc;
  grammar_rule_check (current_rule);
}


/*-------------------------------------------------------------------.
| The previous action turns out the be a mid-rule action.  Attach it |
| to the current rule, i.e., create a dummy symbol, attach it this   |
| mid-rule action, and append this dummy nonterminal to the current  |
| rule.                                                              |
`-------------------------------------------------------------------*/

void
grammar_midrule_action (void)
{
  /* Since the action was written out with this rule's number, we must
     give the new rule this number by inserting the new rule before
     it.  */

  /* Make a DUMMY nonterminal, whose location is that of the midrule
     action.  Create the MIDRULE.  */
  location dummy_location = current_rule->action_location;
  symbol *dummy = dummy_symbol_get (dummy_location);
  symbol_list *midrule = symbol_list_new (dummy, dummy_location);

  /* Make a new rule, whose body is empty, before the current one, so
     that the action just read can belong to it.  */
  ++nrules;
  ++nritems;
  /* Attach its location and actions to that of the DUMMY.  */
  midrule->location = dummy_location;
  midrule->action = current_rule->action;
  midrule->action_location = dummy_location;
  current_rule->action = NULL;
  /* If $$ was used in the action, the LHS of the enclosing rule was
     incorrectly flagged as used.  */
  midrule->used = current_rule->used;
  current_rule->used = false;

  if (previous_rule_end)
    previous_rule_end->next = midrule;
  else
    grammar = midrule;

  /* End the dummy's rule.  */
  midrule->next = symbol_list_new (NULL, dummy_location);
  grammar_rule_check (midrule);
  midrule->next->next = current_rule;

  previous_rule_end = midrule->next;

  /* Insert the dummy nonterminal replacing the midrule action into
     the current rule.  Bind it to its dedicated rule.  */
  grammar_current_rule_symbol_append (dummy, dummy_location);
  grammar_end->midrule = midrule;
}

/* Set the precedence symbol of the current rule to PRECSYM. */

void
grammar_current_rule_prec_set (symbol *precsym, location loc)
{
  if (current_rule->ruleprec)
    complain_at (loc, _("only one %s allowed per rule"), "%prec");
  current_rule->ruleprec = precsym;
}

/* Attach dynamic precedence DPREC to the current rule. */

void
grammar_current_rule_dprec_set (int dprec, location loc)
{
  if (! glr_parser)
    warn_at (loc, _("%s affects only GLR parsers"), "%dprec");
  if (dprec <= 0)
    complain_at (loc, _("%s must be followed by positive number"), "%dprec");
  else if (current_rule->dprec != 0)
    complain_at (loc, _("only one %s allowed per rule"), "%dprec");
  current_rule->dprec = dprec;
}

/* Attach a merge function NAME with argument type TYPE to current
   rule. */

void
grammar_current_rule_merge_set (uniqstr name, location loc)
{
  if (! glr_parser)
    warn_at (loc, _("%s affects only GLR parsers"), "%merge");
  if (current_rule->merger != 0)
    complain_at (loc, _("only one %s allowed per rule"), "%merge");
  current_rule->merger =
    get_merge_function (name, current_rule->sym->type_name, loc);
}

/* Attach SYM to the current rule.  If needed, move the previous
   action as a mid-rule action.  */

void
grammar_current_rule_symbol_append (symbol *sym, location loc)
{
  if (current_rule->action)
    grammar_midrule_action ();
  grammar_symbol_append (sym, loc);
}

/* Attach an ACTION to the current rule.  */

void
grammar_current_rule_action_append (const char *action, location loc)
{
  if (current_rule->action)
    grammar_midrule_action ();
  current_rule->action = translate_rule_action (current_rule, action, loc);
  current_rule->action_location = loc;
}

\f
/*---------------------------------------------------------------.
| Convert the rules into the representation using RRHS, RLHS and |
| RITEM.                                                         |
`---------------------------------------------------------------*/

static void
packgram (void)
{
  unsigned int itemno = 0;
  rule_number ruleno = 0;
  symbol_list *p = grammar;

  ritem = xnmalloc (nritems + 1, sizeof *ritem);

  /* This sentinel is used by build_relations in gram.c.  */
  *ritem++ = 0;

  rules = xnmalloc (nrules, sizeof *rules);

  while (p)
    {
      int rule_length = 0;
      symbol *ruleprec = p->ruleprec;
      rules[ruleno].user_number = ruleno;
      rules[ruleno].number = ruleno;
      rules[ruleno].lhs = p->sym;
      rules[ruleno].rhs = ritem + itemno;
      rules[ruleno].prec = NULL;
      rules[ruleno].dprec = p->dprec;
      rules[ruleno].merger = p->merger;
      rules[ruleno].precsym = NULL;
      rules[ruleno].location = p->location;
      rules[ruleno].useful = true;
      rules[ruleno].action = p->action;
      rules[ruleno].action_location = p->action_location;

      for (p = p->next; p && p->sym; p = p->next)
	{
	  ++rule_length;

	  /* Don't allow rule_length == INT_MAX, since that might
	     cause confusion with strtol if INT_MAX == LONG_MAX.  */
	  if (rule_length == INT_MAX)
	      fatal_at (rules[ruleno].location, _("rule is too long"));

	  /* item_number = symbol_number.
	     But the former needs to contain more: negative rule numbers. */
	  ritem[itemno++] = symbol_number_as_item_number (p->sym->number);
	  /* A rule gets by default the precedence and associativity
	     of its last token.  */
	  if (p->sym->class == token_sym && default_prec)
	    rules[ruleno].prec = p->sym;
	}

      /* If this rule has a %prec,
         the specified symbol's precedence replaces the default.  */
      if (ruleprec)
	{
	  rules[ruleno].precsym = ruleprec;
	  rules[ruleno].prec = ruleprec;
	}
      /* An item ends by the rule number (negated).  */
      ritem[itemno++] = rule_number_as_item_number (ruleno);
      assert (itemno < ITEM_NUMBER_MAX);
      ++ruleno;
      assert (ruleno < RULE_NUMBER_MAX);

      if (p)
	p = p->next;
    }

  assert (itemno == nritems);

  if (trace_flag & trace_sets)
    ritem_print (stderr);
}
\f
/*------------------------------------------------------------------.
| Read in the grammar specification and record it in the format     |
| described in gram.h.  All actions are copied into ACTION_OBSTACK, |
| in each case forming the body of a C function (YYACTION) which    |
| contains a switch statement to decide which action to execute.    |
`------------------------------------------------------------------*/

void
reader (void)
{
  /* Initialize the symbol table.  */
  symbols_new ();

  /* Construct the accept symbol. */
  accept = symbol_get ("$accept", empty_location);
  accept->class = nterm_sym;
  accept->number = nvars++;

  /* Construct the error token */
  errtoken = symbol_get ("error", empty_location);
  errtoken->class = token_sym;
  errtoken->number = ntokens++;

  /* Construct a token that represents all undefined literal tokens.
     It is always token number 2.  */
  undeftoken = symbol_get ("$undefined", empty_location);
  undeftoken->class = token_sym;
  undeftoken->number = ntokens++;

  /* Initialize the obstacks. */
  obstack_init (&pre_prologue_obstack);
  obstack_init (&post_prologue_obstack);

  gram_in = xfopen (grammar_file, "r");

  gram__flex_debug = trace_flag & trace_scan;
  gram_debug = trace_flag & trace_parse;
  gram_scanner_initialize ();
  gram_parse ();

  if (! complaint_issued)
    check_and_convert_grammar ();

  xfclose (gram_in);
}


/*-------------------------------------------------------------.
| Check the grammar that has just been read, and convert it to |
| internal form.					       |
`-------------------------------------------------------------*/

static void
check_and_convert_grammar (void)
{
  /* Grammar has been read.  Do some checking.  */
  if (nrules == 0)
    fatal (_("no rules in the input grammar"));

  /* Report any undefined symbols and consider them nonterminals.  */
  symbols_check_defined ();

  /* If the user did not define her ENDTOKEN, do it now. */
  if (!endtoken)
    {
      endtoken = symbol_get ("$end", empty_location);
      endtoken->class = token_sym;
      endtoken->number = 0;
      /* Value specified by POSIX.  */
      endtoken->user_token_number = 0;
    }

  /* Insert the initial rule, whose line is that of the first rule
     (not that of the start symbol):

     accept: %start EOF.  */
  {
    symbol_list *p = symbol_list_new (accept, empty_location);
    p->location = grammar->location;
    p->next = symbol_list_new (startsymbol, empty_location);
    p->next->next = symbol_list_new (endtoken, empty_location);
    p->next->next->next = symbol_list_new (NULL, empty_location);
    p->next->next->next->next = grammar;
    nrules += 1;
    nritems += 3;
    grammar = p;
  }

  assert (nsyms <= SYMBOL_NUMBER_MAXIMUM && nsyms == ntokens + nvars);

  /* Assign the symbols their symbol numbers.  Write #defines for the
     token symbols into FDEFINES if requested.  */
  symbols_pack ();

  /* Convert the grammar into the format described in gram.h.  */
  packgram ();

  /* The grammar as a symbol_list is no longer needed. */
  LIST_FREE (symbol_list, grammar);
}
Commit	Line	Data
	1	/* Input parser for Bison
	2
	3	Copyright (C) 1984, 1986, 1989, 1992, 1998, 2000, 2001, 2002, 2003,
	4	2005, 2006 Free Software Foundation, Inc.
	5
	6	This file is part of Bison, the GNU Compiler Compiler.
	7
	8	Bison is free software; you can redistribute it and/or modify
	9	it under the terms of the GNU General Public License as published by
	10	the Free Software Foundation; either version 2, or (at your option)
	11	any later version.
	12
	13	Bison is distributed in the hope that it will be useful,
	14	but WITHOUT ANY WARRANTY; without even the implied warranty of
	15	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	16	GNU General Public License for more details.
	17
	18	You should have received a copy of the GNU General Public License
	19	along with Bison; see the file COPYING. If not, write to
	20	the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
	21	Boston, MA 02110-1301, USA. */
	22
	23	#include <config.h>
	24	#include "system.h"
	25	#include <assert.h>
	26
	27	#include <quotearg.h>
	28
	29	#include "complain.h"
	30	#include "conflicts.h"
	31	#include "files.h"
	32	#include "getargs.h"
	33	#include "gram.h"
	34	#include "muscle_tab.h"
	35	#include "reader.h"
	36	#include "symlist.h"
	37	#include "symtab.h"
	38	#include "scan-gram.h"
	39	#include "scan-code.h"
	40
	41	static void check_and_convert_grammar (void);
	42
	43	static symbol_list *grammar = NULL;
	44	static bool start_flag = false;
	45	merger_list *merge_functions;
	46
	47	/* Was %union seen? */
	48	bool typed = false;
	49
	50	/* Should rules have a default precedence? */
	51	bool default_prec = true;
	52	\f
	53	/*-----------------------.
	54	\| Set the start symbol. \|
	55	`-----------------------*/
	56
	57	void
	58	grammar_start_symbol_set (symbol *sym, location loc)
	59	{
	60	if (start_flag)
	61	complain_at (loc, _("multiple %s declarations"), "%start");
	62	else
	63	{
	64	start_flag = true;
	65	startsymbol = sym;
	66	startsymbol_location = loc;
	67	}
	68	}
	69
	70
	71	/*---------------------------------------------------------------------.
	72	\| There are two prologues: one before the first %union and one after. \|
	73	\| Augment the one specified by POST. \|
	74	`---------------------------------------------------------------------*/
	75
	76	void
	77	prologue_augment (const char *prologue, location loc, bool post)
	78	{
	79	struct obstack *oout =
	80	!post ? &pre_prologue_obstack : &post_prologue_obstack;
	81
	82	obstack_fgrow1 (oout, "]b4_syncline(%d, [[", loc.start.line);
	83	/* FIXME: Protection of M4 characters missing here. See
	84	output.c:escaped_output. */
	85	MUSCLE_OBSTACK_SGROW (oout,
	86	quotearg_style (c_quoting_style, loc.start.file));
	87	obstack_sgrow (oout, "]])[\n");
	88	obstack_sgrow (oout, prologue);
	89	}
	90
	91	\f
	92
	93	/*-------------------------------------------------------------------.
	94	\| Return the merger index for a merging function named NAME, whose \|
	95	\| arguments have type TYPE. Records the function, if new, in \|
	96	\| MERGER_LIST. \|
	97	`-------------------------------------------------------------------*/
	98
	99	static int
	100	get_merge_function (uniqstr name, uniqstr type, location loc)
	101	{
	102	merger_list *syms;
	103	merger_list head;
	104	int n;
	105
	106	if (! glr_parser)
	107	return 0;
	108
	109	if (type == NULL)
	110	type = uniqstr_new ("");
	111
	112	head.next = merge_functions;
	113	for (syms = &head, n = 1; syms->next; syms = syms->next, n += 1)
	114	if (UNIQSTR_EQ (name, syms->next->name))
	115	break;
	116	if (syms->next == NULL)
	117	{
	118	syms->next = xmalloc (sizeof syms->next[0]);
	119	syms->next->name = uniqstr_new (name);
	120	syms->next->type = uniqstr_new (type);
	121	syms->next->next = NULL;
	122	merge_functions = head.next;
	123	}
	124	else if (!UNIQSTR_EQ (type, syms->next->type))
	125	warn_at (loc, _("result type clash on merge function %s: <%s> != <%s>"),
	126	name, type, syms->next->type);
	127	return n;
	128	}
	129
	130	/*--------------------------------------.
	131	\| Free all merge-function definitions. \|
	132	`--------------------------------------*/
	133
	134	void
	135	free_merger_functions (void)
	136	{
	137	merger_list *L0 = merge_functions;
	138	while (L0)
	139	{
	140	merger_list *L1 = L0->next;
	141	free (L0);
	142	L0 = L1;
	143	}
	144	}
	145
	146	\f
	147	/*-------------------------------------------------------------------.
	148	\| Parse the input grammar into a one symbol_list structure. Each \|
	149	\| rule is represented by a sequence of symbols: the left hand side \|
	150	\| followed by the contents of the right hand side, followed by a \|
	151	\| null pointer instead of a symbol to terminate the rule. The next \|
	152	\| symbol is the lhs of the following rule. \|
	153	\| \|
	154	\| All actions are copied out, labelled by the rule number they apply \|
	155	\| to. \|
	156	`-------------------------------------------------------------------*/
	157
	158	/* The (currently) last symbol of GRAMMAR. */
	159	static symbol_list *grammar_end = NULL;
	160
	161	/* Append SYM to the grammar. */
	162	static void
	163	grammar_symbol_append (symbol *sym, location loc)
	164	{
	165	symbol_list *p = symbol_list_new (sym, loc);
	166
	167	if (grammar_end)
	168	grammar_end->next = p;
	169	else
	170	grammar = p;
	171
	172	grammar_end = p;
	173
	174	/* A null SYM stands for an end of rule; it is not an actual
	175	part of it. */
	176	if (sym)
	177	++nritems;
	178	}
	179
	180	/* The rule currently being defined, and the previous rule.
	181	CURRENT_RULE points to the first LHS of the current rule, while
	182	PREVIOUS_RULE_END points to the end of the previous rule (NULL). */
	183	symbol_list *current_rule = NULL;
	184	static symbol_list *previous_rule_end = NULL;
	185
	186
	187	/*----------------------------------------------.
	188	\| Create a new rule for LHS in to the GRAMMAR. \|
	189	`----------------------------------------------*/
	190
	191	void
	192	grammar_current_rule_begin (symbol *lhs, location loc)
	193	{
	194	if (!start_flag)
	195	{
	196	startsymbol = lhs;
	197	startsymbol_location = loc;
	198	start_flag = true;
	199	}
	200
	201	/* Start a new rule and record its lhs. */
	202	++nrules;
	203	previous_rule_end = grammar_end;
	204	grammar_symbol_append (lhs, loc);
	205	current_rule = grammar_end;
	206
	207	/* Mark the rule's lhs as a nonterminal if not already so. */
	208	if (lhs->class == unknown_sym)
	209	{
	210	lhs->class = nterm_sym;
	211	lhs->number = nvars;
	212	++nvars;
	213	}
	214	else if (lhs->class == token_sym)
	215	complain_at (loc, _("rule given for %s, which is a token"), lhs->tag);
	216	}
	217
	218
	219	/*----------------------------------------------------------------------.
	220	\| A symbol should be used if it has a destructor, or if it is a \|
	221	\| mid-rule symbol (i.e., the generated LHS replacing a mid-rule \|
	222	\| action) that was assigned to, as in "exp: { $$ = 1; } { $$ = $1; }". \|
	223	`----------------------------------------------------------------------*/
	224
	225	static bool
	226	symbol_should_be_used (symbol_list const *s)
	227	{
	228	return (s->sym->destructor
	229	\|\| (s->midrule && s->midrule->used));
	230	}
	231
	232	/*----------------------------------------------------------------.
	233	\| Check that the rule R is properly defined. For instance, there \|
	234	\| should be no type clash on the default action. \|
	235	`----------------------------------------------------------------*/
	236
	237	static void
	238	grammar_rule_check (const symbol_list *r)
	239	{
	240	/* Type check.
	241
	242	If there is an action, then there is nothing we can do: the user
	243	is allowed to shoot herself in the foot.
	244
	245	Don't worry about the default action if $$ is untyped, since $$'s
	246	value can't be used. */
	247	if (!r->action && r->sym->type_name)
	248	{
	249	symbol *first_rhs = r->next->sym;
	250	/* If $$ is being set in default way, report if any type mismatch. */
	251	if (first_rhs)
	252	{
	253	char const *lhs_type = r->sym->type_name;
	254	const char *rhs_type =
	255	first_rhs->type_name ? first_rhs->type_name : "";
	256	if (!UNIQSTR_EQ (lhs_type, rhs_type))
	257	warn_at (r->location,
	258	_("type clash on default action: <%s> != <%s>"),
	259	lhs_type, rhs_type);
	260	}
	261	/* Warn if there is no default for $$ but we need one. */
	262	else
	263	warn_at (r->location,
	264	_("empty rule for typed nonterminal, and no action"));
	265	}
	266
	267	/* Check that symbol values that should be used are in fact used. */
	268	{
	269	symbol_list const *l = r;
	270	int n = 0;
	271	for (; l && l->sym; l = l->next, ++n)
	272	if (! (l->used
	273	\|\| !symbol_should_be_used (l)
	274	/* The default action, $$ = $1, `uses' both. */
	275	\|\| (!r->action && (n == 0 \|\| n == 1))))
	276	{
	277	if (n)
	278	warn_at (r->location, _("unused value: $%d"), n);
	279	else
	280	warn_at (r->location, _("unset value: $$"));
	281	}
	282	}
	283	}
	284
	285
	286	/*-------------------------------------.
	287	\| End the currently being grown rule. \|
	288	`-------------------------------------*/
	289
	290	void
	291	grammar_current_rule_end (location loc)
	292	{
	293	/* Put an empty link in the list to mark the end of this rule */
	294	grammar_symbol_append (NULL, grammar_end->location);
	295	current_rule->location = loc;
	296	grammar_rule_check (current_rule);
	297	}
	298
	299
	300	/*-------------------------------------------------------------------.
	301	\| The previous action turns out the be a mid-rule action. Attach it \|
	302	\| to the current rule, i.e., create a dummy symbol, attach it this \|
	303	\| mid-rule action, and append this dummy nonterminal to the current \|
	304	\| rule. \|
	305	`-------------------------------------------------------------------*/
	306
	307	void
	308	grammar_midrule_action (void)
	309	{
	310	/* Since the action was written out with this rule's number, we must
	311	give the new rule this number by inserting the new rule before
	312	it. */
	313
	314	/* Make a DUMMY nonterminal, whose location is that of the midrule
	315	action. Create the MIDRULE. */
	316	location dummy_location = current_rule->action_location;
	317	symbol *dummy = dummy_symbol_get (dummy_location);
	318	symbol_list *midrule = symbol_list_new (dummy, dummy_location);
	319
	320	/* Make a new rule, whose body is empty, before the current one, so
	321	that the action just read can belong to it. */
	322	++nrules;
	323	++nritems;
	324	/* Attach its location and actions to that of the DUMMY. */
	325	midrule->location = dummy_location;
	326	midrule->action = current_rule->action;
	327	midrule->action_location = dummy_location;
	328	current_rule->action = NULL;
	329	/* If $$ was used in the action, the LHS of the enclosing rule was
	330	incorrectly flagged as used. */
	331	midrule->used = current_rule->used;
	332	current_rule->used = false;
	333
	334	if (previous_rule_end)
	335	previous_rule_end->next = midrule;
	336	else
	337	grammar = midrule;
	338
	339	/* End the dummy's rule. */
	340	midrule->next = symbol_list_new (NULL, dummy_location);
	341	grammar_rule_check (midrule);
	342	midrule->next->next = current_rule;
	343
	344	previous_rule_end = midrule->next;
	345
	346	/* Insert the dummy nonterminal replacing the midrule action into
	347	the current rule. Bind it to its dedicated rule. */
	348	grammar_current_rule_symbol_append (dummy, dummy_location);
	349	grammar_end->midrule = midrule;
	350	}
	351
	352	/* Set the precedence symbol of the current rule to PRECSYM. */
	353
	354	void
	355	grammar_current_rule_prec_set (symbol *precsym, location loc)
	356	{
	357	if (current_rule->ruleprec)
	358	complain_at (loc, _("only one %s allowed per rule"), "%prec");
	359	current_rule->ruleprec = precsym;
	360	}
	361
	362	/* Attach dynamic precedence DPREC to the current rule. */
	363
	364	void
	365	grammar_current_rule_dprec_set (int dprec, location loc)
	366	{
	367	if (! glr_parser)
	368	warn_at (loc, _("%s affects only GLR parsers"), "%dprec");
	369	if (dprec <= 0)
	370	complain_at (loc, _("%s must be followed by positive number"), "%dprec");
	371	else if (current_rule->dprec != 0)
	372	complain_at (loc, _("only one %s allowed per rule"), "%dprec");
	373	current_rule->dprec = dprec;
	374	}
	375
	376	/* Attach a merge function NAME with argument type TYPE to current
	377	rule. */
	378
	379	void
	380	grammar_current_rule_merge_set (uniqstr name, location loc)
	381	{
	382	if (! glr_parser)
	383	warn_at (loc, _("%s affects only GLR parsers"), "%merge");
	384	if (current_rule->merger != 0)
	385	complain_at (loc, _("only one %s allowed per rule"), "%merge");
	386	current_rule->merger =
	387	get_merge_function (name, current_rule->sym->type_name, loc);
	388	}
	389
	390	/* Attach SYM to the current rule. If needed, move the previous
	391	action as a mid-rule action. */
	392
	393	void
	394	grammar_current_rule_symbol_append (symbol *sym, location loc)
	395	{
	396	if (current_rule->action)
	397	grammar_midrule_action ();
	398	grammar_symbol_append (sym, loc);
	399	}
	400
	401	/* Attach an ACTION to the current rule. */
	402
	403	void
	404	grammar_current_rule_action_append (const char *action, location loc)
	405	{
	406	if (current_rule->action)
	407	grammar_midrule_action ();
	408	current_rule->action = translate_rule_action (current_rule, action, loc);
	409	current_rule->action_location = loc;
	410	}
	411
	412	\f
	413	/*---------------------------------------------------------------.
	414	\| Convert the rules into the representation using RRHS, RLHS and \|
	415	\| RITEM. \|
	416	`---------------------------------------------------------------*/
	417
	418	static void
	419	packgram (void)
	420	{
	421	unsigned int itemno = 0;
	422	rule_number ruleno = 0;
	423	symbol_list *p = grammar;
	424
	425	ritem = xnmalloc (nritems + 1, sizeof *ritem);
	426
	427	/* This sentinel is used by build_relations in gram.c. */
	428	*ritem++ = 0;
	429
	430	rules = xnmalloc (nrules, sizeof *rules);
	431
	432	while (p)
	433	{
	434	int rule_length = 0;
	435	symbol *ruleprec = p->ruleprec;
	436	rules[ruleno].user_number = ruleno;
	437	rules[ruleno].number = ruleno;
	438	rules[ruleno].lhs = p->sym;
	439	rules[ruleno].rhs = ritem + itemno;
	440	rules[ruleno].prec = NULL;
	441	rules[ruleno].dprec = p->dprec;
	442	rules[ruleno].merger = p->merger;
	443	rules[ruleno].precsym = NULL;
	444	rules[ruleno].location = p->location;
	445	rules[ruleno].useful = true;
	446	rules[ruleno].action = p->action;
	447	rules[ruleno].action_location = p->action_location;
	448
	449	for (p = p->next; p && p->sym; p = p->next)
	450	{
	451	++rule_length;
	452
	453	/* Don't allow rule_length == INT_MAX, since that might
	454	cause confusion with strtol if INT_MAX == LONG_MAX. */
	455	if (rule_length == INT_MAX)
	456	fatal_at (rules[ruleno].location, _("rule is too long"));
	457
	458	/* item_number = symbol_number.
	459	But the former needs to contain more: negative rule numbers. */
	460	ritem[itemno++] = symbol_number_as_item_number (p->sym->number);
	461	/* A rule gets by default the precedence and associativity
	462	of its last token. */
	463	if (p->sym->class == token_sym && default_prec)
	464	rules[ruleno].prec = p->sym;
	465	}
	466
	467	/* If this rule has a %prec,
	468	the specified symbol's precedence replaces the default. */
	469	if (ruleprec)
	470	{
	471	rules[ruleno].precsym = ruleprec;
	472	rules[ruleno].prec = ruleprec;
	473	}
	474	/* An item ends by the rule number (negated). */
	475	ritem[itemno++] = rule_number_as_item_number (ruleno);
	476	assert (itemno < ITEM_NUMBER_MAX);
	477	++ruleno;
	478	assert (ruleno < RULE_NUMBER_MAX);
	479
	480	if (p)
	481	p = p->next;
	482	}
	483
	484	assert (itemno == nritems);
	485
	486	if (trace_flag & trace_sets)
	487	ritem_print (stderr);
	488	}
	489	\f
	490	/*------------------------------------------------------------------.
	491	\| Read in the grammar specification and record it in the format \|
	492	\| described in gram.h. All actions are copied into ACTION_OBSTACK, \|
	493	\| in each case forming the body of a C function (YYACTION) which \|
	494	\| contains a switch statement to decide which action to execute. \|
	495	`------------------------------------------------------------------*/
	496
	497	void
	498	reader (void)
	499	{
	500	/* Initialize the symbol table. */
	501	symbols_new ();
	502
	503	/* Construct the accept symbol. */
	504	accept = symbol_get ("$accept", empty_location);
	505	accept->class = nterm_sym;
	506	accept->number = nvars++;
	507
	508	/* Construct the error token */
	509	errtoken = symbol_get ("error", empty_location);
	510	errtoken->class = token_sym;
	511	errtoken->number = ntokens++;
	512
	513	/* Construct a token that represents all undefined literal tokens.
	514	It is always token number 2. */
	515	undeftoken = symbol_get ("$undefined", empty_location);
	516	undeftoken->class = token_sym;
	517	undeftoken->number = ntokens++;
	518
	519	/* Initialize the obstacks. */
	520	obstack_init (&pre_prologue_obstack);
	521	obstack_init (&post_prologue_obstack);
	522
	523	gram_in = xfopen (grammar_file, "r");
	524
	525	gram__flex_debug = trace_flag & trace_scan;
	526	gram_debug = trace_flag & trace_parse;
	527	gram_scanner_initialize ();
	528	gram_parse ();
	529
	530	if (! complaint_issued)
	531	check_and_convert_grammar ();
	532
	533	xfclose (gram_in);
	534	}
	535
	536
	537	/*-------------------------------------------------------------.
	538	\| Check the grammar that has just been read, and convert it to \|
	539	\| internal form. \|
	540	`-------------------------------------------------------------*/
	541
	542	static void
	543	check_and_convert_grammar (void)
	544	{
	545	/* Grammar has been read. Do some checking. */
	546	if (nrules == 0)
	547	fatal (_("no rules in the input grammar"));
	548
	549	/* Report any undefined symbols and consider them nonterminals. */
	550	symbols_check_defined ();
	551
	552	/* If the user did not define her ENDTOKEN, do it now. */
	553	if (!endtoken)
	554	{
	555	endtoken = symbol_get ("$end", empty_location);
	556	endtoken->class = token_sym;
	557	endtoken->number = 0;
	558	/* Value specified by POSIX. */
	559	endtoken->user_token_number = 0;
	560	}
	561
	562	/* Insert the initial rule, whose line is that of the first rule
	563	(not that of the start symbol):
	564
	565	accept: %start EOF. */
	566	{
	567	symbol_list *p = symbol_list_new (accept, empty_location);
	568	p->location = grammar->location;
	569	p->next = symbol_list_new (startsymbol, empty_location);
	570	p->next->next = symbol_list_new (endtoken, empty_location);
	571	p->next->next->next = symbol_list_new (NULL, empty_location);
	572	p->next->next->next->next = grammar;
	573	nrules += 1;
	574	nritems += 3;
	575	grammar = p;
	576	}
	577
	578	assert (nsyms <= SYMBOL_NUMBER_MAXIMUM && nsyms == ntokens + nvars);
	579
	580	/* Assign the symbols their symbol numbers. Write #defines for the
	581	token symbols into FDEFINES if requested. */
	582	symbols_pack ();
	583
	584	/* Convert the grammar into the format described in gram.h. */
	585	packgram ();
	586
	587	/* The grammar as a symbol_list is no longer needed. */
	588	LIST_FREE (symbol_list, grammar);
	589	}