[bison.git] / src / LR0.c

/* Generate the nondeterministic finite state machine for bison,
   Copyright 1984, 1986, 1989, 2000, 2001  Free Software Foundation, Inc.

   This file is part of Bison, the GNU Compiler Compiler.

   Bison is free software; you can redistribute it and/or modify
   it under the terms of the GNU General Public License as published by
   the Free Software Foundation; either version 2, or (at your option)
   any later version.

   Bison is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
   GNU General Public License for more details.

   You should have received a copy of the GNU General Public License
   along with Bison; see the file COPYING.  If not, write to
   the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
   Boston, MA 02111-1307, USA.  */


/* See comments in state.h for the data structures that represent it.
   The entry point is generate_states.  */

#include "system.h"
#include "getargs.h"
#include "gram.h"
#include "state.h"
#include "complain.h"
#include "closure.h"
#include "LR0.h"


int nstates;
int final_state;
core *first_state = NULL;
shifts *first_shift = NULL;
reductions *first_reduction = NULL;

static core *this_state = NULL;
static core *last_state = NULL;
static shifts *last_shift = NULL;
static reductions *last_reduction = NULL;

static int nshifts;
static short *shift_symbol = NULL;

static short *redset = NULL;
static short *shiftset = NULL;

static short **kernel_base = NULL;
static short **kernel_end = NULL;
static short *kernel_items = NULL;

/* hash table for states, to recognize equivalent ones.  */

#define	STATE_TABLE_SIZE	1009
static core **state_table = NULL;

\f
static void
allocate_itemsets (void)
{
  short *itemp = NULL;
  int symbol;
  int i;
  int count;
  short *symbol_count = NULL;

  count = 0;
  symbol_count = XCALLOC (short, nsyms);

  itemp = ritem;
  symbol = *itemp++;
  while (symbol)
    {
      if (symbol > 0)
	{
	  count++;
	  symbol_count[symbol]++;
	}
      symbol = *itemp++;
    }

  /* See comments before new_itemsets.  All the vectors of items
     live inside KERNEL_ITEMS.  The number of active items after
     some symbol cannot be more than the number of times that symbol
     appears as an item, which is symbol_count[symbol].
     We allocate that much space for each symbol.  */

  kernel_base = XCALLOC (short *, nsyms);
  if (count)
    kernel_items = XCALLOC (short, count);

  count = 0;
  for (i = 0; i < nsyms; i++)
    {
      kernel_base[i] = kernel_items + count;
      count += symbol_count[i];
    }

  shift_symbol = symbol_count;
  kernel_end = XCALLOC (short *, nsyms);
}


static void
allocate_storage (void)
{
  allocate_itemsets ();

  shiftset = XCALLOC (short, nsyms);
  redset = XCALLOC (short, nrules + 1);
  state_table = XCALLOC (core *, STATE_TABLE_SIZE);
}


static void
free_storage (void)
{
  XFREE (shift_symbol);
  XFREE (redset);
  XFREE (shiftset);
  XFREE (kernel_base);
  XFREE (kernel_end);
  XFREE (kernel_items);
  XFREE (state_table);
}


/*----------------------------------------------------------------.
| Find which symbols can be shifted in the current state, and for |
| each one record which items would be active after that shift.   |
| Uses the contents of itemset.                                   |
|                                                                 |
| shift_symbol is set to a vector of the symbols that can be      |
| shifted.  For each symbol in the grammar, kernel_base[symbol]   |
| points to a vector of item numbers activated if that symbol is  |
| shifted, and kernel_end[symbol] points after the end of that    |
| vector.                                                         |
`----------------------------------------------------------------*/

static void
new_itemsets (void)
{
  int i;
  int shiftcount;

  if (trace_flag)
    fprintf (stderr, "Entering new_itemsets, state = %d\n", nstates);

  for (i = 0; i < nsyms; i++)
    kernel_end[i] = NULL;

  shiftcount = 0;

  for (i = 0; i < itemsetend - itemset; ++i)
    {
      int symbol = ritem[itemset[i]];
      if (symbol > 0)
	{
	  short *ksp = kernel_end[symbol];

	  if (!ksp)
	    {
	      shift_symbol[shiftcount] = symbol;
	      ksp = kernel_base[symbol];
	      shiftcount++;
	    }

	  *ksp++ = itemset[i] + 1;
	  kernel_end[symbol] = ksp;
	}
    }

  nshifts = shiftcount;
}


/*-----------------------------------------------------------------.
| Subroutine of get_state.  Create a new state for those items, if |
| necessary.                                                       |
`-----------------------------------------------------------------*/

static core *
new_state (int symbol)
{
  int n;
  core *p;

  if (trace_flag)
    fprintf (stderr, "Entering new_state, state = %d, symbol = %d\n",
	     nstates, symbol);

  if (nstates >= MAXSHORT)
    fatal (_("too many states (max %d)"), MAXSHORT);

  n = kernel_end[symbol] - kernel_base[symbol];

  p = CORE_ALLOC (n);
  p->accessing_symbol = symbol;
  p->number = nstates;
  p->nitems = n;

  shortcpy (p->items, kernel_base[symbol], n);

  last_state->next = p;
  last_state = p;
  nstates++;

  return p;
}


/*--------------------------------------------------------------.
| Find the state number for the state we would get to (from the |
| current state) by shifting symbol.  Create a new state if no  |
| equivalent one exists already.  Used by append_states.        |
`--------------------------------------------------------------*/

static int
get_state (int symbol)
{
  int key;
  short *isp2;
  int i;
  core *sp;

  int n = kernel_end[symbol] - kernel_base[symbol];

  if (trace_flag)
    fprintf (stderr, "Entering get_state, state = %d, symbol = %d\n",
	     nstates, symbol);

  /* Add up the target state's active item numbers to get a hash key.
     */
  key = 0;
  for (i = 0; i < n; ++i)
    key += kernel_base[symbol][i];
  key = key % STATE_TABLE_SIZE;
  sp = state_table[key];

  if (sp)
    {
      int found = 0;
      while (!found)
	{
	  if (sp->nitems == n)
	    {
	      int i;
	      found = 1;
	      for (i = 0; i < n; ++i)
		if (kernel_base[symbol][i] != sp->items[i])
		  found = 0;
	    }

	  if (!found)
	    {
	      if (sp->link)
		{
		  sp = sp->link;
		}
	      else		/* bucket exhausted and no match */
		{
		  sp = sp->link = new_state (symbol);
		  found = 1;
		}
	    }
	}
    }
  else				/* bucket is empty */
    {
      state_table[key] = sp = new_state (symbol);
    }

  return sp->number;
}

/*------------------------------------------------------------------.
| Use the information computed by new_itemsets to find the state    |
| numbers reached by each shift transition from the current state.  |
|                                                                   |
| shiftset is set up as a vector of state numbers of those states.  |
`------------------------------------------------------------------*/

static void
append_states (void)
{
  int i;
  int j;
  int symbol;

  if (trace_flag)
    fprintf (stderr, "Entering append_states\n");


  /* first sort shift_symbol into increasing order */

  for (i = 1; i < nshifts; i++)
    {
      symbol = shift_symbol[i];
      j = i;
      while (j > 0 && shift_symbol[j - 1] > symbol)
	{
	  shift_symbol[j] = shift_symbol[j - 1];
	  j--;
	}
      shift_symbol[j] = symbol;
    }

  for (i = 0; i < nshifts; i++)
    shiftset[i] = get_state (shift_symbol[i]);
}


static void
new_states (void)
{
  first_state = last_state = this_state = CORE_ALLOC (0);
  nstates = 1;
}


static void
save_shifts (void)
{
  shifts *p = SHIFTS_ALLOC (nshifts);

  p->number = this_state->number;
  p->nshifts = nshifts;

  shortcpy (p->shifts, shiftset, nshifts);

  if (last_shift)
    last_shift->next = p;
  else
    first_shift = p;
  last_shift = p;
}


/*------------------------------------------------------------------.
| Subroutine of augment_automaton.  Create the next-to-final state, |
| to which a shift has already been made in the initial state.      |
`------------------------------------------------------------------*/

static void
insert_start_shift (void)
{
  core *statep;
  shifts *sp;

  statep = CORE_ALLOC (0);
  statep->number = nstates;
  statep->accessing_symbol = start_symbol;

  last_state->next = statep;
  last_state = statep;

  /* Make a shift from this state to (what will be) the final state.  */
  sp = SHIFTS_ALLOC (1);
  sp->number = nstates++;
  sp->nshifts = 1;
  sp->shifts[0] = nstates;

  last_shift->next = sp;
  last_shift = sp;
}


/*------------------------------------------------------------------.
| Make sure that the initial state has a shift that accepts the     |
| grammar's start symbol and goes to the next-to-final state, which |
| has a shift going to the final state, which has a shift to the    |
| termination state.  Create such states and shifts if they don't   |
| happen to exist already.                                          |
`------------------------------------------------------------------*/

static void
augment_automaton (void)
{
  int i;
  int k;
  core *statep;
  shifts *sp;
  shifts *sp2;
  shifts *sp1 = NULL;

  sp = first_shift;

  if (sp)
    {
      if (sp->number == 0)
	{
	  k = sp->nshifts;
	  statep = first_state->next;

	  /* The states reached by shifts from first_state are numbered 1...K.
	     Look for one reached by start_symbol.  */
	  while (statep->accessing_symbol < start_symbol
		 && statep->number < k)
	    statep = statep->next;

	  if (statep->accessing_symbol == start_symbol)
	    {
	      /* We already have a next-to-final state.
	         Make sure it has a shift to what will be the final state.  */
	      k = statep->number;

	      while (sp && sp->number < k)
		{
		  sp1 = sp;
		  sp = sp->next;
		}

	      if (sp && sp->number == k)
		{
		  sp2 = SHIFTS_ALLOC (sp->nshifts + 1);
		  sp2->number = k;
		  sp2->nshifts = sp->nshifts + 1;
		  sp2->shifts[0] = nstates;
		  for (i = sp->nshifts; i > 0; i--)
		    sp2->shifts[i] = sp->shifts[i - 1];

		  /* Patch sp2 into the chain of shifts in place of sp,
		     following sp1.  */
		  sp2->next = sp->next;
		  sp1->next = sp2;
		  if (sp == last_shift)
		    last_shift = sp2;
		  XFREE (sp);
		}
	      else
		{
		  sp2 = SHIFTS_ALLOC (1);
		  sp2->number = k;
		  sp2->nshifts = 1;
		  sp2->shifts[0] = nstates;

		  /* Patch sp2 into the chain of shifts between sp1 and sp.  */
		  sp2->next = sp;
		  sp1->next = sp2;
		  if (sp == 0)
		    last_shift = sp2;
		}
	    }
	  else
	    {
	      /* There is no next-to-final state as yet.  */
	      /* Add one more shift in first_shift,
	         going to the next-to-final state (yet to be made).  */
	      sp = first_shift;

	      sp2 = SHIFTS_ALLOC (sp->nshifts + 1);
	      sp2->nshifts = sp->nshifts + 1;

	      /* Stick this shift into the vector at the proper place.  */
	      statep = first_state->next;
	      for (k = 0, i = 0; i < sp->nshifts; k++, i++)
		{
		  if (statep->accessing_symbol > start_symbol && i == k)
		    sp2->shifts[k++] = nstates;
		  sp2->shifts[k] = sp->shifts[i];
		  statep = statep->next;
		}
	      if (i == k)
		sp2->shifts[k++] = nstates;

	      /* Patch sp2 into the chain of shifts
	         in place of sp, at the beginning.  */
	      sp2->next = sp->next;
	      first_shift = sp2;
	      if (last_shift == sp)
		last_shift = sp2;

	      XFREE (sp);

	      /* Create the next-to-final state, with shift to
	         what will be the final state.  */
	      insert_start_shift ();
	    }
	}
      else
	{
	  /* The initial state didn't even have any shifts.
	     Give it one shift, to the next-to-final state.  */
	  sp = SHIFTS_ALLOC (1);
	  sp->nshifts = 1;
	  sp->shifts[0] = nstates;

	  /* Patch sp into the chain of shifts at the beginning.  */
	  sp->next = first_shift;
	  first_shift = sp;

	  /* Create the next-to-final state, with shift to
	     what will be the final state.  */
	  insert_start_shift ();
	}
    }
  else
    {
      /* There are no shifts for any state.
         Make one shift, from the initial state to the next-to-final state.  */

      sp = SHIFTS_ALLOC (1);
      sp->nshifts = 1;
      sp->shifts[0] = nstates;

      /* Initialize the chain of shifts with sp.  */
      first_shift = sp;
      last_shift = sp;

      /* Create the next-to-final state, with shift to
         what will be the final state.  */
      insert_start_shift ();
    }

  /* Make the final state--the one that follows a shift from the
     next-to-final state.
     The symbol for that shift is 0 (end-of-file).  */
  statep = CORE_ALLOC (0);
  statep->number = nstates;
  last_state->next = statep;
  last_state = statep;

  /* Make the shift from the final state to the termination state.  */
  sp = SHIFTS_ALLOC (1);
  sp->number = nstates++;
  sp->nshifts = 1;
  sp->shifts[0] = nstates;
  last_shift->next = sp;
  last_shift = sp;

  /* Note that the variable `final_state' refers to what we sometimes call
     the termination state.  */
  final_state = nstates;

  /* Make the termination state.  */
  statep = CORE_ALLOC (0);
  statep->number = nstates++;
  last_state->next = statep;
  last_state = statep;
}


/*----------------------------------------------------------------.
| Find which rules can be used for reduction transitions from the |
| current state and make a reductions structure for the state to  |
| record their rule numbers.                                      |
`----------------------------------------------------------------*/

static void
save_reductions (void)
{
  short *isp;
  int item;
  int count;
  reductions *p;

  short *rend;

  /* Find and count the active items that represent ends of rules. */

  count = 0;
  for (isp = itemset; isp < itemsetend; isp++)
    {
      item = ritem[*isp];
      if (item < 0)
	redset[count++] = -item;
    }

  /* Make a reductions structure and copy the data into it.  */

  if (count)
    {
      p = REDUCTIONS_ALLOC (count);

      p->number = this_state->number;
      p->nreds = count;

      shortcpy (p->rules, redset, count);

      if (last_reduction)
	last_reduction->next = p;
      else
	first_reduction = p;
      last_reduction = p;
    }
}

\f
/*-------------------------------------------------------------------.
| Compute the nondeterministic finite state machine (see state.h for |
| details) from the grammar.                                         |
`-------------------------------------------------------------------*/

void
generate_states (void)
{
  allocate_storage ();
  new_closure (nitems);
  new_states ();

  while (this_state)
    {
      /* Set up ruleset and itemset for the transitions out of this
         state.  ruleset gets a 1 bit for each rule that could reduce
         now.  itemset gets a vector of all the items that could be
         accepted next.  */
      closure (this_state->items, this_state->nitems);
      /* record the reductions allowed out of this state */
      save_reductions ();
      /* find the itemsets of the states that shifts can reach */
      new_itemsets ();
      /* find or create the core structures for those states */
      append_states ();

      /* create the shifts structures for the shifts to those states,
         now that the state numbers transitioning to are known */
      if (nshifts > 0)
	save_shifts ();

      /* states are queued when they are created; process them all */
      this_state = this_state->next;
    }

  /* discard various storage */
  free_closure ();
  free_storage ();

  /* set up initial and final states as parser wants them */
  augment_automaton ();
}
Commit	Line	Data
40675e7c	1	/* Generate the nondeterministic finite state machine for bison,
97db7bd4	2	Copyright 1984, 1986, 1989, 2000, 2001 Free Software Foundation, Inc.
40675e7c	3
2fa6973e	4	This file is part of Bison, the GNU Compiler Compiler.
40675e7c	5
2fa6973e AD	6	Bison is free software; you can redistribute it and/or modify
	7	it under the terms of the GNU General Public License as published by
	8	the Free Software Foundation; either version 2, or (at your option)
	9	any later version.
40675e7c	10
2fa6973e AD	11	Bison is distributed in the hope that it will be useful,
	12	but WITHOUT ANY WARRANTY; without even the implied warranty of
	13	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	14	GNU General Public License for more details.
40675e7c	15
2fa6973e AD	16	You should have received a copy of the GNU General Public License
	17	along with Bison; see the file COPYING. If not, write to
	18	the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
	19	Boston, MA 02111-1307, USA. */
40675e7c DM	20
	21
	22	/* See comments in state.h for the data structures that represent it.
	23	The entry point is generate_states. */
	24
40675e7c	25	#include "system.h"
9bfe901c	26	#include "getargs.h"
40675e7c DM	27	#include "gram.h"
40675e7c DM	28	#include "state.h"
a0f6b076	29	#include "complain.h"
2fa6973e	30	#include "closure.h"
403b315b	31	#include "LR0.h"
40675e7c	32
40675e7c	33
40675e7c DM	34	int nstates;
40675e7c DM	35	int final_state;
342b8b6e AD	36	core *first_state = NULL;
	37	shifts *first_shift = NULL;
	38	reductions *first_reduction = NULL;
40675e7c	39
342b8b6e AD	40	static core *this_state = NULL;
	41	static core *last_state = NULL;
	42	static shifts *last_shift = NULL;
	43	static reductions *last_reduction = NULL;
40675e7c DM	44
40675e7c DM	45	static int nshifts;
342b8b6e	46	static short *shift_symbol = NULL;
40675e7c	47
342b8b6e AD	48	static short *redset = NULL;
342b8b6e AD	49	static short *shiftset = NULL;
40675e7c	50
342b8b6e AD	51	static short **kernel_base = NULL;
	52	static short **kernel_end = NULL;
	53	static short *kernel_items = NULL;
40675e7c DM	54
	55	/* hash table for states, to recognize equivalent ones. */
	56
	57	#define STATE_TABLE_SIZE 1009
342b8b6e	58	static core **state_table = NULL;
40675e7c	59
2fa6973e	60	\f
4a120d45	61	static void
d2729d44	62	allocate_itemsets (void)
40675e7c	63	{
342b8b6e	64	short *itemp = NULL;
2fa6973e AD	65	int symbol;
	66	int i;
	67	int count;
342b8b6e	68	short *symbol_count = NULL;
40675e7c DM	69
40675e7c DM	70	count = 0;
d7913476	71	symbol_count = XCALLOC (short, nsyms);
40675e7c DM	72
	73	itemp = ritem;
	74	symbol = *itemp++;
	75	while (symbol)
	76	{
	77	if (symbol > 0)
	78	{
	79	count++;
	80	symbol_count[symbol]++;
	81	}
	82	symbol = *itemp++;
	83	}
	84
2fa6973e AD	85	/* See comments before new_itemsets. All the vectors of items
2fa6973e AD	86	live inside KERNEL_ITEMS. The number of active items after
40675e7c DM	87	some symbol cannot be more than the number of times that symbol
	88	appears as an item, which is symbol_count[symbol].
	89	We allocate that much space for each symbol. */
	90
d7913476	91	kernel_base = XCALLOC (short *, nsyms);
342b8b6e AD	92	if (count)
342b8b6e AD	93	kernel_items = XCALLOC (short, count);
40675e7c DM	94
	95	count = 0;
	96	for (i = 0; i < nsyms; i++)
	97	{
	98	kernel_base[i] = kernel_items + count;
	99	count += symbol_count[i];
	100	}
	101
	102	shift_symbol = symbol_count;
d7913476	103	kernel_end = XCALLOC (short *, nsyms);
40675e7c DM	104	}
	105
	106
4a120d45	107	static void
d2729d44	108	allocate_storage (void)
40675e7c	109	{
2fa6973e	110	allocate_itemsets ();
40675e7c	111
d7913476 AD	112	shiftset = XCALLOC (short, nsyms);
	113	redset = XCALLOC (short, nrules + 1);
	114	state_table = XCALLOC (core *, STATE_TABLE_SIZE);
40675e7c DM	115	}
	116
	117
4a120d45	118	static void
d2729d44	119	free_storage (void)
40675e7c	120	{
d7913476 AD	121	XFREE (shift_symbol);
	122	XFREE (redset);
	123	XFREE (shiftset);
	124	XFREE (kernel_base);
	125	XFREE (kernel_end);
	126	XFREE (kernel_items);
	127	XFREE (state_table);
40675e7c DM	128	}
	129
	130
	131
40675e7c	132
2fa6973e AD	133	/*----------------------------------------------------------------.
	134	\| Find which symbols can be shifted in the current state, and for \|
	135	\| each one record which items would be active after that shift. \|
	136	\| Uses the contents of itemset. \|
	137	\| \|
	138	\| shift_symbol is set to a vector of the symbols that can be \|
	139	\| shifted. For each symbol in the grammar, kernel_base[symbol] \|
	140	\| points to a vector of item numbers activated if that symbol is \|
	141	\| shifted, and kernel_end[symbol] points after the end of that \|
	142	\| vector. \|
	143	`----------------------------------------------------------------*/
40675e7c	144
4a120d45	145	static void
d2729d44	146	new_itemsets (void)
40675e7c	147	{
2fa6973e AD	148	int i;
2fa6973e AD	149	int shiftcount;
2fa6973e	150
9bfe901c AD	151	if (trace_flag)
9bfe901c AD	152	fprintf (stderr, "Entering new_itemsets, state = %d\n", nstates);
40675e7c DM	153
	154	for (i = 0; i < nsyms; i++)
	155	kernel_end[i] = NULL;
	156
	157	shiftcount = 0;
	158
97db7bd4	159	for (i = 0; i < itemsetend - itemset; ++i)
40675e7c	160	{
97db7bd4	161	int symbol = ritem[itemset[i]];
40675e7c DM	162	if (symbol > 0)
40675e7c DM	163	{
97db7bd4	164	short *ksp = kernel_end[symbol];
40675e7c	165
2fa6973e	166	if (!ksp)
40675e7c	167	{
97db7bd4	168	shift_symbol[shiftcount] = symbol;
40675e7c	169	ksp = kernel_base[symbol];
97db7bd4	170	shiftcount++;
40675e7c DM	171	}
40675e7c DM	172
97db7bd4	173	*ksp++ = itemset[i] + 1;
2fa6973e	174	kernel_end[symbol] = ksp;
40675e7c DM	175	}
	176	}
	177
	178	nshifts = shiftcount;
	179	}
	180
	181
	182
2fa6973e AD	183	/*-----------------------------------------------------------------.
	184	\| Subroutine of get_state. Create a new state for those items, if \|
	185	\| necessary. \|
	186	`-----------------------------------------------------------------*/
40675e7c	187
2fa6973e AD	188	static core *
2fa6973e AD	189	new_state (int symbol)
40675e7c	190	{
2fa6973e AD	191	int n;
2fa6973e AD	192	core *p;
40675e7c	193
9bfe901c AD	194	if (trace_flag)
	195	fprintf (stderr, "Entering new_state, state = %d, symbol = %d\n",
	196	nstates, symbol);
40675e7c	197
2fa6973e AD	198	if (nstates >= MAXSHORT)
2fa6973e AD	199	fatal (_("too many states (max %d)"), MAXSHORT);
40675e7c	200
300f275f	201	n = kernel_end[symbol] - kernel_base[symbol];
40675e7c	202
f59c437a	203	p = CORE_ALLOC (n);
2fa6973e AD	204	p->accessing_symbol = symbol;
	205	p->number = nstates;
	206	p->nitems = n;
	207
300f275f	208	shortcpy (p->items, kernel_base[symbol], n);
2fa6973e AD	209
	210	last_state->next = p;
	211	last_state = p;
2fa6973e	212	nstates++;
40675e7c	213
2fa6973e AD	214	return p;
2fa6973e AD	215	}
40675e7c	216
2fa6973e AD	217
	218	/*--------------------------------------------------------------.
	219	\| Find the state number for the state we would get to (from the \|
	220	\| current state) by shifting symbol. Create a new state if no \|
97db7bd4	221	\| equivalent one exists already. Used by append_states. \|
2fa6973e	222	`--------------------------------------------------------------*/
40675e7c	223
4a120d45	224	static int
d2729d44	225	get_state (int symbol)
40675e7c	226	{
2fa6973e	227	int key;
2fa6973e	228	short *isp2;
97db7bd4	229	int i;
2fa6973e	230	core *sp;
40675e7c	231
97db7bd4	232	int n = kernel_end[symbol] - kernel_base[symbol];
40675e7c	233
9bfe901c AD	234	if (trace_flag)
	235	fprintf (stderr, "Entering get_state, state = %d, symbol = %d\n",
	236	nstates, symbol);
40675e7c	237
97db7bd4 AD	238	/* Add up the target state's active item numbers to get a hash key.
97db7bd4 AD	239	*/
40675e7c	240	key = 0;
97db7bd4 AD	241	for (i = 0; i < n; ++i)
97db7bd4 AD	242	key += kernel_base[symbol][i];
40675e7c	243	key = key % STATE_TABLE_SIZE;
40675e7c DM	244	sp = state_table[key];
	245
	246	if (sp)
	247	{
97db7bd4	248	int found = 0;
40675e7c DM	249	while (!found)
	250	{
	251	if (sp->nitems == n)
	252	{
97db7bd4	253	int i;
40675e7c	254	found = 1;
97db7bd4 AD	255	for (i = 0; i < n; ++i)
	256	if (kernel_base[symbol][i] != sp->items[i])
	257	found = 0;
40675e7c DM	258	}
	259
	260	if (!found)
	261	{
	262	if (sp->link)
	263	{
	264	sp = sp->link;
	265	}
2fa6973e	266	else /* bucket exhausted and no match */
40675e7c	267	{
2fa6973e	268	sp = sp->link = new_state (symbol);
40675e7c DM	269	found = 1;
	270	}
	271	}
	272	}
	273	}
2fa6973e	274	else /* bucket is empty */
40675e7c	275	{
2fa6973e	276	state_table[key] = sp = new_state (symbol);
40675e7c DM	277	}
40675e7c DM	278
36281465	279	return sp->number;
40675e7c DM	280	}
40675e7c DM	281
2fa6973e AD	282	/*------------------------------------------------------------------.
	283	\| Use the information computed by new_itemsets to find the state \|
	284	\| numbers reached by each shift transition from the current state. \|
	285	\| \|
	286	\| shiftset is set up as a vector of state numbers of those states. \|
	287	`------------------------------------------------------------------*/
40675e7c	288
2fa6973e AD	289	static void
2fa6973e AD	290	append_states (void)
40675e7c	291	{
2fa6973e AD	292	int i;
	293	int j;
	294	int symbol;
40675e7c	295
9bfe901c AD	296	if (trace_flag)
	297	fprintf (stderr, "Entering append_states\n");
	298
40675e7c	299
2fa6973e	300	/* first sort shift_symbol into increasing order */
40675e7c	301
2fa6973e AD	302	for (i = 1; i < nshifts; i++)
	303	{
	304	symbol = shift_symbol[i];
	305	j = i;
	306	while (j > 0 && shift_symbol[j - 1] > symbol)
	307	{
	308	shift_symbol[j] = shift_symbol[j - 1];
	309	j--;
	310	}
	311	shift_symbol[j] = symbol;
	312	}
40675e7c	313
2fa6973e	314	for (i = 0; i < nshifts; i++)
97db7bd4	315	shiftset[i] = get_state (shift_symbol[i]);
40675e7c DM	316	}
	317
	318
4a120d45	319	static void
2fa6973e	320	new_states (void)
40675e7c	321	{
97db7bd4	322	first_state = last_state = this_state = CORE_ALLOC (0);
40675e7c DM	323	nstates = 1;
	324	}
	325
	326
4a120d45	327	static void
d2729d44	328	save_shifts (void)
40675e7c	329	{
97db7bd4	330	shifts *p = SHIFTS_ALLOC (nshifts);
40675e7c DM	331
	332	p->number = this_state->number;
	333	p->nshifts = nshifts;
	334
300f275f	335	shortcpy (p->shifts, shiftset, nshifts);
40675e7c DM	336
40675e7c DM	337	if (last_shift)
97db7bd4	338	last_shift->next = p;
40675e7c	339	else
97db7bd4 AD	340	first_shift = p;
97db7bd4 AD	341	last_shift = p;
40675e7c DM	342	}
	343
	344
2fa6973e AD	345	/*------------------------------------------------------------------.
	346	\| Subroutine of augment_automaton. Create the next-to-final state, \|
	347	\| to which a shift has already been made in the initial state. \|
	348	`------------------------------------------------------------------*/
40675e7c	349
4a120d45	350	static void
2fa6973e	351	insert_start_shift (void)
40675e7c	352	{
2fa6973e AD	353	core *statep;
2fa6973e AD	354	shifts *sp;
40675e7c	355
f59c437a	356	statep = CORE_ALLOC (0);
2fa6973e AD	357	statep->number = nstates;
2fa6973e AD	358	statep->accessing_symbol = start_symbol;
40675e7c	359
2fa6973e AD	360	last_state->next = statep;
2fa6973e AD	361	last_state = statep;
40675e7c	362
2fa6973e	363	/* Make a shift from this state to (what will be) the final state. */
f59c437a	364	sp = SHIFTS_ALLOC (1);
2fa6973e AD	365	sp->number = nstates++;
	366	sp->nshifts = 1;
	367	sp->shifts[0] = nstates;
40675e7c	368
2fa6973e AD	369	last_shift->next = sp;
2fa6973e AD	370	last_shift = sp;
40675e7c DM	371	}
	372
	373
2fa6973e AD	374	/*------------------------------------------------------------------.
	375	\| Make sure that the initial state has a shift that accepts the \|
	376	\| grammar's start symbol and goes to the next-to-final state, which \|
	377	\| has a shift going to the final state, which has a shift to the \|
	378	\| termination state. Create such states and shifts if they don't \|
	379	\| happen to exist already. \|
	380	`------------------------------------------------------------------*/
40675e7c	381
4a120d45	382	static void
d2729d44	383	augment_automaton (void)
40675e7c	384	{
2fa6973e AD	385	int i;
	386	int k;
	387	core *statep;
	388	shifts *sp;
	389	shifts *sp2;
	390	shifts *sp1 = NULL;
40675e7c DM	391
	392	sp = first_shift;
	393
	394	if (sp)
	395	{
	396	if (sp->number == 0)
	397	{
	398	k = sp->nshifts;
	399	statep = first_state->next;
	400
	401	/* The states reached by shifts from first_state are numbered 1...K.
	402	Look for one reached by start_symbol. */
	403	while (statep->accessing_symbol < start_symbol
2fa6973e	404	&& statep->number < k)
40675e7c DM	405	statep = statep->next;
	406
	407	if (statep->accessing_symbol == start_symbol)
	408	{
	409	/* We already have a next-to-final state.
2fa6973e	410	Make sure it has a shift to what will be the final state. */
40675e7c DM	411	k = statep->number;
	412
	413	while (sp && sp->number < k)
	414	{
	415	sp1 = sp;
	416	sp = sp->next;
	417	}
	418
	419	if (sp && sp->number == k)
	420	{
f59c437a	421	sp2 = SHIFTS_ALLOC (sp->nshifts + 1);
40675e7c DM	422	sp2->number = k;
	423	sp2->nshifts = sp->nshifts + 1;
	424	sp2->shifts[0] = nstates;
	425	for (i = sp->nshifts; i > 0; i--)
	426	sp2->shifts[i] = sp->shifts[i - 1];
	427
	428	/* Patch sp2 into the chain of shifts in place of sp,
	429	following sp1. */
	430	sp2->next = sp->next;
	431	sp1->next = sp2;
	432	if (sp == last_shift)
	433	last_shift = sp2;
d7913476	434	XFREE (sp);
40675e7c DM	435	}
	436	else
	437	{
f59c437a	438	sp2 = SHIFTS_ALLOC (1);
40675e7c DM	439	sp2->number = k;
	440	sp2->nshifts = 1;
	441	sp2->shifts[0] = nstates;
	442
	443	/* Patch sp2 into the chain of shifts between sp1 and sp. */
	444	sp2->next = sp;
	445	sp1->next = sp2;
	446	if (sp == 0)
	447	last_shift = sp2;
	448	}
	449	}
	450	else
	451	{
	452	/* There is no next-to-final state as yet. */
	453	/* Add one more shift in first_shift,
2fa6973e	454	going to the next-to-final state (yet to be made). */
40675e7c DM	455	sp = first_shift;
40675e7c DM	456
f59c437a	457	sp2 = SHIFTS_ALLOC (sp->nshifts + 1);
40675e7c DM	458	sp2->nshifts = sp->nshifts + 1;
	459
	460	/* Stick this shift into the vector at the proper place. */
	461	statep = first_state->next;
	462	for (k = 0, i = 0; i < sp->nshifts; k++, i++)
	463	{
	464	if (statep->accessing_symbol > start_symbol && i == k)
	465	sp2->shifts[k++] = nstates;
	466	sp2->shifts[k] = sp->shifts[i];
	467	statep = statep->next;
	468	}
	469	if (i == k)
	470	sp2->shifts[k++] = nstates;
	471
	472	/* Patch sp2 into the chain of shifts
2fa6973e	473	in place of sp, at the beginning. */
40675e7c DM	474	sp2->next = sp->next;
	475	first_shift = sp2;
	476	if (last_shift == sp)
	477	last_shift = sp2;
	478
d7913476	479	XFREE (sp);
40675e7c DM	480
40675e7c DM	481	/* Create the next-to-final state, with shift to
2fa6973e AD	482	what will be the final state. */
2fa6973e AD	483	insert_start_shift ();
40675e7c DM	484	}
	485	}
	486	else
	487	{
	488	/* The initial state didn't even have any shifts.
	489	Give it one shift, to the next-to-final state. */
f59c437a	490	sp = SHIFTS_ALLOC (1);
40675e7c DM	491	sp->nshifts = 1;
	492	sp->shifts[0] = nstates;
	493
	494	/* Patch sp into the chain of shifts at the beginning. */
	495	sp->next = first_shift;
	496	first_shift = sp;
	497
	498	/* Create the next-to-final state, with shift to
	499	what will be the final state. */
2fa6973e	500	insert_start_shift ();
40675e7c DM	501	}
	502	}
	503	else
	504	{
	505	/* There are no shifts for any state.
2fa6973e	506	Make one shift, from the initial state to the next-to-final state. */
40675e7c	507
f59c437a	508	sp = SHIFTS_ALLOC (1);
40675e7c DM	509	sp->nshifts = 1;
	510	sp->shifts[0] = nstates;
	511
	512	/* Initialize the chain of shifts with sp. */
	513	first_shift = sp;
	514	last_shift = sp;
	515
	516	/* Create the next-to-final state, with shift to
2fa6973e AD	517	what will be the final state. */
2fa6973e AD	518	insert_start_shift ();
40675e7c DM	519	}
	520
	521	/* Make the final state--the one that follows a shift from the
	522	next-to-final state.
	523	The symbol for that shift is 0 (end-of-file). */
f59c437a	524	statep = CORE_ALLOC (0);
40675e7c DM	525	statep->number = nstates;
	526	last_state->next = statep;
	527	last_state = statep;
	528
	529	/* Make the shift from the final state to the termination state. */
f59c437a	530	sp = SHIFTS_ALLOC (1);
40675e7c DM	531	sp->number = nstates++;
	532	sp->nshifts = 1;
	533	sp->shifts[0] = nstates;
	534	last_shift->next = sp;
	535	last_shift = sp;
	536
	537	/* Note that the variable `final_state' refers to what we sometimes call
	538	the termination state. */
	539	final_state = nstates;
	540
	541	/* Make the termination state. */
f59c437a	542	statep = CORE_ALLOC (0);
40675e7c DM	543	statep->number = nstates++;
	544	last_state->next = statep;
	545	last_state = statep;
	546	}
	547
	548
2fa6973e AD	549	/*----------------------------------------------------------------.
	550	\| Find which rules can be used for reduction transitions from the \|
	551	\| current state and make a reductions structure for the state to \|
	552	\| record their rule numbers. \|
	553	`----------------------------------------------------------------*/
	554
4a120d45	555	static void
2fa6973e	556	save_reductions (void)
40675e7c	557	{
2fa6973e	558	short *isp;
2fa6973e AD	559	int item;
	560	int count;
	561	reductions *p;
40675e7c	562
2fa6973e	563	short *rend;
40675e7c	564
2fa6973e	565	/* Find and count the active items that represent ends of rules. */
40675e7c	566
2fa6973e AD	567	count = 0;
	568	for (isp = itemset; isp < itemsetend; isp++)
	569	{
	570	item = ritem[*isp];
	571	if (item < 0)
	572	redset[count++] = -item;
	573	}
40675e7c	574
2fa6973e AD	575	/* Make a reductions structure and copy the data into it. */
	576
	577	if (count)
	578	{
f59c437a	579	p = REDUCTIONS_ALLOC (count);
2fa6973e AD	580
	581	p->number = this_state->number;
	582	p->nreds = count;
	583
300f275f	584	shortcpy (p->rules, redset, count);
2fa6973e AD	585
2fa6973e AD	586	if (last_reduction)
97db7bd4	587	last_reduction->next = p;
2fa6973e	588	else
97db7bd4 AD	589	first_reduction = p;
97db7bd4 AD	590	last_reduction = p;
2fa6973e AD	591	}
	592	}
	593
	594	\f
	595	/*-------------------------------------------------------------------.
	596	\| Compute the nondeterministic finite state machine (see state.h for \|
	597	\| details) from the grammar. \|
	598	`-------------------------------------------------------------------*/
	599
	600	void
	601	generate_states (void)
	602	{
	603	allocate_storage ();
	604	new_closure (nitems);
	605	new_states ();
	606
	607	while (this_state)
	608	{
	609	/* Set up ruleset and itemset for the transitions out of this
	610	state. ruleset gets a 1 bit for each rule that could reduce
	611	now. itemset gets a vector of all the items that could be
	612	accepted next. */
	613	closure (this_state->items, this_state->nitems);
	614	/* record the reductions allowed out of this state */
	615	save_reductions ();
	616	/* find the itemsets of the states that shifts can reach */
	617	new_itemsets ();
	618	/* find or create the core structures for those states */
	619	append_states ();
	620
	621	/* create the shifts structures for the shifts to those states,
	622	now that the state numbers transitioning to are known */
	623	if (nshifts > 0)
	624	save_shifts ();
	625
	626	/* states are queued when they are created; process them all */
	627	this_state = this_state->next;
	628	}
	629
	630	/* discard various storage */
	631	free_closure ();
	632	free_storage ();
	633
	634	/* set up initial and final states as parser wants them */
	635	augment_automaton ();
40675e7c	636	}