X-Git-Url: https://git.saurik.com/bison.git/blobdiff_plain/a083fbbf221545ea6e68a831da060d8834f36eca..9a636f47cee64ab6e1f7588c6261fc46ea134c39:/src/closure.c diff --git a/src/closure.c b/src/closure.c index d24fee37..05b299a7 100644 --- a/src/closure.c +++ b/src/closure.c @@ -1,351 +1,295 @@ /* Subroutines for bison - Copyright (C) 1984, 1989 Free Software Foundation, Inc. + Copyright (C) 1984, 1989, 2000, 2001, 2002 Free Software Foundation, Inc. -This file is part of Bison, the GNU Compiler Compiler. + This file is part of Bison, the GNU Compiler Compiler. -Bison is free software; you can redistribute it and/or modify -it under the terms of the GNU General Public License as published by -the Free Software Foundation; either version 2, or (at your option) -any later version. + Bison is free software; you can redistribute it and/or modify it + under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2, or (at your option) + any later version. -Bison is distributed in the hope that it will be useful, -but WITHOUT ANY WARRANTY; without even the implied warranty of -MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the -GNU General Public License for more details. + Bison is distributed in the hope that it will be useful, but + WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + General Public License for more details. -You should have received a copy of the GNU General Public License -along with Bison; see the file COPYING. If not, write to -the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */ + You should have received a copy of the GNU General Public License + along with Bison; see the file COPYING. If not, write to the Free + Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA + 02111-1307, USA. */ - -/* subroutines of file LR0.c. - -Entry points: - - closure (items, n) - -Given a vector of item numbers items, of length n, -set up ruleset and itemset to indicate what rules could be run -and which items could be accepted when those items are the active ones. - -ruleset contains a bit for each rule. closure sets the bits -for all rules which could potentially describe the next input to be read. - -itemset is a vector of item numbers; itemsetend points to just beyond the end - of the part of it that is significant. -closure places there the indices of all items which represent units of -input that could arrive next. - - initialize_closure (n) - -Allocates the itemset and ruleset vectors, -and precomputes useful data so that closure can be called. -n is the number of elements to allocate for itemset. - - finalize_closure () - -Frees itemset, ruleset and internal data. - -*/ - -#include #include "system.h" -#include "machine.h" -#include "new.h" +#include "quotearg.h" +#include "bitset.h" +#include "bitsetv.h" +#include "getargs.h" +#include "symtab.h" #include "gram.h" +#include "reader.h" +#include "closure.h" +#include "derives.h" - -extern short **derives; -extern char **tags; - -void set_fderives(); -void set_firsts(); - -extern void RTC(); - +/* NITEMSET is the size of the array ITEMSET. */ short *itemset; -short *itemsetend; -static unsigned *ruleset; +int nritemset; -/* internal data. See comments before set_fderives and set_firsts. */ -static unsigned *fderives; -static unsigned *firsts; +static bitset ruleset; -/* number of words required to hold a bit for each rule */ -static int rulesetsize; +/* internal data. See comments before set_fderives and set_firsts. */ +static bitsetv fderives = NULL; +static bitsetv firsts = NULL; -/* number of words required to hold a bit for each variable */ -static int varsetsize; +/* Retrieve the FDERIVES/FIRSTS sets of the nonterminals numbered Var. */ +#define FDERIVES(Var) fderives[(Var) - ntokens] +#define FIRSTS(Var) firsts[(Var) - ntokens] + +/*-----------------. +| Debugging code. | +`-----------------*/ -void -initialize_closure(n) -int n; +static void +print_closure (const char *title, short *array, size_t size) { - itemset = NEW2(n, short); - - rulesetsize = WORDSIZE(nrules + 1); - ruleset = NEW2(rulesetsize, unsigned); - - set_fderives(); + size_t i; + fprintf (stderr, "Closure: %s\n", title); + for (i = 0; i < size; ++i) + { + short *rp; + fprintf (stderr, " %2d: .", array[i]); + for (rp = &ritem[array[i]]; *rp >= 0; ++rp) + fprintf (stderr, " %s", + quotearg_style (escape_quoting_style, symbols[*rp]->tag)); + fprintf (stderr, " (rule %d)\n", -*rp - 1); + } + fputs ("\n\n", stderr); } - -/* set fderives to an nvars by nrules matrix of bits - indicating which rules can help derive the beginning of the data - for each nonterminal. For example, if symbol 5 can be derived as - the sequence of symbols 8 3 20, and one of the rules for deriving - symbol 8 is rule 4, then the [5 - ntokens, 4] bit in fderives is set. */ -void -set_fderives() +static void +print_firsts (void) { - register unsigned *rrow; - register unsigned *vrow; - register int j; - register unsigned cword; - register short *rp; - register int b; - - int ruleno; - int i; - - fderives = NEW2(nvars * rulesetsize, unsigned) - ntokens * rulesetsize; - - set_firsts(); - - rrow = fderives + ntokens * rulesetsize; + int i, j; + fprintf (stderr, "FIRSTS\n"); for (i = ntokens; i < nsyms; i++) { - vrow = firsts + ((i - ntokens) * varsetsize); - cword = *vrow++; - b = 0; - for (j = ntokens; j < nsyms; j++) - { - if (cword & (1 << b)) - { - rp = derives[j]; - while ((ruleno = *rp++) > 0) - { - SETBIT(rrow, ruleno); - } - } - - b++; - if (b >= BITS_PER_WORD && j + 1 < nsyms) - { - cword = *vrow++; - b = 0; - } - } - - rrow += rulesetsize; + fprintf (stderr, "\t%s firsts\n", + quotearg_style (escape_quoting_style, symbols[i]->tag)); + for (j = 0; j < nvars; j++) + if (bitset_test (FIRSTS (i), j)) + fprintf (stderr, "\t\t%d (%s)\n", + j + ntokens, + quotearg_style (escape_quoting_style, + symbols[j + ntokens]->tag)); } - -#ifdef DEBUG - print_fderives(); -#endif - - FREE(firsts); + fprintf (stderr, "\n\n"); } - -/* set firsts to be an nvars by nvars bit matrix indicating which items - can represent the beginning of the input corresponding to which other items. - For example, if some rule expands symbol 5 into the sequence of symbols 8 3 20, - the symbol 8 can be the beginning of the data for symbol 5, - so the bit [8 - ntokens, 5 - ntokens] in firsts is set. */ -void -set_firsts() +static void +print_fderives (void) { - register unsigned *row; -/* register int done; JF unused */ - register int symbol; - register short *sp; - register int rowsize; + int i, j; - int i; - - varsetsize = rowsize = WORDSIZE(nvars); - - firsts = NEW2(nvars * rowsize, unsigned); - - row = firsts; + fprintf (stderr, "FDERIVES\n"); for (i = ntokens; i < nsyms; i++) { - sp = derives[i]; - while (*sp >= 0) - { - symbol = ritem[rrhs[*sp++]]; - if (ISVAR(symbol)) - { - symbol -= ntokens; - SETBIT(row, symbol); - } - } - - row += rowsize; + fprintf (stderr, "\t%s derives\n", + quotearg_style (escape_quoting_style, symbols[i]->tag)); + for (j = 0; j < nrules + 1; j++) + if (bitset_test (FDERIVES (i), j)) + { + short *rhsp; + fprintf (stderr, "\t\t%d:", j - 1); + for (rhsp = rules[j].rhs; *rhsp >= 0; ++rhsp) + fprintf (stderr, " %s", + quotearg_style (escape_quoting_style, + symbols[*rhsp]->tag)); + fputc ('\n', stderr); + } } - - RTC(firsts, nvars); - -#ifdef DEBUG - print_firsts(); -#endif + fprintf (stderr, "\n\n"); } +/*--------------------------------------------------------. +| Display the MATRIX array of SIZE bitsets of size SIZE. | +`--------------------------------------------------------*/ -void -closure(core, n) -short *core; -int n; +static void +bitmatrix_print (const char *title, bitsetv matrix) { - register int ruleno; - register unsigned word; - register short *csp; - register unsigned *dsp; - register unsigned *rsp; - - short *csend; - unsigned *rsend; - int symbol; - int itemno; - - rsp = ruleset; - rsend = ruleset + rulesetsize; - csend = core + n; - - if (n == 0) - { - dsp = fderives + start_symbol * rulesetsize; - while (rsp < rsend) - *rsp++ = *dsp++; - } - else - { - while (rsp < rsend) - *rsp++ = 0; - - csp = core; - while (csp < csend) - { - symbol = ritem[*csp++]; - if (ISVAR(symbol)) - { - dsp = fderives + symbol * rulesetsize; - rsp = ruleset; - while (rsp < rsend) - *rsp++ |= *dsp++; - } - } - } - - ruleno = 0; - itemsetend = itemset; - csp = core; - rsp = ruleset; - while (rsp < rsend) + size_t i, j; + size_t size = bitset_size (matrix[0]); + + /* Title. */ + fprintf (stderr, "%s BEGIN\n", title); + + /* Column numbers. */ + fputs (" ", stderr); + for (i = 0; i < size; ++i) + putc (i / 10 ? '0' + i / 10 : ' ', stderr); + putc ('\n', stderr); + fputs (" ", stderr); + for (i = 0; i < size; ++i) + fprintf (stderr, "%d", i % 10); + putc ('\n', stderr); + + /* Bar. */ + fputs (" .", stderr); + for (i = 0; i < size; ++i) + putc ('-', stderr); + fputs (".\n", stderr); + + /* Contents. */ + for (i = 0; i < size; ++i) { - word = *rsp++; - if (word == 0) - { - ruleno += BITS_PER_WORD; - } - else - { - register int b; - - for (b = 0; b < BITS_PER_WORD; b++) - { - if (word & (1 << b)) - { - itemno = rrhs[ruleno]; - while (csp < csend && *csp < itemno) - *itemsetend++ = *csp++; - *itemsetend++ = itemno; - } - - ruleno++; - } - } + fprintf (stderr, "%2d|", i); + for (j = 0; j < size; ++j) + fputs (bitset_test (matrix[i], j) ? "1" : " ", stderr); + fputs ("|\n", stderr); } - while (csp < csend) - *itemsetend++ = *csp++; + /* Bar. */ + fputs (" `", stderr); + for (i = 0; i < size; ++i) + putc ('-', stderr); + fputs ("'\n", stderr); -#ifdef DEBUG - print_closure(n); -#endif + /* End title. */ + fprintf (stderr, "%s END\n\n", title); } - - -void -finalize_closure() + +/*------------------------------------------------------------------. +| Set FIRSTS to be an NVARS array of NVARS bitsets indicating which | +| items can represent the beginning of the input corresponding to | +| which other items. | +| | +| For example, if some rule expands symbol 5 into the sequence of | +| symbols 8 3 20, the symbol 8 can be the beginning of the data for | +| symbol 5, so the bit [8 - ntokens] in first[5 - ntokens] (= FIRST | +| (5)) is set. | +`------------------------------------------------------------------*/ + +static void +set_firsts (void) { - FREE(itemset); - FREE(ruleset); - FREE(fderives + ntokens * rulesetsize); -} - + int i, j; + firsts = bitsetv_create (nvars, nvars, BITSET_FIXED); -#ifdef DEBUG + for (i = ntokens; i < nsyms; i++) + for (j = 0; derives[i][j] >= 0; ++j) + { + int symbol = rules[derives[i][j]].rhs[0]; + if (ISVAR (symbol)) + bitset_set (FIRSTS (i), symbol - ntokens); + } + + if (trace_flag) + bitmatrix_print ("RTC: Input", firsts); + bitsetv_reflexive_transitive_closure (firsts); + if (trace_flag) + bitmatrix_print ("RTC: Output", firsts); + + if (trace_flag) + print_firsts (); +} -print_closure(n) -int n; +/*-------------------------------------------------------------------. +| Set FDERIVES to an NVARS by NRULES matrix of bits indicating which | +| rules can help derive the beginning of the data for each | +| nonterminal. | +| | +| For example, if symbol 5 can be derived as the sequence of symbols | +| 8 3 20, and one of the rules for deriving symbol 8 is rule 4, then | +| the [5 - NTOKENS, 4] bit in FDERIVES is set. | +`-------------------------------------------------------------------*/ + +static void +set_fderives (void) { - register short *isp; + int i, j, k; - printf("\n\nn = %d\n\n", n); - for (isp = itemset; isp < itemsetend; isp++) - printf(" %d\n", *isp); -} + fderives = bitsetv_create (nvars, nrules + 1, BITSET_FIXED); + set_firsts (); + for (i = ntokens; i < nsyms; ++i) + for (j = ntokens; j < nsyms; ++j) + if (bitset_test (FIRSTS (i), j - ntokens)) + for (k = 0; derives[j][k] > 0; ++k) + bitset_set (FDERIVES (i), derives[j][k]); -print_firsts() -{ - register int i; - register int j; - register unsigned *rowp; + if (trace_flag) + print_fderives (); - printf(_("\n\n\nFIRSTS\n\n")); + bitsetv_free (firsts); +} + - for (i = ntokens; i < nsyms; i++) - { - printf(_("\n\n%s firsts\n\n"), tags[i]); +void +new_closure (int n) +{ + itemset = XCALLOC (short, n); - rowp = firsts + ((i - ntokens) * varsetsize); + ruleset = bitset_create (nrules + 1, BITSET_FIXED); - for (j = 0; j < nvars; j++) - if (BITISSET (rowp, j)) - printf(" %s\n", tags[j + ntokens]); - } + set_fderives (); } -print_fderives() +void +closure (short *core, int n) { - register int i; - register int j; - register unsigned *rp; + /* Index over CORE. */ + int c; - printf(_("\n\n\nFDERIVES\n")); + /* A bit index over RULESET. */ + int ruleno; - for (i = ntokens; i < nsyms; i++) + if (trace_flag) + print_closure ("input", core, n); + + bitset_zero (ruleset); + + for (c = 0; c < n; ++c) + if (ISVAR (ritem[core[c]])) + bitset_or (ruleset, ruleset, FDERIVES (ritem[core[c]])); + + nritemset = 0; + c = 0; + for (ruleno = 0; ruleno < nrules + 1; ++ruleno) + if (bitset_test (ruleset, ruleno)) + { + int itemno = rules[ruleno].rhs - ritem; + while (c < n && core[c] < itemno) + { + itemset[nritemset] = core[c]; + nritemset++; + c++; + } + itemset[nritemset] = itemno; + nritemset++; + } + + while (c < n) { - printf(_("\n\n%s derives\n\n"), tags[i]); - rp = fderives + i * rulesetsize; - - for (j = 0; j <= nrules; j++) - if (BITISSET (rp, j)) - printf(" %d\n", j); + itemset[nritemset] = core[c]; + nritemset++; + c++; } - fflush(stdout); + if (trace_flag) + print_closure ("output", itemset, nritemset); } -#endif + +void +free_closure (void) +{ + XFREE (itemset); + bitset_free (ruleset); + bitsetv_free (fderives); +}