]>
git.saurik.com Git - bison.git/blob - src/lalr.c
1 /* Compute look-ahead criteria for bison,
2 Copyright 1984, 1986, 1989, 2000, 2001 Free Software Foundation, Inc.
4 This file is part of Bison, the GNU Compiler Compiler.
6 Bison is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2, or (at your option)
11 Bison is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with Bison; see the file COPYING. If not, write to
18 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 Boston, MA 02111-1307, USA. */
22 /* Compute how to make the finite state machine deterministic; find
23 which rules need lookahead in each state, and which lookahead
24 tokens they accept. */
36 /* All the decorated states, indexed by the state number. Warning:
37 there is a state_TABLE in LR0.c, but it is different and static.
39 state_t
*state_table
= NULL
;
50 /* And for the famous F variable, which name is so descriptive that a
51 comment is hardly needed. <grin>. */
52 static unsigned *F
= NULL
;
53 #define F(Rule) (F + (Rule) * tokensetsize)
55 static short **includes
;
56 static shorts
**lookback
;
59 /*---------------------------------------------------------------.
60 | digraph & traverse. |
62 | The following variables are used as common storage between the |
64 `---------------------------------------------------------------*/
68 static short *VERTICES
;
78 size_t size
= F (i
+ 1) - F(i
);
81 INDEX
[i
] = height
= top
;
84 for (j
= 0; R
[i
][j
] >= 0; ++j
)
86 if (INDEX
[R
[i
][j
]] == 0)
89 if (INDEX
[i
] > INDEX
[R
[i
][j
]])
90 INDEX
[i
] = INDEX
[R
[i
][j
]];
92 for (k
= 0; k
< size
; ++k
)
93 F (i
)[k
] |= F (R
[i
][j
])[k
];
96 if (INDEX
[i
] == height
)
105 for (k
= 0; k
< size
; ++k
)
112 digraph (short **relation
)
116 infinity
= ngotos
+ 2;
117 INDEX
= XCALLOC (short, ngotos
+ 1);
118 VERTICES
= XCALLOC (short, ngotos
+ 1);
123 for (i
= 0; i
< ngotos
; i
++)
126 for (i
= 0; i
< ngotos
; i
++)
127 if (INDEX
[i
] == 0 && R
[i
])
135 /*--------------------.
136 | Build STATE_TABLE. |
137 `--------------------*/
140 set_state_table (void)
142 /* NSTATES + 1 because lookahead for the pseudo state number NSTATES
143 might be used (see conflicts.c). It is too opaque for me to
144 provide a probably less hacky implementation. --akim */
145 state_table
= XCALLOC (state_t
, nstates
+ 1);
149 for (sp
= first_state
; sp
; sp
= sp
->next
)
151 state_table
[sp
->number
].state
= sp
;
152 state_table
[sp
->number
].accessing_symbol
= sp
->accessing_symbol
;
158 for (sp
= first_shift
; sp
; sp
= sp
->next
)
159 state_table
[sp
->number
].shifts
= sp
;
164 for (rp
= first_reduction
; rp
; rp
= rp
->next
)
165 state_table
[rp
->number
].reductions
= rp
;
168 /* Pessimization, but simplification of the code: make sense all the
169 states have a shifts, even if reduced to 0 shifts. */
172 for (i
= 0; i
< nstates
; i
++)
173 if (!state_table
[i
].shifts
)
174 state_table
[i
].shifts
= shifts_new (0);
177 /* Initializing the lookaheads members. Please note that it must be
178 performed after having set some of the other members which are
179 used below. Change with extreme caution. */
183 for (i
= 0; i
< nstates
; i
++)
186 reductions
*rp
= state_table
[i
].reductions
;
187 shifts
*sp
= state_table
[i
].shifts
;
189 state_table
[i
].lookaheads
= count
;
192 && (rp
->nreds
> 1 || (sp
->nshifts
&& SHIFT_IS_SHIFT (sp
, 0))))
195 state_table
[i
].consistent
= 1;
197 for (k
= 0; k
< sp
->nshifts
; k
++)
198 if (SHIFT_IS_ERROR (sp
, k
))
200 state_table
[i
].consistent
= 0;
204 state_table
[nstates
].lookaheads
= count
;
217 size_t nLA
= state_table
[nstates
].lookaheads
;
221 LA
= XCALLOC (unsigned, nLA
* tokensetsize
);
222 LAruleno
= XCALLOC (short, nLA
);
223 lookback
= XCALLOC (shorts
*, nLA
);
226 for (i
= 0; i
< nstates
; i
++)
227 if (!state_table
[i
].consistent
)
228 if ((rp
= state_table
[i
].reductions
))
229 for (j
= 0; j
< rp
->nreds
; j
++)
230 *np
++ = rp
->rules
[j
];
245 goto_map
= XCALLOC (short, nvars
+ 1) - ntokens
;
246 temp_map
= XCALLOC (short, nvars
+ 1) - ntokens
;
249 for (sp
= first_shift
; sp
; sp
= sp
->next
)
251 for (i
= sp
->nshifts
- 1; i
>= 0 && SHIFT_IS_GOTO (sp
, i
); --i
)
253 symbol
= state_table
[sp
->shifts
[i
]].accessing_symbol
;
255 if (ngotos
== MAXSHORT
)
256 fatal (_("too many gotos (max %d)"), MAXSHORT
);
263 for (i
= ntokens
; i
< nsyms
; i
++)
269 for (i
= ntokens
; i
< nsyms
; i
++)
270 goto_map
[i
] = temp_map
[i
];
272 goto_map
[nsyms
] = ngotos
;
273 temp_map
[nsyms
] = ngotos
;
275 from_state
= XCALLOC (short, ngotos
);
276 to_state
= XCALLOC (short, ngotos
);
278 for (sp
= first_shift
; sp
; sp
= sp
->next
)
282 for (i
= sp
->nshifts
- 1; i
>= 0 && SHIFT_IS_GOTO (sp
, i
); --i
)
284 state2
= sp
->shifts
[i
];
285 symbol
= state_table
[state2
].accessing_symbol
;
287 k
= temp_map
[symbol
]++;
288 from_state
[k
] = state1
;
289 to_state
[k
] = state2
;
293 XFREE (temp_map
+ ntokens
);
298 /*----------------------------------------------------------.
299 | Map a state/symbol pair into its numeric representation. |
300 `----------------------------------------------------------*/
303 map_goto (int state
, int symbol
)
310 low
= goto_map
[symbol
];
311 high
= goto_map
[symbol
+ 1] - 1;
315 middle
= (low
+ high
) / 2;
316 s
= from_state
[middle
];
334 short **reads
= XCALLOC (short *, ngotos
);
335 short *edge
= XCALLOC (short, ngotos
+ 1);
340 F
= XCALLOC (unsigned, ngotos
* tokensetsize
);
342 for (i
= 0; i
< ngotos
; i
++)
344 int stateno
= to_state
[i
];
345 shifts
*sp
= state_table
[stateno
].shifts
;
348 for (j
= 0; j
< sp
->nshifts
&& SHIFT_IS_SHIFT (sp
, j
); j
++)
350 int symbol
= state_table
[sp
->shifts
[j
]].accessing_symbol
;
351 SETBIT (F (i
), symbol
);
354 for (; j
< sp
->nshifts
; j
++)
356 int symbol
= state_table
[sp
->shifts
[j
]].accessing_symbol
;
357 if (nullable
[symbol
])
358 edge
[nedges
++] = map_goto (stateno
, symbol
);
363 reads
[i
] = XCALLOC (short, nedges
+ 1);
364 shortcpy (reads
[i
], edge
, nedges
);
365 reads
[i
][nedges
] = -1;
372 for (i
= 0; i
< ngotos
; i
++)
381 add_lookback_edge (int stateno
, int ruleno
, int gotono
)
388 i
= state_table
[stateno
].lookaheads
;
389 k
= state_table
[stateno
+ 1].lookaheads
;
391 while (!found
&& i
< k
)
393 if (LAruleno
[i
] == ruleno
)
401 sp
= XCALLOC (shorts
, 1);
402 sp
->next
= lookback
[i
];
409 matrix_print (FILE *out
, short **matrix
, int n
)
413 for (i
= 0; i
< n
; ++i
)
415 fprintf (out
, "%3d: ", i
);
417 for (j
= 0; matrix
[i
][j
] != -1; ++j
)
418 fprintf (out
, "%3d ", matrix
[i
][j
]);
424 /*-------------------------------------------------------------------.
425 | Return the transpose of R_ARG, of size N. Destroy R_ARG, as it is |
426 | replaced with the result. |
428 | R_ARG[I] is NULL or a -1 terminated list of numbers. |
430 | RESULT[NUM] is NULL or the -1 terminated list of the I such as NUM |
432 `-------------------------------------------------------------------*/
435 transpose (short **R_arg
, int n
)
438 short **new_R
= XCALLOC (short *, n
);
439 /* END_R[I] -- next entry of NEW_R[I]. */
440 short **end_R
= XCALLOC (short *, n
);
441 /* NEDGES[I] -- total size of NEW_R[I]. */
442 short *nedges
= XCALLOC (short, n
);
447 fputs ("transpose: input\n", stderr
);
448 matrix_print (stderr
, R_arg
, n
);
452 for (i
= 0; i
< n
; i
++)
454 for (j
= 0; R_arg
[i
][j
] >= 0; ++j
)
455 ++nedges
[R_arg
[i
][j
]];
458 for (i
= 0; i
< n
; i
++)
461 short *sp
= XCALLOC (short, nedges
[i
] + 1);
468 for (i
= 0; i
< n
; i
++)
470 for (j
= 0; R_arg
[i
][j
] >= 0; ++j
)
472 *end_R
[R_arg
[i
][j
]] = i
;
473 ++end_R
[R_arg
[i
][j
]];
479 /* Free the input: it is replaced with the result. */
480 for (i
= 0; i
< n
; i
++)
486 fputs ("transpose: output\n", stderr
);
487 matrix_print (stderr
, new_R
, n
);
495 build_relations (void)
497 short *edge
= XCALLOC (short, ngotos
+ 1);
498 short *states
= XCALLOC (short, ritem_longest_rhs () + 1);
501 includes
= XCALLOC (short *, ngotos
);
503 for (i
= 0; i
< ngotos
; i
++)
506 int state1
= from_state
[i
];
507 int symbol1
= state_table
[to_state
[i
]].accessing_symbol
;
510 for (rulep
= derives
[symbol1
]; *rulep
> 0; rulep
++)
514 int stateno
= state1
;
518 for (rp
= ritem
+ rule_table
[*rulep
].rhs
; *rp
> 0; rp
++)
520 shifts
*sp
= state_table
[stateno
].shifts
;
522 for (j
= 0; j
< sp
->nshifts
; j
++)
524 stateno
= sp
->shifts
[j
];
525 if (state_table
[stateno
].accessing_symbol
== *rp
)
529 states
[length
++] = stateno
;
532 if (!state_table
[stateno
].consistent
)
533 add_lookback_edge (stateno
, *rulep
, i
);
541 /* JF added rp>=ritem && I hope to god its right! */
542 if (rp
>= ritem
&& ISVAR (*rp
))
544 stateno
= states
[--length
];
545 edge
[nedges
++] = map_goto (stateno
, *rp
);
555 includes
[i
] = XCALLOC (short, nedges
+ 1);
556 for (j
= 0; j
< nedges
; j
++)
557 includes
[i
][j
] = edge
[j
];
558 includes
[i
][nedges
] = -1;
565 includes
= transpose (includes
, ngotos
);
571 compute_FOLLOWS (void)
577 for (i
= 0; i
< ngotos
; i
++)
585 compute_lookaheads (void)
590 for (i
= 0; i
< state_table
[nstates
].lookaheads
; i
++)
591 for (sp
= lookback
[i
]; sp
; sp
= sp
->next
)
593 int size
= LA (i
+ 1) - LA (i
);
595 for (j
= 0; j
< size
; ++j
)
596 LA (i
)[j
] |= F (sp
->value
)[j
];
600 for (i
= 0; i
< state_table
[nstates
].lookaheads
; i
++)
601 LIST_FREE (shorts
, lookback
[i
]);
611 tokensetsize
= WORDSIZE (ntokens
);
619 compute_lookaheads ();