]>
Commit | Line | Data |
---|---|---|
d0fb370f | 1 | /* Compute look-ahead criteria for bison, |
b0299a2e AD |
2 | Copyright (C) 1984, 1986, 1989, 2000, 2001, 2002 |
3 | Free Software Foundation, Inc. | |
d0fb370f | 4 | |
340ef489 | 5 | This file is part of Bison, the GNU Compiler Compiler. |
d0fb370f | 6 | |
340ef489 AD |
7 | Bison is free software; you can redistribute it and/or modify |
8 | it under the terms of the GNU General Public License as published by | |
9 | the Free Software Foundation; either version 2, or (at your option) | |
10 | any later version. | |
d0fb370f | 11 | |
340ef489 AD |
12 | Bison is distributed in the hope that it will be useful, |
13 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 | GNU General Public License for more details. | |
d0fb370f | 16 | |
340ef489 AD |
17 | You should have received a copy of the GNU General Public License |
18 | along with Bison; see the file COPYING. If not, write to | |
19 | the Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
20 | Boston, MA 02111-1307, USA. */ | |
d0fb370f RS |
21 | |
22 | ||
720d742f AD |
23 | /* Compute how to make the finite state machine deterministic; find |
24 | which rules need lookahead in each state, and which lookahead | |
340ef489 | 25 | tokens they accept. */ |
d0fb370f | 26 | |
d0fb370f | 27 | #include "system.h" |
5dde5425 PE |
28 | |
29 | #include <bitset.h> | |
30 | #include <bitsetv.h> | |
31 | #include <quotearg.h> | |
32 | ||
b2ca4022 | 33 | #include "LR0.h" |
a0f6b076 | 34 | #include "complain.h" |
340ef489 | 35 | #include "derives.h" |
f67d13aa | 36 | #include "getargs.h" |
5dde5425 PE |
37 | #include "gram.h" |
38 | #include "lalr.h" | |
39 | #include "nullable.h" | |
40 | #include "reader.h" | |
41 | #include "relation.h" | |
42 | #include "symtab.h" | |
d0fb370f | 43 | |
5dde5425 PE |
44 | goto_number *goto_map = NULL; |
45 | static goto_number ngotos = 0; | |
46 | state_number *from_state = NULL; | |
47 | state_number *to_state = NULL; | |
e68e0410 AD |
48 | |
49 | /* Linked list of goto numbers. */ | |
5dde5425 | 50 | typedef struct goto_list |
e68e0410 | 51 | { |
5dde5425 PE |
52 | struct goto_list *next; |
53 | goto_number value; | |
54 | } goto_list; | |
e68e0410 AD |
55 | |
56 | ||
3325ddc4 AD |
57 | /* LA is a LR by NTOKENS matrix of bits. LA[l, i] is 1 if the rule |
58 | LArule[l] is applicable in the appropriate state when the next | |
59 | token is symbol i. If LA[l, i] and LA[l, j] are both 1 for i != j, | |
60 | it is a conflict. */ | |
61 | ||
62 | static bitsetv LA = NULL; | |
d200e455 | 63 | size_t nLA; |
9703cc49 | 64 | |
d0fb370f | 65 | |
fe961097 | 66 | /* And for the famous F variable, which name is so descriptive that a |
ddcd5fdf | 67 | comment is hardly needed. <grin>. */ |
914feea9 | 68 | static bitsetv F = NULL; |
ddcd5fdf | 69 | |
5dde5425 PE |
70 | static goto_number **includes; |
71 | static goto_list **lookback; | |
aa2aab3c AD |
72 | |
73 | ||
720d742f | 74 | |
bb527fc2 | 75 | |
4a120d45 | 76 | static void |
d2729d44 | 77 | set_goto_map (void) |
d0fb370f | 78 | { |
5dde5425 PE |
79 | state_number s; |
80 | goto_number *temp_map; | |
d0fb370f | 81 | |
5dde5425 PE |
82 | goto_map = XCALLOC (goto_number, nvars + 1) - ntokens; |
83 | temp_map = XCALLOC (goto_number, nvars + 1) - ntokens; | |
d0fb370f RS |
84 | |
85 | ngotos = 0; | |
5dde5425 | 86 | for (s = 0; s < nstates; ++s) |
7215de24 | 87 | { |
5dde5425 | 88 | transitions *sp = states[s]->transitions; |
d57650a5 | 89 | int i; |
ccaf65bc | 90 | for (i = sp->num - 1; i >= 0 && TRANSITION_IS_GOTO (sp, i); --i) |
7215de24 | 91 | { |
5dde5425 | 92 | if (ngotos >= GOTO_NUMBER_MAXIMUM) |
58a84254 | 93 | abort (); |
7215de24 | 94 | ngotos++; |
ccaf65bc | 95 | goto_map[TRANSITION_SYMBOL (sp, i)]++; |
7215de24 AD |
96 | } |
97 | } | |
d0fb370f | 98 | |
d0b0fefa AD |
99 | { |
100 | int k = 0; | |
d57650a5 | 101 | int i; |
d0b0fefa AD |
102 | for (i = ntokens; i < nsyms; i++) |
103 | { | |
104 | temp_map[i] = k; | |
105 | k += goto_map[i]; | |
106 | } | |
d0fb370f | 107 | |
d0b0fefa AD |
108 | for (i = ntokens; i < nsyms; i++) |
109 | goto_map[i] = temp_map[i]; | |
d0fb370f | 110 | |
d0b0fefa AD |
111 | goto_map[nsyms] = ngotos; |
112 | temp_map[nsyms] = ngotos; | |
113 | } | |
d0fb370f | 114 | |
5dde5425 PE |
115 | from_state = XCALLOC (state_number, ngotos); |
116 | to_state = XCALLOC (state_number, ngotos); | |
d0fb370f | 117 | |
5dde5425 | 118 | for (s = 0; s < nstates; ++s) |
d0fb370f | 119 | { |
5dde5425 | 120 | transitions *sp = states[s]->transitions; |
d57650a5 | 121 | int i; |
ccaf65bc | 122 | for (i = sp->num - 1; i >= 0 && TRANSITION_IS_GOTO (sp, i); --i) |
d0fb370f | 123 | { |
ccaf65bc | 124 | int k = temp_map[TRANSITION_SYMBOL (sp, i)]++; |
5dde5425 | 125 | from_state[k] = s; |
640748ee | 126 | to_state[k] = sp->states[i]->number; |
d0fb370f RS |
127 | } |
128 | } | |
129 | ||
d7913476 | 130 | XFREE (temp_map + ntokens); |
d0fb370f RS |
131 | } |
132 | ||
133 | ||
134 | ||
43591cec AD |
135 | /*----------------------------------------------------------. |
136 | | Map a state/symbol pair into its numeric representation. | | |
137 | `----------------------------------------------------------*/ | |
d0fb370f | 138 | |
4a120d45 | 139 | static int |
5dde5425 | 140 | map_goto (state_number s0, symbol_number sym) |
d0fb370f | 141 | { |
720d742f AD |
142 | int high; |
143 | int low; | |
144 | int middle; | |
5dde5425 | 145 | state_number s; |
d0fb370f | 146 | |
5dde5425 PE |
147 | low = goto_map[sym]; |
148 | high = goto_map[sym + 1] - 1; | |
d0fb370f | 149 | |
58a84254 | 150 | for (;;) |
d0fb370f | 151 | { |
58a84254 PE |
152 | if (high < low) |
153 | abort (); | |
d0fb370f RS |
154 | middle = (low + high) / 2; |
155 | s = from_state[middle]; | |
5dde5425 | 156 | if (s == s0) |
36281465 | 157 | return middle; |
5dde5425 | 158 | else if (s < s0) |
d0fb370f RS |
159 | low = middle + 1; |
160 | else | |
161 | high = middle - 1; | |
162 | } | |
d0fb370f RS |
163 | } |
164 | ||
165 | ||
4a120d45 | 166 | static void |
d2729d44 | 167 | initialize_F (void) |
d0fb370f | 168 | { |
5dde5425 PE |
169 | goto_number **reads = XCALLOC (goto_number *, ngotos); |
170 | goto_number *edge = XCALLOC (goto_number, ngotos + 1); | |
4d4f699c | 171 | int nedges = 0; |
d0fb370f | 172 | |
4d4f699c | 173 | int i; |
d0fb370f | 174 | |
914feea9 | 175 | F = bitsetv_create (ngotos, ntokens, BITSET_FIXED); |
d0fb370f | 176 | |
d0fb370f RS |
177 | for (i = 0; i < ngotos; i++) |
178 | { | |
5dde5425 PE |
179 | state_number stateno = to_state[i]; |
180 | transitions *sp = states[stateno]->transitions; | |
d0fb370f | 181 | |
d954473d | 182 | int j; |
640748ee | 183 | FOR_EACH_SHIFT (sp, j) |
ccaf65bc | 184 | bitset_set (F[i], TRANSITION_SYMBOL (sp, j)); |
d0fb370f | 185 | |
ccaf65bc | 186 | for (; j < sp->num; j++) |
d954473d | 187 | { |
5dde5425 PE |
188 | symbol_number sym = TRANSITION_SYMBOL (sp, j); |
189 | if (nullable[sym]) | |
190 | edge[nedges++] = map_goto (stateno, sym); | |
d954473d | 191 | } |
a0f6b076 | 192 | |
d954473d AD |
193 | if (nedges) |
194 | { | |
5dde5425 | 195 | reads[i] = XCALLOC (goto_number, nedges + 1); |
62a3e4f0 | 196 | memcpy (reads[i], edge, nedges * sizeof (edge[0])); |
d954473d AD |
197 | reads[i][nedges] = -1; |
198 | nedges = 0; | |
d0fb370f | 199 | } |
d0fb370f RS |
200 | } |
201 | ||
0e4d5753 | 202 | relation_digraph (reads, ngotos, &F); |
d0fb370f RS |
203 | |
204 | for (i = 0; i < ngotos; i++) | |
ddcd5fdf | 205 | XFREE (reads[i]); |
d0fb370f | 206 | |
d7913476 AD |
207 | XFREE (reads); |
208 | XFREE (edge); | |
d0fb370f RS |
209 | } |
210 | ||
211 | ||
4a120d45 | 212 | static void |
5dde5425 | 213 | add_lookback_edge (state *s, rule *r, int gotono) |
d0fb370f | 214 | { |
5dde5425 PE |
215 | int ri = state_reduction_find (s, r); |
216 | goto_list *sp = XCALLOC (goto_list, 1); | |
217 | sp->next = lookback[(s->reductions->lookaheads - LA) + ri]; | |
d0fb370f | 218 | sp->value = gotono; |
5dde5425 | 219 | lookback[(s->reductions->lookaheads - LA) + ri] = sp; |
d0fb370f RS |
220 | } |
221 | ||
222 | ||
d0fb370f | 223 | |
4a120d45 | 224 | static void |
720d742f | 225 | build_relations (void) |
d0fb370f | 226 | { |
5dde5425 PE |
227 | goto_number *edge = XCALLOC (goto_number, ngotos + 1); |
228 | state_number *states1 = XCALLOC (state_number, ritem_longest_rhs () + 1); | |
720d742f | 229 | int i; |
720d742f | 230 | |
5dde5425 | 231 | includes = XCALLOC (goto_number *, ngotos); |
d0fb370f RS |
232 | |
233 | for (i = 0; i < ngotos; i++) | |
234 | { | |
9887c18a | 235 | int nedges = 0; |
5dde5425 PE |
236 | symbol_number symbol1 = states[to_state[i]]->accessing_symbol; |
237 | rule **rulep; | |
d0fb370f | 238 | |
bb0027a9 | 239 | for (rulep = derives[symbol1]; *rulep; rulep++) |
720d742f | 240 | { |
9887c18a | 241 | int done; |
80a69750 | 242 | int length = 1; |
5dde5425 PE |
243 | item_number *rp; |
244 | state *s = states[from_state[i]]; | |
245 | states1[0] = s->number; | |
d0fb370f | 246 | |
bb0027a9 | 247 | for (rp = (*rulep)->rhs; *rp >= 0; rp++) |
720d742f | 248 | { |
5dde5425 PE |
249 | s = transitions_to (s->transitions, |
250 | item_number_as_symbol_number (*rp)); | |
251 | states1[length++] = s->number; | |
720d742f AD |
252 | } |
253 | ||
5dde5425 PE |
254 | if (!s->consistent) |
255 | add_lookback_edge (s, *rulep, i); | |
720d742f AD |
256 | |
257 | length--; | |
258 | done = 0; | |
259 | while (!done) | |
260 | { | |
261 | done = 1; | |
262 | rp--; | |
263 | /* JF added rp>=ritem && I hope to god its right! */ | |
264 | if (rp >= ritem && ISVAR (*rp)) | |
265 | { | |
5dde5425 | 266 | /* Downcasting from item_number to symbol_number. */ |
5fbb0954 | 267 | edge[nedges++] = map_goto (states1[--length], |
a49aecd5 | 268 | item_number_as_symbol_number (*rp)); |
720d742f AD |
269 | if (nullable[*rp]) |
270 | done = 0; | |
271 | } | |
272 | } | |
d0fb370f RS |
273 | } |
274 | ||
720d742f AD |
275 | if (nedges) |
276 | { | |
9887c18a | 277 | int j; |
5dde5425 | 278 | includes[i] = XCALLOC (goto_number, nedges + 1); |
720d742f | 279 | for (j = 0; j < nedges; j++) |
80a69750 AD |
280 | includes[i][j] = edge[j]; |
281 | includes[i][nedges] = -1; | |
720d742f | 282 | } |
d0fb370f RS |
283 | } |
284 | ||
d7913476 | 285 | XFREE (edge); |
b9f71f19 | 286 | XFREE (states1); |
9887c18a | 287 | |
0e4d5753 | 288 | relation_transpose (&includes, ngotos); |
d0fb370f RS |
289 | } |
290 | ||
291 | ||
720d742f | 292 | |
4a120d45 | 293 | static void |
720d742f | 294 | compute_FOLLOWS (void) |
d0fb370f | 295 | { |
720d742f | 296 | int i; |
d0fb370f | 297 | |
0e4d5753 | 298 | relation_digraph (includes, ngotos, &F); |
d0fb370f RS |
299 | |
300 | for (i = 0; i < ngotos; i++) | |
ddcd5fdf | 301 | XFREE (includes[i]); |
d0fb370f | 302 | |
d7913476 | 303 | XFREE (includes); |
d0fb370f RS |
304 | } |
305 | ||
306 | ||
4a120d45 | 307 | static void |
720d742f | 308 | compute_lookaheads (void) |
d0fb370f | 309 | { |
d200e455 | 310 | size_t i; |
5dde5425 | 311 | goto_list *sp; |
d0fb370f | 312 | |
d200e455 | 313 | for (i = 0; i < nLA; i++) |
ddcd5fdf | 314 | for (sp = lookback[i]; sp; sp = sp->next) |
0fb1ffb1 | 315 | bitset_or (LA[i], LA[i], F[sp->value]); |
d0fb370f | 316 | |
ddcd5fdf | 317 | /* Free LOOKBACK. */ |
d200e455 | 318 | for (i = 0; i < nLA; i++) |
5dde5425 | 319 | LIST_FREE (goto_list, lookback[i]); |
d0fb370f | 320 | |
d7913476 | 321 | XFREE (lookback); |
914feea9 | 322 | bitsetv_free (F); |
720d742f | 323 | } |
d0fb370f | 324 | |
d0fb370f | 325 | |
5dde5425 PE |
326 | /*-----------------------------------------------------------. |
327 | | Count the number of lookaheads required for S (NLOOKAHEADS | | |
328 | | member). | | |
329 | `-----------------------------------------------------------*/ | |
5edafffd | 330 | |
cd08e51e | 331 | static int |
5dde5425 | 332 | state_lookaheads_count (state *s) |
5edafffd | 333 | { |
cd08e51e AD |
334 | int k; |
335 | int nlookaheads = 0; | |
5dde5425 PE |
336 | reductions *rp = s->reductions; |
337 | transitions *sp = s->transitions; | |
cd08e51e AD |
338 | |
339 | /* We need a lookahead either to distinguish different | |
340 | reductions (i.e., there are two or more), or to distinguish a | |
341 | reduction from a shift. Otherwise, it is straightforward, | |
342 | and the state is `consistent'. */ | |
343 | if (rp->num > 1 | |
344 | || (rp->num == 1 && sp->num && | |
345 | !TRANSITION_IS_DISABLED (sp, 0) && TRANSITION_IS_SHIFT (sp, 0))) | |
346 | nlookaheads += rp->num; | |
347 | else | |
5dde5425 | 348 | s->consistent = 1; |
cd08e51e AD |
349 | |
350 | for (k = 0; k < sp->num; k++) | |
351 | if (!TRANSITION_IS_DISABLED (sp, k) && TRANSITION_IS_ERROR (sp, k)) | |
352 | { | |
5dde5425 | 353 | s->consistent = 0; |
cd08e51e AD |
354 | break; |
355 | } | |
3877f72b | 356 | |
cd08e51e | 357 | return nlookaheads; |
5edafffd AD |
358 | } |
359 | ||
7c6b64d0 | 360 | |
cd08e51e AD |
361 | /*----------------------------------------------. |
362 | | Compute LA, NLA, and the lookaheads members. | | |
363 | `----------------------------------------------*/ | |
c0263492 AD |
364 | |
365 | static void | |
cd08e51e | 366 | initialize_LA (void) |
c0263492 | 367 | { |
5dde5425 | 368 | state_number i; |
cd08e51e | 369 | bitsetv pLA; |
c0263492 | 370 | |
cd08e51e AD |
371 | /* Compute the total number of reductions requiring a lookahead. */ |
372 | nLA = 0; | |
373 | for (i = 0; i < nstates; i++) | |
374 | nLA += state_lookaheads_count (states[i]); | |
375 | /* Avoid having to special case 0. */ | |
376 | if (!nLA) | |
377 | nLA = 1; | |
378 | ||
379 | pLA = LA = bitsetv_create (nLA, ntokens, BITSET_FIXED); | |
5dde5425 | 380 | lookback = XCALLOC (goto_list *, nLA); |
cd08e51e AD |
381 | |
382 | /* Initialize the members LOOKAHEADS for each state which reductions | |
383 | require lookaheads. */ | |
c0263492 AD |
384 | for (i = 0; i < nstates; i++) |
385 | { | |
cd08e51e AD |
386 | int count = state_lookaheads_count (states[i]); |
387 | if (count) | |
388 | { | |
389 | states[i]->reductions->lookaheads = pLA; | |
390 | pLA += count; | |
391 | } | |
c0263492 AD |
392 | } |
393 | } | |
394 | ||
395 | ||
7c6b64d0 AD |
396 | /*---------------------------------------. |
397 | | Output the lookaheads for each state. | | |
398 | `---------------------------------------*/ | |
399 | ||
400 | static void | |
401 | lookaheads_print (FILE *out) | |
402 | { | |
5dde5425 | 403 | state_number i; |
602bbf31 | 404 | int j, k; |
427c0dda | 405 | fprintf (out, "Lookaheads: BEGIN\n"); |
7c6b64d0 AD |
406 | for (i = 0; i < nstates; ++i) |
407 | { | |
5dde5425 | 408 | reductions *reds = states[i]->reductions; |
613f5e1a | 409 | bitset_iterator iter; |
cd08e51e AD |
410 | int nlookaheads = 0; |
411 | ||
412 | if (reds->lookaheads) | |
413 | for (k = 0; k < reds->num; ++k) | |
414 | if (reds->lookaheads[k]) | |
415 | ++nlookaheads; | |
613f5e1a | 416 | |
427c0dda | 417 | fprintf (out, "State %d: %d lookaheads\n", |
cd08e51e | 418 | i, nlookaheads); |
7c6b64d0 | 419 | |
cd08e51e AD |
420 | if (reds->lookaheads) |
421 | for (j = 0; j < reds->num; ++j) | |
422 | BITSET_FOR_EACH (iter, reds->lookaheads[j], k, 0) | |
423 | { | |
427c0dda | 424 | fprintf (out, " on %d (%s) -> rule %d\n", |
cd08e51e AD |
425 | k, symbols[k]->tag, |
426 | reds->rules[j]->number); | |
427 | }; | |
7c6b64d0 | 428 | } |
427c0dda | 429 | fprintf (out, "Lookaheads: END\n"); |
7c6b64d0 AD |
430 | } |
431 | ||
720d742f AD |
432 | void |
433 | lalr (void) | |
434 | { | |
720d742f AD |
435 | initialize_LA (); |
436 | set_goto_map (); | |
437 | initialize_F (); | |
438 | build_relations (); | |
439 | compute_FOLLOWS (); | |
440 | compute_lookaheads (); | |
7c6b64d0 | 441 | |
273a74fa | 442 | if (trace_flag & trace_sets) |
7c6b64d0 | 443 | lookaheads_print (stderr); |
d0fb370f | 444 | } |
3325ddc4 AD |
445 | |
446 | ||
447 | void | |
448 | lalr_free (void) | |
449 | { | |
5dde5425 | 450 | state_number s; |
3325ddc4 | 451 | for (s = 0; s < nstates; ++s) |
cd08e51e | 452 | states[s]->reductions->lookaheads = NULL; |
3325ddc4 | 453 | bitsetv_free (LA); |
3325ddc4 | 454 | } |