]>
git.saurik.com Git - bison.git/blob - src/lalr.c
1 /* Compute look-ahead criteria for bison,
2 Copyright (C) 1984, 1986, 1989, 2000, 2001, 2002
3 Free Software Foundation, Inc.
5 This file is part of Bison, the GNU Compiler Compiler.
7 Bison is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
12 Bison is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with Bison; see the file COPYING. If not, write to
19 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA. */
23 /* Compute how to make the finite state machine deterministic; find
24 which rules need lookahead in each state, and which lookahead
25 tokens they accept. */
42 /* All the decorated states, indexed by the state number. */
43 state_t
**states
= NULL
;
45 rule_t
**LArule
= NULL
;
50 short *goto_map
= NULL
;
51 state_number_t
*from_state
= NULL
;
52 state_number_t
*to_state
= NULL
;
54 /* And for the famous F variable, which name is so descriptive that a
55 comment is hardly needed. <grin>. */
56 static bitsetv F
= NULL
;
58 static short **includes
;
59 static shorts
**lookback
;
62 /*---------------------------------------------------------------.
63 | digraph & traverse. |
65 | The following variables are used as common storage between the |
67 `---------------------------------------------------------------*/
71 static short *VERTICES
;
82 INDEX
[i
] = height
= top
;
85 for (j
= 0; R
[i
][j
] >= 0; ++j
)
87 if (INDEX
[R
[i
][j
]] == 0)
90 if (INDEX
[i
] > INDEX
[R
[i
][j
]])
91 INDEX
[i
] = INDEX
[R
[i
][j
]];
93 bitset_or (F
[i
], F
[i
], F
[R
[i
][j
]]);
96 if (INDEX
[i
] == height
)
105 bitset_copy (F
[j
], F
[i
]);
111 digraph (short **relation
)
115 infinity
= ngotos
+ 2;
116 INDEX
= XCALLOC (short, ngotos
+ 1);
117 VERTICES
= XCALLOC (short, ngotos
+ 1);
122 for (i
= 0; i
< ngotos
; i
++)
125 for (i
= 0; i
< ngotos
; i
++)
126 if (INDEX
[i
] == 0 && R
[i
])
141 /* Avoid having to special case 0. */
145 LA
= bitsetv_create (nLA
, ntokens
, BITSET_FIXED
);
146 LArule
= XCALLOC (rule_t
*, nLA
);
147 lookback
= XCALLOC (shorts
*, nLA
);
150 for (i
= 0; i
< nstates
; i
++)
151 if (!states
[i
]->consistent
)
152 for (j
= 0; j
< states
[i
]->reductions
->nreds
; j
++)
153 *np
++ = &rules
[states
[i
]->reductions
->rules
[j
]];
160 state_number_t state
;
163 goto_map
= XCALLOC (short, nvars
+ 1) - ntokens
;
164 temp_map
= XCALLOC (short, nvars
+ 1) - ntokens
;
167 for (state
= 0; state
< nstates
; ++state
)
169 shifts
*sp
= states
[state
]->shifts
;
171 for (i
= sp
->nshifts
- 1; i
>= 0 && SHIFT_IS_GOTO (sp
, i
); --i
)
173 if (ngotos
== SHRT_MAX
)
174 fatal (_("too many gotos (max %d)"), SHRT_MAX
);
177 goto_map
[SHIFT_SYMBOL (sp
, i
)]++;
184 for (i
= ntokens
; i
< nsyms
; i
++)
190 for (i
= ntokens
; i
< nsyms
; i
++)
191 goto_map
[i
] = temp_map
[i
];
193 goto_map
[nsyms
] = ngotos
;
194 temp_map
[nsyms
] = ngotos
;
197 from_state
= XCALLOC (state_number_t
, ngotos
);
198 to_state
= XCALLOC (state_number_t
, ngotos
);
200 for (state
= 0; state
< nstates
; ++state
)
202 shifts
*sp
= states
[state
]->shifts
;
204 for (i
= sp
->nshifts
- 1; i
>= 0 && SHIFT_IS_GOTO (sp
, i
); --i
)
206 int k
= temp_map
[SHIFT_SYMBOL (sp
, i
)]++;
207 from_state
[k
] = state
;
208 to_state
[k
] = sp
->shifts
[i
];
212 XFREE (temp_map
+ ntokens
);
217 /*----------------------------------------------------------.
218 | Map a state/symbol pair into its numeric representation. |
219 `----------------------------------------------------------*/
222 map_goto (state_number_t state
, symbol_number_t symbol
)
229 low
= goto_map
[symbol
];
230 high
= goto_map
[symbol
+ 1] - 1;
234 middle
= (low
+ high
) / 2;
235 s
= from_state
[middle
];
253 short **reads
= XCALLOC (short *, ngotos
);
254 short *edge
= XCALLOC (short, ngotos
+ 1);
259 F
= bitsetv_create (ngotos
, ntokens
, BITSET_FIXED
);
261 for (i
= 0; i
< ngotos
; i
++)
263 state_number_t stateno
= to_state
[i
];
264 shifts
*sp
= states
[stateno
]->shifts
;
267 for (j
= 0; j
< sp
->nshifts
&& SHIFT_IS_SHIFT (sp
, j
); j
++)
268 bitset_set (F
[i
], SHIFT_SYMBOL (sp
, j
));
270 for (; j
< sp
->nshifts
; j
++)
272 symbol_number_t symbol
= SHIFT_SYMBOL (sp
, j
);
273 if (nullable
[symbol
])
274 edge
[nedges
++] = map_goto (stateno
, symbol
);
279 reads
[i
] = XCALLOC (short, nedges
+ 1);
280 memcpy (reads
[i
], edge
, nedges
* sizeof (edge
[0]));
281 reads
[i
][nedges
] = -1;
288 for (i
= 0; i
< ngotos
; i
++)
297 add_lookback_edge (state_t
*state
, int ruleno
, int gotono
)
302 for (i
= 0; i
< state
->nlookaheads
; ++i
)
303 if (state
->lookaheads_rule
[i
]->number
== ruleno
)
306 assert (state
->lookaheads_rule
[i
]->number
== ruleno
);
308 sp
= XCALLOC (shorts
, 1);
309 sp
->next
= lookback
[(state
->lookaheads
- LA
) + i
];
311 lookback
[(state
->lookaheads
- LA
) + i
] = sp
;
316 matrix_print (FILE *out
, short **matrix
, int n
)
320 for (i
= 0; i
< n
; ++i
)
322 fprintf (out
, "%3d: ", i
);
324 for (j
= 0; matrix
[i
][j
] != -1; ++j
)
325 fprintf (out
, "%3d ", matrix
[i
][j
]);
331 /*-------------------------------------------------------------------.
332 | Return the transpose of R_ARG, of size N. Destroy R_ARG, as it is |
333 | replaced with the result. |
335 | R_ARG[I] is NULL or a -1 terminated list of numbers. |
337 | RESULT[NUM] is NULL or the -1 terminated list of the I such as NUM |
339 `-------------------------------------------------------------------*/
342 transpose (short **R_arg
, int n
)
345 short **new_R
= XCALLOC (short *, n
);
346 /* END_R[I] -- next entry of NEW_R[I]. */
347 short **end_R
= XCALLOC (short *, n
);
348 /* NEDGES[I] -- total size of NEW_R[I]. */
349 short *nedges
= XCALLOC (short, n
);
354 fputs ("transpose: input\n", stderr
);
355 matrix_print (stderr
, R_arg
, n
);
359 for (i
= 0; i
< n
; i
++)
361 for (j
= 0; R_arg
[i
][j
] >= 0; ++j
)
362 ++nedges
[R_arg
[i
][j
]];
365 for (i
= 0; i
< n
; i
++)
368 short *sp
= XCALLOC (short, nedges
[i
] + 1);
375 for (i
= 0; i
< n
; i
++)
377 for (j
= 0; R_arg
[i
][j
] >= 0; ++j
)
379 *end_R
[R_arg
[i
][j
]] = i
;
380 ++end_R
[R_arg
[i
][j
]];
386 /* Free the input: it is replaced with the result. */
387 for (i
= 0; i
< n
; i
++)
393 fputs ("transpose: output\n", stderr
);
394 matrix_print (stderr
, new_R
, n
);
402 build_relations (void)
404 short *edge
= XCALLOC (short, ngotos
+ 1);
405 state_number_t
*states1
= XCALLOC (state_number_t
, ritem_longest_rhs () + 1);
408 includes
= XCALLOC (short *, ngotos
);
410 for (i
= 0; i
< ngotos
; i
++)
413 symbol_number_t symbol1
= states
[to_state
[i
]]->accessing_symbol
;
416 for (rulep
= derives
[symbol1
]; *rulep
> 0; rulep
++)
421 state_t
*state
= states
[from_state
[i
]];
422 states1
[0] = state
->number
;
424 for (rp
= rules
[*rulep
].rhs
; *rp
>= 0; rp
++)
426 shifts
*sp
= state
->shifts
;
428 for (j
= 0; j
< sp
->nshifts
; j
++)
430 state
= states
[sp
->shifts
[j
]];
431 if (state
->accessing_symbol
432 == item_number_as_symbol_number (*rp
))
436 states1
[length
++] = state
->number
;
439 if (!state
->consistent
)
440 add_lookback_edge (state
, *rulep
, i
);
448 /* JF added rp>=ritem && I hope to god its right! */
449 if (rp
>= ritem
&& ISVAR (*rp
))
451 /* Downcasting from item_number_t to symbol_number_t. */
452 edge
[nedges
++] = map_goto (states1
[--length
],
453 item_number_as_symbol_number (*rp
));
463 includes
[i
] = XCALLOC (short, nedges
+ 1);
464 for (j
= 0; j
< nedges
; j
++)
465 includes
[i
][j
] = edge
[j
];
466 includes
[i
][nedges
] = -1;
473 includes
= transpose (includes
, ngotos
);
479 compute_FOLLOWS (void)
485 for (i
= 0; i
< ngotos
; i
++)
493 compute_lookaheads (void)
498 for (i
= 0; i
< nLA
; i
++)
499 for (sp
= lookback
[i
]; sp
; sp
= sp
->next
)
500 bitset_or (LA
[i
], LA
[i
], F
[sp
->value
]);
503 for (i
= 0; i
< nLA
; i
++)
504 LIST_FREE (shorts
, lookback
[i
]);
511 /*-------------------------------------------------------------.
512 | Count the number of lookaheads required for each state |
513 | (NLOOKAHEADS member). Compute the total number of LA, NLA. |
514 `-------------------------------------------------------------*/
517 states_lookaheads_count (void)
523 for (i
= 0; i
< nstates
; i
++)
527 reductions
*rp
= states
[i
]->reductions
;
528 shifts
*sp
= states
[i
]->shifts
;
530 /* We need a lookahead either to distinguish different
531 reductions (i.e., there are two or more), or to distinguish a
532 reduction from a shift. Otherwise, it is straightforward,
533 and the state is `consistent'. */
535 || (rp
->nreds
== 1 && sp
->nshifts
&& SHIFT_IS_SHIFT (sp
, 0)))
536 nlookaheads
+= rp
->nreds
;
538 states
[i
]->consistent
= 1;
540 for (k
= 0; k
< sp
->nshifts
; k
++)
541 if (SHIFT_IS_ERROR (sp
, k
))
543 states
[i
]->consistent
= 0;
547 states
[i
]->nlookaheads
= nlookaheads
;
553 /*--------------------------------------.
554 | Initializing the lookaheads members. |
555 `--------------------------------------*/
558 states_lookaheads_initialize (void)
562 rule_t
**pLArule
= LArule
;
564 /* Initialize the members LOOKAHEADS and LOOKAHEADS_RULE for each
566 for (i
= 0; i
< nstates
; i
++)
568 states
[i
]->lookaheads
= pLA
;
569 states
[i
]->lookaheads_rule
= pLArule
;
570 pLA
+= states
[i
]->nlookaheads
;
571 pLArule
+= states
[i
]->nlookaheads
;
576 /*---------------------------------------.
577 | Output the lookaheads for each state. |
578 `---------------------------------------*/
581 lookaheads_print (FILE *out
)
585 fprintf (out
, "Lookaheads: BEGIN\n");
586 for (i
= 0; i
< nstates
; ++i
)
588 fprintf (out
, "State %d: %d lookaheads\n",
589 i
, states
[i
]->nlookaheads
);
591 for (j
= 0; j
< states
[i
]->nlookaheads
; ++j
)
592 for (k
= 0; k
< ntokens
; ++k
)
593 if (bitset_test (states
[i
]->lookaheads
[j
], k
))
594 fprintf (out
, " on %d (%s) -> rule %d\n",
595 k
, symbol_tag_get (symbols
[k
]),
596 states
[i
]->lookaheads_rule
[j
]->number
- 1);
598 fprintf (out
, "Lookaheads: END\n");
604 states_lookaheads_count ();
606 states_lookaheads_initialize ();
611 compute_lookaheads ();
614 lookaheads_print (stderr
);