]> git.saurik.com Git - bison.git/blame - src/output.c
Have Bison grammars parsed by a Bison grammar.
[bison.git] / src / output.c
CommitLineData
c3e23647 1/* Output the generated parsing program for bison,
5bb18f9a 2 Copyright (C) 1984, 1986, 1989, 1992, 2000, 2001, 2002
255ef638 3 Free Software Foundation, Inc.
c3e23647 4
9ee3c97b 5 This file is part of Bison, the GNU Compiler Compiler.
c3e23647 6
9ee3c97b
AD
7 Bison is free software; you can redistribute it and/or modify it
8 under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
10 any later version.
c3e23647 11
9ee3c97b
AD
12 Bison is distributed in the hope that it will be useful, but
13 WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 General Public License for more details.
c3e23647 16
9ee3c97b
AD
17 You should have received a copy of the GNU General Public License
18 along with Bison; see the file COPYING. If not, write to the Free
19 Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
20 02111-1307, USA. */
c3e23647
RS
21
22
255ef638
AD
23/* The parser tables consist of these tables. Marked ones needed only
24 for the semantic parser. Double marked are output only if switches
25 are set.
c3e23647 26
255ef638
AD
27 YYTRANSLATE = vector mapping yylex's token numbers into bison's
28 token numbers.
c3e23647 29
255ef638 30 ++ YYTNAME = vector of string-names indexed by bison token number.
c3e23647 31
255ef638
AD
32 ++ YYTOKNUM = vector of yylex token numbers corresponding to
33 entries in YYTNAME.
c3e23647 34
255ef638
AD
35 YYRLINE = vector of line-numbers of all rules. For yydebug
36 printouts.
c3e23647 37
255ef638
AD
38 YYRHS = vector of items of all rules. This is exactly what RITEMS
39 contains. For yydebug and for semantic parser.
c3e23647 40
255ef638 41 YYPRHS[R] = index in YYRHS of first item for rule R.
c3e23647 42
255ef638 43 YYR1[R] = symbol number of symbol that rule R derives.
c3e23647 44
255ef638 45 YYR2[R] = number of symbols composing right hand side of rule R.
c3e23647 46
255ef638
AD
47 + YYSTOS[S] = the symbol number of the symbol that leads to state
48 S.
e372befa 49
255ef638
AD
50 YYDEFACT[S] = default rule to reduce with in state s, when YYTABLE
51 doesn't specify something else to do. Zero means the default is an
52 error.
c3e23647 53
255ef638
AD
54 YYDEFGOTO[I] = default state to go to after a reduction of a rule
55 that generates variable NTOKENS + I, except when YYTABLE specifies
56 something else to do.
c3e23647 57
255ef638
AD
58 YYPACT[S] = index in YYTABLE of the portion describing state S.
59 The lookahead token's type is used to index that portion to find
60 out what to do.
c3e23647 61
255ef638
AD
62 If the value in YYTABLE is positive, we shift the token and go to
63 that state.
c3e23647 64
6c89f1c1 65 If the value is negative, it is minus a rule number to reduce by.
c3e23647 66
255ef638
AD
67 If the value is zero, the default action from YYDEFACT[S] is used.
68
69 YYPGOTO[I] = the index in YYTABLE of the portion describing what to
70 do after reducing a rule that derives variable I + NTOKENS. This
71 portion is indexed by the parser state number, S, as of before the
72 text for this nonterminal was read. The value from YYTABLE is the
73 state to go to if the corresponding value in YYCHECK is S.
74
75 YYTABLE = a vector filled with portions for different uses, found
76 via YYPACT and YYPGOTO.
77
78 YYCHECK = a vector indexed in parallel with YYTABLE. It indicates,
79 in a roundabout way, the bounds of the portion you are trying to
80 examine.
81
82 Suppose that the portion of yytable starts at index P and the index
83 to be examined within the portion is I. Then if YYCHECK[P+I] != I,
84 I is outside the bounds of what is actually allocated, and the
85 default (from YYDEFACT or YYDEFGOTO) should be used. Otherwise,
86 YYTABLE[P+I] should be used.
87
88 YYFINAL = the state number of the termination state. YYFLAG = most
89 negative short int. Used to flag ?? */
c3e23647 90
c3e23647 91#include "system.h"
914feea9 92#include "bitsetv.h"
14d3eb9b 93#include "quotearg.h"
be2a1a68 94#include "error.h"
ceed8467 95#include "getargs.h"
c3e23647
RS
96#include "files.h"
97#include "gram.h"
b2ca4022 98#include "LR0.h"
a0f6b076 99#include "complain.h"
6c89f1c1 100#include "output.h"
720d742f 101#include "lalr.h"
a70083a3 102#include "reader.h"
ad949da9 103#include "symtab.h"
0619caf0 104#include "conflicts.h"
11d82f03 105#include "muscle_tab.h"
be2a1a68
AD
106
107/* From lib/readpipe.h. */
108FILE *readpipe PARAMS ((const char *, ...));
109
110/* From src/scan-skel.l. */
111int skel_lex PARAMS ((void));
112extern FILE *skel_in;
d019d655 113
c3e23647
RS
114static int nvectors;
115static int nentries;
342b8b6e
AD
116static short **froms = NULL;
117static short **tos = NULL;
118static short *tally = NULL;
119static short *width = NULL;
120static short *actrow = NULL;
121static short *state_count = NULL;
122static short *order = NULL;
123static short *base = NULL;
124static short *pos = NULL;
133c20e2
AD
125
126/* TABLE_SIZE is the allocated size of both TABLE and CHECK.
127 We start with the original hard-coded value: SHRT_MAX
128 (yes, not USHRT_MAX). */
129static size_t table_size = SHRT_MAX;
342b8b6e
AD
130static short *table = NULL;
131static short *check = NULL;
c3e23647
RS
132static int lowzero;
133static int high;
134
11d82f03 135struct obstack muscle_obstack;
f87685c3 136static struct obstack format_obstack;
c3e23647 137
c7925b99
MA
138int error_verbose = 0;
139
f0440388 140
133c20e2
AD
141/*----------------------------------------------------------------.
142| If TABLE (and CHECK) appear to be small to be addressed at |
143| DESIRED, grow them. Note that TABLE[DESIRED] is to be used, so |
144| the desired size is at least DESIRED + 1. |
145`----------------------------------------------------------------*/
146
147static void
148table_grow (size_t desired)
149{
150 size_t old_size = table_size;
151
152 while (table_size <= desired)
153 table_size *= 2;
154
155 if (trace_flag)
156 fprintf (stderr, "growing table and check from: %d to %d\n",
157 old_size, table_size);
158
159 table = XREALLOC (table, short, table_size);
160 check = XREALLOC (check, short, table_size);
161
162 for (/* Nothing. */; old_size < table_size; ++old_size)
163 {
164 table[old_size] = 0;
165 check[old_size] = -1;
166 }
167}
168
169
5372019f
AD
170/*-------------------------------------------------------------------.
171| Create a function NAME which associates to the muscle NAME the |
172| result of formatting the FIRST and then TABLE_DATA[BEGIN..END[ (of |
173| TYPE), and to the muscle NAME_max, the max value of the |
174| TABLE_DATA. |
175`-------------------------------------------------------------------*/
62a3e4f0 176
62a3e4f0 177
5372019f 178#define GENERATE_MUSCLE_INSERT_TABLE(Name, Type) \
5fbb0954 179 \
5372019f
AD
180static void \
181Name (const char *name, \
5fbb0954
AD
182 Type *table_data, \
183 Type first, \
184 int begin, \
185 int end) \
186{ \
0c2d3f4c 187 Type max = first; \
5fbb0954
AD
188 int i; \
189 int j = 1; \
190 \
5372019f 191 obstack_fgrow1 (&format_obstack, "%6d", first); \
5fbb0954
AD
192 for (i = begin; i < end; ++i) \
193 { \
5372019f 194 obstack_1grow (&format_obstack, ','); \
5fbb0954
AD
195 if (j >= 10) \
196 { \
5372019f 197 obstack_sgrow (&format_obstack, "\n "); \
5fbb0954
AD
198 j = 1; \
199 } \
200 else \
201 ++j; \
5372019f 202 obstack_fgrow1 (&format_obstack, "%6d", table_data[i]); \
5fbb0954
AD
203 if (table_data[i] > max) \
204 max = table_data[i]; \
205 } \
5372019f
AD
206 obstack_1grow (&format_obstack, 0); \
207 muscle_insert (name, obstack_finish (&format_obstack)); \
5fbb0954 208 \
5372019f
AD
209 /* Build `NAME_max' in the obstack. */ \
210 obstack_fgrow1 (&format_obstack, "%s_max", name); \
211 obstack_1grow (&format_obstack, 0); \
0c2d3f4c
AD
212 MUSCLE_INSERT_LONG_INT (obstack_finish (&format_obstack), \
213 (long int) max); \
62a3e4f0
AD
214}
215
5372019f
AD
216GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_unsigned_int_table, unsigned int)
217GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_short_table, short)
a49aecd5 218GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_symbol_number_table, symbol_number_t)
5372019f 219GENERATE_MUSCLE_INSERT_TABLE(muscle_insert_item_number_table, item_number_t)
c3e23647
RS
220
221
b0940840
AD
222/*-----------------------------------------------------------------.
223| Prepare the muscles related to the tokens: translate, tname, and |
224| toknum. |
225`-----------------------------------------------------------------*/
226
4a120d45 227static void
b0940840 228prepare_tokens (void)
c3e23647 229{
a49aecd5 230 muscle_insert_symbol_number_table ("translate",
5372019f
AD
231 token_translations,
232 0, 1, max_user_token_number + 1);
c3e23647 233
b0940840
AD
234 {
235 int i;
236 int j = 0;
237 for (i = 0; i < nsyms; i++)
238 {
239 /* Be sure not to use twice the same quotearg slot. */
240 const char *cp =
241 quotearg_n_style (1, c_quoting_style,
242 quotearg_style (escape_quoting_style,
243 symbols[i]->tag));
244 /* Width of the next token, including the two quotes, the coma
245 and the space. */
246 int strsize = strlen (cp) + 2;
247
248 if (j + strsize > 75)
249 {
250 obstack_sgrow (&format_obstack, "\n ");
251 j = 2;
252 }
253
254 obstack_sgrow (&format_obstack, cp);
255 obstack_sgrow (&format_obstack, ", ");
256 j += strsize;
257 }
258 /* Add a NULL entry to list of tokens (well, 0, as NULL might not be
259 defined). */
260 obstack_sgrow (&format_obstack, "0");
c3e23647 261
b0940840
AD
262 /* Finish table and store. */
263 obstack_1grow (&format_obstack, 0);
264 muscle_insert ("tname", obstack_finish (&format_obstack));
265 }
266
267 /* Output YYTOKNUM. */
b2ed6e58
AD
268 {
269 int i;
b0940840
AD
270 short *values = XCALLOC (short, ntokens + 1);
271 for (i = 0; i < ntokens + 1; ++i)
272 values[i] = symbols[i]->user_token_number;
5372019f
AD
273 muscle_insert_short_table ("toknum", values,
274 0, 1, ntokens + 1);
b0940840 275 free (values);
b2ed6e58 276 }
b0940840 277}
b2ed6e58 278
b0940840
AD
279
280/*-------------------------------------------------------------.
281| Prepare the muscles related to the rules: rhs, prhs, r1, r2, |
282| rline. |
283`-------------------------------------------------------------*/
284
285static void
286prepare_rules (void)
287{
b0940840 288 int r;
5df5f6d5 289 unsigned int i = 0;
62a3e4f0 290 item_number_t *rhs = XMALLOC (item_number_t, nritems);
5df5f6d5
AD
291 unsigned int *prhs = XMALLOC (unsigned int, nrules + 1);
292 unsigned int *rline = XMALLOC (unsigned int, nrules + 1);
a49aecd5 293 symbol_number_t *r1 = XMALLOC (symbol_number_t, nrules + 1);
5df5f6d5 294 unsigned int *r2 = XMALLOC (unsigned int, nrules + 1);
b0940840
AD
295
296 for (r = 1; r < nrules + 1; ++r)
297 {
5df5f6d5 298 item_number_t *rhsp;
b0940840
AD
299 /* Index of rule R in RHS. */
300 prhs[r] = i;
301 /* RHS of the rule R. */
302 for (rhsp = rules[r].rhs; *rhsp >= 0; ++rhsp)
303 rhs[i++] = *rhsp;
304 /* LHS of the rule R. */
305 r1[r] = rules[r].lhs->number;
306 /* Length of rule R's RHS. */
307 r2[r] = i - prhs[r];
308 /* Separator in RHS. */
309 rhs[i++] = -1;
310 /* Line where rule was defined. */
311 rline[r] = rules[r].line;
312 }
313 assert (i == nritems);
314
5372019f
AD
315 muscle_insert_item_number_table ("rhs", rhs, ritem[0], 1, nritems);
316 muscle_insert_unsigned_int_table ("prhs", prhs, 0, 1, nrules + 1);
317 muscle_insert_unsigned_int_table ("rline", rline, 0, 1, nrules + 1);
a49aecd5 318 muscle_insert_symbol_number_table ("r1", r1, 0, 1, nrules + 1);
5372019f 319 muscle_insert_unsigned_int_table ("r2", r2, 0, 1, nrules + 1);
796d61fb 320
b0940840
AD
321 free (rhs);
322 free (prhs);
5df5f6d5
AD
323 free (rline);
324 free (r1);
b0940840 325 free (r2);
c3e23647
RS
326}
327
b0940840
AD
328/*--------------------------------------------.
329| Prepare the muscles related to the states. |
330`--------------------------------------------*/
c3e23647 331
4a120d45 332static void
b0940840 333prepare_states (void)
c3e23647 334{
602bbf31 335 size_t i;
a49aecd5
AD
336 symbol_number_t *values =
337 (symbol_number_t *) alloca (sizeof (symbol_number_t) * nstates);
9703cc49 338 for (i = 0; i < nstates; ++i)
29e88316 339 values[i] = states[i]->accessing_symbol;
a49aecd5 340 muscle_insert_symbol_number_table ("stos", values,
5372019f 341 0, 1, nstates);
c3e23647
RS
342}
343
344
6c89f1c1
AD
345/*------------------------------------------------------------------.
346| Decide what to do for each type of token if seen as the lookahead |
347| token in specified state. The value returned is used as the |
348| default action (yydefact) for the state. In addition, actrow is |
349| filled with what to do for each kind of token, index by symbol |
350| number, with zero meaning do the default action. The value |
62a3e4f0 351| SHRT_MIN, a very negative number, means this situation is an |
6c89f1c1
AD
352| error. The parser recognizes this value specially. |
353| |
354| This is where conflicts are resolved. The loop over lookahead |
355| rules considered lower-numbered rules last, and the last rule |
356| considered that likes a token gets to handle it. |
357`------------------------------------------------------------------*/
c3e23647 358
4a120d45 359static int
f9507c28 360action_row (state_t *state)
c3e23647 361{
6c89f1c1 362 int i;
837491d8 363 int default_rule = 0;
f9507c28 364 reductions *redp = state->reductions;
f9507c28
AD
365 shifts *shiftp = state->shifts;
366 errs *errp = state->errs;
837491d8
AD
367 /* set nonzero to inhibit having any default reduction */
368 int nodefault = 0;
c3e23647
RS
369
370 for (i = 0; i < ntokens; i++)
371 actrow[i] = 0;
372
80dac38c 373 if (redp->nreds >= 1)
c3e23647 374 {
837491d8
AD
375 int j;
376 /* loop over all the rules available here which require
377 lookahead */
f9507c28 378 for (i = state->nlookaheads - 1; i >= 0; --i)
837491d8
AD
379 /* and find each token which the rule finds acceptable
380 to come next */
381 for (j = 0; j < ntokens; j++)
382 /* and record this rule as the rule to use if that
383 token follows. */
602bbf31 384 if (bitset_test (LA[state->lookaheadsp + i], j))
b0299a2e 385 actrow[j] = -LArule[state->lookaheadsp + i]->number;
c3e23647
RS
386 }
387
36281465
AD
388 /* Now see which tokens are allowed for shifts in this state. For
389 them, record the shift as the thing to do. So shift is preferred
390 to reduce. */
d954473d 391 for (i = 0; i < shiftp->nshifts; i++)
c3e23647 392 {
a49aecd5 393 symbol_number_t symbol;
837491d8 394 int shift_state = shiftp->shifts[i];
d954473d
AD
395 if (!shift_state)
396 continue;
c3e23647 397
29e88316 398 symbol = states[shift_state]->accessing_symbol;
c3e23647 399
d954473d
AD
400 if (ISVAR (symbol))
401 break;
c3e23647 402
d954473d 403 actrow[symbol] = shift_state;
c3e23647 404
d954473d
AD
405 /* Do not use any default reduction if there is a shift for
406 error */
007a50a4 407 if (symbol == errtoken->number)
d954473d 408 nodefault = 1;
c3e23647
RS
409 }
410
36281465 411 /* See which tokens are an explicit error in this state (due to
62a3e4f0 412 %nonassoc). For them, record SHRT_MIN as the action. */
2cec70b9
AD
413 for (i = 0; i < errp->nerrs; i++)
414 {
415 int symbol = errp->errs[i];
62a3e4f0 416 actrow[symbol] = SHRT_MIN;
2cec70b9 417 }
c3e23647 418
36281465
AD
419 /* Now find the most common reduction and make it the default action
420 for this state. */
c3e23647 421
80dac38c 422 if (redp->nreds >= 1 && !nodefault)
c3e23647 423 {
f9507c28 424 if (state->consistent)
c3e23647
RS
425 default_rule = redp->rules[0];
426 else
427 {
7a5350ba 428 int max = 0;
f9507c28 429 for (i = 0; i < state->nlookaheads; i++)
c3e23647 430 {
7a5350ba 431 int count = 0;
b0299a2e 432 int rule = -LArule[state->lookaheadsp + i]->number;
837491d8 433 int j;
9ee3c97b 434
c3e23647 435 for (j = 0; j < ntokens; j++)
837491d8
AD
436 if (actrow[j] == rule)
437 count++;
9ee3c97b 438
c3e23647
RS
439 if (count > max)
440 {
441 max = count;
442 default_rule = rule;
443 }
444 }
9ee3c97b 445
c3e23647
RS
446 /* actions which match the default are replaced with zero,
447 which means "use the default" */
9ee3c97b 448
c3e23647
RS
449 if (max > 0)
450 {
837491d8 451 int j;
c3e23647 452 for (j = 0; j < ntokens; j++)
837491d8
AD
453 if (actrow[j] == default_rule)
454 actrow[j] = 0;
9ee3c97b 455
ceed8467 456 default_rule = -default_rule;
c3e23647
RS
457 }
458 }
459 }
460
461 /* If have no default rule, the default is an error.
462 So replace any action which says "error" with "use default". */
463
464 if (default_rule == 0)
837491d8 465 for (i = 0; i < ntokens; i++)
62a3e4f0 466 if (actrow[i] == SHRT_MIN)
837491d8 467 actrow[i] = 0;
c3e23647 468
36281465 469 return default_rule;
c3e23647
RS
470}
471
472
4a120d45 473static void
d2729d44 474save_row (int state)
c3e23647 475{
6c89f1c1
AD
476 int i;
477 int count;
478 short *sp;
479 short *sp1;
480 short *sp2;
c3e23647
RS
481
482 count = 0;
483 for (i = 0; i < ntokens; i++)
796d61fb
AD
484 if (actrow[i] != 0)
485 count++;
c3e23647
RS
486
487 if (count == 0)
488 return;
489
d7913476
AD
490 froms[state] = sp1 = sp = XCALLOC (short, count);
491 tos[state] = sp2 = XCALLOC (short, count);
c3e23647
RS
492
493 for (i = 0; i < ntokens; i++)
796d61fb
AD
494 if (actrow[i] != 0)
495 {
496 *sp1++ = i;
497 *sp2++ = actrow[i];
498 }
c3e23647
RS
499
500 tally[state] = count;
501 width[state] = sp1[-1] - sp[0] + 1;
502}
503
504
6c89f1c1
AD
505/*------------------------------------------------------------------.
506| Figure out the actions for the specified state, indexed by |
507| lookahead token type. |
508| |
f2acea59
AD
509| The YYDEFACT table is output now. The detailed info is saved for |
510| putting into YYTABLE later. |
6c89f1c1 511`------------------------------------------------------------------*/
c3e23647 512
4a120d45 513static void
6c89f1c1 514token_actions (void)
c3e23647 515{
602bbf31 516 size_t i;
d7913476 517 short *yydefact = XCALLOC (short, nstates);
c3e23647 518
d7913476 519 actrow = XCALLOC (short, ntokens);
f2acea59 520 for (i = 0; i < nstates; ++i)
c3e23647 521 {
29e88316 522 yydefact[i] = action_row (states[i]);
6c89f1c1 523 save_row (i);
c3e23647 524 }
bbb5bcc6 525
5372019f
AD
526 muscle_insert_short_table ("defact", yydefact,
527 yydefact[0], 1, nstates);
26f609ff 528 XFREE (actrow);
d7913476 529 XFREE (yydefact);
c3e23647
RS
530}
531
532
3f96f4dc
AD
533/*-----------------------------.
534| Output the actions to OOUT. |
535`-----------------------------*/
536
9b3add5b 537void
be2a1a68 538actions_output (FILE *out)
3f96f4dc
AD
539{
540 int rule;
541 for (rule = 1; rule < nrules + 1; ++rule)
1a2b5d37 542 if (rules[rule].action)
3f96f4dc 543 {
ea52d706 544 fprintf (out, " case %d:\n", rule);
3f96f4dc
AD
545
546 if (!no_lines_flag)
ea52d706 547 fprintf (out, muscle_find ("linef"),
1a2b5d37 548 rules[rule].action_line,
ea52d706
AD
549 quotearg_style (c_quoting_style,
550 muscle_find ("filename")));
e9955c83
AD
551 fprintf (out, " %s\n break;\n\n",
552 rules[rule].action);
3f96f4dc
AD
553 }
554}
555
556
091e20bb
AD
557/*---------------------------------------.
558| Output the tokens definition to OOUT. |
559`---------------------------------------*/
560
9b3add5b 561void
be2a1a68 562token_definitions_output (FILE *out)
091e20bb
AD
563{
564 int i;
0d8bed56 565 int first = 1;
091e20bb
AD
566 for (i = 0; i < ntokens; ++i)
567 {
db8837cb 568 symbol_t *symbol = symbols[i];
091e20bb
AD
569 int number = symbol->user_token_number;
570
b87f8b21
AD
571 /* At this stage, if there are literal aliases, they are part of
572 SYMBOLS, so we should not find symbols which are the aliases
573 here. */
574 assert (number != USER_NUMBER_ALIAS);
575
091e20bb 576 /* Skip error token. */
007a50a4 577 if (symbol == errtoken)
091e20bb 578 continue;
b87f8b21
AD
579
580 /* If this string has an alias, then it is necessarily the alias
581 which is to be output. */
582 if (symbol->alias)
583 symbol = symbol->alias;
584
585 /* Don't output literal chars or strings (when defined only as a
586 string). Note that must be done after the alias resolution:
587 think about `%token 'f' "f"'. */
588 if (symbol->tag[0] == '\'' || symbol->tag[0] == '\"')
589 continue;
091e20bb
AD
590
591 /* Don't #define nonliteral tokens whose names contain periods
592 or '$' (as does the default value of the EOF token). */
593 if (strchr (symbol->tag, '.') || strchr (symbol->tag, '$'))
594 continue;
595
83ccf991 596 fprintf (out, "%s[[[%s]], [%d]]",
0d8bed56 597 first ? "" : ",\n", symbol->tag, number);
b87f8b21 598
0d8bed56 599 first = 0;
091e20bb
AD
600 }
601}
602
603
4a120d45 604static void
d2729d44 605save_column (int symbol, int default_state)
c3e23647 606{
6c89f1c1 607 int i;
6c89f1c1
AD
608 short *sp;
609 short *sp1;
610 short *sp2;
611 int count;
837491d8 612 int symno = symbol - ntokens + nstates;
c3e23647 613
43591cec
AD
614 short begin = goto_map[symbol];
615 short end = goto_map[symbol + 1];
c3e23647
RS
616
617 count = 0;
43591cec 618 for (i = begin; i < end; i++)
796d61fb
AD
619 if (to_state[i] != default_state)
620 count++;
c3e23647
RS
621
622 if (count == 0)
623 return;
624
d7913476
AD
625 froms[symno] = sp1 = sp = XCALLOC (short, count);
626 tos[symno] = sp2 = XCALLOC (short, count);
c3e23647 627
43591cec 628 for (i = begin; i < end; i++)
796d61fb
AD
629 if (to_state[i] != default_state)
630 {
631 *sp1++ = from_state[i];
632 *sp2++ = to_state[i];
633 }
c3e23647
RS
634
635 tally[symno] = count;
636 width[symno] = sp1[-1] - sp[0] + 1;
637}
638
6c89f1c1
AD
639static int
640default_goto (int symbol)
641{
602bbf31
AD
642 size_t i;
643 size_t m = goto_map[symbol];
644 size_t n = goto_map[symbol + 1];
837491d8
AD
645 int default_state = -1;
646 int max = 0;
6c89f1c1
AD
647
648 if (m == n)
649 return -1;
650
651 for (i = 0; i < nstates; i++)
652 state_count[i] = 0;
653
654 for (i = m; i < n; i++)
655 state_count[to_state[i]]++;
656
6c89f1c1 657 for (i = 0; i < nstates; i++)
796d61fb
AD
658 if (state_count[i] > max)
659 {
660 max = state_count[i];
661 default_state = i;
662 }
6c89f1c1
AD
663
664 return default_state;
665}
666
667
668/*-------------------------------------------------------------------.
669| Figure out what to do after reducing with each rule, depending on |
670| the saved state from before the beginning of parsing the data that |
671| matched this rule. |
672| |
673| The YYDEFGOTO table is output now. The detailed info is saved for |
674| putting into YYTABLE later. |
675`-------------------------------------------------------------------*/
676
677static void
678goto_actions (void)
679{
43591cec 680 int i;
bbb5bcc6 681 short *yydefgoto = XMALLOC (short, nsyms - ntokens);
bbb5bcc6 682
26f609ff 683 state_count = XCALLOC (short, nstates);
43591cec 684 for (i = ntokens; i < nsyms; ++i)
6c89f1c1 685 {
43591cec
AD
686 int default_state = default_goto (i);
687 save_column (i, default_state);
688 yydefgoto[i - ntokens] = default_state;
6c89f1c1
AD
689 }
690
5372019f
AD
691 muscle_insert_short_table ("defgoto", yydefgoto,
692 yydefgoto[0], 1, nsyms - ntokens);
d7913476 693 XFREE (state_count);
43591cec 694 XFREE (yydefgoto);
6c89f1c1 695}
c3e23647
RS
696
697
9ee3c97b
AD
698/* The next few functions decide how to pack the actions and gotos
699 information into yytable. */
c3e23647 700
4a120d45 701static void
d2729d44 702sort_actions (void)
c3e23647 703{
6c89f1c1 704 int i;
c3e23647 705
d7913476 706 order = XCALLOC (short, nvectors);
c3e23647
RS
707 nentries = 0;
708
709 for (i = 0; i < nvectors; i++)
796d61fb
AD
710 if (tally[i] > 0)
711 {
837491d8
AD
712 int k;
713 int t = tally[i];
714 int w = width[i];
715 int j = nentries - 1;
c3e23647 716
796d61fb
AD
717 while (j >= 0 && (width[order[j]] < w))
718 j--;
c3e23647 719
796d61fb
AD
720 while (j >= 0 && (width[order[j]] == w) && (tally[order[j]] < t))
721 j--;
c3e23647 722
796d61fb
AD
723 for (k = nentries - 1; k > j; k--)
724 order[k + 1] = order[k];
c3e23647 725
796d61fb
AD
726 order[j + 1] = i;
727 nentries++;
728 }
c3e23647
RS
729}
730
731
4a120d45 732static int
d2729d44 733matching_state (int vector)
c3e23647 734{
837491d8 735 int i = order[vector];
6c89f1c1
AD
736 int t;
737 int w;
6c89f1c1 738 int prev;
c3e23647 739
602bbf31 740 if (i >= (int) nstates)
36281465 741 return -1;
c3e23647
RS
742
743 t = tally[i];
744 w = width[i];
745
746 for (prev = vector - 1; prev >= 0; prev--)
747 {
837491d8
AD
748 int j = order[prev];
749 int k;
750 int match = 1;
751
c3e23647 752 if (width[j] != w || tally[j] != t)
36281465 753 return -1;
c3e23647 754
c3e23647 755 for (k = 0; match && k < t; k++)
796d61fb
AD
756 if (tos[j][k] != tos[i][k] || froms[j][k] != froms[i][k])
757 match = 0;
c3e23647
RS
758
759 if (match)
36281465 760 return j;
c3e23647
RS
761 }
762
36281465 763 return -1;
c3e23647
RS
764}
765
766
4a120d45 767static int
d2729d44 768pack_vector (int vector)
c3e23647 769{
837491d8 770 int i = order[vector];
6c89f1c1 771 int j;
837491d8 772 int t = tally[i];
6c89f1c1 773 int loc = 0;
837491d8
AD
774 short *from = froms[i];
775 short *to = tos[i];
c3e23647 776
340ef489 777 assert (t);
c3e23647 778
133c20e2 779 for (j = lowzero - from[0]; j < (int) table_size; j++)
c3e23647 780 {
837491d8
AD
781 int k;
782 int ok = 1;
c3e23647
RS
783
784 for (k = 0; ok && k < t; k++)
785 {
786 loc = j + from[k];
133c20e2
AD
787 if (loc > (int) table_size)
788 table_grow (loc);
c3e23647
RS
789
790 if (table[loc] != 0)
791 ok = 0;
792 }
793
794 for (k = 0; ok && k < vector; k++)
796d61fb
AD
795 if (pos[k] == j)
796 ok = 0;
c3e23647
RS
797
798 if (ok)
799 {
800 for (k = 0; k < t; k++)
801 {
802 loc = j + from[k];
803 table[loc] = to[k];
804 check[loc] = from[k];
805 }
806
807 while (table[lowzero] != 0)
808 lowzero++;
809
810 if (loc > high)
811 high = loc;
812
36281465 813 return j;
c3e23647
RS
814 }
815 }
275fc3ad
AD
816#define pack_vector_succeeded 0
817 assert (pack_vector_succeeded);
3843c413 818 return 0;
c3e23647
RS
819}
820
821
6c89f1c1
AD
822static void
823pack_table (void)
824{
825 int i;
826 int place;
827 int state;
828
d7913476
AD
829 base = XCALLOC (short, nvectors);
830 pos = XCALLOC (short, nentries);
133c20e2
AD
831 table = XCALLOC (short, table_size);
832 check = XCALLOC (short, table_size);
6c89f1c1
AD
833
834 lowzero = 0;
835 high = 0;
836
837 for (i = 0; i < nvectors; i++)
62a3e4f0 838 base[i] = SHRT_MIN;
6c89f1c1 839
133c20e2 840 for (i = 0; i < (int) table_size; i++)
6c89f1c1
AD
841 check[i] = -1;
842
843 for (i = 0; i < nentries; i++)
844 {
845 state = matching_state (i);
846
847 if (state < 0)
848 place = pack_vector (i);
849 else
850 place = base[state];
851
852 pos[i] = place;
853 base[order[i]] = place;
854 }
855
856 for (i = 0; i < nvectors; i++)
857 {
796d61fb
AD
858 XFREE (froms[i]);
859 XFREE (tos[i]);
6c89f1c1
AD
860 }
861
d7913476
AD
862 XFREE (froms);
863 XFREE (tos);
864 XFREE (pos);
6c89f1c1 865}
c3e23647
RS
866
867/* the following functions output yytable, yycheck
868 and the vectors whose elements index the portion starts */
869
4a120d45 870static void
d2729d44 871output_base (void)
c3e23647 872{
26f609ff 873 /* Output pact. */
5372019f
AD
874 muscle_insert_short_table ("pact", base,
875 base[0], 1, nstates);
c3e23647 876
26f609ff 877 /* Output pgoto. */
5372019f
AD
878 muscle_insert_short_table ("pgoto", base,
879 base[nstates], nstates + 1, nvectors);
d7913476 880 XFREE (base);
c3e23647
RS
881}
882
883
4a120d45 884static void
d2729d44 885output_table (void)
c3e23647 886{
5372019f
AD
887 muscle_insert_short_table ("table", table,
888 table[0], 1, high + 1);
d7913476 889 XFREE (table);
c3e23647
RS
890}
891
892
4a120d45 893static void
d2729d44 894output_check (void)
c3e23647 895{
5372019f
AD
896 muscle_insert_short_table ("check", check,
897 check[0], 1, high + 1);
d7913476 898 XFREE (check);
c3e23647
RS
899}
900
b0940840
AD
901/*-----------------------------------------------------------------.
902| Compute and output yydefact, yydefgoto, yypact, yypgoto, yytable |
903| and yycheck. |
904`-----------------------------------------------------------------*/
6c89f1c1
AD
905
906static void
907output_actions (void)
908{
602bbf31 909 size_t i;
6c89f1c1 910 nvectors = nstates + nvars;
c3e23647 911
d7913476
AD
912 froms = XCALLOC (short *, nvectors);
913 tos = XCALLOC (short *, nvectors);
914 tally = XCALLOC (short, nvectors);
915 width = XCALLOC (short, nvectors);
6c89f1c1
AD
916
917 token_actions ();
914feea9 918 bitsetv_free (LA);
b0299a2e 919 free (LArule);
6c89f1c1
AD
920
921 goto_actions ();
d7913476
AD
922 XFREE (goto_map + ntokens);
923 XFREE (from_state);
924 XFREE (to_state);
6c89f1c1
AD
925
926 sort_actions ();
927 pack_table ();
4e5caae2 928
6c89f1c1
AD
929 output_base ();
930 output_table ();
4e5caae2 931
6c89f1c1 932 output_check ();
49701457
AD
933
934 for (i = 0; i < nstates; ++i)
935 {
29e88316
AD
936 free (states[i]->shifts);
937 XFREE (states[i]->reductions);
938 free (states[i]->errs);
939 free (states[i]);
49701457 940 }
29e88316 941 XFREE (states);
6c89f1c1 942}
c3e23647 943
652def80 944\f
1239777d
AD
945/*---------------------------.
946| Call the skeleton parser. |
947`---------------------------*/
c3e23647 948
4a120d45 949static void
1239777d 950output_skeleton (void)
9b3add5b 951{
be2a1a68 952 /* Store the definition of all the muscles. */
d0039cbc 953 const char *tempdir = getenv ("TMPDIR");
381fb12e
AD
954 char *tempfile = NULL;
955 FILE *out = NULL;
381fb12e
AD
956 int fd;
957
958 if (tempdir == NULL)
959 tempdir = DEFAULT_TMPDIR;
960 tempfile = xmalloc (strlen (tempdir) + 11);
961 sprintf (tempfile, "%s/bsnXXXXXX", tempdir);
962 fd = mkstemp (tempfile);
963 if (fd == -1)
964 error (EXIT_FAILURE, errno, "%s", tempfile);
965
966 out = fdopen (fd, "w");
967 if (out == NULL)
968 error (EXIT_FAILURE, errno, "%s", tempfile);
969
970 /* There are no comments, especially not `#': we do want M4 expansion
971 after `#': think of CPP macros! */
972 fputs ("m4_changecom()\n", out);
973 fputs ("m4_init()\n", out);
974
975 fputs ("m4_define([b4_actions], \n[[", out);
976 actions_output (out);
977 fputs ("]])\n\n", out);
978
0d8bed56 979 fputs ("m4_define([b4_tokens], \n[", out);
381fb12e 980 token_definitions_output (out);
0d8bed56 981 fputs ("])\n\n", out);
be2a1a68 982
381fb12e 983 muscles_m4_output (out);
be2a1a68 984
381fb12e
AD
985 fputs ("m4_wrap([m4_divert_pop(0)])\n", out);
986 fputs ("m4_divert_push(0)dnl\n", out);
987 xfclose (out);
be2a1a68
AD
988
989 /* Invoke m4 on the definition of the muscles, and the skeleton. */
990 {
991 const char *bison_pkgdatadir = getenv ("BISON_PKGDATADIR");
abe017f6 992 const char *m4 = getenv ("M4");
7067cb36
PH
993 int pkg_data_len;
994 char *full_skeleton;
995
abe017f6
AD
996 if (!m4)
997 m4 = M4;
be2a1a68
AD
998 if (!bison_pkgdatadir)
999 bison_pkgdatadir = PKGDATADIR;
7067cb36 1000 pkg_data_len = strlen (bison_pkgdatadir);
670ddffd 1001 full_skeleton = XMALLOC (char, pkg_data_len + strlen (skeleton) + 2);
7067cb36
PH
1002 if (bison_pkgdatadir[pkg_data_len-1] == '/')
1003 sprintf (full_skeleton, "%s%s", bison_pkgdatadir, skeleton);
1004 else
1005 sprintf (full_skeleton, "%s/%s", bison_pkgdatadir, skeleton);
381fb12e
AD
1006 if (trace_flag)
1007 fprintf (stderr,
abe017f6 1008 "running: %s -I %s m4sugar/m4sugar.m4 %s %s\n",
7067cb36 1009 m4, bison_pkgdatadir, tempfile, full_skeleton);
abe017f6
AD
1010 skel_in = readpipe (m4,
1011 "-I", bison_pkgdatadir,
be2a1a68 1012 "m4sugar/m4sugar.m4",
381fb12e 1013 tempfile,
7067cb36 1014 full_skeleton,
be2a1a68 1015 NULL);
7067cb36 1016 XFREE (full_skeleton);
be2a1a68
AD
1017 if (!skel_in)
1018 error (EXIT_FAILURE, errno, "cannot run m4");
1019 skel_lex ();
381fb12e
AD
1020
1021 /* If `debugging', keep this file alive. */
1022 if (!trace_flag)
1023 unlink (tempfile);
be2a1a68 1024 }
26f609ff
RA
1025}
1026
1027static void
1028prepare (void)
1029{
11d82f03 1030 MUSCLE_INSERT_INT ("last", high);
62a3e4f0 1031 MUSCLE_INSERT_INT ("flag", SHRT_MIN);
11d82f03
MA
1032 MUSCLE_INSERT_INT ("pure", pure_parser);
1033 MUSCLE_INSERT_INT ("nsym", nsyms);
1034 MUSCLE_INSERT_INT ("debug", debug_flag);
1035 MUSCLE_INSERT_INT ("final", final_state);
007a50a4
AD
1036 MUSCLE_INSERT_INT ("undef_token_number", undeftoken->number);
1037 MUSCLE_INSERT_INT ("user_token_number_max", max_user_token_number);
be2a1a68 1038 MUSCLE_INSERT_INT ("error_verbose", error_verbose);
b5b61c61 1039 MUSCLE_INSERT_STRING ("prefix", spec_name_prefix ? spec_name_prefix : "yy");
11d82f03 1040
b85810ae
AD
1041 /* FIXME: This is wrong: the muscles should decide whether they hold
1042 a copy or not, but the situation is too obscure currently. */
be2a1a68
AD
1043 MUSCLE_INSERT_STRING ("output_infix", output_infix ? output_infix : "");
1044 MUSCLE_INSERT_STRING ("output_prefix", short_base_name);
1045 MUSCLE_INSERT_STRING ("output_parser_name", parser_file_name);
1046 MUSCLE_INSERT_STRING ("output_header_name", spec_defines_file);
b85810ae 1047
11d82f03
MA
1048 MUSCLE_INSERT_INT ("nnts", nvars);
1049 MUSCLE_INSERT_INT ("nrules", nrules);
1050 MUSCLE_INSERT_INT ("nstates", nstates);
1051 MUSCLE_INSERT_INT ("ntokens", ntokens);
1052
be2a1a68
AD
1053 MUSCLE_INSERT_INT ("locations_flag", locations_flag);
1054 MUSCLE_INSERT_INT ("defines_flag", defines_flag);
381fb12e
AD
1055
1056 /* Copy definitions in directive. */
0dd1580a
RA
1057 obstack_1grow (&pre_prologue_obstack, 0);
1058 obstack_1grow (&post_prologue_obstack, 0);
1059 muscle_insert ("pre_prologue", obstack_finish (&pre_prologue_obstack));
1060 muscle_insert ("post_prologue", obstack_finish (&post_prologue_obstack));
381fb12e
AD
1061
1062 /* Find the right skeleton file. */
1063 if (!skeleton)
fdbcd8e2 1064 skeleton = "bison.simple";
381fb12e
AD
1065
1066 /* Parse the skeleton file and output the needed parsers. */
1067 muscle_insert ("skeleton", skeleton);
26f609ff 1068}
c3e23647 1069
93ede233 1070
6c89f1c1
AD
1071/*----------------------------------------------------------.
1072| Output the parsing tables and the parser code to ftable. |
1073`----------------------------------------------------------*/
c3e23647 1074
6c89f1c1
AD
1075void
1076output (void)
1077{
f87685c3 1078 obstack_init (&format_obstack);
dd60faec 1079
b0940840
AD
1080 prepare_tokens ();
1081 prepare_rules ();
1082 prepare_states ();
6c89f1c1 1083 output_actions ();
342b8b6e 1084
26f609ff 1085 prepare ();
652def80 1086
9b3add5b
RA
1087 /* Process the selected skeleton file. */
1088 output_skeleton ();
1089
f499b062
AD
1090 obstack_free (&muscle_obstack, NULL);
1091 obstack_free (&format_obstack, NULL);
1092 obstack_free (&action_obstack, NULL);
0dd1580a
RA
1093 obstack_free (&pre_prologue_obstack, NULL);
1094 obstack_free (&post_prologue_obstack, NULL);
c3e23647 1095}