src/reader.c

   1 /* Input parser for bison
   2    Copyright (C) 1984, 1986, 1989, 1992 Free Software Foundation, Inc.
   3
   4 This file is part of Bison, the GNU Compiler Compiler.
   5
   6 Bison is free software; you can redistribute it and/or modify
   7 it under the terms of the GNU General Public License as published by
   8 the Free Software Foundation; either version 2, or (at your option)
   9 any later version.
  10
  11 Bison is distributed in the hope that it will be useful,
  12 but WITHOUT ANY WARRANTY; without even the implied warranty of
  13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
  14 GNU General Public License for more details.
  15
  16 You should have received a copy of the GNU General Public License
  17 along with Bison; see the file COPYING.  If not, write to
  18 the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.  */
  19
  20
  21 /* read in the grammar specification and record it in the format described in gram.h.
  22   All guards are copied into the fguard file and all actions into faction,
  23   in each case forming the body of a C function (yyguard or yyaction)
  24   which contains a switch statement to decide which guard or action to execute.
  25
  26 The entry point is reader().  */
  27
  28 #include <stdio.h>
  29 #include <ctype.h>
  30 #include "system.h"
  31 #include "files.h"
  32 #include "alloc.h"
  33 #include "symtab.h"
  34 #include "lex.h"
  35 #include "gram.h"
  36 #include "machine.h"
  37
  38 #define LTYPESTR        "\n#ifndef YYLTYPE\ntypedef\n  struct yyltype\n\
  39     {\n      int timestamp;\n      int first_line;\n      int first_column;\
  40 \n      int last_line;\n      int last_column;\n      char *text;\n   }\n\
  41   yyltype;\n\n#define YYLTYPE yyltype\n#endif\n\n"
  42
  43 /* Number of slots allocated (but not necessarily used yet) in `rline'  */
  44 int rline_allocated;
  45
  46 extern char *program_name;
  47 extern int definesflag;
  48 extern int nolinesflag;
  49 extern int noparserflag;
  50 extern int rawtoknumflag;
  51 extern bucket *symval;
  52 extern int numval;
  53 extern int expected_conflicts;
  54 extern char *token_buffer;
  55
  56 extern void init_lex();
  57 extern void tabinit();
  58 extern void output_headers();
  59 extern void output_trailers();
  60 extern void free_symtab();
  61 extern void open_extra_files();
  62 extern char *int_to_string();
  63 extern void fatal();
  64 extern void fatals();
  65 extern void warn();
  66 extern void warni();
  67 extern void warns();
  68 extern void warnss();
  69 extern void warnsss();
  70 extern void unlex();
  71 extern void done();
  72
  73 extern int skip_white_space();
  74 extern int parse_percent_token();
  75 extern int lex();
  76
  77 void reader_output_yylsp();
  78 void read_declarations();
  79 void copy_definition();
  80 void parse_token_decl();
  81 void parse_start_decl();
  82 void parse_type_decl();
  83 void parse_assoc_decl();
  84 void parse_union_decl();
  85 void parse_expect_decl();
  86 void parse_thong_decl();
  87 void copy_action();
  88 void readgram();
  89 void record_rule_line();
  90 void packsymbols();
  91 void output_token_defines();
  92 void packgram();
  93 int read_signed_integer();
  94 static int get_type();
  95
  96 typedef
  97   struct symbol_list
  98     {
  99       struct symbol_list *next;
 100       bucket *sym;
 101       bucket *ruleprec;
 102     }
 103   symbol_list;
 104
 105
 106
 107 int lineno;
 108 symbol_list *grammar;
 109 int start_flag;
 110 bucket *startval;
 111 char **tags;
 112 int *user_toknums;
 113
 114 /* Nonzero if components of semantic values are used, implying
 115    they must be unions.  */
 116 static int value_components_used;
 117
 118 static int typed;  /* nonzero if %union has been seen.  */
 119
 120 static int lastprec;  /* incremented for each %left, %right or %nonassoc seen */
 121
 122 static int gensym_count;  /* incremented for each generated symbol */
 123
 124 static bucket *errtoken;
 125
 126 /* Nonzero if any action or guard uses the @n construct.  */
 127 static int yylsp_needed;
 128
 129 extern char *version_string;
 130
 131
 132 static void
 133 skip_to_char(target)
 134      int target;
 135 {
 136   int c;
 137   if (target == '\n')
 138     warn(_("   Skipping to next \\n"));
 139   else
 140     warni(_("   Skipping to next %c"), target);
 141
 142   do
 143     c = skip_white_space();
 144   while (c != target && c != EOF);
 145   if (c != EOF)
 146     ungetc(c, finput);
 147 }
 148
 149
 150 void
 151 reader()
 152 {
 153   start_flag = 0;
 154   startval = NULL;  /* start symbol not specified yet. */
 155
 156 #if 0
 157   translations = 0;  /* initially assume token number translation not needed.  */
 158 #endif
 159   /* Nowadays translations is always set to 1,
 160      since we give `error' a user-token-number
 161      to satisfy the Posix demand for YYERRCODE==256.  */
 162   translations = 1;
 163
 164   nsyms = 1;
 165   nvars = 0;
 166   nrules = 0;
 167   nitems = 0;
 168   rline_allocated = 10;
 169   rline = NEW2(rline_allocated, short);
 170
 171   typed = 0;
 172   lastprec = 0;
 173
 174   gensym_count = 0;
 175
 176   semantic_parser = 0;
 177   pure_parser = 0;
 178   yylsp_needed = 0;
 179
 180   grammar = NULL;
 181
 182   init_lex();
 183   lineno = 1;
 184
 185   /* initialize the symbol table.  */
 186   tabinit();
 187   /* construct the error token */
 188   errtoken = getsym("error");
 189   errtoken->class = STOKEN;
 190   errtoken->user_token_number = 256; /* Value specified by posix.  */
 191   /* construct a token that represents all undefined literal tokens. */
 192   /* it is always token number 2.  */
 193   getsym("$undefined.")->class = STOKEN;
 194   /* Read the declaration section.  Copy %{ ... %} groups to ftable and fdefines file.
 195      Also notice any %token, %left, etc. found there.  */
 196   if (noparserflag)
 197     fprintf(ftable, "\n/*  Bison-generated parse tables, made from %s\n",
 198                 infile);
 199   else
 200     fprintf(ftable, "\n/*  A Bison parser, made from %s\n", infile);
 201   fprintf(ftable, " by  %s  */\n\n", version_string);
 202   fprintf(ftable, "#define YYBISON 1  /* Identify Bison output.  */\n\n");
 203   read_declarations();
 204   /* start writing the guard and action files, if they are needed.  */
 205   output_headers();
 206   /* read in the grammar, build grammar in list form.  write out guards and actions.  */
 207   readgram();
 208   /* Now we know whether we need the line-number stack.
 209      If we do, write its type into the .tab.h file.  */
 210   if (fdefines)
 211     reader_output_yylsp(fdefines);
 212   /* write closing delimiters for actions and guards.  */
 213   output_trailers();
 214   if (yylsp_needed)
 215     fprintf(ftable, "#define YYLSP_NEEDED\n\n");
 216   /* assign the symbols their symbol numbers.
 217      Write #defines for the token symbols into fdefines if requested.  */
 218   packsymbols();
 219   /* convert the grammar into the format described in gram.h.  */
 220   packgram();
 221   /* free the symbol table data structure
 222      since symbols are now all referred to by symbol number.  */
 223   free_symtab();
 224 }
 225
 226 void
 227 reader_output_yylsp(f)
 228      FILE *f;
 229 {
 230   if (yylsp_needed)
 231     fprintf(f, LTYPESTR);
 232 }
 233
 234 /* read from finput until %% is seen.  Discard the %%.
 235 Handle any % declarations,
 236 and copy the contents of any %{ ... %} groups to fattrs.  */
 237
 238 void
 239 read_declarations ()
 240 {
 241   register int c;
 242   register int tok;
 243
 244   for (;;)
 245     {
 246       c = skip_white_space();
 247
 248       if (c == '%')
 249         {
 250           tok = parse_percent_token();
 251
 252           switch (tok)
 253             {
 254             case TWO_PERCENTS:
 255               return;
 256
 257             case PERCENT_LEFT_CURLY:
 258               copy_definition();
 259               break;
 260
 261             case TOKEN:
 262               parse_token_decl (STOKEN, SNTERM);
 263               break;
 264
 265             case NTERM:
 266               parse_token_decl (SNTERM, STOKEN);
 267               break;
 268
 269             case TYPE:
 270               parse_type_decl();
 271               break;
 272
 273             case START:
 274               parse_start_decl();
 275               break;
 276
 277             case UNION:
 278               parse_union_decl();
 279               break;
 280
 281             case EXPECT:
 282               parse_expect_decl();
 283               break;
 284             case THONG:
 285               parse_thong_decl();
 286               break;
 287             case LEFT:
 288               parse_assoc_decl(LEFT_ASSOC);
 289               break;
 290
 291             case RIGHT:
 292               parse_assoc_decl(RIGHT_ASSOC);
 293               break;
 294
 295             case NONASSOC:
 296               parse_assoc_decl(NON_ASSOC);
 297               break;
 298
 299             case SEMANTIC_PARSER:
 300               if (semantic_parser == 0)
 301                 {
 302                   semantic_parser = 1;
 303                   open_extra_files();
 304                 }
 305               break;
 306
 307             case PURE_PARSER:
 308               pure_parser = 1;
 309               break;
 310
 311             case NOOP:
 312               break;
 313
 314             default:
 315               warns(_("unrecognized: %s"), token_buffer);
 316               skip_to_char('%');
 317           }
 318         }
 319       else if (c == EOF)
 320         fatal(_("no input grammar"));
 321       else
 322         {
 323                 char buff[100];
 324                 sprintf(buff, _("unknown character: %s"), printable_version(c));
 325                 warn(buff);
 326                 skip_to_char('%');
 327         }
 328     }
 329 }
 330
 331
 332 /* copy the contents of a %{ ... %} into the definitions file.
 333 The %{ has already been read.  Return after reading the %}.  */
 334
 335 void
 336 copy_definition ()
 337 {
 338   register int c;
 339   register int match;
 340   register int ended;
 341   register int after_percent;  /* -1 while reading a character if prev char was % */
 342   int cplus_comment;
 343
 344   if (!nolinesflag)
 345     fprintf(fattrs, "#line %d \"%s\"\n", lineno, infile);
 346
 347   after_percent = 0;
 348
 349   c = getc(finput);
 350
 351   for (;;)
 352     {
 353       switch (c)
 354         {
 355         case '\n':
 356           putc(c, fattrs);
 357           lineno++;
 358           break;
 359
 360         case '%':
 361           after_percent = -1;
 362           break;
 363
 364         case '\'':
 365         case '"':
 366           match = c;
 367           putc(c, fattrs);
 368           c = getc(finput);
 369
 370           while (c != match)
 371             {
 372               if (c == EOF)
 373                 fatal(_("unterminated string at end of file"));
 374               if (c == '\n')
 375                 {
 376                   warn(_("unterminated string"));
 377                   ungetc(c, finput);
 378                   c = match;
 379                   continue;
 380                 }
 381
 382               putc(c, fattrs);
 383
 384               if (c == '\\')
 385                 {
 386                   c = getc(finput);
 387                   if (c == EOF)
 388                     fatal(_("unterminated string at end of file"));
 389                   putc(c, fattrs);
 390                   if (c == '\n')
 391                     lineno++;
 392                 }
 393
 394               c = getc(finput);
 395             }
 396
 397           putc(c, fattrs);
 398           break;
 399
 400         case '/':
 401           putc(c, fattrs);
 402           c = getc(finput);
 403           if (c != '*' && c != '/')
 404             continue;
 405
 406           cplus_comment = (c == '/');
 407           putc(c, fattrs);
 408           c = getc(finput);
 409
 410           ended = 0;
 411           while (!ended)
 412             {
 413               if (!cplus_comment && c == '*')
 414                 {
 415                   while (c == '*')
 416                     {
 417                       putc(c, fattrs);
 418                       c = getc(finput);
 419                     }
 420
 421                   if (c == '/')
 422                     {
 423                       putc(c, fattrs);
 424                       ended = 1;
 425                     }
 426                 }
 427               else if (c == '\n')
 428                 {
 429                   lineno++;
 430                   putc(c, fattrs);
 431                   if (cplus_comment)
 432                     ended = 1;
 433                   else
 434                     c = getc(finput);
 435                 }
 436               else if (c == EOF)
 437                 fatal(_("unterminated comment in `%{' definition"));
 438               else
 439                 {
 440                   putc(c, fattrs);
 441                   c = getc(finput);
 442                 }
 443             }
 444
 445           break;
 446
 447         case EOF:
 448           fatal(_("unterminated `%{' definition"));
 449
 450         default:
 451           putc(c, fattrs);
 452         }
 453
 454       c = getc(finput);
 455
 456       if (after_percent)
 457         {
 458           if (c == '}')
 459             return;
 460           putc('%', fattrs);
 461         }
 462       after_percent = 0;
 463
 464     }
 465
 466 }
 467
 468
 469
 470 /* parse what comes after %token or %nterm.
 471 For %token, what_is is STOKEN and what_is_not is SNTERM.
 472 For %nterm, the arguments are reversed.  */
 473
 474 void
 475 parse_token_decl (what_is, what_is_not)
 476      int what_is, what_is_not;
 477 {
 478   register int token = 0;
 479   register char *typename = 0;
 480   register struct bucket *symbol = NULL;  /* pts to symbol being defined */
 481   int k;
 482
 483   for (;;)
 484     {
 485       if(ungetc(skip_white_space(), finput) == '%')
 486         return;
 487       token = lex();
 488       if (token == COMMA)
 489         {
 490           symbol = NULL;
 491           continue;
 492         }
 493       if (token == TYPENAME)
 494         {
 495           k = strlen(token_buffer);
 496           typename = NEW2(k + 1, char);
 497           strcpy(typename, token_buffer);
 498           value_components_used = 1;
 499           symbol = NULL;
 500         }
 501       else if (token == IDENTIFIER && *symval->tag == '\"'
 502                 && symbol)
 503         {
 504           translations = 1;
 505           symval->class = STOKEN;
 506           symval->type_name = typename;
 507           symval->user_token_number = symbol->user_token_number;
 508           symbol->user_token_number = SALIAS;
 509
 510           symval->alias = symbol;
 511           symbol->alias = symval;
 512           symbol = NULL;
 513
 514           nsyms--;   /* symbol and symval combined are only one symbol */
 515         }
 516       else if (token == IDENTIFIER)
 517         {
 518           int oldclass = symval->class;
 519           symbol = symval;
 520
 521           if (symbol->class == what_is_not)
 522             warns(_("symbol %s redefined"), symbol->tag);
 523           symbol->class = what_is;
 524           if (what_is == SNTERM && oldclass != SNTERM)
 525             symbol->value = nvars++;
 526
 527           if (typename)
 528             {
 529               if (symbol->type_name == NULL)
 530                 symbol->type_name = typename;
 531               else if (strcmp(typename, symbol->type_name) != 0)
 532                 warns(_("type redeclaration for %s"), symbol->tag);
 533             }
 534         }
 535       else if (symbol && token == NUMBER)
 536         {
 537           symbol->user_token_number = numval;
 538           translations = 1;
 539         }
 540       else
 541         {
 542           warnss(_("`%s' is invalid in %s"),
 543                 token_buffer,
 544                 (what_is == STOKEN) ? "%token" : "%nterm");
 545           skip_to_char('%');
 546         }
 547     }
 548
 549 }
 550
 551 /* parse what comes after %thong
 552         the full syntax is
 553                 %thong <type> token number literal
 554  the <type> or number may be omitted.  The number specifies the
 555  user_token_number.
 556
 557  Two symbols are entered in the table, one for the token symbol and
 558  one for the literal.  Both are given the <type>, if any, from the declaration.
 559  The ->user_token_number of the first is SALIAS and the ->user_token_number
 560  of the second is set to the number, if any, from the declaration.
 561  The two symbols are linked via pointers in their ->alias fields.
 562
 563  during output_defines_table, the symbol is reported
 564  thereafter, only the literal string is retained
 565  it is the literal string that is output to yytname
 566 */
 567
 568 void
 569 parse_thong_decl ()
 570 {
 571   register int token;
 572   register struct bucket *symbol;
 573   register char *typename = 0;
 574   int k, usrtoknum;
 575
 576   translations = 1;
 577   token = lex();                /* fetch typename or first token */
 578   if (token == TYPENAME) {
 579     k = strlen(token_buffer);
 580     typename = NEW2(k + 1, char);
 581     strcpy(typename, token_buffer);
 582     value_components_used = 1;
 583     token = lex();              /* fetch first token */
 584   }
 585
 586   /* process first token */
 587
 588   if (token != IDENTIFIER)
 589     {
 590       warns(_("unrecognized item %s, expected an identifier"),
 591             token_buffer);
 592       skip_to_char('%');
 593       return;
 594     }
 595   symval->class = STOKEN;
 596   symval->type_name = typename;
 597   symval->user_token_number = SALIAS;
 598   symbol = symval;
 599
 600   token = lex();                /* get number or literal string */
 601
 602   if (token == NUMBER) {
 603     usrtoknum = numval;
 604     token = lex();              /* okay, did number, now get literal */
 605   }
 606   else usrtoknum = 0;
 607
 608   /* process literal string token */
 609
 610   if (token != IDENTIFIER || *symval->tag != '\"')
 611     {
 612       warns(_("expected string constant instead of %s"),
 613             token_buffer);
 614       skip_to_char('%');
 615       return;
 616     }
 617   symval->class = STOKEN;
 618   symval->type_name = typename;
 619   symval->user_token_number = usrtoknum;
 620
 621   symval->alias = symbol;
 622   symbol->alias = symval;
 623
 624   nsyms--;                      /* symbol and symval combined are only one symbol */
 625 }
 626
 627
 628 /* parse what comes after %start */
 629
 630 void
 631 parse_start_decl ()
 632 {
 633   if (start_flag)
 634     warn(_("multiple %start declarations"));
 635   if (lex() != IDENTIFIER)
 636     warn(_("invalid %start declaration"));
 637   else
 638     {
 639       start_flag = 1;
 640       startval = symval;
 641     }
 642 }
 643
 644
 645
 646 /* read in a %type declaration and record its information for get_type_name to access */
 647
 648 void
 649 parse_type_decl ()
 650 {
 651   register int k;
 652   register char *name;
 653
 654   if (lex() != TYPENAME)
 655     {
 656       warn(_("%type declaration has no <typename>"));
 657       skip_to_char('%');
 658       return;
 659     }
 660
 661   k = strlen(token_buffer);
 662   name = NEW2(k + 1, char);
 663   strcpy(name, token_buffer);
 664
 665   for (;;)
 666     {
 667       register int t;
 668
 669       if(ungetc(skip_white_space(), finput) == '%')
 670         return;
 671
 672       t = lex();
 673
 674       switch (t)
 675         {
 676
 677         case COMMA:
 678         case SEMICOLON:
 679           break;
 680
 681         case IDENTIFIER:
 682           if (symval->type_name == NULL)
 683             symval->type_name = name;
 684           else if (strcmp(name, symval->type_name) != 0)
 685             warns(_("type redeclaration for %s"), symval->tag);
 686
 687           break;
 688
 689         default:
 690           warns(_("invalid %%type declaration due to item: `%s'"), token_buffer);
 691           skip_to_char('%');
 692         }
 693     }
 694 }
 695
 696
 697
 698 /* read in a %left, %right or %nonassoc declaration and record its information.  */
 699 /* assoc is either LEFT_ASSOC, RIGHT_ASSOC or NON_ASSOC.  */
 700
 701 void
 702 parse_assoc_decl (assoc)
 703 int assoc;
 704 {
 705   register int k;
 706   register char *name = NULL;
 707   register int prev = 0;
 708
 709   lastprec++;  /* Assign a new precedence level, never 0.  */
 710
 711   for (;;)
 712     {
 713       register int t;
 714
 715       if(ungetc(skip_white_space(), finput) == '%')
 716         return;
 717
 718       t = lex();
 719
 720       switch (t)
 721         {
 722
 723         case TYPENAME:
 724           k = strlen(token_buffer);
 725           name = NEW2(k + 1, char);
 726           strcpy(name, token_buffer);
 727           break;
 728
 729         case COMMA:
 730           break;
 731
 732         case IDENTIFIER:
 733           if (symval->prec != 0)
 734             warns(_("redefining precedence of %s"), symval->tag);
 735           symval->prec = lastprec;
 736           symval->assoc = assoc;
 737           if (symval->class == SNTERM)
 738             warns(_("symbol %s redefined"), symval->tag);
 739           symval->class = STOKEN;
 740           if (name)
 741             { /* record the type, if one is specified */
 742               if (symval->type_name == NULL)
 743                 symval->type_name = name;
 744               else if (strcmp(name, symval->type_name) != 0)
 745                 warns(_("type redeclaration for %s"), symval->tag);
 746             }
 747           break;
 748
 749         case NUMBER:
 750           if (prev == IDENTIFIER)
 751             {
 752               symval->user_token_number = numval;
 753               translations = 1;
 754             }
 755           else
 756             {
 757               warns(_("invalid text (%s) - number should be after identifier"),
 758                         token_buffer);
 759               skip_to_char('%');
 760             }
 761           break;
 762
 763         case SEMICOLON:
 764           return;
 765
 766         default:
 767           warns(_("unexpected item: %s"), token_buffer);
 768           skip_to_char('%');
 769         }
 770
 771       prev = t;
 772
 773     }
 774 }
 775
 776
 777
 778 /* copy the union declaration into fattrs (and fdefines),
 779    where it is made into the
 780    definition of YYSTYPE, the type of elements of the parser value stack.  */
 781
 782 void
 783 parse_union_decl()
 784 {
 785   register int c;
 786   register int count;
 787   register int in_comment;
 788   int cplus_comment;
 789
 790   if (typed)
 791     warn(_("multiple %union declarations"));
 792
 793   typed = 1;
 794
 795   if (!nolinesflag)
 796     fprintf(fattrs, "\n#line %d \"%s\"\n", lineno, infile);
 797   else
 798     fprintf(fattrs, "\n");
 799
 800   fprintf(fattrs, "typedef union");
 801   if (fdefines)
 802     fprintf(fdefines, "typedef union");
 803
 804   count = 0;
 805   in_comment = 0;
 806
 807   c = getc(finput);
 808
 809   while (c != EOF)
 810     {
 811       putc(c, fattrs);
 812       if (fdefines)
 813         putc(c, fdefines);
 814
 815       switch (c)
 816         {
 817         case '\n':
 818           lineno++;
 819           break;
 820
 821         case '/':
 822           c = getc(finput);
 823           if (c != '*' && c != '/')
 824             ungetc(c, finput);
 825           else
 826             {
 827               putc(c, fattrs);
 828               if (fdefines)
 829                 putc(c, fdefines);
 830               cplus_comment = (c == '/');
 831               in_comment = 1;
 832               c = getc(finput);
 833               while (in_comment)
 834                 {
 835                   putc(c, fattrs);
 836                   if (fdefines)
 837                     putc(c, fdefines);
 838
 839                   if (c == '\n')
 840                     {
 841                       lineno++;
 842                       if (cplus_comment)
 843                         {
 844                           in_comment = 0;
 845                           break;
 846                         }
 847                     }
 848                   if (c == EOF)
 849                     fatal(_("unterminated comment at end of file"));
 850
 851                   if (!cplus_comment && c == '*')
 852                     {
 853                       c = getc(finput);
 854                       if (c == '/')
 855                         {
 856                           putc('/', fattrs);
 857                           if (fdefines)
 858                             putc('/', fdefines);
 859                           in_comment = 0;
 860                         }
 861                     }
 862                   else
 863                     c = getc(finput);
 864                 }
 865             }
 866           break;
 867
 868
 869         case '{':
 870           count++;
 871           break;
 872
 873         case '}':
 874           if (count == 0)
 875             warn (_("unmatched close-brace (`}')"));
 876           count--;
 877           if (count <= 0)
 878             {
 879               fprintf(fattrs, " YYSTYPE;\n");
 880               if (fdefines)
 881                 fprintf(fdefines, " YYSTYPE;\n");
 882               /* JF don't choke on trailing semi */
 883               c=skip_white_space();
 884               if(c!=';') ungetc(c,finput);
 885               return;
 886             }
 887         }
 888
 889       c = getc(finput);
 890     }
 891 }
 892
 893 /* parse the declaration %expect N which says to expect N
 894    shift-reduce conflicts.  */
 895
 896 void
 897 parse_expect_decl()
 898 {
 899   register int c;
 900   register int count;
 901   char buffer[20];
 902
 903   c = getc(finput);
 904   while (c == ' ' || c == '\t')
 905     c = getc(finput);
 906
 907   count = 0;
 908   while (c >= '0' && c <= '9')
 909     {
 910       if (count < 20)
 911         buffer[count++] = c;
 912       c = getc(finput);
 913     }
 914   buffer[count] = 0;
 915
 916   ungetc (c, finput);
 917
 918   if (count <= 0 || count > 10)
 919         warn(_("argument of %expect is not an integer"));
 920   expected_conflicts = atoi (buffer);
 921 }
 922
 923 /* that's all of parsing the declaration section */
 924 \f
 925 /* Get the data type (alternative in the union) of the value for symbol n in rule rule.  */
 926
 927 char *
 928 get_type_name(n, rule)
 929 int n;
 930 symbol_list *rule;
 931 {
 932   static char *msg = N_("invalid $ value");
 933
 934   register int i;
 935   register symbol_list *rp;
 936
 937   if (n < 0)
 938     {
 939       warn(_(msg));
 940       return NULL;
 941     }
 942
 943   rp = rule;
 944   i = 0;
 945
 946   while (i < n)
 947     {
 948       rp = rp->next;
 949       if (rp == NULL || rp->sym == NULL)
 950         {
 951           warn(_(msg));
 952           return NULL;
 953         }
 954       i++;
 955     }
 956
 957   return (rp->sym->type_name);
 958 }
 959
 960
 961 /* after %guard is seen in the input file,
 962 copy the actual guard into the guards file.
 963 If the guard is followed by an action, copy that into the actions file.
 964 stack_offset is the number of values in the current rule so far,
 965 which says where to find $0 with respect to the top of the stack,
 966 for the simple parser in which the stack is not popped until after the guard is run.  */
 967
 968 void
 969 copy_guard(rule, stack_offset)
 970 symbol_list *rule;
 971 int stack_offset;
 972 {
 973   register int c;
 974   register int n;
 975   register int count;
 976   register int match;
 977   register int ended;
 978   register char *type_name;
 979   int brace_flag = 0;
 980   int cplus_comment;
 981
 982   /* offset is always 0 if parser has already popped the stack pointer */
 983   if (semantic_parser) stack_offset = 0;
 984
 985   fprintf(fguard, "\ncase %d:\n", nrules);
 986   if (!nolinesflag)
 987     fprintf(fguard, "#line %d \"%s\"\n", lineno, infile);
 988   putc('{', fguard);
 989
 990   count = 0;
 991   c = getc(finput);
 992
 993   while (brace_flag ? (count > 0) : (c != ';'))
 994     {
 995       switch (c)
 996         {
 997         case '\n':
 998           putc(c, fguard);
 999           lineno++;
1000           break;
1001
1002         case '{':
1003           putc(c, fguard);
1004           brace_flag = 1;
1005           count++;
1006           break;
1007
1008         case '}':
1009           putc(c, fguard);
1010           if (count > 0)
1011             count--;
1012           else
1013             {
1014               warn(_("unmatched right brace (`}')"));
1015               c = getc(finput); /* skip it */
1016             }
1017           break;
1018
1019         case '\'':
1020         case '"':
1021           match = c;
1022           putc(c, fguard);
1023           c = getc(finput);
1024
1025           while (c != match)
1026             {
1027               if (c == EOF)
1028                 fatal(_("unterminated string at end of file"));
1029               if (c == '\n')
1030                 {
1031                   warn(_("unterminated string"));
1032                   ungetc(c, finput);
1033                   c = match;            /* invent terminator */
1034                   continue;
1035                 }
1036
1037               putc(c, fguard);
1038
1039               if (c == '\\')
1040                 {
1041                   c = getc(finput);
1042                   if (c == EOF)
1043                     fatal(_("unterminated string"));
1044                   putc(c, fguard);
1045                   if (c == '\n')
1046                     lineno++;
1047                 }
1048
1049               c = getc(finput);
1050             }
1051
1052           putc(c, fguard);
1053           break;
1054
1055         case '/':
1056           putc(c, fguard);
1057           c = getc(finput);
1058           if (c != '*' && c != '/')
1059             continue;
1060
1061           cplus_comment = (c == '/');
1062           putc(c, fguard);
1063           c = getc(finput);
1064
1065           ended = 0;
1066           while (!ended)
1067             {
1068               if (!cplus_comment && c == '*')
1069                 {
1070                   while (c == '*')
1071                     {
1072                       putc(c, fguard);
1073                       c = getc(finput);
1074                     }
1075
1076                   if (c == '/')
1077                     {
1078                       putc(c, fguard);
1079                       ended = 1;
1080                     }
1081                 }
1082               else if (c == '\n')
1083                 {
1084                   lineno++;
1085                   putc(c, fguard);
1086                   if (cplus_comment)
1087                     ended = 1;
1088                   else
1089                     c = getc(finput);
1090                 }
1091               else if (c == EOF)
1092                 fatal(_("unterminated comment"));
1093               else
1094                 {
1095                   putc(c, fguard);
1096                   c = getc(finput);
1097                 }
1098             }
1099
1100           break;
1101
1102         case '$':
1103           c = getc(finput);
1104           type_name = NULL;
1105
1106           if (c == '<')
1107             {
1108               register char *cp = token_buffer;
1109
1110               while ((c = getc(finput)) != '>' && c > 0)
1111                 *cp++ = c;
1112               *cp = 0;
1113               type_name = token_buffer;
1114
1115               c = getc(finput);
1116             }
1117
1118           if (c == '$')
1119             {
1120               fprintf(fguard, "yyval");
1121               if (!type_name) type_name = rule->sym->type_name;
1122               if (type_name)
1123                 fprintf(fguard, ".%s", type_name);
1124               if(!type_name && typed)
1125                 warns(_("$$ of `%s' has no declared type"), rule->sym->tag);
1126             }
1127
1128           else if (isdigit(c) || c == '-')
1129             {
1130               ungetc (c, finput);
1131               n = read_signed_integer(finput);
1132               c = getc(finput);
1133
1134               if (!type_name && n > 0)
1135                 type_name = get_type_name(n, rule);
1136
1137               fprintf(fguard, "yyvsp[%d]", n - stack_offset);
1138               if (type_name)
1139                 fprintf(fguard, ".%s", type_name);
1140               if(!type_name && typed)
1141                 warnss(_("$%s of `%s' has no declared type"), int_to_string(n), rule->sym->tag);
1142               continue;
1143             }
1144           else
1145             warns(_("$%s is invalid"), printable_version(c));
1146
1147           break;
1148
1149         case '@':
1150           c = getc(finput);
1151           if (isdigit(c) || c == '-')
1152             {
1153               ungetc (c, finput);
1154               n = read_signed_integer(finput);
1155               c = getc(finput);
1156             }
1157           else
1158             {
1159               warns(_("@%s is invalid"), printable_version(c));
1160               n = 1;
1161             }
1162
1163           fprintf(fguard, "yylsp[%d]", n - stack_offset);
1164           yylsp_needed = 1;
1165
1166           continue;
1167
1168         case EOF:
1169           fatal(_("unterminated %%guard clause"));
1170
1171         default:
1172           putc(c, fguard);
1173         }
1174
1175       if (c != '}' || count != 0)
1176         c = getc(finput);
1177     }
1178
1179   c = skip_white_space();
1180
1181   fprintf(fguard, ";\n    break;}");
1182   if (c == '{')
1183     copy_action(rule, stack_offset);
1184   else if (c == '=')
1185     {
1186       c = getc(finput); /* why not skip_white_space -wjh */
1187       if (c == '{')
1188         copy_action(rule, stack_offset);
1189     }
1190   else
1191     ungetc(c, finput);
1192 }
1193
1194
1195
1196 /* Assuming that a { has just been seen, copy everything up to the matching }
1197 into the actions file.
1198 stack_offset is the number of values in the current rule so far,
1199 which says where to find $0 with respect to the top of the stack.  */
1200
1201 void
1202 copy_action(rule, stack_offset)
1203 symbol_list *rule;
1204 int stack_offset;
1205 {
1206   register int c;
1207   register int n;
1208   register int count;
1209   register int match;
1210   register int ended;
1211   register char *type_name;
1212   int cplus_comment;
1213
1214   /* offset is always 0 if parser has already popped the stack pointer */
1215   if (semantic_parser) stack_offset = 0;
1216
1217   fprintf(faction, "\ncase %d:\n", nrules);
1218   if (!nolinesflag)
1219     fprintf(faction, "#line %d \"%s\"\n", lineno, infile);
1220   putc('{', faction);
1221
1222   count = 1;
1223   c = getc(finput);
1224
1225   while (count > 0)
1226     {
1227       while (c != '}')
1228         {
1229           switch (c)
1230             {
1231             case '\n':
1232               putc(c, faction);
1233               lineno++;
1234               break;
1235
1236             case '{':
1237               putc(c, faction);
1238               count++;
1239               break;
1240
1241             case '\'':
1242             case '"':
1243               match = c;
1244               putc(c, faction);
1245               c = getc(finput);
1246
1247               while (c != match)
1248                 {
1249                   if (c == '\n')
1250                     {
1251                       warn(_("unterminated string"));
1252                       ungetc(c, finput);
1253                       c = match;
1254                       continue;
1255                     }
1256                   else if (c == EOF)
1257                     fatal(_("unterminated string at end of file"));
1258
1259                   putc(c, faction);
1260
1261                   if (c == '\\')
1262                     {
1263                       c = getc(finput);
1264                       if (c == EOF)
1265                         fatal(_("unterminated string"));
1266                       putc(c, faction);
1267                       if (c == '\n')
1268                         lineno++;
1269                     }
1270
1271                   c = getc(finput);
1272                 }
1273
1274               putc(c, faction);
1275               break;
1276
1277             case '/':
1278               putc(c, faction);
1279               c = getc(finput);
1280               if (c != '*' && c != '/')
1281                 continue;
1282
1283               cplus_comment = (c == '/');
1284               putc(c, faction);
1285               c = getc(finput);
1286
1287               ended = 0;
1288               while (!ended)
1289                 {
1290                   if (!cplus_comment && c == '*')
1291                     {
1292                       while (c == '*')
1293                         {
1294                           putc(c, faction);
1295                           c = getc(finput);
1296                         }
1297
1298                       if (c == '/')
1299                         {
1300                           putc(c, faction);
1301                           ended = 1;
1302                         }
1303                     }
1304                   else if (c == '\n')
1305                     {
1306                       lineno++;
1307                       putc(c, faction);
1308                       if (cplus_comment)
1309                         ended = 1;
1310                       else
1311                         c = getc(finput);
1312                     }
1313                   else if (c == EOF)
1314                     fatal(_("unterminated comment"));
1315                   else
1316                     {
1317                       putc(c, faction);
1318                       c = getc(finput);
1319                     }
1320                 }
1321
1322               break;
1323
1324             case '$':
1325               c = getc(finput);
1326               type_name = NULL;
1327
1328               if (c == '<')
1329                 {
1330                   register char *cp = token_buffer;
1331
1332                   while ((c = getc(finput)) != '>' && c > 0)
1333                     *cp++ = c;
1334                   *cp = 0;
1335                   type_name = token_buffer;
1336                   value_components_used = 1;
1337
1338                   c = getc(finput);
1339                 }
1340               if (c == '$')
1341                 {
1342                   fprintf(faction, "yyval");
1343                   if (!type_name) type_name = get_type_name(0, rule);
1344                   if (type_name)
1345                     fprintf(faction, ".%s", type_name);
1346                   if(!type_name && typed)
1347                     warns(_("$$ of `%s' has no declared type"), rule->sym->tag);
1348                 }
1349               else if (isdigit(c) || c == '-')
1350                 {
1351                   ungetc (c, finput);
1352                   n = read_signed_integer(finput);
1353                   c = getc(finput);
1354
1355                   if (!type_name && n > 0)
1356                     type_name = get_type_name(n, rule);
1357
1358                   fprintf(faction, "yyvsp[%d]", n - stack_offset);
1359                   if (type_name)
1360                     fprintf(faction, ".%s", type_name);
1361                   if(!type_name && typed)
1362                     warnss(_("$%s of `%s' has no declared type"),
1363                                 int_to_string(n), rule->sym->tag);
1364                   continue;
1365                 }
1366               else
1367                 warns(_("$%s is invalid"), printable_version(c));
1368
1369               break;
1370
1371             case '@':
1372               c = getc(finput);
1373               if (isdigit(c) || c == '-')
1374                 {
1375                   ungetc (c, finput);
1376                   n = read_signed_integer(finput);
1377                   c = getc(finput);
1378                 }
1379               else
1380                 {
1381                   warn(_("invalid @-construct"));
1382                   n = 1;
1383                 }
1384
1385               fprintf(faction, "yylsp[%d]", n - stack_offset);
1386               yylsp_needed = 1;
1387
1388               continue;
1389
1390             case EOF:
1391               fatal(_("unmatched `{'"));
1392
1393             default:
1394               putc(c, faction);
1395             }
1396
1397           c = getc(finput);
1398         }
1399
1400       /* above loop exits when c is '}' */
1401
1402       if (--count)
1403         {
1404           putc(c, faction);
1405           c = getc(finput);
1406         }
1407     }
1408
1409   fprintf(faction, ";\n    break;}");
1410 }
1411
1412
1413
1414 /* generate a dummy symbol, a nonterminal,
1415 whose name cannot conflict with the user's names. */
1416
1417 bucket *
1418 gensym()
1419 {
1420   register bucket *sym;
1421
1422   sprintf (token_buffer, "@%d", ++gensym_count);
1423   sym = getsym(token_buffer);
1424   sym->class = SNTERM;
1425   sym->value = nvars++;
1426   return (sym);
1427 }
1428
1429 /* Parse the input grammar into a one symbol_list structure.
1430 Each rule is represented by a sequence of symbols: the left hand side
1431 followed by the contents of the right hand side, followed by a null pointer
1432 instead of a symbol to terminate the rule.
1433 The next symbol is the lhs of the following rule.
1434
1435 All guards and actions are copied out to the appropriate files,
1436 labelled by the rule number they apply to.  */
1437
1438 void
1439 readgram()
1440 {
1441   register int t;
1442   register bucket *lhs;
1443   register symbol_list *p;
1444   register symbol_list *p1;
1445   register bucket *bp;
1446
1447   symbol_list *crule;   /* points to first symbol_list of current rule.  */
1448                         /* its symbol is the lhs of the rule.   */
1449   symbol_list *crule1;  /* points to the symbol_list preceding crule.  */
1450
1451   p1 = NULL;
1452
1453   t = lex();
1454
1455   while (t != TWO_PERCENTS && t != ENDFILE)
1456     {
1457       if (t == IDENTIFIER || t == BAR)
1458         {
1459           register int actionflag = 0;
1460           int rulelength = 0;  /* number of symbols in rhs of this rule so far  */
1461           int xactions = 0;     /* JF for error checking */
1462           bucket *first_rhs = 0;
1463
1464           if (t == IDENTIFIER)
1465             {
1466               lhs = symval;
1467
1468               if (!start_flag)
1469                 {
1470                   startval = lhs;
1471                   start_flag = 1;
1472                 }
1473
1474               t = lex();
1475               if (t != COLON)
1476                 {
1477                   warn(_("ill-formed rule: initial symbol not followed by colon"));
1478                   unlex(t);
1479                 }
1480             }
1481
1482           if (nrules == 0 && t == BAR)
1483             {
1484               warn(_("grammar starts with vertical bar"));
1485               lhs = symval;     /* BOGUS: use a random symval */
1486             }
1487           /* start a new rule and record its lhs.  */
1488
1489           nrules++;
1490           nitems++;
1491
1492           record_rule_line ();
1493
1494           p = NEW(symbol_list);
1495           p->sym = lhs;
1496
1497           crule1 = p1;
1498           if (p1)
1499             p1->next = p;
1500           else
1501             grammar = p;
1502
1503           p1 = p;
1504           crule = p;
1505
1506           /* mark the rule's lhs as a nonterminal if not already so.  */
1507
1508           if (lhs->class == SUNKNOWN)
1509             {
1510               lhs->class = SNTERM;
1511               lhs->value = nvars;
1512               nvars++;
1513             }
1514           else if (lhs->class == STOKEN)
1515             warns(_("rule given for %s, which is a token"), lhs->tag);
1516
1517           /* read the rhs of the rule.  */
1518
1519           for (;;)
1520             {
1521               t = lex();
1522               if (t == PREC)
1523                 {
1524                   t = lex();
1525                   crule->ruleprec = symval;
1526                   t = lex();
1527                 }
1528
1529               if (! (t == IDENTIFIER || t == LEFT_CURLY)) break;
1530
1531               /* If next token is an identifier, see if a colon follows it.
1532                  If one does, exit this rule now.  */
1533               if (t == IDENTIFIER)
1534                 {
1535                   register bucket *ssave;
1536                   register int t1;
1537
1538                   ssave = symval;
1539                   t1 = lex();
1540                   unlex(t1);
1541                   symval = ssave;
1542                   if (t1 == COLON) break;
1543
1544                   if(!first_rhs)        /* JF */
1545                     first_rhs = symval;
1546                   /* Not followed by colon =>
1547                      process as part of this rule's rhs.  */
1548                 }
1549
1550               /* If we just passed an action, that action was in the middle
1551                  of a rule, so make a dummy rule to reduce it to a
1552                  non-terminal.  */
1553               if (actionflag)
1554                 {
1555                   register bucket *sdummy;
1556
1557                   /* Since the action was written out with this rule's */
1558                   /* number, we must give the new rule this number */
1559                   /* by inserting the new rule before it.  */
1560
1561                   /* Make a dummy nonterminal, a gensym.  */
1562                   sdummy = gensym();
1563
1564                   /* Make a new rule, whose body is empty,
1565                      before the current one, so that the action
1566                      just read can belong to it.  */
1567                   nrules++;
1568                   nitems++;
1569                   record_rule_line ();
1570                   p = NEW(symbol_list);
1571                   if (crule1)
1572                     crule1->next = p;
1573                   else grammar = p;
1574                   p->sym = sdummy;
1575                   crule1 = NEW(symbol_list);
1576                   p->next = crule1;
1577                   crule1->next = crule;
1578
1579                   /* insert the dummy generated by that rule into this rule.  */
1580                   nitems++;
1581                   p = NEW(symbol_list);
1582                   p->sym = sdummy;
1583                   p1->next = p;
1584                   p1 = p;
1585
1586                   actionflag = 0;
1587                 }
1588
1589               if (t == IDENTIFIER)
1590                 {
1591                   nitems++;
1592                   p = NEW(symbol_list);
1593                   p->sym = symval;
1594                   p1->next = p;
1595                   p1 = p;
1596                 }
1597               else /* handle an action.  */
1598                 {
1599                   copy_action(crule, rulelength);
1600                   actionflag = 1;
1601                   xactions++;   /* JF */
1602                 }
1603               rulelength++;
1604             }   /* end of  read rhs of rule */
1605
1606           /* Put an empty link in the list to mark the end of this rule  */
1607           p = NEW(symbol_list);
1608           p1->next = p;
1609           p1 = p;
1610
1611           if (t == PREC)
1612             {
1613               warn(_("two @prec's in a row"));
1614               t = lex();
1615               crule->ruleprec = symval;
1616               t = lex();
1617             }
1618           if (t == GUARD)
1619             {
1620               if (! semantic_parser)
1621                 warn(_("%%guard present but %%semantic_parser not specified"));
1622
1623               copy_guard(crule, rulelength);
1624               t = lex();
1625             }
1626           else if (t == LEFT_CURLY)
1627             {
1628                 /* This case never occurs -wjh */
1629               if (actionflag)  warn(_("two actions at end of one rule"));
1630               copy_action(crule, rulelength);
1631               actionflag = 1;
1632               xactions++;       /* -wjh */
1633               t = lex();
1634             }
1635           /* If $$ is being set in default way,
1636              warn if any type mismatch.  */
1637           else if (!xactions && first_rhs && lhs->type_name != first_rhs->type_name)
1638             {
1639               if (lhs->type_name == 0 || first_rhs->type_name == 0
1640                   || strcmp(lhs->type_name,first_rhs->type_name))
1641                 warnss(_("type clash (`%s' `%s') on default action"),
1642                         lhs->type_name ? lhs->type_name : "",
1643                         first_rhs->type_name ? first_rhs->type_name : "");
1644             }
1645           /* Warn if there is no default for $$ but we need one.  */
1646           else if (!xactions && !first_rhs && lhs->type_name != 0)
1647             warn(_("empty rule for typed nonterminal, and no action"));
1648           if (t == SEMICOLON)
1649             t = lex();
1650         }
1651 #if 0
1652   /* these things can appear as alternatives to rules.  */
1653 /* NO, they cannot.
1654         a) none of the documentation allows them
1655         b) most of them scan forward until finding a next %
1656                 thus they may swallow lots of intervening rules
1657 */
1658       else if (t == TOKEN)
1659         {
1660           parse_token_decl(STOKEN, SNTERM);
1661           t = lex();
1662         }
1663       else if (t == NTERM)
1664         {
1665           parse_token_decl(SNTERM, STOKEN);
1666           t = lex();
1667         }
1668       else if (t == TYPE)
1669         {
1670           t = get_type();
1671         }
1672       else if (t == UNION)
1673         {
1674           parse_union_decl();
1675           t = lex();
1676         }
1677       else if (t == EXPECT)
1678         {
1679           parse_expect_decl();
1680           t = lex();
1681         }
1682       else if (t == START)
1683         {
1684           parse_start_decl();
1685           t = lex();
1686         }
1687 #endif
1688
1689       else
1690         {
1691           warns(_("invalid input: %s"), token_buffer);
1692           t = lex();
1693         }
1694     }
1695
1696   /* grammar has been read.  Do some checking */
1697
1698   if (nsyms > MAXSHORT)
1699     fatals(_("too many symbols (tokens plus nonterminals); maximum %s"),
1700            int_to_string(MAXSHORT));
1701   if (nrules == 0)
1702     fatal(_("no rules in the input grammar"));
1703
1704   if (typed == 0        /* JF put out same default YYSTYPE as YACC does */
1705       && !value_components_used)
1706     {
1707       /* We used to use `unsigned long' as YYSTYPE on MSDOS,
1708          but it seems better to be consistent.
1709          Most programs should declare their own type anyway.  */
1710       fprintf(fattrs, "#ifndef YYSTYPE\n#define YYSTYPE int\n#endif\n");
1711       if (fdefines)
1712         fprintf(fdefines, "#ifndef YYSTYPE\n#define YYSTYPE int\n#endif\n");
1713     }
1714
1715   /* Report any undefined symbols and consider them nonterminals.  */
1716
1717   for (bp = firstsymbol; bp; bp = bp->next)
1718     if (bp->class == SUNKNOWN)
1719       {
1720         warns(_("symbol %s is used, but is not defined as a token and has no rules"),
1721                         bp->tag);
1722         bp->class = SNTERM;
1723         bp->value = nvars++;
1724       }
1725
1726   ntokens = nsyms - nvars;
1727 }
1728
1729
1730 void
1731 record_rule_line ()
1732 {
1733   /* Record each rule's source line number in rline table.  */
1734
1735   if (nrules >= rline_allocated)
1736     {
1737       rline_allocated = nrules * 2;
1738       rline = (short *) xrealloc (rline,
1739                                  rline_allocated * sizeof (short));
1740     }
1741   rline[nrules] = lineno;
1742 }
1743
1744
1745 /* read in a %type declaration and record its information for get_type_name to access */
1746 /* this is unused.  it is only called from the #if 0 part of readgram */
1747 static int
1748 get_type()
1749 {
1750   register int k;
1751   register int t;
1752   register char *name;
1753
1754   t = lex();
1755
1756   if (t != TYPENAME)
1757     {
1758       warn(_("ill-formed %type declaration"));
1759       return t;
1760     }
1761
1762   k = strlen(token_buffer);
1763   name = NEW2(k + 1, char);
1764   strcpy(name, token_buffer);
1765
1766   for (;;)
1767     {
1768       t = lex();
1769
1770       switch (t)
1771         {
1772         case SEMICOLON:
1773           return (lex());
1774
1775         case COMMA:
1776           break;
1777
1778         case IDENTIFIER:
1779           if (symval->type_name == NULL)
1780             symval->type_name = name;
1781           else if (strcmp(name, symval->type_name) != 0)
1782             warns(_("type redeclaration for %s"), symval->tag);
1783
1784           break;
1785
1786         default:
1787           return (t);
1788         }
1789     }
1790 }
1791
1792
1793
1794 /* assign symbol numbers, and write definition of token names into fdefines.
1795 Set up vectors tags and sprec of names and precedences of symbols.  */
1796
1797 void
1798 packsymbols()
1799 {
1800   register bucket *bp;
1801   register int tokno = 1;
1802   register int i;
1803   register int last_user_token_number;
1804
1805   /* int lossage = 0; JF set but not used */
1806
1807   tags = NEW2(nsyms + 1, char *);
1808   tags[0] = "$";
1809   user_toknums = NEW2(nsyms + 1, int);
1810   user_toknums[0] = 0;
1811
1812   sprec = NEW2(nsyms, short);
1813   sassoc = NEW2(nsyms, short);
1814
1815   max_user_token_number = 256;
1816   last_user_token_number = 256;
1817
1818   for (bp = firstsymbol; bp; bp = bp->next)
1819     {
1820       if (bp->class == SNTERM)
1821         {
1822           bp->value += ntokens;
1823         }
1824       else if (bp->alias)
1825         {
1826                 /* this symbol and its alias are a single token defn.
1827                   allocate a tokno, and assign to both
1828                   check agreement of ->prec and ->assoc fields
1829                         and make both the same
1830                 */
1831                 if (bp->value == 0)
1832                         bp->value = bp->alias->value = tokno++;
1833
1834                 if (bp->prec != bp->alias->prec) {
1835                         if (bp->prec != 0 && bp->alias->prec != 0
1836                                         && bp->user_token_number == SALIAS)
1837                                 warnss(_("conflicting precedences for %s and %s"),
1838                                         bp->tag, bp->alias->tag);
1839                         if (bp->prec != 0) bp->alias->prec = bp->prec;
1840                         else bp->prec = bp->alias->prec;
1841                 }
1842
1843                 if (bp->assoc != bp->alias->assoc) {
1844                         if (bp->assoc != 0 && bp->alias->assoc != 0
1845                                         && bp->user_token_number == SALIAS)
1846                                 warnss(_("conflicting assoc values for %s and %s"),
1847                                         bp->tag, bp->alias->tag);
1848                         if (bp->assoc != 0) bp->alias->assoc = bp->assoc;
1849                         else bp->assoc = bp->alias->assoc;
1850                 }
1851
1852                 if (bp->user_token_number == SALIAS)
1853                         continue;  /* do not do processing below for SALIASs */
1854
1855         }
1856       else  /* bp->class == STOKEN */
1857         {
1858           bp->value = tokno++;
1859         }
1860
1861       if (bp->class == STOKEN)
1862         {
1863           if (translations && !(bp->user_token_number))
1864             bp->user_token_number = ++last_user_token_number;
1865           if (bp->user_token_number > max_user_token_number)
1866             max_user_token_number = bp->user_token_number;
1867         }
1868
1869       tags[bp->value] = bp->tag;
1870       user_toknums[bp->value] = bp->user_token_number;
1871       sprec[bp->value] = bp->prec;
1872       sassoc[bp->value] = bp->assoc;
1873
1874     }
1875
1876   if (translations)
1877     {
1878       register int i;
1879
1880       token_translations = NEW2(max_user_token_number+1, short);
1881
1882       /* initialize all entries for literal tokens to 2,
1883          the internal token number for $undefined.,
1884          which represents all invalid inputs.  */
1885       for (i = 0; i <= max_user_token_number; i++)
1886         token_translations[i] = 2;
1887
1888       for (bp = firstsymbol; bp; bp = bp->next)
1889         {
1890           if (bp->value >= ntokens) continue;             /* non-terminal */
1891           if (bp->user_token_number == SALIAS) continue;
1892           if (token_translations[bp->user_token_number] != 2)
1893             warnsss(_("tokens %s and %s both assigned number %s"),
1894                               tags[token_translations[bp->user_token_number]],
1895                               bp->tag,
1896                               int_to_string(bp->user_token_number));
1897           token_translations[bp->user_token_number] = bp->value;
1898         }
1899     }
1900
1901   error_token_number = errtoken->value;
1902
1903   if (! noparserflag)
1904     output_token_defines(ftable);
1905
1906   if (startval->class == SUNKNOWN)
1907     fatals(_("the start symbol %s is undefined"), startval->tag);
1908   else if (startval->class == STOKEN)
1909     fatals(_("the start symbol %s is a token"), startval->tag);
1910
1911   start_symbol = startval->value;
1912
1913   if (definesflag)
1914     {
1915       output_token_defines(fdefines);
1916
1917       if (!pure_parser)
1918         {
1919           if (spec_name_prefix)
1920             fprintf(fdefines, "\nextern YYSTYPE %slval;\n", spec_name_prefix);
1921           else
1922             fprintf(fdefines, "\nextern YYSTYPE yylval;\n");
1923         }
1924
1925       if (semantic_parser)
1926         for (i = ntokens; i < nsyms; i++)
1927           {
1928             /* don't make these for dummy nonterminals made by gensym.  */
1929             if (*tags[i] != '@')
1930               fprintf(fdefines, "#define\tNT%s\t%d\n", tags[i], i);
1931           }
1932 #if 0
1933       /* `fdefines' is now a temporary file, so we need to copy its
1934          contents in `done', so we can't close it here.  */
1935       fclose(fdefines);
1936       fdefines = NULL;
1937 #endif
1938     }
1939 }
1940
1941 /* For named tokens, but not literal ones, define the name.
1942    The value is the user token number.
1943 */
1944 void
1945 output_token_defines(file)
1946 FILE *file;
1947 {
1948   bucket *bp;
1949   register char *cp, *symbol;
1950   register char c;
1951
1952   for (bp = firstsymbol; bp; bp = bp->next)
1953     {
1954       symbol = bp->tag;                         /* get symbol */
1955
1956       if (bp->value >= ntokens) continue;
1957       if (bp->user_token_number == SALIAS) continue;
1958       if ('\'' == *symbol) continue;    /* skip literal character */
1959       if (bp == errtoken) continue;     /* skip error token */
1960       if ('\"' == *symbol)
1961         {
1962                 /* use literal string only if given a symbol with an alias */
1963                 if (bp->alias)
1964                         symbol = bp->alias->tag;
1965                 else
1966                         continue;
1967         }
1968
1969       /* Don't #define nonliteral tokens whose names contain periods.  */
1970       cp = symbol;
1971       while ((c = *cp++) && c != '.');
1972       if (c != '\0')  continue;
1973
1974       fprintf(file, "#define\t%s\t%d\n", symbol,
1975                 ((translations && ! rawtoknumflag)
1976                         ? bp->user_token_number
1977                         : bp->value));
1978       if (semantic_parser)
1979         fprintf(file, "#define\tT%s\t%d\n", symbol, bp->value);
1980     }
1981
1982   putc('\n', file);
1983 }
1984
1985
1986
1987 /* convert the rules into the representation using rrhs, rlhs and ritems.  */
1988
1989 void
1990 packgram()
1991 {
1992   register int itemno;
1993   register int ruleno;
1994   register symbol_list *p;
1995 /*  register bucket *bp; JF unused */
1996
1997   bucket *ruleprec;
1998
1999   ritem = NEW2(nitems + 1, short);
2000   rlhs = NEW2(nrules, short) - 1;
2001   rrhs = NEW2(nrules, short) - 1;
2002   rprec = NEW2(nrules, short) - 1;
2003   rprecsym = NEW2(nrules, short) - 1;
2004   rassoc = NEW2(nrules, short) - 1;
2005
2006   itemno = 0;
2007   ruleno = 1;
2008
2009   p = grammar;
2010   while (p)
2011     {
2012       rlhs[ruleno] = p->sym->value;
2013       rrhs[ruleno] = itemno;
2014       ruleprec = p->ruleprec;
2015
2016       p = p->next;
2017       while (p && p->sym)
2018         {
2019           ritem[itemno++] = p->sym->value;
2020           /* A rule gets by default the precedence and associativity
2021              of the last token in it.  */
2022           if (p->sym->class == STOKEN)
2023             {
2024               rprec[ruleno] = p->sym->prec;
2025               rassoc[ruleno] = p->sym->assoc;
2026             }
2027           if (p) p = p->next;
2028         }
2029
2030       /* If this rule has a %prec,
2031          the specified symbol's precedence replaces the default.  */
2032       if (ruleprec)
2033         {
2034           rprec[ruleno] = ruleprec->prec;
2035           rassoc[ruleno] = ruleprec->assoc;
2036           rprecsym[ruleno] = ruleprec->value;
2037         }
2038
2039       ritem[itemno++] = -ruleno;
2040       ruleno++;
2041
2042       if (p) p = p->next;
2043     }
2044
2045   ritem[itemno] = 0;
2046 }
2047 \f
2048 /* Read a signed integer from STREAM and return its value.  */
2049
2050 int
2051 read_signed_integer (stream)
2052      FILE *stream;
2053 {
2054   register int c = getc(stream);
2055   register int sign = 1;
2056   register int n;
2057
2058   if (c == '-')
2059     {
2060       c = getc(stream);
2061       sign = -1;
2062     }
2063   n = 0;
2064   while (isdigit(c))
2065     {
2066       n = 10*n + (c - '0');
2067       c = getc(stream);
2068     }
2069
2070   ungetc(c, stream);
2071
2072   return n * sign;
2073 }