1 /* Compute lookahead criteria for Bison. 
   3    Copyright (C) 1984, 1986, 1989, 2000, 2001, 2002, 2003, 2004, 2005, 
   4    2006, 2007, 2008, 2009 Free Software Foundation, Inc. 
   6    This file is part of Bison, the GNU Compiler Compiler. 
   8    This program is free software: you can redistribute it and/or modify 
   9    it under the terms of the GNU General Public License as published by 
  10    the Free Software Foundation, either version 3 of the License, or 
  11    (at your option) any later version. 
  13    This program is distributed in the hope that it will be useful, 
  14    but WITHOUT ANY WARRANTY; without even the implied warranty of 
  15    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
  16    GNU General Public License for more details. 
  18    You should have received a copy of the GNU General Public License 
  19    along with this program.  If not, see <http://www.gnu.org/licenses/>.  */ 
  22 /* Compute how to make the finite state machine deterministic; find 
  23    which rules need lookahead in each state, and which lookahead 
  24    tokens they accept.  */ 
  39 #include "muscle_tab.h" 
  45 goto_number 
*goto_map
; 
  46 static goto_number ngotos
; 
  47 state_number 
*from_state
; 
  48 state_number 
*to_state
; 
  50 /* Linked list of goto numbers.  */ 
  51 typedef struct goto_list
 
  53   struct goto_list 
*next
; 
  58 /* LA is an NLA by NTOKENS matrix of bits.  LA[l, i] is 1 if the rule 
  59    LArule[l] is applicable in the appropriate state when the next 
  60    token is symbol i.  If LA[l, i] and LA[l, j] are both 1 for i != j, 
  63 static bitsetv LA 
= NULL
; 
  67 /* And for the famous F variable, which name is so descriptive that a 
  68    comment is hardly needed.  <grin>.  */ 
  69 static bitsetv F 
= NULL
; 
  71 static goto_number 
**includes
; 
  72 static goto_list 
**lookback
; 
  81   goto_number 
*temp_map
; 
  83   goto_map 
= xcalloc (nvars 
+ 1, sizeof *goto_map
); 
  84   temp_map 
= xnmalloc (nvars 
+ 1, sizeof *temp_map
); 
  87   for (s 
= 0; s 
< nstates
; ++s
) 
  89       transitions 
*sp 
= states
[s
]->transitions
; 
  91       for (i 
= sp
->num 
- 1; i 
>= 0 && TRANSITION_IS_GOTO (sp
, i
); --i
) 
  95           /* Abort if (ngotos + 1) would overflow.  */ 
  96           aver (ngotos 
!= GOTO_NUMBER_MAXIMUM
); 
  98           goto_map
[TRANSITION_SYMBOL (sp
, i
) - ntokens
]++; 
 105     for (i 
= ntokens
; i 
< nsyms
; i
++) 
 107         temp_map
[i 
- ntokens
] = k
; 
 108         k 
+= goto_map
[i 
- ntokens
]; 
 111     for (i 
= ntokens
; i 
< nsyms
; i
++) 
 112       goto_map
[i 
- ntokens
] = temp_map
[i 
- ntokens
]; 
 114     goto_map
[nsyms 
- ntokens
] = ngotos
; 
 115     temp_map
[nsyms 
- ntokens
] = ngotos
; 
 118   from_state 
= xcalloc (ngotos
, sizeof *from_state
); 
 119   to_state 
= xcalloc (ngotos
, sizeof *to_state
); 
 121   for (s 
= 0; s 
< nstates
; ++s
) 
 123       transitions 
*sp 
= states
[s
]->transitions
; 
 125       for (i 
= sp
->num 
- 1; i 
>= 0 && TRANSITION_IS_GOTO (sp
, i
); --i
) 
 127           goto_number k 
= temp_map
[TRANSITION_SYMBOL (sp
, i
) - ntokens
]++; 
 129           to_state
[k
] = sp
->states
[i
]->number
; 
 138 /*----------------------------------------------------------. 
 139 | Map a state/symbol pair into its numeric representation.  | 
 140 `----------------------------------------------------------*/ 
 143 map_goto (state_number s0
, symbol_number sym
) 
 150   low 
= goto_map
[sym 
- ntokens
]; 
 151   high 
= goto_map
[sym 
- ntokens 
+ 1] - 1; 
 156       middle 
= (low 
+ high
) / 2; 
 157       s 
= from_state
[middle
]; 
 171   goto_number 
**reads 
= xnmalloc (ngotos
, sizeof *reads
); 
 172   goto_number 
*edge 
= xnmalloc (ngotos 
+ 1, sizeof *edge
); 
 173   goto_number nedges 
= 0; 
 177   F 
= bitsetv_create (ngotos
, ntokens
, BITSET_FIXED
); 
 179   for (i 
= 0; i 
< ngotos
; i
++) 
 181       state_number stateno 
= to_state
[i
]; 
 182       transitions 
*sp 
= states
[stateno
]->transitions
; 
 185       FOR_EACH_SHIFT (sp
, j
) 
 186         bitset_set (F
[i
], TRANSITION_SYMBOL (sp
, j
)); 
 188       for (; j 
< sp
->num
; j
++) 
 190           symbol_number sym 
= TRANSITION_SYMBOL (sp
, j
); 
 191           if (nullable
[sym 
- ntokens
]) 
 192             edge
[nedges
++] = map_goto (stateno
, sym
); 
 199           reads
[i
] = xnmalloc (nedges 
+ 1, sizeof reads
[i
][0]); 
 200           memcpy (reads
[i
], edge
, nedges 
* sizeof edge
[0]); 
 201           reads
[i
][nedges
] = END_NODE
; 
 206   relation_digraph (reads
, ngotos
, &F
); 
 208   for (i 
= 0; i 
< ngotos
; i
++) 
 217 add_lookback_edge (state 
*s
, rule 
*r
, goto_number gotono
) 
 219   int ri 
= state_reduction_find (s
, r
); 
 220   goto_list 
*sp 
= xmalloc (sizeof *sp
); 
 221   sp
->next 
= lookback
[(s
->reductions
->lookahead_tokens 
- LA
) + ri
]; 
 223   lookback
[(s
->reductions
->lookahead_tokens 
- LA
) + ri
] = sp
; 
 229 build_relations (void) 
 231   goto_number 
*edge 
= xnmalloc (ngotos 
+ 1, sizeof *edge
); 
 232   state_number 
*states1 
= xnmalloc (ritem_longest_rhs () + 1, sizeof *states1
); 
 235   includes 
= xnmalloc (ngotos
, sizeof *includes
); 
 237   for (i 
= 0; i 
< ngotos
; i
++) 
 240       symbol_number symbol1 
= states
[to_state
[i
]]->accessing_symbol
; 
 243       for (rulep 
= derives
[symbol1 
- ntokens
]; *rulep
; rulep
++) 
 247           item_number 
const *rp
; 
 248           state 
*s 
= states
[from_state
[i
]]; 
 249           states1
[0] = s
->number
; 
 251           for (rp 
= (*rulep
)->rhs
; ! item_number_is_rule_number (*rp
); rp
++) 
 253               s 
= transitions_to (s
->transitions
, 
 254                                   item_number_as_symbol_number (*rp
)); 
 255               states1
[length
++] = s
->number
; 
 259             add_lookback_edge (s
, *rulep
, i
); 
 266               /* Each rhs ends in a rule number, and there is a 
 267                  sentinel before the first rhs, so it is safe to 
 268                  decrement RP here.  */ 
 272                   /* Downcasting from item_number to symbol_number.  */ 
 273                   edge
[nedges
++] = map_goto (states1
[--length
], 
 274                                              item_number_as_symbol_number (*rp
)); 
 275                   if (nullable
[*rp 
- ntokens
]) 
 286           includes
[i
] = xnmalloc (nedges 
+ 1, sizeof includes
[i
][0]); 
 287           for (j 
= 0; j 
< nedges
; j
++) 
 288             includes
[i
][j
] = edge
[j
]; 
 289           includes
[i
][nedges
] = END_NODE
; 
 296   relation_transpose (&includes
, ngotos
); 
 302 compute_FOLLOWS (void) 
 306   relation_digraph (includes
, ngotos
, &F
); 
 308   for (i 
= 0; i 
< ngotos
; i
++) 
 316 compute_lookahead_tokens (void) 
 321   for (i 
= 0; i 
< nLA
; i
++) 
 322     for (sp 
= lookback
[i
]; sp
; sp 
= sp
->next
) 
 323       bitset_or (LA
[i
], LA
[i
], F
[sp
->value
]); 
 326   for (i 
= 0; i 
< nLA
; i
++) 
 327     LIST_FREE (goto_list
, lookback
[i
]); 
 334 /*----------------------------------------------------. 
 335 | Count the number of lookahead tokens required for S | 
 336 | (N_LOOKAHEAD_TOKENS member).                        | 
 337 `----------------------------------------------------*/ 
 340 state_lookahead_tokens_count (state 
*s
, bool default_rule_only_for_accept
) 
 342   int n_lookahead_tokens 
= 0; 
 343   reductions 
*rp 
= s
->reductions
; 
 344   transitions 
*sp 
= s
->transitions
; 
 346   /* Transitions are only disabled during conflict resolution, and that 
 347      hasn't happened yet, so there should be no need to check that 
 348      transition 0 hasn't been disabled before checking if it is a shift. 
 349      However, this check was performed at one time, so we leave it as an 
 351   aver (sp
->num 
== 0 || !TRANSITION_IS_DISABLED (sp
, 0)); 
 353   /* We need a lookahead either to distinguish different reductions 
 354      (i.e., there are two or more), or to distinguish a reduction from a 
 355      shift.  Otherwise, it is straightforward, and the state is 
 356      `consistent'.  However, for states that have any rules, treat only 
 357      the accepting state as consistent (since there is never a lookahead 
 358      token that makes sense there, and so no lookahead token should be 
 359      read) if the user has otherwise disabled default rules.  */ 
 361       || (rp
->num 
== 1 && sp
->num 
&& TRANSITION_IS_SHIFT (sp
, 0)) 
 362       || (rp
->num 
== 1 && rp
->rules
[0]->number 
!= 0 
 363           && default_rule_only_for_accept
)) 
 364     n_lookahead_tokens 
+= rp
->num
; 
 368   return n_lookahead_tokens
; 
 372 /*----------------------------------------------------. 
 373 | Compute LA, NLA, and the lookahead_tokens members.  | 
 374 `----------------------------------------------------*/ 
 381   bool default_rule_only_for_accept
; 
 383     char *default_rules 
= muscle_percent_define_get ("lr.default_rules"); 
 384     default_rule_only_for_accept 
= 0 == strcmp (default_rules
, "accepting"); 
 385     free (default_rules
); 
 388   /* Compute the total number of reductions requiring a lookahead.  */ 
 390   for (i 
= 0; i 
< nstates
; i
++) 
 392       state_lookahead_tokens_count (states
[i
], default_rule_only_for_accept
); 
 393   /* Avoid having to special case 0.  */ 
 397   pLA 
= LA 
= bitsetv_create (nLA
, ntokens
, BITSET_FIXED
); 
 398   lookback 
= xcalloc (nLA
, sizeof *lookback
); 
 400   /* Initialize the members LOOKAHEAD_TOKENS for each state whose reductions 
 401      require lookahead tokens.  */ 
 402   for (i 
= 0; i 
< nstates
; i
++) 
 405         state_lookahead_tokens_count (states
[i
], default_rule_only_for_accept
); 
 408           states
[i
]->reductions
->lookahead_tokens 
= pLA
; 
 415 /*---------------------------------------------. 
 416 | Output the lookahead tokens for each state.  | 
 417 `---------------------------------------------*/ 
 420 lookahead_tokens_print (FILE *out
) 
 424   fprintf (out
, "Lookahead tokens: BEGIN\n"); 
 425   for (i 
= 0; i 
< nstates
; ++i
) 
 427       reductions 
*reds 
= states
[i
]->reductions
; 
 428       bitset_iterator iter
; 
 429       int n_lookahead_tokens 
= 0; 
 431       if (reds
->lookahead_tokens
) 
 432         for (k 
= 0; k 
< reds
->num
; ++k
) 
 433           if (reds
->lookahead_tokens
[k
]) 
 434             ++n_lookahead_tokens
; 
 436       fprintf (out
, "State %d: %d lookahead tokens\n", 
 437                i
, n_lookahead_tokens
); 
 439       if (reds
->lookahead_tokens
) 
 440         for (j 
= 0; j 
< reds
->num
; ++j
) 
 441           BITSET_FOR_EACH (iter
, reds
->lookahead_tokens
[j
], k
, 0) 
 443             fprintf (out
, "   on %d (%s) -> rule %d\n", 
 445                      reds
->rules
[j
]->number
); 
 448   fprintf (out
, "Lookahead tokens: END\n"); 
 459   compute_lookahead_tokens (); 
 461   if (trace_flag 
& trace_sets
) 
 462     lookahead_tokens_print (stderr
); 
 467 lalr_update_state_numbers (state_number old_to_new
[], state_number nstates_old
) 
 469   goto_number ngotos_reachable 
= 0; 
 470   symbol_number nonterminal 
= 0; 
 471   aver (nsyms 
== nvars 
+ ntokens
); 
 474     for (i 
= 0; i 
< ngotos
; ++i
) 
 476         while (i 
== goto_map
[nonterminal
]) 
 477           goto_map
[nonterminal
++] = ngotos_reachable
; 
 478         /* If old_to_new[from_state[i]] = nstates_old, remove this goto 
 480         if (old_to_new
[from_state
[i
]] != nstates_old
) 
 482             /* from_state[i] is not removed, so it and thus to_state[i] are 
 483                reachable, so to_state[i] != nstates_old.  */ 
 484             aver (old_to_new
[to_state
[i
]] != nstates_old
); 
 485             from_state
[ngotos_reachable
] = old_to_new
[from_state
[i
]]; 
 486             to_state
[ngotos_reachable
] = old_to_new
[to_state
[i
]]; 
 491   while (nonterminal 
<= nvars
) 
 493       aver (ngotos 
== goto_map
[nonterminal
]); 
 494       goto_map
[nonterminal
++] = ngotos_reachable
; 
 496   ngotos 
= ngotos_reachable
; 
 504   for (s 
= 0; s 
< nstates
; ++s
) 
 505     states
[s
]->reductions
->lookahead_tokens 
= NULL
;