]>
Commit | Line | Data |
---|---|---|
d0fb370f | 1 | /* Type definitions for nondeterministic finite state machine for bison, |
d954473d | 2 | Copyright 1984, 1989, 2000, 2001 Free Software Foundation, Inc. |
d0fb370f | 3 | |
a70083a3 | 4 | This file is part of Bison, the GNU Compiler Compiler. |
d0fb370f | 5 | |
a70083a3 AD |
6 | Bison is free software; you can redistribute it and/or modify |
7 | it under the terms of the GNU General Public License as published by | |
8 | the Free Software Foundation; either version 2, or (at your option) | |
9 | any later version. | |
d0fb370f | 10 | |
a70083a3 AD |
11 | Bison is distributed in the hope that it will be useful, |
12 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
14 | GNU General Public License for more details. | |
d0fb370f | 15 | |
a70083a3 AD |
16 | You should have received a copy of the GNU General Public License |
17 | along with Bison; see the file COPYING. If not, write to | |
18 | the Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
19 | Boston, MA 02111-1307, USA. */ | |
d0fb370f RS |
20 | |
21 | ||
22 | /* These type definitions are used to represent a nondeterministic | |
a70083a3 AD |
23 | finite state machine that parses the specified grammar. This |
24 | information is generated by the function generate_states in the | |
25 | file LR0. | |
26 | ||
27 | Each state of the machine is described by a set of items -- | |
28 | particular positions in particular rules -- that are the possible | |
29 | places where parsing could continue when the machine is in this | |
30 | state. These symbols at these items are the allowable inputs that | |
31 | can follow now. | |
32 | ||
33 | A core represents one state. States are numbered in the number | |
34 | field. When generate_states is finished, the starting state is | |
35 | state 0 and nstates is the number of states. (A transition to a | |
36 | state whose state number is nstates indicates termination.) All | |
37 | the cores are chained together and first_state points to the first | |
38 | one (state 0). | |
39 | ||
40 | For each state there is a particular symbol which must have been | |
41 | the last thing accepted to reach that state. It is the | |
42 | accessing_symbol of the core. | |
43 | ||
44 | Each core contains a vector of nitems items which are the indices | |
45 | in the ritems vector of the items that are selected in this state. | |
46 | ||
47 | The link field is used for chaining buckets that hash states by | |
48 | their itemsets. This is for recognizing equivalent states and | |
49 | combining them when the states are generated. | |
50 | ||
51 | The two types of transitions are shifts (push the lookahead token | |
52 | and read another) and reductions (combine the last n things on the | |
53 | stack via a rule, replace them with the symbol that the rule | |
54 | derives, and leave the lookahead token alone). When the states are | |
55 | generated, these transitions are represented in two other lists. | |
56 | ||
57 | Each shifts structure describes the possible shift transitions out | |
58 | of one state, the state whose number is in the number field. The | |
59 | shifts structures are linked through next and first_shift points to | |
60 | them. Each contains a vector of numbers of the states that shift | |
61 | transitions can go to. The accessing_symbol fields of those | |
62 | states' cores say what kind of input leads to them. | |
63 | ||
64 | A shift to state zero should be ignored. Conflict resolution | |
65 | deletes shifts by changing them to zero. | |
66 | ||
67 | Each reductions structure describes the possible reductions at the | |
68 | state whose number is in the number field. The data is a list of | |
69 | nreds rules, represented by their rule numbers. first_reduction | |
70 | points to the list of these structures. | |
71 | ||
72 | Conflict resolution can decide that certain tokens in certain | |
73 | states should explicitly be errors (for implementing %nonassoc). | |
74 | For each state, the tokens that are errors for this reason are | |
75 | recorded in an errs structure, which has the state number in its | |
76 | number field. The rest of the errs structure is full of token | |
77 | numbers. | |
78 | ||
79 | There is at least one shift transition present in state zero. It | |
80 | leads to a next-to-final state whose accessing_symbol is the | |
81 | grammar's start symbol. The next-to-final state has one shift to | |
82 | the final state, whose accessing_symbol is zero (end of input). | |
83 | The final state has one shift, which goes to the termination state | |
84 | (whose number is nstates-1). The reason for the extra state at the | |
85 | end is to placate the parser's strategy of making all decisions one | |
86 | token ahead of its actions. */ | |
87 | ||
88 | #ifndef STATE_H_ | |
89 | # define STATE_H_ | |
90 | ||
aa2aab3c | 91 | |
aa2aab3c AD |
92 | /*---------. |
93 | | Shifts. | | |
94 | `---------*/ | |
95 | ||
a70083a3 AD |
96 | typedef struct shifts |
97 | { | |
98 | struct shifts *next; | |
99 | short number; | |
100 | short nshifts; | |
101 | short shifts[1]; | |
aa2aab3c AD |
102 | } shifts; |
103 | ||
a70083a3 | 104 | |
f59c437a AD |
105 | #define SHIFTS_ALLOC(Nshifts) \ |
106 | (shifts *) xcalloc ((unsigned) (sizeof (shifts) \ | |
107 | + (Nshifts - 1) * sizeof (short)), 1) | |
a70083a3 | 108 | |
d954473d AD |
109 | shifts * shifts_new PARAMS ((int n)); |
110 | ||
111 | ||
b608206e AD |
112 | /* What is the symbol which is shifted by SHIFTS->shifts[Shift]? Can |
113 | be a token (amongst which the error token), or non terminals in | |
114 | case of gotos. */ | |
115 | ||
116 | #define SHIFT_SYMBOL(Shifts, Shift) \ | |
f693ad14 | 117 | (state_table[Shifts->shifts[Shift]]->accessing_symbol) |
b608206e | 118 | |
aa2aab3c AD |
119 | /* Is the SHIFTS->shifts[Shift] a real shift? (as opposed to gotos.) */ |
120 | ||
121 | #define SHIFT_IS_SHIFT(Shifts, Shift) \ | |
b608206e | 122 | (ISTOKEN (SHIFT_SYMBOL (Shifts, Shift))) |
aa2aab3c AD |
123 | |
124 | /* Is the SHIFTS->shifts[Shift] a goto?. */ | |
125 | ||
126 | #define SHIFT_IS_GOTO(Shifts, Shift) \ | |
127 | (!SHIFT_IS_SHIFT (Shifts, Shift)) | |
128 | ||
129 | /* Is the SHIFTS->shifts[Shift] then handling of the error token?. */ | |
130 | ||
131 | #define SHIFT_IS_ERROR(Shifts, Shift) \ | |
b608206e | 132 | (SHIFT_SYMBOL (Shifts, Shift) == error_token_number) |
aa2aab3c | 133 | |
9839bbe5 AD |
134 | /* When resolving a SR conflicts, if the reduction wins, the shift is |
135 | disabled. */ | |
136 | ||
137 | #define SHIFT_DISABLE(Shifts, Shift) \ | |
138 | (Shifts->shifts[Shift] = 0) | |
139 | ||
140 | #define SHIFT_IS_DISABLED(Shifts, Shift) \ | |
141 | (Shifts->shifts[Shift] == 0) | |
142 | ||
aa2aab3c AD |
143 | |
144 | /*-------. | |
145 | | Errs. | | |
146 | `-------*/ | |
a70083a3 AD |
147 | |
148 | typedef struct errs | |
149 | { | |
150 | short nerrs; | |
151 | short errs[1]; | |
aa2aab3c | 152 | } errs; |
a70083a3 | 153 | |
f59c437a AD |
154 | #define ERRS_ALLOC(Nerrs) \ |
155 | (errs *) xcalloc ((unsigned) (sizeof (errs) \ | |
156 | + (Nerrs - 1) * sizeof (short)), 1) | |
157 | ||
a70083a3 | 158 | |
aa2aab3c AD |
159 | /*-------------. |
160 | | Reductions. | | |
161 | `-------------*/ | |
a70083a3 AD |
162 | |
163 | typedef struct reductions | |
164 | { | |
165 | struct reductions *next; | |
166 | short number; | |
167 | short nreds; | |
168 | short rules[1]; | |
aa2aab3c | 169 | } reductions; |
d0fb370f | 170 | |
f59c437a AD |
171 | #define REDUCTIONS_ALLOC(Nreductions) \ |
172 | (reductions *) xcalloc ((unsigned) (sizeof (reductions) \ | |
173 | + (Nreductions - 1) * sizeof (short)), 1) | |
174 | ||
f693ad14 AD |
175 | |
176 | ||
177 | /*----------. | |
178 | | State_t. | | |
179 | `----------*/ | |
180 | ||
181 | typedef struct state_s | |
182 | { | |
183 | struct state_s *next; | |
184 | struct state_s *link; | |
185 | ||
186 | short number; | |
187 | short accessing_symbol; | |
188 | shifts *shifts; | |
189 | reductions *reductions; | |
190 | errs *errs; | |
191 | ||
192 | /* Nonzero if no lookahead is needed to decide what to do in state S. */ | |
193 | char consistent; | |
194 | ||
195 | /* Used in LALR, not LR(0). */ | |
196 | short lookaheads; | |
197 | ||
198 | /* Its items. */ | |
199 | short nitems; | |
200 | short items[1]; | |
201 | } state_t; | |
202 | ||
203 | #define STATE_ALLOC(Nitems) \ | |
204 | (state_t *) xcalloc ((unsigned) (sizeof (state_t) \ | |
205 | + (Nitems - 1) * sizeof (short)), 1) | |
206 | ||
a70083a3 | 207 | #endif /* !STATE_H_ */ |