]>
Commit | Line | Data |
---|---|---|
1 | /* Definitions for symtab.c and callers, part of Bison. | |
2 | ||
3 | Copyright (C) 1984, 1989, 1992, 2000-2002, 2004-2013 Free Software | |
4 | Foundation, Inc. | |
5 | ||
6 | This file is part of Bison, the GNU Compiler Compiler. | |
7 | ||
8 | This program is free software: you can redistribute it and/or modify | |
9 | it under the terms of the GNU General Public License as published by | |
10 | the Free Software Foundation, either version 3 of the License, or | |
11 | (at your option) any later version. | |
12 | ||
13 | This program is distributed in the hope that it will be useful, | |
14 | but WITHOUT ANY WARRANTY; without even the implied warranty of | |
15 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
16 | GNU General Public License for more details. | |
17 | ||
18 | You should have received a copy of the GNU General Public License | |
19 | along with this program. If not, see <http://www.gnu.org/licenses/>. */ | |
20 | ||
21 | /** | |
22 | * \file symtab.h | |
23 | * \brief Manipulating ::symbol. | |
24 | */ | |
25 | ||
26 | #ifndef SYMTAB_H_ | |
27 | # define SYMTAB_H_ | |
28 | ||
29 | # include "assoc.h" | |
30 | # include "location.h" | |
31 | # include "scan-code.h" | |
32 | # include "uniqstr.h" | |
33 | ||
34 | /*----------. | |
35 | | Symbols. | | |
36 | `----------*/ | |
37 | ||
38 | /** Symbol classes. */ | |
39 | typedef enum | |
40 | { | |
41 | unknown_sym, /**< Undefined. */ | |
42 | token_sym, /**< Terminal. */ | |
43 | nterm_sym /**< Non-terminal. */ | |
44 | } symbol_class; | |
45 | ||
46 | ||
47 | /** Internal token numbers. */ | |
48 | typedef int symbol_number; | |
49 | # define SYMBOL_NUMBER_MAXIMUM INT_MAX | |
50 | ||
51 | ||
52 | typedef struct symbol symbol; | |
53 | ||
54 | /* Declaration status of a symbol. | |
55 | ||
56 | First, it is "undeclared". Then, if "undeclared" and used in a | |
57 | %printer/%destructor, it is "used". If not "declared" but used in | |
58 | a rule, it is "needed". Finally, if declared (via a rule for | |
59 | nonterminals, or %token), it is "declared". | |
60 | ||
61 | When status are checked at the end, "declared" symbols are fine, | |
62 | "used" symbols trigger warnings, otherwise it's an error. */ | |
63 | ||
64 | typedef enum | |
65 | { | |
66 | /** Used in the input file for an unknown reason (error). */ | |
67 | undeclared, | |
68 | /** Used by %destructor/%printer but not defined (warning). */ | |
69 | used, | |
70 | /** Used in the gramar (rules) but not defined (error). */ | |
71 | needed, | |
72 | /** Defined with %type or %token (good). */ | |
73 | declared, | |
74 | } status; | |
75 | ||
76 | typedef enum code_props_type code_props_type; | |
77 | enum code_props_type | |
78 | { | |
79 | destructor = 0, | |
80 | printer = 1, | |
81 | }; | |
82 | ||
83 | enum { CODE_PROPS_SIZE = 2 }; | |
84 | ||
85 | /* When extending this structure, be sure to complete | |
86 | symbol_check_alias_consistency. */ | |
87 | struct symbol | |
88 | { | |
89 | /** The key, name of the symbol. */ | |
90 | uniqstr tag; | |
91 | /** The location of its first occurrence. */ | |
92 | location location; | |
93 | ||
94 | /** Its \c \%type. | |
95 | ||
96 | Beware that this is the type_name as was entered by the user, | |
97 | including silly things such as "]" if she entered "%token <]> t". | |
98 | Therefore, when outputting type_name to M4, be sure to escape it | |
99 | into "@}". See quoted_output for instance. */ | |
100 | uniqstr type_name; | |
101 | ||
102 | /** Its \c \%type's location. */ | |
103 | location type_location; | |
104 | ||
105 | /** Any \c \%destructor (resp. \%printer) declared specificially for this | |
106 | symbol. | |
107 | ||
108 | Access this field only through <tt>symbol</tt>'s interface functions. For | |
109 | example, if <tt>symbol::destructor = NULL</tt> (resp. <tt>symbol::printer | |
110 | = NULL</tt>), a default \c \%destructor (resp. \%printer) or a per-type | |
111 | \c symbol_destructor_printer_get will compute the correct one. */ | |
112 | code_props props[CODE_PROPS_SIZE]; | |
113 | ||
114 | symbol_number number; | |
115 | location prec_location; | |
116 | int prec; | |
117 | assoc assoc; | |
118 | int user_token_number; | |
119 | ||
120 | /* Points to the other in the symbol-string pair for an alias. | |
121 | Special value USER_NUMBER_HAS_STRING_ALIAS in the symbol half of the | |
122 | symbol-string pair for an alias. */ | |
123 | symbol *alias; | |
124 | symbol_class class; | |
125 | status status; | |
126 | }; | |
127 | ||
128 | /** Undefined user number. */ | |
129 | # define USER_NUMBER_UNDEFINED -1 | |
130 | ||
131 | /* 'symbol->user_token_number == USER_NUMBER_HAS_STRING_ALIAS' means | |
132 | this symbol has a literal string alias. For instance, '%token foo | |
133 | "foo"' has '"foo"' numbered regularly, and 'foo' numbered as | |
134 | USER_NUMBER_HAS_STRING_ALIAS. */ | |
135 | # define USER_NUMBER_HAS_STRING_ALIAS -9991 | |
136 | ||
137 | /* Undefined internal token number. */ | |
138 | # define NUMBER_UNDEFINED (-1) | |
139 | ||
140 | /** Fetch (or create) the symbol associated to KEY. */ | |
141 | symbol *symbol_from_uniqstr (const uniqstr key, location loc); | |
142 | ||
143 | /** Fetch (or create) the symbol associated to KEY. */ | |
144 | symbol *symbol_get (const char *key, location loc); | |
145 | ||
146 | /** Generate a dummy nonterminal. | |
147 | ||
148 | Its name cannot conflict with the user's names. */ | |
149 | symbol *dummy_symbol_get (location loc); | |
150 | ||
151 | ||
152 | /*--------------------. | |
153 | | Methods on symbol. | | |
154 | `--------------------*/ | |
155 | ||
156 | /** Print a symbol (for debugging). */ | |
157 | void symbol_print (symbol const *s, FILE *f); | |
158 | ||
159 | /** Is this a dummy nonterminal? */ | |
160 | bool symbol_is_dummy (const symbol *sym); | |
161 | ||
162 | /** The name of the code_props type: "\%destructor" or "\%printer". */ | |
163 | char const *code_props_type_string (code_props_type kind); | |
164 | ||
165 | /** The name of the symbol that can be used as an identifier. | |
166 | ** Consider the alias if needed. | |
167 | ** Return 0 if there is none (e.g., the symbol is only defined as | |
168 | ** a string). */ | |
169 | uniqstr symbol_id_get (symbol const *sym); | |
170 | ||
171 | /** | |
172 | * Make \c str the literal string alias of \c sym. Copy token number, | |
173 | * symbol number, and type from \c sym to \c str. | |
174 | */ | |
175 | void symbol_make_alias (symbol *sym, symbol *str, location loc); | |
176 | ||
177 | /** Set the \c type_name associated with \c sym. | |
178 | ||
179 | Do nothing if passed 0 as \c type_name. */ | |
180 | void symbol_type_set (symbol *sym, uniqstr type_name, location loc); | |
181 | ||
182 | /** Set the \c \%destructor or \c \%printer associated with \c sym. */ | |
183 | void symbol_code_props_set (symbol *sym, code_props_type kind, | |
184 | code_props const *destructor); | |
185 | ||
186 | /** Get the computed \c \%destructor or \c %printer for \c sym, which was | |
187 | initialized with \c code_props_none_init if there's no \c \%destructor or | |
188 | \c %printer. */ | |
189 | code_props *symbol_code_props_get (symbol *sym, code_props_type kind); | |
190 | ||
191 | /** Set the \c precedence associated with \c sym. | |
192 | ||
193 | Ensure that \a symbol is a terminal. | |
194 | Do nothing if invoked with \c undef_assoc as \c assoc. */ | |
195 | void symbol_precedence_set (symbol *sym, int prec, assoc a, location loc); | |
196 | ||
197 | /** Set the \c class associated with \c sym. */ | |
198 | void symbol_class_set (symbol *sym, symbol_class class, location loc, | |
199 | bool declaring); | |
200 | ||
201 | /** Set the \c user_token_number associated with \c sym. */ | |
202 | void symbol_user_token_number_set (symbol *sym, int user_number, location loc); | |
203 | ||
204 | ||
205 | ||
206 | /*------------------. | |
207 | | Special symbols. | | |
208 | `------------------*/ | |
209 | ||
210 | /** The error token. */ | |
211 | extern symbol *errtoken; | |
212 | /** The token for unknown tokens. */ | |
213 | extern symbol *undeftoken; | |
214 | /** The end of input token. */ | |
215 | extern symbol *endtoken; | |
216 | /** The genuine start symbol. | |
217 | ||
218 | $accept: start-symbol $end */ | |
219 | extern symbol *accept; | |
220 | ||
221 | /** The user start symbol. */ | |
222 | extern symbol *startsymbol; | |
223 | /** The location of the \c \%start declaration. */ | |
224 | extern location startsymbol_location; | |
225 | ||
226 | ||
227 | ||
228 | /*-------------------. | |
229 | | Symbol Relations. | | |
230 | `-------------------*/ | |
231 | ||
232 | /* The symbol relations are represented by a directed graph. */ | |
233 | ||
234 | /* The id of a node */ | |
235 | typedef int graphid; | |
236 | ||
237 | typedef struct symgraphlink symgraphlink; | |
238 | ||
239 | struct symgraphlink | |
240 | { | |
241 | /** The second \c symbol or group of a precedence relation. | |
242 | * See \c symgraph. */ | |
243 | graphid id; | |
244 | ||
245 | symgraphlink *next; | |
246 | }; | |
247 | ||
248 | /* Symbol precedence graph, to store the used precedence relations between | |
249 | * symbols. */ | |
250 | ||
251 | typedef struct symgraph symgraph; | |
252 | ||
253 | struct symgraph | |
254 | { | |
255 | /** Identifier for the node: equal to the number of the symbol. */ | |
256 | graphid id; | |
257 | ||
258 | /** The list of related symbols that have a smaller precedence. */ | |
259 | symgraphlink *succ; | |
260 | ||
261 | /** The list of related symbols that have a greater precedence. */ | |
262 | symgraphlink *pred; | |
263 | }; | |
264 | ||
265 | /** Register a new precedence relation as used. */ | |
266 | ||
267 | void register_precedence (graphid first, graphid snd); | |
268 | ||
269 | /** Print a warning for each symbol whose precedence and/or associativity | |
270 | * is useless. */ | |
271 | ||
272 | void print_precedence_warnings (void); | |
273 | ||
274 | /*----------------------. | |
275 | | Symbol associativity | | |
276 | `----------------------*/ | |
277 | ||
278 | void register_assoc (graphid i, graphid j); | |
279 | ||
280 | /*-----------------. | |
281 | | Semantic types. | | |
282 | `-----------------*/ | |
283 | ||
284 | /** A semantic type and its associated \c \%destructor and \c \%printer. | |
285 | ||
286 | Access the fields of this struct only through the interface functions in | |
287 | this file. \sa symbol::destructor */ | |
288 | typedef struct { | |
289 | /** The key, name of the semantic type. */ | |
290 | uniqstr tag; | |
291 | ||
292 | /** The location of its first occurence. */ | |
293 | location location; | |
294 | ||
295 | /** Its status : "undeclared", "used" or "declared". | |
296 | It cannot be "needed". */ | |
297 | status status; | |
298 | ||
299 | /** Any \c %destructor and %printer declared for this | |
300 | semantic type. */ | |
301 | code_props props[CODE_PROPS_SIZE]; | |
302 | ||
303 | } semantic_type; | |
304 | ||
305 | /** Fetch (or create) the semantic type associated to KEY. */ | |
306 | semantic_type *semantic_type_from_uniqstr (const uniqstr key, | |
307 | const location *loc); | |
308 | ||
309 | /** Fetch (or create) the semantic type associated to KEY. */ | |
310 | semantic_type *semantic_type_get (const char *key, const location *loc); | |
311 | ||
312 | /** Set the \c destructor or \c printer associated with \c type. */ | |
313 | void semantic_type_code_props_set (semantic_type *type, | |
314 | code_props_type kind, | |
315 | code_props const *code); | |
316 | ||
317 | /*----------------------------------. | |
318 | | Symbol and semantic type tables. | | |
319 | `----------------------------------*/ | |
320 | ||
321 | /** Create the symbol and semantic type tables. */ | |
322 | void symbols_new (void); | |
323 | ||
324 | /** Free all the memory allocated for symbols and semantic types. */ | |
325 | void symbols_free (void); | |
326 | ||
327 | /** Check that all the symbols are defined. | |
328 | ||
329 | Report any undefined symbols and consider them nonterminals. */ | |
330 | void symbols_check_defined (void); | |
331 | ||
332 | /** Sanity checks and #token_translations construction. | |
333 | ||
334 | Perform various sanity checks, assign symbol numbers, and set up | |
335 | #token_translations. */ | |
336 | void symbols_pack (void); | |
337 | ||
338 | #endif /* !SYMTAB_H_ */ |