]>
Commit | Line | Data |
---|---|---|
2cc6b612 PE |
1 | /* Definitions for symtab.c and callers, part of Bison. |
2 | ||
7d6bad19 | 3 | Copyright (C) 1984, 1989, 1992, 2000-2002, 2004-2013 Free Software |
575619af | 4 | Foundation, Inc. |
f7d4d87a | 5 | |
340ef489 | 6 | This file is part of Bison, the GNU Compiler Compiler. |
f7d4d87a | 7 | |
f16b0819 | 8 | This program is free software: you can redistribute it and/or modify |
340ef489 | 9 | it under the terms of the GNU General Public License as published by |
f16b0819 PE |
10 | the Free Software Foundation, either version 3 of the License, or |
11 | (at your option) any later version. | |
f7d4d87a | 12 | |
f16b0819 | 13 | This program is distributed in the hope that it will be useful, |
340ef489 AD |
14 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
15 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
16 | GNU General Public License for more details. | |
f7d4d87a | 17 | |
340ef489 | 18 | You should have received a copy of the GNU General Public License |
f16b0819 | 19 | along with this program. If not, see <http://www.gnu.org/licenses/>. */ |
f7d4d87a | 20 | |
2073e1b6 AD |
21 | /** |
22 | * \file symtab.h | |
23 | * \brief Manipulating ::symbol. | |
24 | */ | |
25 | ||
340ef489 AD |
26 | #ifndef SYMTAB_H_ |
27 | # define SYMTAB_H_ | |
f7d4d87a | 28 | |
a945ec39 | 29 | # include "assoc.h" |
7486e51b | 30 | # include "location.h" |
95021767 | 31 | # include "scan-code.h" |
7486e51b | 32 | # include "uniqstr.h" |
8efe435c | 33 | |
2f1afb73 AD |
34 | /*----------. |
35 | | Symbols. | | |
36 | `----------*/ | |
f7d4d87a | 37 | |
2073e1b6 | 38 | /** Symbol classes. */ |
d7020c20 AD |
39 | typedef enum |
40 | { | |
2073e1b6 | 41 | unknown_sym, /**< Undefined. */ |
e9690142 JD |
42 | token_sym, /**< Terminal. */ |
43 | nterm_sym /**< Non-terminal. */ | |
d7020c20 | 44 | } symbol_class; |
340ef489 | 45 | |
b87f8b21 | 46 | |
2073e1b6 | 47 | /** Internal token numbers. */ |
f6fbd3da | 48 | typedef int symbol_number; |
a99ec53e | 49 | # define SYMBOL_NUMBER_MAXIMUM INT_MAX |
5fbb0954 | 50 | |
5fbb0954 | 51 | |
7486e51b | 52 | typedef struct symbol symbol; |
df09ef2e | 53 | |
3b0b682f AD |
54 | /* Declaration status of a symbol. |
55 | ||
56 | First, it is "undeclared". Then, if "undeclared" and used in a | |
3edfae04 AD |
57 | %printer/%destructor, it is "used". If not "declared" but used in |
58 | a rule, it is "needed". Finally, if declared (via a rule for | |
59 | nonterminals, or %token), it is "declared". | |
3b0b682f AD |
60 | |
61 | When status are checked at the end, "declared" symbols are fine, | |
3edfae04 | 62 | "used" symbols trigger warnings, otherwise it's an error. */ |
3b0b682f | 63 | |
b921d92f VS |
64 | typedef enum |
65 | { | |
3b0b682f AD |
66 | /** Used in the input file for an unknown reason (error). */ |
67 | undeclared, | |
68 | /** Used by %destructor/%printer but not defined (warning). */ | |
69 | used, | |
70 | /** Used in the gramar (rules) but not defined (error). */ | |
71 | needed, | |
72 | /** Defined with %type or %token (good). */ | |
73 | declared, | |
b921d92f VS |
74 | } status; |
75 | ||
71da68b3 VS |
76 | typedef enum code_props_type code_props_type; |
77 | enum code_props_type | |
78 | { | |
79 | destructor = 0, | |
80 | printer = 1, | |
81 | }; | |
82 | ||
83 | enum { CODE_PROPS_SIZE = 2 }; | |
84 | ||
df09ef2e AD |
85 | /* When extending this structure, be sure to complete |
86 | symbol_check_alias_consistency. */ | |
7486e51b | 87 | struct symbol |
340ef489 | 88 | { |
2073e1b6 | 89 | /** The key, name of the symbol. */ |
7486e51b | 90 | uniqstr tag; |
2073e1b6 | 91 | /** The location of its first occurrence. */ |
7486e51b | 92 | location location; |
1e0bab92 | 93 | |
9a86ee60 AD |
94 | /** Its \c \%type. |
95 | ||
96 | Beware that this is the type_name as was entered by the user, | |
97 | including silly things such as "]" if she entered "%token <]> t". | |
98 | Therefore, when outputting type_name to M4, be sure to escape it | |
99 | into "@}". See quoted_output for instance. */ | |
7486e51b | 100 | uniqstr type_name; |
9c46ba16 | 101 | |
ec5479ce | 102 | /** Its \c \%type's location. */ |
df09ef2e AD |
103 | location type_location; |
104 | ||
71da68b3 VS |
105 | /** Any \c \%destructor (resp. \%printer) declared specificially for this |
106 | symbol. | |
ec5479ce | 107 | |
71da68b3 | 108 | Access this field only through <tt>symbol</tt>'s interface functions. For |
4323e0da | 109 | example, if <tt>symbol::destructor = NULL</tt> (resp. <tt>symbol::printer |
71da68b3 | 110 | = NULL</tt>), a default \c \%destructor (resp. \%printer) or a per-type |
4323e0da | 111 | \c symbol_destructor_printer_get will compute the correct one. */ |
71da68b3 | 112 | code_props props[CODE_PROPS_SIZE]; |
ee000ba4 | 113 | |
7486e51b | 114 | symbol_number number; |
df09ef2e | 115 | location prec_location; |
f6fbd3da | 116 | int prec; |
7486e51b | 117 | assoc assoc; |
62a3e4f0 | 118 | int user_token_number; |
3f96f4dc | 119 | |
dfaa4860 JD |
120 | /* Points to the other in the symbol-string pair for an alias. |
121 | Special value USER_NUMBER_HAS_STRING_ALIAS in the symbol half of the | |
122 | symbol-string pair for an alias. */ | |
7486e51b | 123 | symbol *alias; |
d7020c20 | 124 | symbol_class class; |
b921d92f | 125 | status status; |
db8837cb AD |
126 | }; |
127 | ||
2073e1b6 | 128 | /** Undefined user number. */ |
a99ec53e | 129 | # define USER_NUMBER_UNDEFINED -1 |
b87f8b21 | 130 | |
dfaa4860 JD |
131 | /* `symbol->user_token_number == USER_NUMBER_HAS_STRING_ALIAS' means |
132 | this symbol has a literal string alias. For instance, `%token foo | |
b87f8b21 | 133 | "foo"' has `"foo"' numbered regularly, and `foo' numbered as |
dfaa4860 | 134 | USER_NUMBER_HAS_STRING_ALIAS. */ |
a99ec53e | 135 | # define USER_NUMBER_HAS_STRING_ALIAS -9991 |
b87f8b21 AD |
136 | |
137 | /* Undefined internal token number. */ | |
a99ec53e | 138 | # define NUMBER_UNDEFINED (-1) |
b87f8b21 | 139 | |
2073e1b6 | 140 | /** Fetch (or create) the symbol associated to KEY. */ |
203b9274 AD |
141 | symbol *symbol_from_uniqstr (const uniqstr key, location loc); |
142 | ||
2073e1b6 | 143 | /** Fetch (or create) the symbol associated to KEY. */ |
7486e51b | 144 | symbol *symbol_get (const char *key, location loc); |
39f41916 | 145 | |
2073e1b6 AD |
146 | /** Generate a dummy nonterminal. |
147 | ||
148 | Its name cannot conflict with the user's names. */ | |
7486e51b | 149 | symbol *dummy_symbol_get (location loc); |
2f1afb73 | 150 | |
aea10ef4 AD |
151 | |
152 | /*--------------------. | |
153 | | Methods on symbol. | | |
154 | `--------------------*/ | |
155 | ||
156 | /** Print a symbol (for debugging). */ | |
c5289832 | 157 | void symbol_print (symbol const *s, FILE *f); |
aea10ef4 | 158 | |
4d7370cb JD |
159 | /** Is this a dummy nonterminal? */ |
160 | bool symbol_is_dummy (const symbol *sym); | |
161 | ||
6a0655d9 AD |
162 | /** The name of the code_props type: "\%destructor" or "\%printer". */ |
163 | char const *code_props_type_string (code_props_type kind); | |
164 | ||
165 | /** The name of the symbol that can be used as an identifier. | |
aea10ef4 AD |
166 | ** Consider the alias if needed. |
167 | ** Return 0 if there is none (e.g., the symbol is only defined as | |
168 | ** a string). */ | |
169 | uniqstr symbol_id_get (symbol const *sym); | |
170 | ||
dfaa4860 JD |
171 | /** |
172 | * Make \c str the literal string alias of \c sym. Copy token number, | |
173 | * symbol number, and type from \c sym to \c str. | |
174 | */ | |
175 | void symbol_make_alias (symbol *sym, symbol *str, location loc); | |
2f1afb73 | 176 | |
2073e1b6 AD |
177 | /** Set the \c type_name associated with \c sym. |
178 | ||
179 | Do nothing if passed 0 as \c type_name. */ | |
7486e51b | 180 | void symbol_type_set (symbol *sym, uniqstr type_name, location loc); |
3ae2b51f | 181 | |
71da68b3 VS |
182 | /** Set the \c \%destructor or \c \%printer associated with \c sym. */ |
183 | void symbol_code_props_set (symbol *sym, code_props_type kind, | |
184 | code_props const *destructor); | |
db06f0ce | 185 | |
71da68b3 | 186 | /** Get the computed \c \%destructor or \c %printer for \c sym, which was |
0560fa24 AD |
187 | initialized with \c code_props_none_init if there's no \c \%destructor or |
188 | \c %printer. */ | |
70946cff | 189 | code_props *symbol_code_props_get (symbol *sym, code_props_type kind); |
ec5479ce | 190 | |
0560fa24 | 191 | /** Set the \c precedence associated with \c sym. |
2073e1b6 | 192 | |
0560fa24 AD |
193 | Ensure that \a symbol is a terminal. |
194 | Do nothing if invoked with \c undef_assoc as \c assoc. */ | |
7486e51b | 195 | void symbol_precedence_set (symbol *sym, int prec, assoc a, location loc); |
3ae2b51f | 196 | |
2073e1b6 | 197 | /** Set the \c class associated with \c sym. */ |
073f9288 | 198 | void symbol_class_set (symbol *sym, symbol_class class, location loc, |
e9690142 | 199 | bool declaring); |
44536b35 | 200 | |
2073e1b6 | 201 | /** Set the \c user_token_number associated with \c sym. */ |
7486e51b | 202 | void symbol_user_token_number_set (symbol *sym, int user_number, location loc); |
44536b35 AD |
203 | |
204 | ||
aea10ef4 AD |
205 | |
206 | /*------------------. | |
207 | | Special symbols. | | |
208 | `------------------*/ | |
209 | ||
2073e1b6 | 210 | /** The error token. */ |
7486e51b | 211 | extern symbol *errtoken; |
2073e1b6 | 212 | /** The token for unknown tokens. */ |
7486e51b | 213 | extern symbol *undeftoken; |
2073e1b6 | 214 | /** The end of input token. */ |
7486e51b | 215 | extern symbol *endtoken; |
2073e1b6 AD |
216 | /** The genuine start symbol. |
217 | ||
218 | $accept: start-symbol $end */ | |
7486e51b | 219 | extern symbol *accept; |
2073e1b6 AD |
220 | |
221 | /** The user start symbol. */ | |
7486e51b | 222 | extern symbol *startsymbol; |
ec5479ce | 223 | /** The location of the \c \%start declaration. */ |
7486e51b | 224 | extern location startsymbol_location; |
f7d4d87a | 225 | |
340ef489 | 226 | |
284bc49c VT |
227 | |
228 | /*-------------------. | |
229 | | Symbol Relations. | | |
230 | `-------------------*/ | |
231 | ||
232 | /* The symbol relations are represented by a directed graph. */ | |
233 | ||
234 | /* The id of a node */ | |
235 | typedef int graphid; | |
236 | ||
237 | typedef struct symgraphlink symgraphlink; | |
238 | ||
239 | struct symgraphlink | |
240 | { | |
241 | /** The second \c symbol or group of a precedence relation. | |
242 | * See \c symgraph. */ | |
243 | graphid id; | |
244 | ||
245 | symgraphlink *next; | |
246 | }; | |
247 | ||
248 | /* Symbol precedence graph, to store the used precedence relations between | |
249 | * symbols. */ | |
250 | ||
251 | typedef struct symgraph symgraph; | |
252 | ||
253 | struct symgraph | |
254 | { | |
255 | /** Identifier for the node: equal to the number of the symbol. */ | |
256 | graphid id; | |
257 | ||
258 | /** The list of related symbols that have a smaller precedence. */ | |
259 | symgraphlink *succ; | |
260 | ||
261 | /** The list of related symbols that have a greater precedence. */ | |
262 | symgraphlink *pred; | |
263 | }; | |
264 | ||
265 | /** Register a new precedence relation as used. */ | |
266 | ||
267 | void register_precedence (graphid first, graphid snd); | |
268 | ||
cc2235ac VT |
269 | /** Print a warning for each symbol whose precedence and/or associativity |
270 | * is useless. */ | |
284bc49c VT |
271 | |
272 | void print_precedence_warnings (void); | |
273 | ||
e8f7155d VT |
274 | /*----------------------. |
275 | | Symbol associativity | | |
276 | `----------------------*/ | |
277 | ||
cc2235ac | 278 | void register_assoc (graphid i, graphid j); |
e8f7155d | 279 | |
b2a0b7ca JD |
280 | /*-----------------. |
281 | | Semantic types. | | |
282 | `-----------------*/ | |
283 | ||
284 | /** A semantic type and its associated \c \%destructor and \c \%printer. | |
db06f0ce | 285 | |
b2a0b7ca JD |
286 | Access the fields of this struct only through the interface functions in |
287 | this file. \sa symbol::destructor */ | |
db06f0ce | 288 | typedef struct { |
b2a0b7ca JD |
289 | /** The key, name of the semantic type. */ |
290 | uniqstr tag; | |
291 | ||
9641b918 VS |
292 | /** The location of its first occurence. */ |
293 | location location; | |
294 | ||
295 | /** Its status : "undeclared", "used" or "declared". | |
296 | It cannot be "needed". */ | |
297 | status status; | |
298 | ||
71da68b3 VS |
299 | /** Any \c %destructor and %printer declared for this |
300 | semantic type. */ | |
301 | code_props props[CODE_PROPS_SIZE]; | |
302 | ||
b2a0b7ca JD |
303 | } semantic_type; |
304 | ||
305 | /** Fetch (or create) the semantic type associated to KEY. */ | |
9641b918 VS |
306 | semantic_type *semantic_type_from_uniqstr (const uniqstr key, |
307 | const location *loc); | |
b2a0b7ca JD |
308 | |
309 | /** Fetch (or create) the semantic type associated to KEY. */ | |
9641b918 | 310 | semantic_type *semantic_type_get (const char *key, const location *loc); |
b2a0b7ca | 311 | |
71da68b3 VS |
312 | /** Set the \c destructor or \c printer associated with \c type. */ |
313 | void semantic_type_code_props_set (semantic_type *type, | |
314 | code_props_type kind, | |
315 | code_props const *code); | |
2f1afb73 | 316 | |
b2a0b7ca JD |
317 | /*----------------------------------. |
318 | | Symbol and semantic type tables. | | |
319 | `----------------------------------*/ | |
2f1afb73 | 320 | |
b2a0b7ca | 321 | /** Create the symbol and semantic type tables. */ |
d33cb3ae | 322 | void symbols_new (void); |
2f1afb73 | 323 | |
b2a0b7ca | 324 | /** Free all the memory allocated for symbols and semantic types. */ |
d33cb3ae | 325 | void symbols_free (void); |
340ef489 | 326 | |
2073e1b6 AD |
327 | /** Check that all the symbols are defined. |
328 | ||
329 | Report any undefined symbols and consider them nonterminals. */ | |
d33cb3ae | 330 | void symbols_check_defined (void); |
2f1afb73 | 331 | |
2073e1b6 AD |
332 | /** Sanity checks and #token_translations construction. |
333 | ||
334 | Perform various sanity checks, assign symbol numbers, and set up | |
335 | #token_translations. */ | |
d33cb3ae | 336 | void symbols_pack (void); |
2f1afb73 | 337 | |
340ef489 | 338 | #endif /* !SYMTAB_H_ */ |