X-Git-Url: https://git.saurik.com/bison.git/blobdiff_plain/95612cfa608188fc323ed3f8560cc6aea953ff32..c98b5143b071e351bdb820565681890046a6b45a:/src/symtab.h
diff --git a/src/symtab.h b/src/symtab.h
index 23a73351..bcc74951 100644
--- a/src/symtab.h
+++ b/src/symtab.h
@@ -1,162 +1,338 @@
-/* Definitions for symtab.c and callers, part of bison,
- Copyright (C) 1984, 1989, 1992, 2000, 2001, 2002
- Free Software Foundation, Inc.
+/* Definitions for symtab.c and callers, part of Bison.
+
+ Copyright (C) 1984, 1989, 1992, 2000-2002, 2004-2013 Free Software
+ Foundation, Inc.
This file is part of Bison, the GNU Compiler Compiler.
- Bison is free software; you can redistribute it and/or modify
+ This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 2, or (at your option)
- any later version.
+ the Free Software Foundation, either version 3 of the License, or
+ (at your option) any later version.
- Bison is distributed in the hope that it will be useful,
+ This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
- along with Bison; see the file COPYING. If not, write to
- the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
- Boston, MA 02111-1307, USA. */
+ along with this program. If not, see . */
+
+/**
+ * \file symtab.h
+ * \brief Manipulating ::symbol.
+ */
#ifndef SYMTAB_H_
# define SYMTAB_H_
-# include "struniq.h"
-# include "location.h"
# include "assoc.h"
+# include "location.h"
+# include "scan-code.h"
+# include "uniqstr.h"
/*----------.
| Symbols. |
`----------*/
-/* Symbol classes. */
+/** Symbol classes. */
typedef enum
{
- unknown_sym,
- token_sym, /* terminal symbol */
- nterm_sym /* non-terminal */
+ unknown_sym, /**< Undefined. */
+ token_sym, /**< Terminal. */
+ nterm_sym /**< Non-terminal. */
} symbol_class;
-/* Internal token numbers. */
-typedef short symbol_number_t;
-#define SYMBOL_NUMBER_MAX ((symbol_number_t) SHRT_MAX)
+/** Internal token numbers. */
+typedef int symbol_number;
+# define SYMBOL_NUMBER_MAXIMUM INT_MAX
+
+
+typedef struct symbol symbol;
+
+/* Declaration status of a symbol.
+ First, it is "undeclared". Then, if "undeclared" and used in a
+ %printer/%destructor, it is "used". If not "declared" but used in
+ a rule, it is "needed". Finally, if declared (via a rule for
+ nonterminals, or %token), it is "declared".
-typedef struct symbol_s symbol_t;
-struct symbol_s
+ When status are checked at the end, "declared" symbols are fine,
+ "used" symbols trigger warnings, otherwise it's an error. */
+
+typedef enum
+ {
+ /** Used in the input file for an unknown reason (error). */
+ undeclared,
+ /** Used by %destructor/%printer but not defined (warning). */
+ used,
+ /** Used in the gramar (rules) but not defined (error). */
+ needed,
+ /** Defined with %type or %token (good). */
+ declared,
+ } status;
+
+typedef enum code_props_type code_props_type;
+enum code_props_type
+ {
+ destructor = 0,
+ printer = 1,
+ };
+
+enum { CODE_PROPS_SIZE = 2 };
+
+/* When extending this structure, be sure to complete
+ symbol_check_alias_consistency. */
+struct symbol
{
- /* The key, name of the symbol. */
- struniq_t tag;
- /* The location of its first occurence. */
- location_t location;
-
- /* Its %type and associated printer and destructor. */
- struniq_t type_name;
- char *destructor;
- location_t destructor_location;
- char *printer;
- location_t printer_location;
-
- symbol_number_t number;
- short prec;
- assoc_t assoc;
+ /** The key, name of the symbol. */
+ uniqstr tag;
+ /** The location of its first occurrence. */
+ location location;
+
+ /** Its \c \%type.
+
+ Beware that this is the type_name as was entered by the user,
+ including silly things such as "]" if she entered "%token <]> t".
+ Therefore, when outputting type_name to M4, be sure to escape it
+ into "@}". See quoted_output for instance. */
+ uniqstr type_name;
+
+ /** Its \c \%type's location. */
+ location type_location;
+
+ /** Any \c \%destructor (resp. \%printer) declared specificially for this
+ symbol.
+
+ Access this field only through symbol's interface functions. For
+ example, if symbol::destructor = NULL (resp. symbol::printer
+ = NULL), a default \c \%destructor (resp. \%printer) or a per-type
+ \c symbol_destructor_printer_get will compute the correct one. */
+ code_props props[CODE_PROPS_SIZE];
+
+ symbol_number number;
+ location prec_location;
+ int prec;
+ assoc assoc;
int user_token_number;
- /* Points to the other in the identifier-symbol pair for an alias.
- Special value USER_NUMBER_ALIAS in the identifier half of the
- identifier-symbol pair for an alias. */
- symbol_t *alias;
+ /* Points to the other in the symbol-string pair for an alias.
+ Special value USER_NUMBER_HAS_STRING_ALIAS in the symbol half of the
+ symbol-string pair for an alias. */
+ symbol *alias;
symbol_class class;
+ status status;
};
-/* Undefined user number. */
-#define USER_NUMBER_UNDEFINED -1
+/** Undefined user number. */
+# define USER_NUMBER_UNDEFINED -1
-/* `symbol->user_token_number == USER_NUMBER_ALIAS' means this symbol
- *has* (not is) a string literal alias. For instance, `%token foo
- "foo"' has `"foo"' numbered regularly, and `foo' numbered as
- USER_NUMBER_ALIAS. */
-#define USER_NUMBER_ALIAS -9991
+/* 'symbol->user_token_number == USER_NUMBER_HAS_STRING_ALIAS' means
+ this symbol has a literal string alias. For instance, '%token foo
+ "foo"' has '"foo"' numbered regularly, and 'foo' numbered as
+ USER_NUMBER_HAS_STRING_ALIAS. */
+# define USER_NUMBER_HAS_STRING_ALIAS -9991
/* Undefined internal token number. */
-#define NUMBER_UNDEFINED ((symbol_number_t) -1)
+# define NUMBER_UNDEFINED (-1)
+/** Fetch (or create) the symbol associated to KEY. */
+symbol *symbol_from_uniqstr (const uniqstr key, location loc);
-/* Fetch (or create) the symbol associated to KEY. */
-symbol_t *symbol_get (const char *key, location_t location);
+/** Fetch (or create) the symbol associated to KEY. */
+symbol *symbol_get (const char *key, location loc);
-/* Generate a dummy nonterminal, whose name cannot conflict with the
- user's names. */
-symbol_t *dummy_symbol_get (location_t location);
+/** Generate a dummy nonterminal.
-/* Declare the new SYMBOL. Make it an alias of SYMVAL. */
-void symbol_make_alias (symbol_t *symbol, symbol_t *symval,
- location_t location);
+ Its name cannot conflict with the user's names. */
+symbol *dummy_symbol_get (location loc);
-/* Set the TYPE_NAME associated to SYMBOL. Does nothing if passed 0 as
- TYPE_NAME. */
-void symbol_type_set (symbol_t *symbol,
- struniq_t type_name, location_t location);
-/* Set the DESTRUCTOR associated to SYMBOL. */
-void symbol_destructor_set (symbol_t *symbol,
- char *destructor, location_t location);
+/*--------------------.
+| Methods on symbol. |
+`--------------------*/
-/* Set the PRINTER associated to SYMBOL. */
-void symbol_printer_set (symbol_t *symbol,
- char *printer, location_t location);
+/** Print a symbol (for debugging). */
+void symbol_print (symbol const *s, FILE *f);
-/* Set the PRECEDENCE associated to SYMBOL. Ensures that SYMBOL is a
- terminal. Does nothing if invoked with UNDEF_ASSOC as ASSOC. */
-void symbol_precedence_set (symbol_t *symbol,
- int prec, assoc_t assoc, location_t location);
+/** Is this a dummy nonterminal? */
+bool symbol_is_dummy (const symbol *sym);
-/* Set the CLASS associated to SYMBOL. */
-void symbol_class_set (symbol_t *symbol,
- symbol_class class, location_t location);
+/** The name of the code_props type: "\%destructor" or "\%printer". */
+char const *code_props_type_string (code_props_type kind);
-/* Set the USER_TOKEN_NUMBER associated to SYMBOL. */
-void symbol_user_token_number_set (symbol_t *symbol,
- int user_number, location_t location);
+/** The name of the symbol that can be used as an identifier.
+ ** Consider the alias if needed.
+ ** Return 0 if there is none (e.g., the symbol is only defined as
+ ** a string). */
+uniqstr symbol_id_get (symbol const *sym);
+/**
+ * Make \c str the literal string alias of \c sym. Copy token number,
+ * symbol number, and type from \c sym to \c str.
+ */
+void symbol_make_alias (symbol *sym, symbol *str, location loc);
-/* Distinguished symbols. AXIOM is the real start symbol, that used
- by the automaton. STARTSYMBOL is the one specified by the user.
- */
-extern symbol_t *errtoken;
-extern symbol_t *undeftoken;
-extern symbol_t *endtoken;
-extern symbol_t *accept;
-extern symbol_t *startsymbol;
-extern location_t startsymbol_location;
+/** Set the \c type_name associated with \c sym.
+ Do nothing if passed 0 as \c type_name. */
+void symbol_type_set (symbol *sym, uniqstr type_name, location loc);
-/*---------------.
-| Symbol table. |
-`---------------*/
+/** Set the \c \%destructor or \c \%printer associated with \c sym. */
+void symbol_code_props_set (symbol *sym, code_props_type kind,
+ code_props const *destructor);
+/** Get the computed \c \%destructor or \c %printer for \c sym, which was
+ initialized with \c code_props_none_init if there's no \c \%destructor or
+ \c %printer. */
+code_props *symbol_code_props_get (symbol *sym, code_props_type kind);
+
+/** Set the \c precedence associated with \c sym.
+
+ Ensure that \a symbol is a terminal.
+ Do nothing if invoked with \c undef_assoc as \c assoc. */
+void symbol_precedence_set (symbol *sym, int prec, assoc a, location loc);
+
+/** Set the \c class associated with \c sym. */
+void symbol_class_set (symbol *sym, symbol_class class, location loc,
+ bool declaring);
+
+/** Set the \c user_token_number associated with \c sym. */
+void symbol_user_token_number_set (symbol *sym, int user_number, location loc);
-/* Create the symbol table. */
-void symbols_new (void);
-/* A function to apply to each symbol. */
-typedef bool (*symbol_processor) (symbol_t *);
-/* Apply PROCESSOR to all the symbols. PROCESSOR must return true: on
- false, the processing stops. */
-void symbols_do (symbol_processor processor, void *processor_data);
+/*------------------.
+| Special symbols. |
+`------------------*/
+
+/** The error token. */
+extern symbol *errtoken;
+/** The token for unknown tokens. */
+extern symbol *undeftoken;
+/** The end of input token. */
+extern symbol *endtoken;
+/** The genuine start symbol.
+
+ $accept: start-symbol $end */
+extern symbol *accept;
+
+/** The user start symbol. */
+extern symbol *startsymbol;
+/** The location of the \c \%start declaration. */
+extern location startsymbol_location;
+
+
+
+/*-------------------.
+| Symbol Relations. |
+`-------------------*/
+
+/* The symbol relations are represented by a directed graph. */
+
+/* The id of a node */
+typedef int graphid;
+
+typedef struct symgraphlink symgraphlink;
+
+struct symgraphlink
+{
+ /** The second \c symbol or group of a precedence relation.
+ * See \c symgraph. */
+ graphid id;
+
+ symgraphlink *next;
+};
+
+/* Symbol precedence graph, to store the used precedence relations between
+ * symbols. */
-/* Free all the memory allocated for symbols. */
+typedef struct symgraph symgraph;
+
+struct symgraph
+{
+ /** Identifier for the node: equal to the number of the symbol. */
+ graphid id;
+
+ /** The list of related symbols that have a smaller precedence. */
+ symgraphlink *succ;
+
+ /** The list of related symbols that have a greater precedence. */
+ symgraphlink *pred;
+};
+
+/** Register a new precedence relation as used. */
+
+void register_precedence (graphid first, graphid snd);
+
+/** Print a warning for each symbol whose precedence and/or associativity
+ * is useless. */
+
+void print_precedence_warnings (void);
+
+/*----------------------.
+| Symbol associativity |
+`----------------------*/
+
+void register_assoc (graphid i, graphid j);
+
+/*-----------------.
+| Semantic types. |
+`-----------------*/
+
+/** A semantic type and its associated \c \%destructor and \c \%printer.
+
+ Access the fields of this struct only through the interface functions in
+ this file. \sa symbol::destructor */
+typedef struct {
+ /** The key, name of the semantic type. */
+ uniqstr tag;
+
+ /** The location of its first occurence. */
+ location location;
+
+ /** Its status : "undeclared", "used" or "declared".
+ It cannot be "needed". */
+ status status;
+
+ /** Any \c %destructor and %printer declared for this
+ semantic type. */
+ code_props props[CODE_PROPS_SIZE];
+
+} semantic_type;
+
+/** Fetch (or create) the semantic type associated to KEY. */
+semantic_type *semantic_type_from_uniqstr (const uniqstr key,
+ const location *loc);
+
+/** Fetch (or create) the semantic type associated to KEY. */
+semantic_type *semantic_type_get (const char *key, const location *loc);
+
+/** Set the \c destructor or \c printer associated with \c type. */
+void semantic_type_code_props_set (semantic_type *type,
+ code_props_type kind,
+ code_props const *code);
+
+/*----------------------------------.
+| Symbol and semantic type tables. |
+`----------------------------------*/
+
+/** Create the symbol and semantic type tables. */
+void symbols_new (void);
+
+/** Free all the memory allocated for symbols and semantic types. */
void symbols_free (void);
-/* Check that all the symbols are defined. Report any undefined
- symbols and consider them nonterminals. */
+/** Check that all the symbols are defined.
+
+ Report any undefined symbols and consider them nonterminals. */
void symbols_check_defined (void);
-/* Perform various sanity checks, assign symbol numbers, and set up
- TOKEN_TRANSLATIONS. */
+/** Sanity checks and #token_translations construction.
+
+ Perform various sanity checks, assign symbol numbers, and set up
+ #token_translations. */
void symbols_pack (void);
#endif /* !SYMTAB_H_ */