api.namespace: demonstrate and use {...} values instead of "..." values

[bison.git] / doc / bison.texi
diff --git a/doc/bison.texi b/doc/bison.texi

index 912c678233152bf0491fa582e8622778c1777604..1351a6c1c4d4858c73d18fb97e64f70ea3929e8f 100644 (file)
--- a/doc/bison.texi
+++ b/doc/bison.texi
@@ -186,7 +186,6 @@ Bison Grammar Files
  * Grammar Outline::    Overall layout of the grammar file.
  * Symbols::            Terminal and nonterminal symbols.
  * Rules::              How to write grammar rules.
-* Recursion::          Writing recursive rules.
  * Semantics::          Semantic values and actions.
  * Tracking Locations:: Locations and actions.
  * Named References::   Using named references in actions.
@@ -201,6 +200,13 @@ Outline of a Bison Grammar
  * Grammar Rules::         Syntax and usage of the grammar rules section.
  * Epilogue::              Syntax and usage of the epilogue.
  
+Grammar Rules
+
+* Rules Syntax::   Syntax of the rules.
+* Empty Rules::    Symbols that can match the empty string.
+* Recursion::      Writing recursive rules.
+
+
  Defining Language Semantics
  
  * Value Type::        Specifying one data type for all semantic values.
@@ -1007,7 +1013,7 @@ Let's consider an example, vastly simplified from a C++ grammar.
  %%
  
  prog:
-  /* Nothing.  */
+  %empty
  | prog stmt   @{ printf ("\n"); @}
  ;
  
@@ -1538,6 +1544,7 @@ calculator.  As in C, comments are placed between @samp{/*@dots{}*/}.
  @example
  /* Reverse polish notation calculator.  */
  
+@group
  %@{
    #define YYSTYPE double
    #include <stdio.h>
@@ -1545,6 +1552,7 @@ calculator.  As in C, comments are placed between @samp{/*@dots{}*/}.
    int yylex (void);
    void yyerror (char const *);
  %@}
+@end group
  
  %token NUM
  
@@ -1589,7 +1597,7 @@ Here are the grammar rules for the reverse polish notation calculator.
  @example
  @group
  input:
-  /* empty */
+  %empty
  | input line
  ;
  @end group
@@ -1646,7 +1654,7 @@ Consider the definition of @code{input}:
  
  @example
  input:
-  /* empty */
+  %empty
  | input line
  ;
  @end example
@@ -1661,8 +1669,9 @@ The first alternative is empty because there are no symbols between the
  colon and the first @samp{|}; this means that @code{input} can match an
  empty string of input (no tokens).  We write the rules this way because it
  is legitimate to type @kbd{Ctrl-d} right after you start the calculator.
-It's conventional to put an empty alternative first and write the comment
-@samp{/* empty */} in it.
+It's conventional to put an empty alternative first and to use the
+(optional) @code{%empty} directive, or to write the comment @samp{/* empty
+*/} in it (@pxref{Empty Rules}).
  
  The second alternate rule (@code{input line}) handles all nontrivial input.
  It means, ``After reading any number of lines, read one more line if
@@ -2002,7 +2011,7 @@ parentheses nested to arbitrary depth.  Here is the Bison code for
  %% /* The grammar follows.  */
  @group
  input:
-  /* empty */
+  %empty
  | input line
  ;
  @end group
@@ -2182,7 +2191,7 @@ wrong expressions or subexpressions.
  @example
  @group
  input:
-  /* empty */
+  %empty
  | input line
  ;
  @end group
@@ -2394,7 +2403,7 @@ Here are the C and Bison declarations for the multi-function calculator.
  %@{
    #include <stdio.h>  /* For printf, etc. */
    #include <math.h>   /* For pow, used in the grammar.  */
-  #include "calc.h"   /* Contains definition of `symrec'.  */
+  #include "calc.h"   /* Contains definition of 'symrec'.  */
    int yylex (void);
    void yyerror (char const *);
  %@}
@@ -2411,7 +2420,7 @@ Here are the C and Bison declarations for the multi-function calculator.
  %type  <val>  exp
  
  @group
-%right '='
+%precedence '='
  %left '-' '+'
  %left '*' '/'
  %precedence NEG /* negation--unary minus */
@@ -2453,7 +2462,7 @@ those which mention @code{VAR} or @code{FNCT}, are new.
  %% /* The grammar follows.  */
  @group
  input:
-  /* empty */
+  %empty
  | input line
  ;
  @end group
@@ -2523,7 +2532,7 @@ struct symrec
  @group
  typedef struct symrec symrec;
  
-/* The symbol table: a chain of `struct symrec'.  */
+/* The symbol table: a chain of 'struct symrec'.  */
  extern symrec *sym_table;
  
  symrec *putsym (char const *, int);
@@ -2558,7 +2567,7 @@ struct init const arith_fncts[] =
  @end group
  
  @group
-/* The symbol table: a chain of `struct symrec'.  */
+/* The symbol table: a chain of 'struct symrec'.  */
  symrec *sym_table;
  @end group
  
@@ -2787,7 +2796,6 @@ The Bison grammar file conventionally has a name ending in @samp{.y}.
  * Grammar Outline::    Overall layout of the grammar file.
  * Symbols::            Terminal and nonterminal symbols.
  * Rules::              How to write grammar rules.
-* Recursion::          Writing recursive rules.
  * Semantics::          Semantic values and actions.
  * Tracking Locations:: Locations and actions.
  * Named References::   Using named references in actions.
@@ -2857,21 +2865,27 @@ can be done with two @var{Prologue} blocks, one before and one after the
  @code{%union} declaration.
  
  @example
+@group
  %@{
    #define _GNU_SOURCE
    #include <stdio.h>
    #include "ptypes.h"
  %@}
+@end group
  
+@group
  %union @{
    long int n;
    tree t;  /* @r{@code{tree} is defined in @file{ptypes.h}.} */
  @}
+@end group
  
+@group
  %@{
    static void print_token_value (FILE *, int, YYSTYPE);
    #define YYPRINT(F, N, L) print_token_value (F, N, L)
  %@}
+@end group
  
  @dots{}
  @end example
@@ -2903,21 +2917,27 @@ location, or it can be one of @code{requires}, @code{provides},
  Look again at the example of the previous section:
  
  @example
+@group
  %@{
    #define _GNU_SOURCE
    #include <stdio.h>
    #include "ptypes.h"
  %@}
+@end group
  
+@group
  %union @{
    long int n;
    tree t;  /* @r{@code{tree} is defined in @file{ptypes.h}.} */
  @}
+@end group
  
+@group
  %@{
    static void print_token_value (FILE *, int, YYSTYPE);
    #define YYPRINT(F, N, L) print_token_value (F, N, L)
  %@}
+@end group
  
  @dots{}
  @end example
@@ -2955,7 +2975,7 @@ Let's go ahead and add the new @code{YYLTYPE} definition and the
    #include <stdio.h>
  
    /* WARNING: The following code really belongs
-   * in a `%code requires'; see below.  */
+   * in a '%code requires'; see below.  */
  
    #include "ptypes.h"
    #define YYLTYPE YYLTYPE
@@ -2969,16 +2989,20 @@ Let's go ahead and add the new @code{YYLTYPE} definition and the
    @} YYLTYPE;
  @}
  
+@group
  %union @{
    long int n;
    tree t;  /* @r{@code{tree} is defined in @file{ptypes.h}.} */
  @}
+@end group
  
+@group
  %code @{
    static void print_token_value (FILE *, int, YYSTYPE);
    #define YYPRINT(F, N, L) print_token_value (F, N, L)
    static void trace_token (enum yytokentype token, YYLTYPE loc);
  @}
+@end group
  
  @dots{}
  @end example
@@ -3389,7 +3413,18 @@ value of the error token is 256, unless you explicitly assigned 256 to
  one of your tokens with a @code{%token} declaration.
  
  @node Rules
-@section Syntax of Grammar Rules
+@section Grammar Rules
+
+A Bison grammar is a list of rules.
+
+@menu
+* Rules Syntax::   Syntax of the rules.
+* Empty Rules::    Symbols that can match the empty string.
+* Recursion::      Writing recursive rules.
+@end menu
+
+@node Rules Syntax
+@subsection Syntax of Grammar Rules
  @cindex rule syntax
  @cindex grammar rule syntax
  @cindex syntax of grammar rules
@@ -3463,33 +3498,57 @@ be joined with the vertical-bar character @samp{|} as follows:
  @noindent
  They are still considered distinct rules even when joined in this way.
  
-If @var{components} in a rule is empty, it means that @var{result} can
-match the empty string.  For example, here is how to define a
-comma-separated sequence of zero or more @code{exp} groupings:
+@node Empty Rules
+@subsection Empty Rules
+@cindex empty rule
+@cindex rule, empty
+@findex %empty
+
+A rule is said to be @dfn{empty} if its right-hand side (@var{components})
+is empty.  It means that @var{result} can match the empty string.  For
+example, here is how to define an optional semicolon:
+
+@example
+semicolon.opt: | ";";
+@end example
+
+@noindent
+It is easy not to see an empty rule, especially when @code{|} is used.  The
+@code{%empty} directive allows to make explicit that a rule is empty on
+purpose:
  
  @example
  @group
-expseq:
-  /* empty */
-| expseq1
+semicolon.opt:
+  %empty
+| ";"
  ;
  @end group
+@end example
+
+Flagging a non-empty rule with @code{%empty} is an error.  If run with
+@option{-Wempty-rule}, @command{bison} will report empty rules without
+@code{%empty}.  Using @code{%empty} enables this warning, unless
+@option{-Wno-empty-rule} was specified.
+
+The @code{%empty} directive is a Bison extension, it does not work with
+Yacc.  To remain compatible with POSIX Yacc, it is customary to write a
+comment @samp{/* empty */} in each rule with no components:
  
+@example
  @group
-expseq1:
-  exp
-| expseq1 ',' exp
+semicolon.opt:
+  /* empty */
+| ";"
  ;
  @end group
  @end example
  
-@noindent
-It is customary to write a comment @samp{/* empty */} in each rule
-with no components.
  
  @node Recursion
-@section Recursive Rules
+@subsection Recursive Rules
  @cindex recursive rule
+@cindex rule, recursive
  
  A rule is called @dfn{recursive} when its @var{result} nonterminal
  appears also on its right hand side.  Nearly all Bison grammars need to
@@ -3739,7 +3798,7 @@ foo:
  
  @group
  bar:
-  /* empty */    @{ previous_expr = $0; @}
+  %empty    @{ previous_expr = $0; @}
  ;
  @end group
  @end example
@@ -3916,16 +3975,20 @@ declare a destructor for that symbol:
  @group
  %type <context> let
  %destructor @{ pop_context ($$); @} let
+@end group
  
  %%
  
+@group
  stmt:
    let stmt
      @{
        $$ = $2;
        pop_context ($let);
      @};
+@end group
  
+@group
  let:
    "let" '(' var ')'
      @{
@@ -3960,9 +4023,9 @@ exp: @{ a(); @} "b" @{ c(); @} @{ d(); @} "e" @{ f(); @};
  is translated into:
  
  @example
-$@@1: /* empty */ @{ a(); @};
-$@@2: /* empty */ @{ c(); @};
-$@@3: /* empty */ @{ d(); @};
+$@@1: %empty @{ a(); @};
+$@@2: %empty @{ c(); @};
+$@@3: %empty @{ d(); @};
  exp: $@@1 "b" $@@2 $@@3 "e" @{ f(); @};
  @end example
  
@@ -3981,9 +4044,9 @@ exp: @{ a(); @} "b" @{ $$ = c(); @} @{ d(); @} "e" @{ f = $1; @};
  is translated into
  
  @example
-@@1: /* empty */ @{ a(); @};
-@@2: /* empty */ @{ $$ = c(); @};
-$@@3: /* empty */ @{ d(); @};
+@@1: %empty @{ a(); @};
+@@2: %empty @{ $$ = c(); @};
+$@@3: %empty @{ d(); @};
  exp: @@1 "b" @@2 $@@3 "e" @{ f = $1; @}
  @end example
  
@@ -4092,7 +4155,7 @@ serves as a subroutine:
  @example
  @group
  subroutine:
-  /* empty */  @{ prepare_for_local_variables (); @}
+  %empty  @{ prepare_for_local_variables (); @}
  ;
  @end group
  
@@ -5333,7 +5396,7 @@ For instance with @samp{%define api.prefix "calc"} and @samp{%defines
  @end deffn
  
  @deffn {Directive} %defines @var{defines-file}
-Same as above, but save in the file @var{defines-file}.
+Same as above, but save in the file @file{@var{defines-file}}.
  @end deffn
  
  @deffn {Directive} %destructor
@@ -5396,7 +5459,7 @@ own right.
  @end deffn
  
  @deffn {Directive} %output "@var{file}"
-Specify @var{file} for the parser implementation file.
+Generate the parser implementation in @file{@var{file}}.
  @end deffn
  
  @deffn {Directive} %pure-parser
@@ -5523,7 +5586,7 @@ Summary,,%skeleton}).
  Unaccepted @var{variable}s produce an error.
  Some of the accepted @var{variable}s are described below.
  
-@deffn Directive {%define api.namespace} "@var{namespace}"
+@deffn Directive {%define api.namespace} @{@var{namespace}@}
  @itemize
  @item Languages(s): C++
  
@@ -5531,7 +5594,7 @@ Some of the accepted @var{variable}s are described below.
  For example, if you specify:
  
  @example
-%define api.namespace "foo::bar"
+%define api.namespace @{foo::bar@}
  @end example
  
  Bison uses @code{foo::bar} verbatim in references such as:
@@ -5564,7 +5627,7 @@ api.namespace} so that @code{%name-prefix} @emph{only} affects the
  lexical analyzer function.  For example, if you specify:
  
  @example
-%define api.namespace "foo"
+%define api.namespace @{foo@}
  %name-prefix "bar::"
  @end example
  
@@ -5831,7 +5894,7 @@ More user feedback will help to stabilize it.)
  @end deffn
  
  @c ================================================== namespace
-@deffn Directive %define namespace @var{namespace}
+@deffn Directive %define namespace @{@var{namespace}@}
  Obsoleted by @code{api.namespace}
  @c namespace
  @end deffn
@@ -6372,7 +6435,7 @@ yylex (void)
      return 0;
    @dots{}
    if (c == '+' || c == '-')
-    return c;      /* Assume token type for `+' is '+'.  */
+    return c;      /* Assume token type for '+' is '+'.  */
    @dots{}
    return INT;      /* Return the type of the token.  */
    @dots{}
@@ -7469,7 +7532,7 @@ of zero or more @code{word} groupings.
  @example
  @group
  sequence:
-  /* empty */    @{ printf ("empty sequence\n"); @}
+  %empty         @{ printf ("empty sequence\n"); @}
  | maybeword
  | sequence word  @{ printf ("added word %s\n", $2); @}
  ;
@@ -7477,8 +7540,8 @@ sequence:
  
  @group
  maybeword:
-  /* empty */   @{ printf ("empty maybeword\n"); @}
-| word          @{ printf ("single word %s\n", $1); @}
+  %empty    @{ printf ("empty maybeword\n"); @}
+| word      @{ printf ("single word %s\n", $1); @}
  ;
  @end group
  @end example
@@ -7509,7 +7572,7 @@ proper way to define @code{sequence}:
  @example
  @group
  sequence:
-  /* empty */    @{ printf ("empty sequence\n"); @}
+  %empty         @{ printf ("empty sequence\n"); @}
  | sequence word  @{ printf ("added word %s\n", $2); @}
  ;
  @end group
@@ -7520,7 +7583,7 @@ Here is another common error that yields a reduce/reduce conflict:
  @example
  @group
  sequence:
-  /* empty */
+  %empty
  | sequence words
  | sequence redirects
  ;
@@ -7528,14 +7591,14 @@ sequence:
  
  @group
  words:
-  /* empty */
+  %empty
  | words word
  ;
  @end group
  
  @group
  redirects:
-  /* empty */
+  %empty
  | redirects redirect
  ;
  @end group
@@ -7558,7 +7621,7 @@ of sequence:
  
  @example
  sequence:
-  /* empty */
+  %empty
  | sequence word
  | sequence redirect
  ;
@@ -7570,7 +7633,7 @@ from being empty:
  @example
  @group
  sequence:
-  /* empty */
+  %empty
  | sequence words
  | sequence redirects
  ;
@@ -7614,7 +7677,7 @@ rule:
  %%
  @group
  sequence:
-  /* empty */
+  %empty
  | sequence word      %prec "sequence"
  | sequence redirect  %prec "sequence"
  ;
@@ -7636,7 +7699,7 @@ rule with the same precedence, but make them right-associative:
  %%
  @group
  sequence:
-  /* empty */
+  %empty
  | sequence word      %prec "word"
  | sequence redirect  %prec "redirect"
  ;
@@ -8333,7 +8396,7 @@ For example:
  
  @example
  stmts:
-  /* empty string */
+  %empty
  | stmts '\n'
  | stmts exp '\n'
  | stmts error '\n'
@@ -9635,7 +9698,7 @@ Here is a list of options that can be used with Bison, alphabetized by
  short option.  It is followed by a cross key alphabetized by long
  option.
  
-@c Please, keep this ordered as in `bison --help'.
+@c Please, keep this ordered as in 'bison --help'.
  @noindent
  Operations modes:
  @table @option
@@ -9716,6 +9779,72 @@ no effect on the conflict report.
  Deprecated constructs whose support will be removed in future versions of
  Bison.
  
+@item empty-rule
+Empty rules without @code{%empty}.  @xref{Empty Rules}.  Disabled by
+default, but enabled by uses of @code{%empty}, unless
+@option{-Wno-empty-rule} was specified.
+
+@item precedence
+Useless precedence and associativity directives.  Disabled by default.
+
+Consider for instance the following grammar:
+
+@example
+@group
+%nonassoc "="
+%left "+"
+%left "*"
+%precedence "("
+@end group
+%%
+@group
+stmt:
+  exp
+| "var" "=" exp
+;
+@end group
+
+@group
+exp:
+  exp "+" exp
+| exp "*" "num"
+| "(" exp ")"
+| "num"
+;
+@end group
+@end example
+
+Bison reports:
+
+@c cannot leave the location and the [-Wprecedence] for lack of
+@c width in PDF.
+@example
+@group
+warning: useless precedence and associativity for "="
+ %nonassoc "="
+           ^^^
+@end group
+@group
+warning: useless associativity for "*", use %precedence
+ %left "*"
+       ^^^
+@end group
+@group
+warning: useless precedence for "("
+ %precedence "("
+             ^^^
+@end group
+@end example
+
+One would get the exact same parser with the following directives instead:
+
+@example
+@group
+%left "+"
+%precedence "*"
+@end group
+@end example
+
  @item other
  All warnings not categorized above.  These warnings are enabled by default.
  
@@ -9724,9 +9853,11 @@ releases of Bison may move warnings from this category to new, more specific
  categories.
  
  @item all
-All the warnings.
+All the warnings except @code{yacc}.
+
  @item none
  Turn off all the warnings.
+
  @item error
  See @option{-Werror}, below.
  @end table
@@ -10207,14 +10338,6 @@ therefore, since, as far as we know, @code{double} is the most demanding
  type on all platforms, alignments are enforced for @code{double} whatever
  types are actually used.  This may waste space in some cases.
  
-@item
-Our implementation is not conforming with strict aliasing rules.  Alias
-analysis is a technique used in optimizing compilers to detect when two
-pointers are disjoint (they cannot ``meet'').  Our implementation breaks
-some of the rules that G++ 4.4 uses in its alias analysis, so @emph{strict
-alias analysis must be disabled}.  Use the option
-@option{-fno-strict-aliasing} to compile the generated parser.
-
  @item
  There might be portability issues we are not aware of.
  @end itemize
@@ -10967,7 +11090,7 @@ Location Tracking Calculator: @code{ltcalc}}).
  unit: assignments exp  @{ driver.result = $2; @};
  
  assignments:
-  /* Nothing.  */        @{@}
+  %empty                 @{@}
  | assignments assignment @{@};
  
  assignment:
@@ -11036,7 +11159,7 @@ Finally, we enable scanner tracing.
  
  @comment file: calc++-scanner.ll
  @example
-%option noyywrap nounput batch debug
+%option noyywrap nounput batch debug noinput
  @end example
  
  @noindent
@@ -12142,7 +12265,7 @@ operating system's name and version and your compiler's name and
  version.  If you have trouble compiling, you should also include a
  transcript of the build session, starting with the invocation of
  `configure'.  Depending on the nature of the bug, you may be asked to
-send additional files as well (such as `config.h' or `config.cache').
+send additional files as well (such as @file{config.h} or @file{config.cache}).
  
  Patches are most welcome, but not required.  That is, do not hesitate to
  send a bug report just because you cannot provide a fix.
@@ -12357,6 +12480,11 @@ time to resolve reduce/reduce conflicts.  @xref{GLR Parsers, ,Writing
  GLR Parsers}.
  @end deffn
  
+@deffn {Directive} %empty
+Bison declaration to declare make explicit that a rule has an empty
+right-hand side.  @xref{Empty Rules}.
+@end deffn
+
  @deffn {Symbol} $end
  The predefined token marking the end of the token stream.  It cannot be
  used in the grammar.