* data/lalr1.cc: Move the body of the ctor and dtor into the

[bison.git] / doc / bison.texinfo
diff --git a/doc/bison.texinfo b/doc/bison.texinfo

index 380bc152acabff3ef2d0be9a7cd8b0fcd83111c1..01dccb418bcea8ca898ef758154f4c9234e39512 100644 (file)
--- a/doc/bison.texinfo
+++ b/doc/bison.texinfo
@@ -145,9 +145,9 @@ The Concepts of Bison
  
  Writing @acronym{GLR} Parsers
  
-* Simple GLR Parsers::          Using @acronym{GLR} parsers on unambiguous grammars
-* Merging GLR Parses::          Using @acronym{GLR} parsers to resolve ambiguities
-* Compiler Requirements::       @acronym{GLR} parsers require a modern C compiler
+* Simple GLR Parsers::       Using @acronym{GLR} parsers on unambiguous grammars
+* Merging GLR Parses::       Using @acronym{GLR} parsers to resolve ambiguities
+* Compiler Requirements::    @acronym{GLR} parsers require a modern C compiler
  
  Examples
  
@@ -225,6 +225,7 @@ Tracking Locations
  
  Bison Declarations
  
+* Require Decl::      Requiring a Bison version.
  * Token Decl::        Declaring terminal symbols.
  * Precedence Decl::   Declaring terminals with precedence and associativity.
  * Union Decl::        Declaring the set of all semantic value types.
@@ -243,6 +244,8 @@ Parser C-Language Interface
                          which reads tokens.
  * Error Reporting::   You must supply a function @code{yyerror}.
  * Action Features::   Special features for use in actions.
+* Internationalization::  How to let the parser speak in the user's
+                        native language.
  
  The Lexical Analyzer Function @code{yylex}
  
@@ -265,7 +268,7 @@ The Bison Parser Algorithm
  * Reduce/Reduce::     When two rules are applicable in the same situation.
  * Mystery Conflicts::  Reduce/reduce conflicts that look unjustified.
  * Generalized LR Parsing::  Parsing arbitrary context-free grammars.
-* Stack Overflow::    What happens when stack gets full.  How to avoid it.
+* Memory Management:: What happens when memory is exhausted.  How to avoid it.
  
  Operator Precedence
  
@@ -316,7 +319,7 @@ A Complete C++ Example
  
  Frequently Asked Questions
  
-* Parser Stack Overflow::      Breaking the Stack Limits
+* Memory Exhausted::           Breaking the Stack Limits
  * How Can I Reset the Parser:: @code{yyparse} Keeps some State
  * Strings are Destroyed::      @code{yylval} Loses Track of Strings
  * Implementing Gotos/Loops::   Control Flow in the Calculator
@@ -730,9 +733,9 @@ user-defined function on the resulting values to produce an arbitrary
  merged result.
  
  @menu
-* Simple GLR Parsers::          Using @acronym{GLR} parsers on unambiguous grammars
-* Merging GLR Parses::          Using @acronym{GLR} parsers to resolve ambiguities
-* Compiler Requirements::       @acronym{GLR} parsers require a modern C compiler
+* Simple GLR Parsers::       Using @acronym{GLR} parsers on unambiguous grammars
+* Merging GLR Parses::       Using @acronym{GLR} parsers to resolve ambiguities
+* Compiler Requirements::    @acronym{GLR} parsers require a modern C compiler
  @end menu
  
  @node Simple GLR Parsers
@@ -1187,14 +1190,7 @@ start with a function called @code{main}; you have to provide this, and
  arrange for it to call @code{yyparse} or the parser will never run.
  @xref{Interface, ,Parser C-Language Interface}.
  
-If your code defines a C preprocessor macro @code{_} (a single
-underscore), Bison assumes that it can be used to translate
-English-language strings to the user's preferred language using a
-function-like syntax, e.g., @code{_("syntax error")}.  Otherwise,
-Bison defines a no-op macro by that name that merely returns its
-argument, so strings are not translated.
-
-Aside from @code{_} and the token type names and the symbols in the actions you
+Aside from the token type names and the symbols in the actions you
  write, all symbols defined in the Bison parser file itself
  begin with @samp{yy} or @samp{YY}.  This includes interface functions
  such as the lexical analyzer function @code{yylex}, the error reporting
@@ -1202,13 +1198,17 @@ function @code{yyerror} and the parser function @code{yyparse} itself.
  This also includes numerous identifiers used for internal purposes.
  Therefore, you should avoid using C identifiers starting with @samp{yy}
  or @samp{YY} in the Bison grammar file except for the ones defined in
-this manual.
+this manual.  Also, you should avoid using the C identifiers
+@samp{malloc} and @samp{free} for anything other than their usual
+meanings.
  
  In some cases the Bison parser file includes system headers, and in
  those cases your code should respect the identifiers reserved by those
-headers.  On some non-@acronym{GNU} hosts, @code{<alloca.h>},
+headers.  On some non-@acronym{GNU} hosts, @code{<alloca.h>}, @code{<malloc.h>},
  @code{<stddef.h>}, and @code{<stdlib.h>} are included as needed to
-declare memory allocators and related types.  Other system headers may
+declare memory allocators and related types.  @code{<libintl.h>} is
+included if message translation is in use
+(@pxref{Internationalization}).  Other system headers may
  be included if you define @code{YYDEBUG} to a nonzero value
  (@pxref{Tracing, ,Tracing Your Parser}).
  
@@ -1719,12 +1719,12 @@ With all the source in a single file, you use the following command to
  convert it into a parser file:
  
  @example
-bison @var{file_name}.y
+bison @var{file}.y
  @end example
  
  @noindent
  In this example the file was called @file{rpcalc.y} (for ``Reverse Polish
-@sc{calc}ulator'').  Bison produces a file named @file{@var{file_name}.tab.c},
+@sc{calc}ulator'').  Bison produces a file named @file{@var{file}.tab.c},
  removing the @samp{.y} from the original file name.  The file output by
  Bison contains the source code for @code{yyparse}.  The additional
  functions in the input file (@code{yylex}, @code{yyerror} and @code{main})
@@ -3549,6 +3549,7 @@ it explicitly (@pxref{Language and Grammar, ,Languages and Context-Free
  Grammars}).
  
  @menu
+* Require Decl::      Requiring a Bison version.
  * Token Decl::        Declaring terminal symbols.
  * Precedence Decl::   Declaring terminals with precedence and associativity.
  * Union Decl::        Declaring the set of all semantic value types.
@@ -3561,6 +3562,20 @@ Grammars}).
  * Decl Summary::      Table of all Bison declarations.
  @end menu
  
+@node Require Decl
+@subsection Require a Version of Bison
+@cindex version requirement
+@cindex requiring a version of Bison
+@findex %require
+
+You may require the minimum version of Bison to process the grammar.  If
+the requirement is not met, @command{bison} exits with an error (exit
+status 63).
+
+@example
+%require "@var{version}"
+@end example
+
  @node Token Decl
  @subsection Token Type Names
  @cindex declaring token type names
@@ -3782,10 +3797,10 @@ Declare that the @var{code} must be invoked before parsing each time
  For instance, if your locations use a file name, you may use
  
  @example
-%parse-param @{ const char *filename @};
+%parse-param @{ char const *file_name @};
  %initial-action
  @{
-  @@$.begin.filename = @@$.end.filename = filename;
+  @@$.begin.filename = @@$.end.filename = file_name;
  @};
  @end example
  
@@ -3795,28 +3810,31 @@ For instance, if your locations use a file name, you may use
  @cindex freeing discarded symbols
  @findex %destructor
  
-Some symbols can be discarded by the parser.  For instance, during error
-recovery (@pxref{Error Recovery}), embarrassing symbols already pushed
-on the stack, and embarrassing tokens coming from the rest of the file
-are thrown away until the parser falls on its feet.  If these symbols
-convey heap based information, this memory is lost.  While this behavior
-can be tolerable for batch parsers, such as in compilers, it is not for
-possibly ``never ending'' parsers such as shells, or implementations of
-communication protocols.
+Some symbols can be discarded by the parser.  During error recovery
+(@pxref{Error Recovery}), symbols already pushed on the stack and tokens
+coming from the rest of the file are discarded until the parser falls on
+its feet.  If the parser runs out of memory, all the symbols on the
+stack must be discarded.  Even if the parser succeeds, it must discard
+the start symbol.
+
+When discarded symbols convey heap based information, this memory is
+lost.  While this behavior can be tolerable for batch parsers, such as
+in traditional compilers, it is unacceptable for programs like shells or
+protocol implementations that may parse and execute indefinitely.
  
-The @code{%destructor} directive allows for the definition of code that
-is called when a symbol is thrown away.
+The @code{%destructor} directive defines code that
+is called when a symbol is discarded.
  
  @deffn {Directive} %destructor @{ @var{code} @} @var{symbols}
  @findex %destructor
-Declare that the @var{code} must be invoked for each of the
-@var{symbols} that will be discarded by the parser.  The @var{code}
-should use @code{$$} to designate the semantic value associated to the
-@var{symbols}.  The additional parser parameters are also available
-(@pxref{Parser Function, , The Parser Function @code{yyparse}}).
-
-@strong{Warning:} as of Bison 1.875, this feature is still considered as
-experimental, as there was not enough user feedback.  In particular,
+Invoke @var{code} whenever the parser discards one of the @var{symbols}.
+Within @var{code}, @code{$$} designates the semantic value associated
+with the discarded symbol.  The additional parser parameters are also
+available (@pxref{Parser Function, , The Parser Function
+@code{yyparse}}).
+
+@strong{Warning:} as of Bison 2.1, this feature is still
+experimental, as there has not been enough user feedback.  In particular,
  the syntax might still change.
  @end deffn
  
@@ -3833,7 +3851,7 @@ For instance:
  @end smallexample
  
  @noindent
-guarantees that when a @code{STRING} or a @code{string} will be discarded,
+guarantees that when a @code{STRING} or a @code{string} is discarded,
  its associated memory will be freed.
  
  Note that in the future, Bison might also consider that right hand side
@@ -3865,8 +3883,11 @@ stacked symbols popped during the first phase of error recovery,
  @item
  incoming terminals during the second phase of error recovery,
  @item
-the current look-ahead when the parser aborts (either via an explicit
-call to @code{YYABORT}, or as a consequence of a failed error recovery).
+the current look-ahead and the entire stack when the parser aborts
+(either via an explicit call to @code{YYABORT}, or as a consequence of
+a failed error recovery or of memory exhaustion), and
+@item
+the start symbol, when the parser succeeds.
  @end itemize
  
  
@@ -4088,7 +4109,7 @@ above-mentioned declarations and to the token type codes.
  @end deffn
  
  @deffn {Directive} %destructor
-Specifying how the parser should reclaim the memory associated to
+Specify how the parser should reclaim the memory associated to
  discarded symbols.  @xref{Destructor Decl, , Freeing Discarded Symbols}.
  @end deffn
  
@@ -4130,7 +4151,7 @@ parser file contains just @code{#define} directives and static variable
  declarations.
  
  This option also tells Bison to write the C code for the grammar actions
-into a file named @file{@var{filename}.act}, in the form of a
+into a file named @file{@var{file}.act}, in the form of a
  brace-surrounded body fit for a @code{switch} statement.
  @end deffn
  
@@ -4143,8 +4164,8 @@ associate errors with the parser file, treating it an independent source
  file in its own right.
  @end deffn
  
-@deffn {Directive} %output="@var{filename}"
-Specify the @var{filename} for the parser file.
+@deffn {Directive} %output="@var{file}"
+Specify @var{file} for the parser file.
  @end deffn
  
  @deffn {Directive} %pure-parser
@@ -4152,6 +4173,11 @@ Request a pure (reentrant) parser program (@pxref{Pure Decl, ,A Pure
  (Reentrant) Parser}).
  @end deffn
  
+@deffn {Directive} %require "@var{version}"
+Require version @var{version} or higher of Bison.  @xref{Require Decl, ,
+Require a Version of Bison}.
+@end deffn
+
  @deffn {Directive} %token-table
  Generate an array of token names in the parser file.  The name of the
  array is @code{yytname}; @code{yytname[@var{i}]} is the name of the
@@ -4161,15 +4187,14 @@ three elements of @code{yytname} correspond to the predefined tokens
  @code{"error"}, and @code{"$undefined"}; after these come the symbols
  defined in the grammar file.
  
-For single-character literal tokens and literal string tokens, the name
-in the table includes the single-quote or double-quote characters: for
-example, @code{"'+'"} is a single-character literal and @code{"\"<=\""}
-is a literal string token.  All the characters of the literal string
-token appear verbatim in the string found in the table; even
-double-quote characters are not escaped.  For example, if the token
-consists of three characters @samp{*"*}, its string in @code{yytname}
-contains @samp{"*"*"}.  (In C, that would be written as
-@code{"\"*\"*\""}).
+The name in the table includes all the characters needed to represent
+the token in Bison.  For single-character literals and literal
+strings, this includes the surrounding quoting characters and any
+escape sequences.  For example, the Bison single-character literal
+@code{'+'} corresponds to a three-character name, represented in C as
+@code{"'+'"}; and the Bison two-character literal string @code{"\\/"}
+corresponds to a five-character name, represented in C as
+@code{"\"\\\\/\""}.
  
  When you specify @code{%token-table}, Bison also generates macro
  definitions for macros @code{YYNTOKENS}, @code{YYNNTS}, and
@@ -4250,6 +4275,8 @@ in the grammar file, you are likely to run into trouble.
                          which reads tokens.
  * Error Reporting::   You must supply a function @code{yyerror}.
  * Action Features::   Special features for use in actions.
+* Internationalization::  How to let the parser speak in the user's
+                        native language.
  @end menu
  
  @node Parser Function
@@ -4267,7 +4294,11 @@ without reading further.
  The value returned by @code{yyparse} is 0 if parsing was successful (return
  is due to end-of-input).
  
-The value is 1 if parsing failed (return is due to a syntax error).
+The value is 1 if parsing failed because of invalid input, i.e., input
+that contains a syntax error or that causes @code{YYABORT} to be
+invoked.
+
+The value is 2 if parsing failed due to memory exhaustion.
  @end deftypefun
  
  In an action, you can cause immediate return from @code{yyparse} by using
@@ -4408,11 +4439,13 @@ the grammar file has no effect on @code{yylex}.
  table.  The index of the token in the table is the token type's code.
  The name of a multicharacter token is recorded in @code{yytname} with a
  double-quote, the token's characters, and another double-quote.  The
-token's characters are not escaped in any way; they appear verbatim in
-the contents of the string in the table.
+token's characters are escaped as necessary to be suitable as input
+to Bison.
  
-Here's code for looking up a token in @code{yytname}, assuming that the
-characters of the token are stored in @code{token_buffer}.
+Here's code for looking up a multicharacter token in @code{yytname},
+assuming that the characters of the token are stored in
+@code{token_buffer}, and assuming that the token does not contain any
+characters like @samp{"} that require escaping.
  
  @smallexample
  for (i = 0; i < YYNTOKENS; i++)
@@ -4593,13 +4626,16 @@ declarations section (@pxref{Bison Declarations, ,The Bison Declarations
  Section}), then Bison provides a more verbose and specific error message
  string instead of just plain @w{@code{"syntax error"}}.
  
-The parser can detect one other kind of error: stack overflow.  This
-happens when the input contains constructions that are very deeply
+The parser can detect one other kind of error: memory exhaustion.  This
+can happen when the input contains constructions that are very deeply
  nested.  It isn't likely you will encounter this, since the Bison
-parser extends its stack automatically up to a very large limit.  But
-if overflow happens, @code{yyparse} calls @code{yyerror} in the usual
-fashion, except that the argument string is @w{@code{"parser stack
-overflow"}}.
+parser normally extends its stack automatically up to a very large limit.  But
+if memory is exhausted, @code{yyparse} calls @code{yyerror} in the usual
+fashion, except that the argument string is @w{@code{"memory exhausted"}}.
+
+In some cases diagnostics like @w{@code{"syntax error"}} are
+translated automatically from English to some other language before
+they are passed to @code{yyerror}.  @xref{Internationalization}.
  
  The following definition suffices in simple programs:
  
@@ -4680,7 +4716,7 @@ preferable since it more accurately describes the return type for
  
  @vindex yynerrs
  The variable @code{yynerrs} contains the number of syntax errors
-encountered so far.  Normally this variable is global; but if you
+reported so far.  Normally this variable is global; but if you
  request a pure parser (@pxref{Pure Decl, ,A Pure (Reentrant) Parser})
  then it is a local variable which only the actions can access.
  
@@ -4812,6 +4848,90 @@ of the @var{n}th component of the current rule.  @xref{Locations, ,
  Tracking Locations}.
  @end deffn
  
+@node Internationalization
+@section Parser Internationalization
+@cindex internationalization
+@cindex i18n
+@cindex NLS
+@cindex gettext
+@cindex bison-po
+
+A Bison-generated parser can print diagnostics, including error and
+tracing messages.  By default, they appear in English.  However, Bison
+also supports outputting diagnostics in the user's native language.
+To make this work, the user should set the usual environment
+variables.  @xref{Users, , The User's View, gettext, GNU
+@code{gettext} utilities}.  For
+example, the shell command @samp{export LC_ALL=fr_CA.UTF-8} might set
+the user's locale to French Canadian using the @acronym{UTF}-8
+encoding.  The exact set of available locales depends on the user's
+installation.
+
+The maintainer of a package that uses a Bison-generated parser enables
+the internationalization of the parser's output through the following
+steps.  Here we assume a package that uses @acronym{GNU} Autoconf and
+@acronym{GNU} Automake.
+
+@enumerate
+@item
+@cindex bison-i18n.m4
+Into the directory containing the @acronym{GNU} Autoconf macros used
+by the package---often called @file{m4}---copy the
+@file{bison-i18n.m4} file installed by Bison under
+@samp{share/aclocal/bison-i18n.m4} in Bison's installation directory.
+For example:
+
+@example
+cp /usr/local/share/aclocal/bison-i18n.m4 m4/bison-i18n.m4
+@end example
+
+@item
+@findex BISON_I18N
+@vindex BISON_LOCALEDIR
+@vindex YYENABLE_NLS
+In the top-level @file{configure.ac}, after the @code{AM_GNU_GETTEXT}
+invocation, add an invocation of @code{BISON_I18N}.  This macro is
+defined in the file @file{bison-i18n.m4} that you copied earlier.  It
+causes @samp{configure} to find the value of the
+@code{BISON_LOCALEDIR} variable, and it defines the source-language
+symbol @code{YYENABLE_NLS} to enable translations in the
+Bison-generated parser.
+
+@item
+In the @code{main} function of your program, designate the directory
+containing Bison's runtime message catalog, through a call to
+@samp{bindtextdomain} with domain name @samp{bison-runtime}.
+For example:
+
+@example
+bindtextdomain ("bison-runtime", BISON_LOCALEDIR);
+@end example
+
+Typically this appears after any other call @code{bindtextdomain
+(PACKAGE, LOCALEDIR)} that your package already has.  Here we rely on
+@samp{BISON_LOCALEDIR} to be defined as a string through the
+@file{Makefile}.
+
+@item
+In the @file{Makefile.am} that controls the compilation of the @code{main}
+function, make @samp{BISON_LOCALEDIR} available as a C preprocessor macro,
+either in @samp{DEFS} or in @samp{AM_CPPFLAGS}.  For example:
+
+@example
+DEFS = @@DEFS@@ -DBISON_LOCALEDIR='"$(BISON_LOCALEDIR)"'
+@end example
+
+or:
+
+@example
+AM_CPPFLAGS = -DBISON_LOCALEDIR='"$(BISON_LOCALEDIR)"'
+@end example
+
+@item
+Finally, invoke the command @command{autoreconf} to generate the build
+infrastructure.
+@end enumerate
+
  
  @node Algorithm
  @chapter The Bison Parser Algorithm
@@ -4878,7 +4998,7 @@ This kind of parser is known in the literature as a bottom-up parser.
  * Reduce/Reduce::     When two rules are applicable in the same situation.
  * Mystery Conflicts::  Reduce/reduce conflicts that look unjustified.
  * Generalized LR Parsing::  Parsing arbitrary context-free grammars.
-* Stack Overflow::    What happens when stack gets full.  How to avoid it.
+* Memory Management:: What happens when memory is exhausted.  How to avoid it.
  @end menu
  
  @node Look-Ahead
@@ -5496,6 +5616,13 @@ return_spec:
          ;
  @end example
  
+For a more detailed exposition of @acronym{LALR}(1) parsers and parser
+generators, please see:
+Frank DeRemer and Thomas Pennello, Efficient Computation of
+@acronym{LALR}(1) Look-Ahead Sets, @cite{@acronym{ACM} Transactions on
+Programming Languages and Systems}, Vol.@: 4, No.@: 4 (October 1982),
+pp.@: 615--649 @uref{http://doi.acm.org/10.1145/69622.357187}.
+
  @node Generalized LR Parsing
  @section Generalized @acronym{LR} (@acronym{GLR}) Parsing
  @cindex @acronym{GLR} parsing
@@ -5582,16 +5709,17 @@ London, Department of Computer Science, TR-00-12,
  @uref{http://www.cs.rhul.ac.uk/research/languages/publications/tomita_style_1.ps},
  (2000-12-24).
  
-@node Stack Overflow
-@section Stack Overflow, and How to Avoid It
+@node Memory Management
+@section Memory Management, and How to Avoid Memory Exhaustion
+@cindex memory exhaustion
+@cindex memory management
  @cindex stack overflow
  @cindex parser stack overflow
  @cindex overflow of parser stack
  
-The Bison parser stack can overflow if too many tokens are shifted and
+The Bison parser stack can run out of memory if too many tokens are shifted and
  not reduced.  When this happens, the parser function @code{yyparse}
-returns a nonzero value, pausing only to call @code{yyerror} to report
-the overflow.
+calls @code{yyerror} and then returns 2.
  
  Because Bison parsers have growing stacks, hitting the upper limit
  usually results from using a right recursion instead of a left
@@ -5599,12 +5727,12 @@ recursion, @xref{Recursion, ,Recursive Rules}.
  
  @vindex YYMAXDEPTH
  By defining the macro @code{YYMAXDEPTH}, you can control how deep the
-parser stack can become before a stack overflow occurs.  Define the
+parser stack can become before memory is exhausted.  Define the
  macro with a value that is an integer.  This value is the maximum number
  of tokens that can be shifted (and not reduced) before overflow.
  
  The stack space allowed is not necessarily allocated.  If you specify a
-large value for @code{YYMAXDEPTH}, the parser actually allocates a small
+large value for @code{YYMAXDEPTH}, the parser normally allocates a small
  stack at first, and then makes it bigger by stages as needed.  This
  increasing allocation happens automatically and silently.  Therefore,
  you do not need to make @code{YYMAXDEPTH} painfully small merely to save
@@ -5626,17 +5754,14 @@ macro @code{YYINITDEPTH} to a positive integer.  For the C
  unless you are assuming C99 or some other target language or compiler
  that allows variable-length arrays.  The default is 200.
  
-Do not allow @code{YYINITDEPTH} to be a value so large that arithmetic
-overflow would occur when calculating the size of the stack space.
-Also, do not allow @code{YYINITDEPTH} to be greater than
-@code{YYMAXDEPTH}.
+Do not allow @code{YYINITDEPTH} to be greater than @code{YYMAXDEPTH}.
  
  @c FIXME: C++ output.
  Because of semantical differences between C and C++, the
-@acronym{LALR}(1) parsers in C produced by Bison by compiled as C++
-cannot grow.  In this precise case (compiling a C parser as C++) you are
-suggested to grow @code{YYINITDEPTH}.  In the near future, a C++ output
-output will be provided which addresses this issue.
+@acronym{LALR}(1) parsers in C produced by Bison cannot grow when compiled
+by C++ compilers.  In this precise case (compiling a C parser as C++) you are
+suggested to grow @code{YYINITDEPTH}.  The Bison maintainers hope to fix
+this deficiency in a future release.
  
  @node Error Recovery
  @chapter Error Recovery
@@ -6507,14 +6632,15 @@ bison @var{infile}
  
  Here @var{infile} is the grammar file name, which usually ends in
  @samp{.y}.  The parser file's name is made by replacing the @samp{.y}
-with @samp{.tab.c}.  Thus, the @samp{bison foo.y} filename yields
-@file{foo.tab.c}, and the @samp{bison hack/foo.y} filename yields
-@file{hack/foo.tab.c}.  It's also possible, in case you are writing
+with @samp{.tab.c} and removing any leading directory.  Thus, the
+@samp{bison foo.y} file name yields
+@file{foo.tab.c}, and the @samp{bison hack/foo.y} file name yields
+@file{foo.tab.c}.  It's also possible, in case you are writing
  C++ code instead of C in your grammar file, to name it @file{foo.ypp}
  or @file{foo.y++}.  Then, the output files will take an extension like
  the given one as input (respectively @file{foo.tab.cpp} and
  @file{foo.tab.c++}).
-This feature takes effect with all options that manipulate filenames like
+This feature takes effect with all options that manipulate file names like
  @samp{-o} or @samp{-d}.
  
  For example :
@@ -6568,6 +6694,9 @@ Print a summary of the command-line options to Bison and exit.
  @itemx --version
  Print the version number of Bison and exit.
  
+@item --print-localedir
+Print the name of the directory containing locale-dependent data.
+
  @need 1750
  @item -y
  @itemx --yacc
@@ -6669,11 +6798,11 @@ Pretend that @code{%verbose} was specified, i.e, write an extra output
  file containing verbose descriptions of the grammar and
  parser.  @xref{Decl Summary}.
  
-@item -o @var{filename}
-@itemx --output=@var{filename}
-Specify the @var{filename} for the parser file.
+@item -o @var{file}
+@itemx --output=@var{file}
+Specify the @var{file} for the parser file.
  
-The other output files' names are constructed from @var{filename} as
+The other output files' names are constructed from @var{file} as
  described under the @samp{-v} and @samp{-d} options.
  
  @item -g
@@ -6685,7 +6814,7 @@ be @file{foo.vcg}.
  @item --graph=@var{graph-file}
  The behavior of @var{--graph} is the same than @samp{-g}.  The only
  difference is that it has an optional argument which is the name of
-the output graph filename.
+the output graph file.
  @end table
  
  @node Option Cross Key
@@ -6707,6 +6836,7 @@ the corresponding short option.
  \line{ --no-lines \leaderfill -l}
  \line{ --no-parser \leaderfill -n}
  \line{ --output \leaderfill -o}
+\line{ --print-localedir}
  \line{ --token-table \leaderfill -k}
  \line{ --verbose \leaderfill -v}
  \line{ --version \leaderfill -V}
@@ -6725,6 +6855,7 @@ the corresponding short option.
  --no-lines                            -l
  --no-parser                           -n
  --output=@var{outfile}                      -o @var{outfile}
+--print-localedir
  --token-table                         -k
  --verbose                             -v
  --version                             -V
@@ -6785,7 +6916,7 @@ int yyparse (void);
  @c - Always pure
  @c - initial action
  
-The C++ parser LALR(1) skeleton is named @file{lalr1.cc}.  To select
+The C++ parser @acronym{LALR}(1) skeleton is named @file{lalr1.cc}.  To select
  it, you may either pass the option @option{--skeleton=lalr1.cc} to
  Bison, or include the directive @samp{%skeleton "lalr1.cc"} in the
  grammar preamble.  When run, @command{bison} will create several
@@ -6799,13 +6930,13 @@ used for location tracking.  @xref{C++ Location Values}.
  @item stack.hh
  An auxiliary class @code{stack} used by the parser.
  
-@item @var{filename}.hh
-@itemx @var{filename}.cc
+@item @var{file}.hh
+@itemx @var{file}.cc
  The declaration and implementation of the C++ parser class.
-@var{filename} is the name of the output file.  It follows the same
+@var{file} is the name of the output file.  It follows the same
  rules as with regular C parsers.
  
-Note that @file{@var{filename}.hh} is @emph{mandatory}, the C++ cannot
+Note that @file{@var{file}.hh} is @emph{mandatory}, the C++ cannot
  work without the parser class declaration.  Therefore, you must either
  pass @option{-d}/@option{--defines} to @command{bison}, or use the
  @samp{%defines} directive.
@@ -6823,12 +6954,13 @@ for a complete and accurate documentation.
  The @code{%union} directive works as for C, see @ref{Union Decl, ,The
  Collection of Value Types}.  In particular it produces a genuine
  @code{union}@footnote{In the future techniques to allow complex types
-within pseudo-unions (variants) might be implemented to alleviate
-these issues.}, which have a few specific features in C++.
+within pseudo-unions (similar to Boost variants) might be implemented to
+alleviate these issues.}, which have a few specific features in C++.
  @itemize @minus
  @item
-The name @code{YYSTYPE} also denotes @samp{union YYSTYPE}.  You may
-forward declare it just with @samp{union YYSTYPE;}.
+The type @code{YYSTYPE} is defined but its use is discouraged: rather
+you should refer to the parser's encapsulated type
+@code{yy::parser::semantic_type}.
  @item
  Non POD (Plain Old Data) types cannot be used.  C++ forbids any
  instance of classes with constructors in unions: only @emph{pointers}
@@ -6854,7 +6986,7 @@ auxiliary classes define a @code{position}, a single point in a file,
  and a @code{location}, a range composed of a pair of
  @code{position}s (possibly spanning several files).
  
-@deftypemethod {position} {std::string*} filename
+@deftypemethod {position} {std::string*} file
  The name of the file.  It will always be handled as a pointer, the
  parser will never duplicate nor deallocate it.  As an experimental
  feature you may change it to @samp{@var{type}*} using @samp{%define
@@ -6886,8 +7018,8 @@ Various forms of syntactic sugar for @code{columns}.
  
  @deftypemethod {position} {position} operator<< (std::ostream @var{o}, const position& @var{p})
  Report @var{p} on @var{o} like this:
-@samp{@var{filename}:@var{line}.@var{column}}, or
-@samp{@var{line}.@var{column}} if @var{filename} is null.
+@samp{@var{file}:@var{line}.@var{column}}, or
+@samp{@var{line}.@var{column}} if @var{file} is null.
  @end deftypemethod
  
  @deftypemethod {location} {position} begin
@@ -7029,38 +7161,32 @@ transforming the simple parsing context structure into a fully blown
  
  The declaration of this driver class, @file{calc++-driver.hh}, is as
  follows.  The first part includes the CPP guard and imports the
-required standard library components.
+required standard library components, and the declaration of the parser
+class.
  
+@comment file: calc++-driver.hh
  @example
  #ifndef CALCXX_DRIVER_HH
  # define CALCXX_DRIVER_HH
  # include <string>
  # include <map>
+# include "calc++-parser.hh"
  @end example
  
-@noindent
-Then come forward declarations.  Because the parser uses the parsing
-driver and reciprocally, simple inclusions of header files will not
-do.  Because the driver's declaration is the one that will be imported
-by the rest of the project, it is saner to forward declare the
-parser's information here.
-
-@example
-// Forward declarations.
-union YYSTYPE;
-namespace yy @{ class calcxx_parser; @}
-class calcxx_driver;
-@end example
  
  @noindent
  Then comes the declaration of the scanning function.  Flex expects
  the signature of @code{yylex} to be defined in the macro
  @code{YY_DECL}, and the C++ parser expects it to be declared.  We can
  factor both as follows.
+
+@comment file: calc++-driver.hh
  @example
  // Announce to Flex the prototype we want for lexing function, ...
-# define YY_DECL                                               \
-  int yylex (YYSTYPE* yylval, yy::location* yylloc, calcxx_driver& driver)
+# define YY_DECL                                                \
+  int yylex (yy::calcxx_parser::semantic_type* yylval,           \
+             yy::calcxx_parser::location_type* yylloc,           \
+             calcxx_driver& driver)
  // ... and declare it for the parser's sake.
  YY_DECL;
  @end example
@@ -7069,6 +7195,7 @@ YY_DECL;
  The @code{calcxx_driver} class is then declared with its most obvious
  members.
  
+@comment file: calc++-driver.hh
  @example
  // Conducting the whole scanning and parsing of Calc++.
  class calcxx_driver
@@ -7087,6 +7214,7 @@ To encapsulate the coordination with the Flex scanner, it is useful to
  have two members function to open and close the scanning phase.
  members.
  
+@comment file: calc++-driver.hh
  @example
    // Handling the scanner.
    void scan_begin ();
@@ -7097,6 +7225,7 @@ members.
  @noindent
  Similarly for the parser itself.
  
+@comment file: calc++-driver.hh
  @example
    // Handling the parser.
    void parse (const std::string& f);
@@ -7110,6 +7239,7 @@ dumping them on the standard error output, we will pass them to the
  compiler driver using the following two member functions.  Finally, we
  close the class declaration and CPP guard.
  
+@comment file: calc++-driver.hh
  @example
    // Error handling.
    void error (const yy::location& l, const std::string& m);
@@ -7123,6 +7253,7 @@ member function deserves some attention.  The @code{error} functions
  are simple stubs, they should actually register the located error
  messages and set error state.
  
+@comment file: calc++-driver.cc
  @example
  #include "calc++-driver.hh"
  #include "calc++-parser.hh"
@@ -7165,17 +7296,33 @@ calcxx_driver::error (const std::string& m)
  @node Calc++ Parser
  @subsection Calc++ Parser
  
-The parser definition file @file{calc++-parser.yy} starts by asking
-for the C++ skeleton, the creation of the parser header file, and
-specifies the name of the parser class.  It then includes the required
-headers.
+The parser definition file @file{calc++-parser.yy} starts by asking for
+the C++ LALR(1) skeleton, the creation of the parser header file, and
+specifies the name of the parser class.  Because the C++ skeleton
+changed several times, it is safer to require the version you designed
+the grammar for.
+
+@comment file: calc++-parser.yy
  @example
  %skeleton "lalr1.cc"                          /*  -*- C++ -*- */
-%define "parser_class_name" "calcxx_parser"
+%require "2.1a"
  %defines
+%define "parser_class_name" "calcxx_parser"
+@end example
+
+@noindent
+Then come the declarations/inclusions needed to define the
+@code{%union}.  Because the parser uses the parsing driver and
+reciprocally, both cannot include the header of the other.  Because the
+driver's header needs detailed knowledge about the parser class (in
+particular its inner types), it is the parser's header which will simply
+use a forward declaration of the driver.
+
+@comment file: calc++-parser.yy
+@example
  %@{
  # include <string>
-# include "calc++-driver.hh"
+class calcxx_driver;
  %@}
  @end example
  
@@ -7184,6 +7331,7 @@ The driver is passed by reference to the parser and to the scanner.
  This provides a simple but effective pure interface, not relying on
  global variables.
  
+@comment file: calc++-parser.yy
  @example
  // The parsing context.
  %parse-param @{ calcxx_driver& driver @}
@@ -7196,6 +7344,7 @@ first location's file name.  Afterwards new locations are computed
  relatively to the previous locations: the file name will be
  automatically propagated.
  
+@comment file: calc++-parser.yy
  @example
  %locations
  %initial-action
@@ -7209,6 +7358,7 @@ automatically propagated.
  Use the two following directives to enable parser tracing and verbose
  error messages.
  
+@comment file: calc++-parser.yy
  @example
  %debug
  %error-verbose
@@ -7218,6 +7368,7 @@ error messages.
  Semantic values cannot use ``real'' objects, but only pointers to
  them.
  
+@comment file: calc++-parser.yy
  @example
  // Symbols.
  %union
@@ -7227,6 +7378,19 @@ them.
  @};
  @end example
  
+@noindent
+The code between @samp{%@{} and @samp{%@}} after the introduction of the
+@samp{%union} is output in the @file{*.cc} file; it needs detailed
+knowledge about the driver.
+
+@comment file: calc++-parser.yy
+@example
+%@{
+# include "calc++-driver.hh"
+%@}
+@end example
+
+
  @noindent
  The token numbered as 0 corresponds to end of file; the following line
  allows for nicer error messages referring to ``end of file'' instead
@@ -7234,18 +7398,20 @@ of ``$end''.  Similarly user friendly named are provided for each
  symbol.  Note that the tokens names are prefixed by @code{TOKEN_} to
  avoid name clashes.
  
+@comment file: calc++-parser.yy
  @example
-%token        YYEOF          0 "end of file"
-%token        TOKEN_ASSIGN     ":="
-%token <sval> TOKEN_IDENTIFIER "identifier"
-%token <ival> TOKEN_NUMBER     "number"
-%type  <ival> exp              "expression"
+%token        END      0 "end of file"
+%token        ASSIGN     ":="
+%token <sval> IDENTIFIER "identifier"
+%token <ival> NUMBER     "number"
+%type  <ival> exp        "expression"
  @end example
  
  @noindent
  To enable memory deallocation during error recovery, use
  @code{%destructor}.
  
+@comment file: calc++-parser.yy
  @example
  %printer    @{ debug_stream () << *$$; @} "identifier"
  %destructor @{ delete $$; @} "identifier"
@@ -7256,6 +7422,7 @@ To enable memory deallocation during error recovery, use
  @noindent
  The grammar itself is straightforward.
  
+@comment file: calc++-parser.yy
  @example
  %%
  %start unit;
@@ -7264,7 +7431,7 @@ unit: assignments exp  @{ driver.result = $2; @};
  assignments: assignments assignment @{@}
             | /* Nothing. */         @{@};
  
-assignment: TOKEN_IDENTIFIER ":=" exp @{ driver.variables[*$1] = $3; @};
+assignment: "identifier" ":=" exp @{ driver.variables[*$1] = $3; @};
  
  %left '+' '-';
  %left '*' '/';
@@ -7272,8 +7439,8 @@ exp: exp '+' exp   @{ $$ = $1 + $3; @}
     | exp '-' exp   @{ $$ = $1 - $3; @}
     | exp '*' exp   @{ $$ = $1 * $3; @}
     | exp '/' exp   @{ $$ = $1 / $3; @}
-   | TOKEN_IDENTIFIER  @{ $$ = driver.variables[*$1]; @}
-   | TOKEN_NUMBER      @{ $$ = $1; @};
+   | "identifier"  @{ $$ = driver.variables[*$1]; @}
+   | "number"      @{ $$ = $1; @};
  %%
  @end example
  
@@ -7281,9 +7448,11 @@ exp: exp '+' exp   @{ $$ = $1 + $3; @}
  Finally the @code{error} member function registers the errors to the
  driver.
  
+@comment file: calc++-parser.yy
  @example
  void
-yy::calcxx_parser::error (const location_type& l, const std::string& m)
+yy::calcxx_parser::error (const yy::calcxx_parser::location_type& l,
+                          const std::string& m)
  @{
    driver.error (l, m);
  @}
@@ -7295,8 +7464,12 @@ yy::calcxx_parser::error (const location_type& l, const std::string& m)
  The Flex scanner first includes the driver declaration, then the
  parser's to get the set of defined tokens.
  
+@comment file: calc++-scanner.ll
  @example
  %@{                                            /* -*- C++ -*- */
+# include <cstdlib>
+# include <errno.h>
+# include <limits.h>
  # include <string>
  # include "calc++-driver.hh"
  # include "calc++-parser.hh"
@@ -7309,6 +7482,7 @@ Because there is no @code{#include}-like feature we don't need
  actual file, this is not an interactive session with the user.
  Finally we enable the scanner tracing features.
  
+@comment file: calc++-scanner.ll
  @example
  %option noyywrap nounput batch debug
  @end example
@@ -7316,6 +7490,7 @@ Finally we enable the scanner tracing features.
  @noindent
  Abbreviations allow for more readable rules.
  
+@comment file: calc++-scanner.ll
  @example
  id    [a-zA-Z][a-zA-Z_0-9]*
  int   [0-9]+
@@ -7331,25 +7506,42 @@ cursor is adjusted, and each time blanks are matched, the begin cursor
  is moved onto the end cursor to effectively ignore the blanks
  preceding tokens.  Comments would be treated equally.
  
+@comment file: calc++-scanner.ll
  @example
+%@{
+# define YY_USER_ACTION  yylloc->columns (yyleng);
+%@}
  %%
  %@{
    yylloc->step ();
-# define YY_USER_ACTION  yylloc->columns (yyleng);
  %@}
  @{blank@}+   yylloc->step ();
  [\n]+      yylloc->lines (yyleng); yylloc->step ();
  @end example
  
  @noindent
-The rules are simple, just note the use of the driver to report
-errors.
+The rules are simple, just note the use of the driver to report errors.
+It is convenient to use a typedef to shorten
+@code{yy::calcxx_parser::token::identifier} into
+@code{token::identifier} for isntance.
  
+@comment file: calc++-scanner.ll
  @example
+%@{
+  typedef yy::calcxx_parser::token token;
+%@}
+
  [-+*/]     return yytext[0];
-":="       return TOKEN_ASSIGN;
-@{int@}      yylval->ival = atoi (yytext); return TOKEN_NUMBER;
-@{id@}       yylval->sval = new std::string (yytext); return TOKEN_IDENTIFIER;
+":="       return token::ASSIGN;
+@{int@}      @{
+  errno = 0;
+  long n = strtol (yytext, NULL, 10);
+  if (! (INT_MIN <= n && n <= INT_MAX && errno != ERANGE))
+    driver.error (*yylloc, "integer is out of range");
+  yylval->ival = n;
+  return token::NUMBER;
+@}
+@{id@}       yylval->sval = new std::string (yytext); return token::IDENTIFIER;
  .          driver.error (*yylloc, "invalid character");
  %%
  @end example
@@ -7358,6 +7550,7 @@ errors.
  Finally, because the scanner related driver's member function depend
  on the scanner's data, it is simpler to implement them in this file.
  
+@comment file: calc++-scanner.ll
  @example
  void
  calcxx_driver::scan_begin ()
@@ -7379,12 +7572,13 @@ calcxx_driver::scan_end ()
  
  The top level file, @file{calc++.cc}, poses no problem.
  
+@comment file: calc++.cc
  @example
  #include <iostream>
  #include "calc++-driver.hh"
  
  int
-main (int argc, const char* argv[])
+main (int argc, char *argv[])
  @{
    calcxx_driver driver;
    for (++argv; argv[0]; ++argv)
@@ -7411,17 +7605,17 @@ Several questions about Bison come up occasionally.  Here some of them
  are addressed.
  
  @menu
-* Parser Stack Overflow::      Breaking the Stack Limits
+* Memory Exhausted::           Breaking the Stack Limits
  * How Can I Reset the Parser:: @code{yyparse} Keeps some State
  * Strings are Destroyed::      @code{yylval} Loses Track of Strings
  * Implementing Gotos/Loops::   Control Flow in the Calculator
  @end menu
  
-@node Parser Stack Overflow
-@section Parser Stack Overflow
+@node Memory Exhausted
+@section Memory Exhausted
  
  @display
-My parser returns with error with a @samp{parser stack overflow}
+My parser returns with error with a @samp{memory exhausted}
  message.  What can I do?
  @end display
  
@@ -7692,7 +7886,7 @@ Bison declaration to create a header file meant for the scanner.
  @end deffn
  
  @deffn {Directive} %destructor
-Specifying how the parser should reclaim the memory associated to
+Specify how the parser should reclaim the memory associated to
  discarded symbols.  @xref{Destructor Decl, , Freeing Discarded Symbols}.
  @end deffn
  
@@ -7777,7 +7971,7 @@ Bison declaration to assign non-associativity to token(s).
  @xref{Precedence Decl, ,Operator Precedence}.
  @end deffn
  
-@deffn {Directive} %output="@var{filename}"
+@deffn {Directive} %output="@var{file}"
  Bison declaration to set the name of the parser file.  @xref{Decl
  Summary}.
  @end deffn
@@ -7798,6 +7992,11 @@ Bison declaration to request a pure (reentrant) parser.
  @xref{Pure Decl, ,A Pure (Reentrant) Parser}.
  @end deffn
  
+@deffn {Directive} %require "@var{version}"
+Require version @var{version} or higher of Bison.  @xref{Require Decl, ,
+Require a Version of Bison}.
+@end deffn
+
  @deffn {Directive} %right
  Bison declaration to assign right associativity to token(s).
  @xref{Precedence Decl, ,Operator Precedence}.
@@ -7903,7 +8102,7 @@ use for @code{YYERROR_VERBOSE}, just whether you define it.  Using
  
  @deffn {Macro} YYINITDEPTH
  Macro for specifying the initial size of the parser stack.
-@xref{Stack Overflow}.
+@xref{Memory Management}.
  @end deffn
  
  @deffn {Function} yylex
@@ -7941,12 +8140,12 @@ variable within @code{yyparse}, and its address is passed to
  @end deffn
  
  @deffn {Macro} YYMAXDEPTH
-Macro for specifying the maximum size of the parser stack.  @xref{Stack
-Overflow}.
+Macro for specifying the maximum size of the parser stack.  @xref{Memory
+Management}.
  @end deffn
  
  @deffn {Variable} yynerrs
-Global variable which Bison increments each time there is a syntax error.
+Global variable which Bison increments each time it reports a syntax error.
  (In a pure parser, it is a local variable within @code{yyparse}.)
  @xref{Error Reporting, ,The Error Reporting Function @code{yyerror}}.
  @end deffn
@@ -7976,10 +8175,7 @@ the parser will use @code{malloc} to extend its stacks.  If defined to
  reserved for future Bison extensions.  If not defined,
  @code{YYSTACK_USE_ALLOCA} defaults to 0.
  
-If you define @code{YYSTACK_USE_ALLOCA} to 1, it is your
-responsibility to make sure that @code{alloca} is visible, e.g., by
-using @acronym{GCC} or by including @code{<stdlib.h>}.  Furthermore,
-in the all-too-common case where your code may run on a host with a
+In the all-too-common case where your code may run on a host with a
  limited stack and with unreliable stack-overflow checking, you should
  set @code{YYMAXDEPTH} to a value that cannot possibly result in
  unchecked stack overflow on any of your target hosts when