maint: credit Wojciech Polak

[bison.git] / doc / bison.texi
diff --git a/doc/bison.texi b/doc/bison.texi

index f2d3dbc52dcffd3e2a275e7b3f5fad582ee89bfb..a508b9c13c92f8330d246e657ec8afa6fa65f6d9 100644 (file)
--- a/doc/bison.texi
+++ b/doc/bison.texi
@@ -208,6 +208,12 @@ Defining Language Semantics
                        This says when, why and how to use the exceptional
                          action in the middle of a rule.
  
+Actions in Mid-Rule
+
+* Using Mid-Rule Actions::       Putting an action in the middle of a rule.
+* Mid-Rule Action Translation::  How mid-rule actions are actually processed.
+* Mid-Rule Conflicts::           Mid-rule actions can cause conflicts.
+
  Tracking Locations
  
  * Location Type::               Specifying a data type for locations.
@@ -2452,7 +2458,7 @@ function that initializes the symbol table.  Here it is, and
  void
  yyerror (char const *s)
  @{
-  printf ("%s\n", s);
+  fprintf (stderr, "%s\n", s);
  @}
  @end group
  
@@ -2722,6 +2728,9 @@ The Bison grammar file conventionally has a name ending in @samp{.y}.
  
  @node Grammar Outline
  @section Outline of a Bison Grammar
+@cindex comment
+@findex // @dots{}
+@findex /* @dots{} */
  
  A Bison grammar file has four main sections, shown here with the
  appropriate delimiters:
@@ -2741,8 +2750,8 @@ appropriate delimiters:
  @end example
  
  Comments enclosed in @samp{/* @dots{} */} may appear in any of the sections.
-As a GNU extension, @samp{//} introduces a comment that
-continues until end of line.
+As a GNU extension, @samp{//} introduces a comment that continues until end
+of line.
  
  @menu
  * Prologue::              Syntax and usage of the prologue.
@@ -3736,6 +3745,15 @@ Occasionally it is useful to put an action in the middle of a rule.
  These actions are written just like usual end-of-rule actions, but they
  are executed before the parser even recognizes the following components.
  
+@menu
+* Using Mid-Rule Actions::       Putting an action in the middle of a rule.
+* Mid-Rule Action Translation::  How mid-rule actions are actually processed.
+* Mid-Rule Conflicts::           Mid-rule actions can cause conflicts.
+@end menu
+
+@node Using Mid-Rule Actions
+@subsubsection Using Mid-Rule Actions
+
  A mid-rule action may refer to the components preceding it using
  @code{$@var{n}}, but it may not refer to subsequent components because
  it is run before they are parsed.
@@ -3768,10 +3786,16 @@ remove it afterward.  Here is how it is done:
  @example
  @group
  stmt:
-  LET '(' var ')'
-    @{ $<context>$ = push_context (); declare_variable ($3); @}
+  "let" '(' var ')'
+    @{
+      $<context>$ = push_context ();
+      declare_variable ($3);
+    @}
    stmt
-    @{ $$ = $6; pop_context ($<context>5); @}
+    @{
+      $$ = $6;
+      pop_context ($<context>5);
+    @}
  @end group
  @end example
  
@@ -3782,8 +3806,27 @@ list of accessible variables) as its semantic value, using alternative
  @code{context} in the data-type union.  Then it calls
  @code{declare_variable} to add the new variable to that list.  Once the
  first action is finished, the embedded statement @code{stmt} can be
-parsed.  Note that the mid-rule action is component number 5, so the
-@samp{stmt} is component number 6.
+parsed.
+
+Note that the mid-rule action is component number 5, so the @samp{stmt} is
+component number 6.  Named references can be used to improve the readability
+and maintainability (@pxref{Named References}):
+
+@example
+@group
+stmt:
+  "let" '(' var ')'
+    @{
+      $<context>let = push_context ();
+      declare_variable ($3);
+    @}[let]
+  stmt
+    @{
+      $$ = $6;
+      pop_context ($<context>let);
+    @}
+@end group
+@end example
  
  After the embedded statement is parsed, its semantic value becomes the
  value of the entire @code{let}-statement.  Then the semantic value from the
@@ -3817,13 +3860,13 @@ stmt:
    let stmt
      @{
        $$ = $2;
-      pop_context ($1);
+      pop_context ($let);
      @};
  
  let:
-  LET '(' var ')'
+  "let" '(' var ')'
      @{
-      $$ = push_context ();
+      $let = push_context ();
        declare_variable ($3);
      @};
  
@@ -3835,6 +3878,76 @@ Note that the action is now at the end of its rule.
  Any mid-rule action can be converted to an end-of-rule action in this way, and
  this is what Bison actually does to implement mid-rule actions.
  
+@node Mid-Rule Action Translation
+@subsubsection Mid-Rule Action Translation
+@vindex $@@@var{n}
+@vindex @@@var{n}
+
+As hinted earlier, mid-rule actions are actually transformed into regular
+rules and actions.  The various reports generated by Bison (textual,
+graphical, etc., see @ref{Understanding, , Understanding Your Parser})
+reveal this translation, best explained by means of an example.  The
+following rule:
+
+@example
+exp: @{ a(); @} "b" @{ c(); @} @{ d(); @} "e" @{ f(); @};
+@end example
+
+@noindent
+is translated into:
+
+@example
+$@@1: /* empty */ @{ a(); @};
+$@@2: /* empty */ @{ c(); @};
+$@@3: /* empty */ @{ d(); @};
+exp: $@@1 "b" $@@2 $@@3 "e" @{ f(); @};
+@end example
+
+@noindent
+with new nonterminal symbols @code{$@@@var{n}}, where @var{n} is a number.
+
+A mid-rule action is expected to generate a value if it uses @code{$$}, or
+the (final) action uses @code{$@var{n}} where @var{n} denote the mid-rule
+action.  In that case its nonterminal is rather named @code{@@@var{n}}:
+
+@example
+exp: @{ a(); @} "b" @{ $$ = c(); @} @{ d(); @} "e" @{ f = $1; @};
+@end example
+
+@noindent
+is translated into
+
+@example
+@@1: /* empty */ @{ a(); @};
+@@2: /* empty */ @{ $$ = c(); @};
+$@@3: /* empty */ @{ d(); @};
+exp: @@1 "b" @@2 $@@3 "e" @{ f = $1; @}
+@end example
+
+There are probably two errors in the above example: the first mid-rule
+action does not generate a value (it does not use @code{$$} although the
+final action uses it), and the value of the second one is not used (the
+final action does not use @code{$3}).  Bison reports these errors when the
+@code{midrule-value} warnings are enabled (@pxref{Invocation, ,Invoking
+Bison}):
+
+@example
+$ bison -fcaret -Wmidrule-value mid.y
+@group
+mid.y:2.6-13: warning: unset value: $$
+ exp: @{ a(); @} "b" @{ $$ = c(); @} @{ d(); @} "e" @{ f = $1; @};
+      ^^^^^^^^
+@end group
+@group
+mid.y:2.19-31: warning: unused value: $3
+ exp: @{ a(); @} "b" @{ $$ = c(); @} @{ d(); @} "e" @{ f = $1; @};
+                   ^^^^^^^^^^^^^
+@end group
+@end example
+
+
+@node Mid-Rule Conflicts
+@subsubsection Conflicts due to Mid-Rule Actions
  Taking action before a rule is completely recognized often leads to
  conflicts since the parser must commit to a parse in order to execute the
  action.  For example, the following two rules, without mid-rule actions,
@@ -3932,6 +4045,7 @@ compound:
  Now Bison can execute the action in the rule for @code{subroutine} without
  deciding which rule for @code{compound} it will eventually use.
  
+
  @node Tracking Locations
  @section Tracking Locations
  @cindex location
@@ -4885,7 +4999,7 @@ declaration @code{%define api.pure} says that you want the parser to be
  reentrant.  It looks like this:
  
  @example
-%define api.pure
+%define api.pure full
  @end example
  
  The result is that the communication variables @code{yylval} and
@@ -4935,7 +5049,7 @@ compatibility with the impure Yacc pull mode interface.  Unless you know
  what you are doing, your declarations should look like this:
  
  @example
-%define api.pure
+%define api.pure full
  %define api.push-pull push
  @end example
  
@@ -5008,8 +5122,8 @@ yypull_parse (ps); /* Will call the lexer */
  yypstate_delete (ps);
  @end example
  
-Adding the @code{%define api.pure} declaration does exactly the same thing to
-the generated parser with @code{%define api.push-pull both} as it did for
+Adding the @code{%define api.pure full} declaration does exactly the same thing
+to the generated parser with @code{%define api.push-pull both} as it did for
  @code{%define api.push-pull push}.
  
  @node Decl Summary
@@ -5170,8 +5284,6 @@ Specify the programming language for the generated parser.  Currently
  supported languages include C, C++, and Java.
  @var{language} is case-insensitive.
  
-This directive is experimental and its effect may be modified in future
-releases.
  @end deffn
  
  @deffn {Directive} %locations
@@ -5373,9 +5485,41 @@ Some of the accepted @var{variable}s are:
  @item Purpose: Request a pure (reentrant) parser program.
  @xref{Pure Decl, ,A Pure (Reentrant) Parser}.
  
-@item Accepted Values: Boolean
+@item Accepted Values: @code{true}, @code{false}, @code{full}
+
+The value may be omitted: this is equivalent to specifying @code{true}, as is
+the case for Boolean values.
+
+When @code{%define api.pure full} is used, the parser is made reentrant. This
+changes the signature for @code{yylex} (@pxref{Pure Calling}), and also that of
+@code{yyerror} when the tracking of locations has been activated, as shown
+below.
+
+The @code{true} value is very similar to the @code{full} value, the only
+difference is in the signature of @code{yyerror} on Yacc parsers without
+@code{%parse-param}, for historical reasons.
+
+I.e., if @samp{%locations %define api.pure} is passed then the prototypes for
+@code{yyerror} are:
+
+@example
+void yyerror (char const *msg);                 // Yacc parsers.
+void yyerror (YYLTYPE *locp, char const *msg);  // GLR parsers.
+@end example
+
+But if @samp{%locations %define api.pure %parse-param @{int *nastiness@}} is
+used, then both parsers have the same signature:
+
+@example
+void yyerror (YYLTYPE *llocp, int *nastiness, char const *msg);
+@end example
+
+(@pxref{Error Reporting, ,The Error
+Reporting Function @code{yyerror}})
  
  @item Default Value: @code{false}
+
+@item History: the @code{full} value was introduced in Bison 2.7
  @end itemize
  
  @c ================================================== api.push-pull
@@ -5820,6 +5964,27 @@ In the grammar actions, use expressions like this to refer to the data:
  exp: @dots{}    @{ @dots{}; *randomness += 1; @dots{} @}
  @end example
  
+@noindent
+Using the following:
+@example
+%parse-param @{int *randomness@}
+@end example
+
+Results in these signatures:
+@example
+void yyerror (int *randomness, const char *msg);
+int  yyparse (int *randomness);
+@end example
+
+@noindent
+Or, if both @code{%define api.pure full} (or just @code{%define api.pure})
+and @code{%locations} are used:
+
+@example
+void yyerror (YYLTYPE *llocp, int *randomness, const char *msg);
+int  yyparse (int *randomness);
+@end example
+
  @node Push Parser Function
  @section The Push Parser Function @code{yypush_parse}
  @findex yypush_parse
@@ -6071,7 +6236,7 @@ The data type of @code{yylloc} has the name @code{YYLTYPE}.
  @node Pure Calling
  @subsection Calling Conventions for Pure Parsers
  
-When you use the Bison declaration @code{%define api.pure} to request a
+When you use the Bison declaration @code{%define api.pure full} to request a
  pure, reentrant parser, the global communication variables @code{yylval}
  and @code{yylloc} cannot be used.  (@xref{Pure Decl, ,A Pure (Reentrant)
  Parser}.)  In such parsers the two global variables are replaced by
@@ -6106,35 +6271,25 @@ Declare that the braced-code @var{argument-declaration} is an
  additional @code{yylex} argument declaration.
  @end deffn
  
+@noindent
  For instance:
  
  @example
-%parse-param @{int *nastiness@}
  %lex-param   @{int *nastiness@}
-%parse-param @{int *randomness@}
  @end example
  
  @noindent
-results in the following signatures:
+results in the following signature:
  
  @example
-int yylex   (int *nastiness);
-int yyparse (int *nastiness, int *randomness);
-@end example
-
-If @code{%define api.pure} is added:
-
-@example
-int yylex   (YYSTYPE *lvalp, int *nastiness);
-int yyparse (int *nastiness, int *randomness);
+int yylex (int *nastiness);
  @end example
  
  @noindent
-and finally, if both @code{%define api.pure} and @code{%locations} are used:
+If @code{%define api.pure full} (or just @code{%define api.pure}) is added:
  
  @example
-int yylex   (YYSTYPE *lvalp, YYLTYPE *llocp, int *nastiness);
-int yyparse (int *nastiness, int *randomness);
+int yylex (YYSTYPE *lvalp, int *nastiness);
  @end example
  
  @node Error Reporting
@@ -6194,50 +6349,16 @@ error recovery if you have written suitable error recovery grammar rules
  immediately return 1.
  
  Obviously, in location tracking pure parsers, @code{yyerror} should have
-an access to the current location.
-This is indeed the case for the GLR
-parsers, but not for the Yacc parser, for historical reasons.  I.e., if
-@samp{%locations %define api.pure} is passed then the prototypes for
-@code{yyerror} are:
-
-@example
-void yyerror (char const *msg);                 /* Yacc parsers.  */
-void yyerror (YYLTYPE *locp, char const *msg);  /* GLR parsers.   */
-@end example
-
-If @samp{%parse-param @{int *nastiness@}} is used, then:
-
-@example
-void yyerror (int *nastiness, char const *msg);  /* Yacc parsers.  */
-void yyerror (int *nastiness, char const *msg);  /* GLR parsers.   */
-@end example
-
-Finally, GLR and Yacc parsers share the same @code{yyerror} calling
-convention for absolutely pure parsers, i.e., when the calling
-convention of @code{yylex} @emph{and} the calling convention of
-@code{%define api.pure} are pure.
-I.e.:
-
-@example
-/* Location tracking.  */
-%locations
-/* Pure yylex.  */
-%define api.pure
-%lex-param   @{int *nastiness@}
-/* Pure yyparse.  */
-%parse-param @{int *nastiness@}
-%parse-param @{int *randomness@}
-@end example
+an access to the current location. With @code{%define api.pure}, this is
+indeed the case for the GLR parsers, but not for the Yacc parser, for
+historical reasons, and this is the why @code{%define api.pure full} should be
+prefered over @code{%define api.pure}.
  
-@noindent
-results in the following signatures for all the parser kinds:
+When @code{%locations %define api.pure full} is used, @code{yyerror} has the
+following signature:
  
  @example
-int yylex (YYSTYPE *lvalp, YYLTYPE *llocp, int *nastiness);
-int yyparse (int *nastiness, int *randomness);
-void yyerror (YYLTYPE *locp,
-              int *nastiness, int *randomness,
-              char const *msg);
+void yyerror (YYLTYPE *locp, char const *msg);
  @end example
  
  @noindent
@@ -6379,7 +6500,6 @@ Actions}).
  @end deffn
  
  @deffn {Value} @@$
-@findex @@$
  Acts like a structure variable containing information on the textual
  location of the grouping made by the current rule.  @xref{Tracking
  Locations}.
@@ -6438,7 +6558,7 @@ GNU Automake.
  @item
  @cindex bison-i18n.m4
  Into the directory containing the GNU Autoconf macros used
-by the package---often called @file{m4}---copy the
+by the package ---often called @file{m4}--- copy the
  @file{bison-i18n.m4} file installed by Bison under
  @samp{share/aclocal/bison-i18n.m4} in Bison's installation directory.
  For example:
@@ -7355,9 +7475,9 @@ mysterious behavior altogether.  You simply need to activate a more powerful
  parser table construction algorithm by using the @code{%define lr.type}
  directive.
  
-@deffn {Directive} {%define lr.type @var{TYPE}}
+@deffn {Directive} {%define lr.type} @var{type}
  Specify the type of parser tables within the LR(1) family.  The accepted
-values for @var{TYPE} are:
+values for @var{type} are:
  
  @itemize
  @item @code{lalr} (default)
@@ -7544,9 +7664,9 @@ split the parse instead.
  To adjust which states have default reductions enabled, use the
  @code{%define lr.default-reductions} directive.
  
-@deffn {Directive} {%define lr.default-reductions @var{WHERE}}
+@deffn {Directive} {%define lr.default-reductions} @var{where}
  Specify the kind of states that are permitted to contain default reductions.
-The accepted values of @var{WHERE} are:
+The accepted values of @var{where} are:
  @itemize
  @item @code{most} (default for LALR and IELR)
  @item @code{consistent}
@@ -7584,7 +7704,7 @@ that solves these problems for canonical LR, IELR, and LALR without
  sacrificing @code{%nonassoc}, default reductions, or state merging.  You can
  enable LAC with the @code{%define parse.lac} directive.
  
-@deffn {Directive} {%define parse.lac @var{VALUE}}
+@deffn {Directive} {%define parse.lac} @var{value}
  Enable LAC to improve syntax error handling.
  @itemize
  @item @code{none} (default)
@@ -7680,9 +7800,9 @@ resolution because they are useless in the generated parser.  However,
  keeping unreachable states is sometimes useful when trying to understand the
  relationship between the parser and the grammar.
  
-@deffn {Directive} {%define lr.keep-unreachable-states @var{VALUE}}
+@deffn {Directive} {%define lr.keep-unreachable-states} @var{value}
  Request that Bison allow unreachable states to remain in the parser tables.
-@var{VALUE} must be a Boolean.  The default is @code{false}.
+@var{value} must be a Boolean.  The default is @code{false}.
  @end deffn
  
  There are a few caveats to consider:
@@ -8184,8 +8304,26 @@ clear the flag.
  
  Developing a parser can be a challenge, especially if you don't understand
  the algorithm (@pxref{Algorithm, ,The Bison Parser Algorithm}).  This
-chapter explains how to generate and read the detailed description of the
-automaton, and how to enable and understand the parser run-time traces.
+chapter explains how understand and debug a parser.
+
+The first sections focus on the static part of the parser: its structure.
+They explain how to generate and read the detailed description of the
+automaton.  There are several formats available:
+@itemize @minus
+@item
+as text, see @ref{Understanding, , Understanding Your Parser};
+
+@item
+as a graph, see @ref{Graphviz,, Visualizing Your Parser};
+
+@item
+or as a markup report that can be turned, for instance, into HTML, see
+@ref{Xml,, Visualizing your parser in multiple formats}.
+@end itemize
+
+The last section focuses on the dynamic part of the parser: how to enable
+and understand the parser run-time traces (@pxref{Tracing, ,Tracing Your
+Parser}).
  
  @menu
  * Understanding::     Understanding the structure of your parser.
@@ -8200,8 +8338,7 @@ automaton, and how to enable and understand the parser run-time traces.
  As documented elsewhere (@pxref{Algorithm, ,The Bison Parser Algorithm})
  Bison parsers are @dfn{shift/reduce automata}.  In some cases (much more
  frequent than one would hope), looking at this automaton is required to
-tune or simply fix a parser.  Bison provides two different
-representation of it, either textually or graphically (as a DOT file).
+tune or simply fix a parser.
  
  The textual file is generated when the options @option{--report} or
  @option{--verbose} are specified, see @ref{Invocation, , Invoking
@@ -8215,9 +8352,12 @@ The following grammar file, @file{calc.y}, will be used in the sequel:
  
  @example
  %token NUM STR
+@group
  %left '+' '-'
  %left '*'
+@end group
  %%
+@group
  exp:
    exp '+' exp
  | exp '-' exp
@@ -8225,6 +8365,7 @@ exp:
  | exp '/' exp
  | NUM
  ;
+@end group
  useless: STR;
  %%
  @end example
@@ -8234,8 +8375,8 @@ useless: STR;
  @example
  calc.y: warning: 1 nonterminal useless in grammar
  calc.y: warning: 1 rule useless in grammar
-calc.y:11.1-7: warning: nonterminal useless in grammar: useless
-calc.y:11.10-12: warning: rule useless in grammar: useless: STR
+calc.y:12.1-7: warning: nonterminal useless in grammar: useless
+calc.y:12.10-12: warning: rule useless in grammar: useless: STR
  calc.y: conflicts: 7 shift/reduce
  @end example
  
@@ -8329,7 +8470,7 @@ item is a production rule together with a point (@samp{.}) marking
  the location of the input cursor.
  
  @example
-state 0
+State 0
  
      0 $accept: . exp $end
  
@@ -8359,7 +8500,7 @@ you want to see more detail you can invoke @command{bison} with
  @option{--report=itemset} to list the derived items as well:
  
  @example
-state 0
+State 0
  
      0 $accept: . exp $end
      1 exp: . exp '+' exp
@@ -8377,7 +8518,7 @@ state 0
  In the state 1@dots{}
  
  @example
-state 1
+State 1
  
      5 exp: NUM .
  
@@ -8387,11 +8528,11 @@ state 1
  @noindent
  the rule 5, @samp{exp: NUM;}, is completed.  Whatever the lookahead token
  (@samp{$default}), the parser will reduce it.  If it was coming from
-state 0, then, after this reduction it will return to state 0, and will
+State 0, then, after this reduction it will return to state 0, and will
  jump to state 2 (@samp{exp: go to state 2}).
  
  @example
-state 2
+State 2
  
      0 $accept: exp . $end
      1 exp: exp . '+' exp
@@ -8419,7 +8560,7 @@ The state 3 is named the @dfn{final state}, or the @dfn{accepting
  state}:
  
  @example
-state 3
+State 3
  
      0 $accept: exp $end .
  
@@ -8434,7 +8575,7 @@ The interpretation of states 4 to 7 is straightforward, and is left to
  the reader.
  
  @example
-state 4
+State 4
  
      1 exp: exp '+' . exp
  
@@ -8443,7 +8584,7 @@ state 4
      exp  go to state 8
  
  
-state 5
+State 5
  
      2 exp: exp '-' . exp
  
@@ -8452,7 +8593,7 @@ state 5
      exp  go to state 9
  
  
-state 6
+State 6
  
      3 exp: exp '*' . exp
  
@@ -8461,7 +8602,7 @@ state 6
      exp  go to state 10
  
  
-state 7
+State 7
  
      4 exp: exp '/' . exp
  
@@ -8474,7 +8615,7 @@ As was announced in beginning of the report, @samp{State 8 conflicts:
  1 shift/reduce}:
  
  @example
-state 8
+State 8
  
      1 exp: exp . '+' exp
      1    | exp '+' exp .
@@ -8517,7 +8658,7 @@ with some set of possible lookahead tokens.  When run with
  @option{--report=lookahead}, Bison specifies these lookahead tokens:
  
  @example
-state 8
+State 8
  
      1 exp: exp . '+' exp
      1    | exp '+' exp .  [$end, '+', '-', '/']
@@ -8549,7 +8690,7 @@ The remaining states are similar:
  
  @example
  @group
-state 9
+State 9
  
      1 exp: exp . '+' exp
      2    | exp . '-' exp
@@ -8565,7 +8706,7 @@ state 9
  @end group
  
  @group
-state 10
+State 10
  
      1 exp: exp . '+' exp
      2    | exp . '-' exp
@@ -8580,7 +8721,7 @@ state 10
  @end group
  
  @group
-state 11
+State 11
  
      1 exp: exp . '+' exp
      2    | exp . '-' exp
@@ -8603,12 +8744,11 @@ state 11
  
  @noindent
  Observe that state 11 contains conflicts not only due to the lack of
-precedence of @samp{/} with respect to @samp{+}, @samp{-}, and
-@samp{*}, but also because the
-associativity of @samp{/} is not specified.
+precedence of @samp{/} with respect to @samp{+}, @samp{-}, and @samp{*}, but
+also because the associativity of @samp{/} is not specified.
  
-Note that Bison may also produce an HTML version of this output, via an XML
-file and XSLT processing (@pxref{Xml}).
+Bison may also produce an HTML version of this output, via an XML file and
+XSLT processing (@pxref{Xml,,Visualizing your parser in multiple formats}).
  
  @c ================================================= Graphical Representation
  
@@ -8628,7 +8768,10 @@ This file is generated when the @option{--graph} option is specified
  (@pxref{Invocation, , Invoking Bison}).  Its name is made by removing
  @samp{.tab.c} or @samp{.c} from the parser implementation file name, and
  adding @samp{.dot} instead.  If the grammar file is @file{foo.y}, the
-Graphviz output file is called @file{foo.dot}.
+Graphviz output file is called @file{foo.dot}.  A DOT file may also be
+produced via an XML file and XSLT processing (@pxref{Xml,,Visualizing your
+parser in multiple formats}).
+
  
  The following grammar file, @file{rr.y}, will be used in the sequel:
  
@@ -8641,10 +8784,20 @@ b: "0";
  @end group
  @end example
  
-The graphical output is very similar to the textual one, and as such it is
-easier understood by making direct comparisons between them. See
-@ref{Debugging, , Debugging Your Parser} for a detailled analysis of the
-textual report.
+The graphical output
+@ifnotinfo
+(see @ref{fig:graph})
+@end ifnotinfo
+is very similar to the textual one, and as such it is easier understood by
+making direct comparisons between them.  @xref{Debugging, , Debugging Your
+Parser}, for a detailled analysis of the textual report.
+
+@ifnotinfo
+@float Figure,fig:graph
+@image{figs/example, 430pt}
+@caption{A graphical rendering of the parser.}
+@end float
+@end ifnotinfo
  
  @subheading Graphical Representation of States
  
@@ -8669,7 +8822,7 @@ shift. The following describes a reduction in the @file{rr.output} file:
  
  @example
  @group
-state 3
+State 3
  
      1 exp: a . ";"
  
@@ -8690,7 +8843,7 @@ action for the given state, there is no such label.
  
  This is how reductions are represented in the verbose file @file{rr.output}:
  @example
-state 1
+State 1
  
      3 a: "0" .  [";"]
      4 b: "0" .  ["."]
@@ -8709,17 +8862,14 @@ reduction, see @ref{Shift/Reduce, , Shift/Reduce Conflicts}.  Discarded actions
  are distinguished by a red filling color on these nodes, just like how they are
  reported between square brackets in the verbose file.
  
-The reduction corresponding to the rule number 0 is the acceptation state. It
-is shown as a blue diamond, labelled "Acc".
+The reduction corresponding to the rule number 0 is the acceptation
+state. It is shown as a blue diamond, labelled ``Acc''.
  
  @subheading Graphical representation of go tos
  
  The @samp{go to} jump transitions are represented as dotted lines bearing
  the name of the rule being jumped to.
  
-Note that a DOT file may also be produced via an XML file and XSLT
-processing (@pxref{Xml}).
-
  @c ================================================= XML
  
  @node Xml
@@ -8727,8 +8877,10 @@ processing (@pxref{Xml}).
  @cindex xml
  
  Bison supports two major report formats: textual output
-(@pxref{Understanding}) when invoked with option @option{--verbose}, and DOT
-(@pxref{Graphviz}) when invoked with option @option{--graph}. However,
+(@pxref{Understanding, ,Understanding Your Parser}) when invoked
+with option @option{--verbose}, and DOT
+(@pxref{Graphviz,, Visualizing Your Parser}) when invoked with
+option @option{--graph}. However,
  another alternative is to output an XML file that may then be, with
  @command{xsltproc}, rendered as either a raw text format equivalent to the
  verbose file, or as an HTML version of the same file, with clickable
@@ -8736,7 +8888,7 @@ transitions, or even as a DOT. The @file{.output} and DOT files obtained via
  XSLT have no difference whatsoever with those obtained by invoking
  @command{bison} with options @option{--verbose} or @option{--graph}.
  
-The textual file is generated when the options @option{-x} or
+The XML file is generated when the options @option{-x} or
  @option{--xml[=FILE]} are specified, see @ref{Invocation,,Invoking Bison}.
  If not specified, its name is made by removing @samp{.tab.c} or @samp{.c}
  from the parser implementation file name, and adding @samp{.xml} instead.
@@ -8750,19 +8902,19 @@ files to apply to the XML file. Their names are non-ambiguous:
  @item xml2dot.xsl
  Used to output a copy of the DOT visualization of the automaton.
  @item xml2text.xsl
-Used to output a copy of the .output file.
+Used to output a copy of the @samp{.output} file.
  @item xml2xhtml.xsl
-Used to output an xhtml enhancement of the .output file.
+Used to output an xhtml enhancement of the @samp{.output} file.
  @end table
  
-Sample usage (requires @code{xsltproc}):
+Sample usage (requires @command{xsltproc}):
  @example
-$ bison -x input.y
+$ bison -x gr.y
  @group
  $ bison --print-datadir
  /usr/local/share/bison
  @end group
-$ xsltproc /usr/local/share/bison/xslt/xml2xhtml.xsl input.xml > input.html
+$ xsltproc /usr/local/share/bison/xslt/xml2xhtml.xsl gr.xml >gr.html
  @end example
  
  @c ================================================= Tracing
@@ -8953,7 +9105,7 @@ Entering state 24
  
  @noindent
  The previous reduction demonstrates the @code{%printer} directive for
-@code{<val>}: both the token @code{NUM} and the resulting non-terminal
+@code{<val>}: both the token @code{NUM} and the resulting nonterminal
  @code{exp} have @samp{1} as value.
  
  @example
@@ -9232,6 +9384,56 @@ Treat warnings as errors.
  A category can be turned off by prefixing its name with @samp{no-}.  For
  instance, @option{-Wno-yacc} will hide the warnings about
  POSIX Yacc incompatibilities.
+
+@item -f [@var{feature}]
+@itemx --feature[=@var{feature}]
+Activate miscellaneous @var{feature}. @var{feature} can be one of:
+@table @code
+@item caret
+@itemx diagnostics-show-caret
+Show caret errors, in a manner similar to GCC's
+@option{-fdiagnostics-show-caret}, or Clang's @option{-fcaret-diagnotics}. The
+location provided with the message is used to quote the corresponding line of
+the source file, underlining the important part of it with carets (^). Here is
+an example, using the following file @file{in.y}:
+
+@example
+%type <ival> exp
+%%
+exp: exp '+' exp @{ $exp = $1 + $2; @};
+@end example
+
+When invoked with @option{-fcaret}, Bison will report:
+
+@example
+@group
+in.y:3.20-23: error: ambiguous reference: '$exp'
+ exp: exp '+' exp @{ $exp = $1 + $2; @};
+                    ^^^^
+@end group
+@group
+in.y:3.1-3:       refers to: $exp at $$
+ exp: exp '+' exp @{ $exp = $1 + $2; @};
+ ^^^
+@end group
+@group
+in.y:3.6-8:       refers to: $exp at $1
+ exp: exp '+' exp @{ $exp = $1 + $2; @};
+      ^^^
+@end group
+@group
+in.y:3.14-16:     refers to: $exp at $3
+ exp: exp '+' exp @{ $exp = $1 + $2; @};
+              ^^^
+@end group
+@group
+in.y:3.32-33: error: $2 of 'exp' has no declared type
+ exp: exp '+' exp @{ $exp = $1 + $2; @};
+                                ^^
+@end group
+@end example
+
+@end table
  @end table
  
  @noindent
@@ -9280,9 +9482,6 @@ Specify the programming language for the generated parser, as if
  Summary}).  Currently supported languages include C, C++, and Java.
  @var{language} is case-insensitive.
  
-This option is experimental and its effect may be modified in future
-releases.
-
  @item --locations
  Pretend that @code{%locations} was specified.  @xref{Decl Summary}.
  
@@ -9790,7 +9989,7 @@ described by @var{m}.
  
  The parser invokes the scanner by calling @code{yylex}.  Contrary to C
  parsers, C++ parsers are always pure: there is no point in using the
-@code{%define api.pure} directive.  Therefore the interface is as follows.
+@code{%define api.pure full} directive.  Therefore the interface is as follows.
  
  @deftypemethod {parser} {int} yylex (semantic_type* @var{yylval}, location_type* @var{yylloc}, @var{type1} @var{arg1}, ...)
  Return the next token.  Its type is the return value, its semantic
@@ -10241,19 +10440,30 @@ It is convenient to use a typedef to shorten
  %@{
    typedef yy::calcxx_parser::token token;
  %@}
-           /* Convert ints to the actual type of tokens.  */
-[-+*/]     return yy::calcxx_parser::token_type (yytext[0]);
-":="       return token::ASSIGN;
-@{int@}      @{
-  errno = 0;
-  long n = strtol (yytext, NULL, 10);
-  if (! (INT_MIN <= n && n <= INT_MAX && errno != ERANGE))
-    driver.error (*yylloc, "integer is out of range");
-  yylval->ival = n;
-  return token::NUMBER;
-@}
-@{id@}       yylval->sval = new std::string (yytext); return token::IDENTIFIER;
-.          driver.error (*yylloc, "invalid character");
+         /* Convert ints to the actual type of tokens.  */
+[-+*/]   return yy::calcxx_parser::token_type (yytext[0]);
+
+":="     return token::ASSIGN;
+
+@group
+@{int@}    @{
+           errno = 0;
+           long n = strtol (yytext, NULL, 10);
+           if (! (INT_MIN <= n && n <= INT_MAX && errno != ERANGE))
+             driver.error (*yylloc, "integer is out of range");
+           yylval->ival = n;
+           return token::NUMBER;
+         @}
+@end group
+
+@group
+@{id@}     @{
+           yylval->sval = new std::string (yytext);
+           return token::IDENTIFIER;
+         @}
+@end group
+
+.        driver.error (*yylloc, "invalid character");
  %%
  @end example
  
@@ -10353,7 +10563,7 @@ You can create documentation for generated parsers using Javadoc.
  Contrary to C parsers, Java parsers do not use global variables; the
  state of the parser is always local to an instance of the parser class.
  Therefore, all Java parsers are ``pure'', and the @code{%pure-parser}
-and @code{%define api.pure} directives does not do anything when used in
+and @code{%define api.pure full} directives does not do anything when used in
  Java.
  
  Push parsers are currently unsupported in Java and @code{%define
@@ -10936,7 +11146,7 @@ or
  @quotation
  My parser includes support for an @samp{#include}-like feature, in
  which case I run @code{yyparse} from @code{yyparse}.  This fails
-although I did specify @samp{%define api.pure}.
+although I did specify @samp{%define api.pure full}.
  @end quotation
  
  These problems typically come not from Bison itself, but from
@@ -11299,18 +11509,23 @@ In an action, the location of the left-hand side of the rule.
  @end deffn
  
  @deffn {Variable} @@@var{n}
+@deffnx {Symbol} @@@var{n}
  In an action, the location of the @var{n}-th symbol of the right-hand side
  of the rule.  @xref{Tracking Locations}.
+
+In a grammar, the Bison-generated nonterminal symbol for a mid-rule action
+with a semantical value.  @xref{Mid-Rule Action Translation}.
  @end deffn
  
  @deffn {Variable} @@@var{name}
-In an action, the location of a symbol addressed by name.  @xref{Tracking
-Locations}.
+@deffnx {Variable} @@[@var{name}]
+In an action, the location of a symbol addressed by @var{name}.
+@xref{Tracking Locations}.
  @end deffn
  
-@deffn {Variable} @@[@var{name}]
-In an action, the location of a symbol addressed by name.  @xref{Tracking
-Locations}.
+@deffn {Symbol} $@@@var{n}
+In a grammar, the Bison-generated nonterminal symbol for a mid-rule action
+with no semantical value.  @xref{Mid-Rule Action Translation}.
  @end deffn
  
  @deffn {Variable} $$
@@ -11324,12 +11539,8 @@ right-hand side of the rule.  @xref{Actions}.
  @end deffn
  
  @deffn {Variable} $@var{name}
-In an action, the semantic value of a symbol addressed by name.
-@xref{Actions}.
-@end deffn
-
-@deffn {Variable} $[@var{name}]
-In an action, the semantic value of a symbol addressed by name.
+@deffnx {Variable} $[@var{name}]
+In an action, the semantic value of a symbol addressed by @var{name}.
  @xref{Actions}.
  @end deffn
  
@@ -11347,8 +11558,9 @@ the grammar file.  @xref{Grammar Outline, ,Outline of a Bison
  Grammar}.
  @end deffn
  
-@deffn {Construct} /*@dots{}*/
-Comment delimiters, as in C.
+@deffn {Construct} /* @dots{} */
+@deffnx {Construct} // @dots{}
+Comments, as in C/C++.
  @end deffn
  
  @deffn {Delimiter} :
@@ -11831,7 +12043,7 @@ Data type of semantic values; @code{int} by default.
  @item Accepting state
  A state whose only action is the accept action.
  The accepting state is thus a consistent state.
-@xref{Understanding,,}.
+@xref{Understanding, ,Understanding Your Parser}.
  
  @item Backus-Naur Form (BNF; also called ``Backus Normal Form'')
  Formal method of specifying context-free grammars originally proposed