tests: enhance existing tests with carets

[bison.git] / tests / conflicts.at
diff --git a/tests/conflicts.at b/tests/conflicts.at

index f455d1f5627cdd13446a8cdb7ec30e0013231c1d..5653b481f4f93248a176c332074385dcc4c45862 100644 (file)
--- a/tests/conflicts.at
+++ b/tests/conflicts.at
@@ -1,7 +1,7 @@
  # Exercising Bison on conflicts.                         -*- Autotest -*-
  
-# Copyright (C) 2002, 2003, 2004, 2005, 2007, 2009, 2010 Free
-# Software Foundation, Inc.
+# Copyright (C) 2002-2005, 2007, 2009-2012 Free Software Foundation,
+# Inc.
  
  # This program is free software: you can redistribute it and/or modify
  # it under the terms of the GNU General Public License as published by
@@ -41,6 +41,12 @@ AT_BISON_CHECK([-o input.c input.y], 0, [],
  [[input.y:4.9: warning: rule useless in parser due to conflicts: e: /* empty */
  ]])
  
+AT_BISON_CHECK([-fcaret -o input.c input.y], 0, [],
+[[input.y:4.9: warning: rule useless in parser due to conflicts
+ e: 'e' | /* Nothing. */;
+         ^
+]])
+
  AT_CLEANUP
  
  
@@ -50,20 +56,17 @@ AT_CLEANUP
  
  AT_SETUP([%nonassoc and eof])
  
+AT_BISON_OPTION_PUSHDEFS
  AT_DATA_GRAMMAR([input.y],
  [[
  %{
  #include <stdio.h>
  #include <stdlib.h>
  #include <string.h>
+#include <assert.h>
  
  #define YYERROR_VERBOSE 1
-static void
-yyerror (const char *msg)
-{
-  fprintf (stderr, "%s\n", msg);
-}
-
+]AT_YYERROR_DEFINE[
  /* The current argument. */
  static const char *input;
  
@@ -71,8 +74,7 @@ static int
  yylex (void)
  {
    static size_t toknum;
-  if (! (toknum <= strlen (input)))
-    abort ();
+  assert (toknum <= strlen (input));
    return input[toknum++];
  }
  
@@ -93,47 +95,54 @@ main (int argc, const char *argv[])
    return yyparse ();
  }
  ]])
+AT_BISON_OPTION_POPDEFS
  
-# Specify the output files to avoid problems on different file systems.
-AT_BISON_CHECK([-o input.c input.y])
+m4_pushdef([AT_NONASSOC_AND_EOF_CHECK],
+[AT_BISON_CHECK([$1[ -o input.c input.y]])
  AT_COMPILE([input])
  
+m4_pushdef([AT_EXPECTING], [m4_if($2, [correct], [[, expecting $end]])])
+
  AT_PARSER_CHECK([./input '0<0'])
  AT_PARSER_CHECK([./input '0<0<0'], [1], [],
-         [syntax error, unexpected '<'
+         [syntax error, unexpected '<'AT_EXPECTING
  ])
  
  AT_PARSER_CHECK([./input '0>0'])
  AT_PARSER_CHECK([./input '0>0>0'], [1], [],
-         [syntax error, unexpected '>'
+         [syntax error, unexpected '>'AT_EXPECTING
  ])
  
  AT_PARSER_CHECK([./input '0<0>0'], [1], [],
-         [syntax error, unexpected '>'
+         [syntax error, unexpected '>'AT_EXPECTING
  ])
  
-# We must disable default reductions in inconsistent states in order to
-# have an explicit list of all expected tokens.  (However, unless we use
-# canonical LR, lookahead sets are merged for different left contexts,
-# so it is still possible to have extra incorrect tokens in the expected
-# list.  That just doesn't happen to be a problem for this test case.)
-
-AT_BISON_CHECK([-Dlr.default-reductions=consistent -o input.c input.y])
-AT_COMPILE([input])
-
-AT_PARSER_CHECK([./input '0<0'])
-AT_PARSER_CHECK([./input '0<0<0'], [1], [],
-         [syntax error, unexpected '<', expecting $end
-])
+m4_popdef([AT_EXPECTING])])
  
-AT_PARSER_CHECK([./input '0>0'])
-AT_PARSER_CHECK([./input '0>0>0'], [1], [],
-         [syntax error, unexpected '>', expecting $end
-])
+# Expected token list is missing.
+AT_NONASSOC_AND_EOF_CHECK([], [[incorrect]])
  
-AT_PARSER_CHECK([./input '0<0>0'], [1], [],
-         [syntax error, unexpected '>', expecting $end
-])
+# We must disable default reductions in inconsistent states in order to
+# have an explicit list of all expected tokens.
+AT_NONASSOC_AND_EOF_CHECK([[-Dlr.default-reductions=consistent]],
+                          [[correct]])
+
+# lr.default-reductions=consistent happens to work for this test case.
+# However, for other grammars, lookahead sets can be merged for
+# different left contexts, so it is still possible to have an incorrect
+# expected list.  Canonical LR is almost a general solution (that is, it
+# can fail only when %nonassoc is used), so make sure it gives the same
+# result as above.
+AT_NONASSOC_AND_EOF_CHECK([[-Dlr.type=canonical-lr]], [[correct]])
+
+# parse.lac=full is a completely general solution that does not require
+# any of the above sacrifices.  Of course, it does not extend the
+# language-recognition power of LALR to (IE)LR, but it does ensure that
+# the reported list of expected tokens matches what the given parser
+# would have accepted in place of the unexpected token.
+AT_NONASSOC_AND_EOF_CHECK([[-Dparse.lac=full]], [[correct]])
+
+m4_popdef([AT_NONASSOC_AND_EOF_CHECK])
  
  AT_CLEANUP
  
@@ -165,7 +174,7 @@ AT_SKEL_JAVA_IF([AT_DATA], [AT_DATA_GRAMMAR])([input.y],
    #include <string>]], [[
    #include <assert.h>
    #include <stdio.h>
-  void yyerror (char const *msg);]])[
+  ]AT_YYERROR_DECLARE])[
    ]AT_YYLEX_PROTOTYPE[;
    #define USE(Var)
  }
@@ -206,31 +215,11 @@ public Object getLVal ()
    *lvalp = 1;
    return *input++;
  }]])[
-
-/*----------.
-| yyerror.  |
-`----------*/]AT_SKEL_JAVA_IF([[
-
-public void yyerror (String msg)
-{
-  System.err.println (msg);
-}
-
+]AT_YYERROR_DEFINE[
+]AT_SKEL_JAVA_IF([[
  };
  
-%%]], [AT_SKEL_CC_IF([[
-
-void
-yy::parser::error (const yy::location &, std::string const &msg)
-{
-  std::cerr << msg << std::endl;
-}]], [[
-
-void
-yyerror (char const *msg)
-{
-  fprintf (stderr, "%s\n", msg);
-}]])])[
+%%]])[
  
  /*-------.
  | main.  |
@@ -343,6 +332,18 @@ AT_CONSISTENT_ERRORS_CHECK([[%define lr.type canonical-lr]],
                             [AT_PREVIOUS_STATE_INPUT],
                             [[$end]], [[ab]])
  
+# Only LAC gets it right.
+AT_CONSISTENT_ERRORS_CHECK([[%define lr.type canonical-lr
+                             %define parse.lac full]],
+                           [AT_PREVIOUS_STATE_GRAMMAR],
+                           [AT_PREVIOUS_STATE_INPUT],
+                           [[$end]], [[b]])
+AT_CONSISTENT_ERRORS_CHECK([[%define lr.type ielr
+                             %define parse.lac full]],
+                           [AT_PREVIOUS_STATE_GRAMMAR],
+                           [AT_PREVIOUS_STATE_INPUT],
+                           [[$end]], [[b]])
+
  m4_popdef([AT_PREVIOUS_STATE_GRAMMAR])
  m4_popdef([AT_PREVIOUS_STATE_INPUT])
  
@@ -422,6 +423,16 @@ AT_CONSISTENT_ERRORS_CHECK([[%define lr.type canonical-lr]],
                             [AT_USER_ACTION_INPUT],
                             [[$end]], [[a]])
  
+AT_CONSISTENT_ERRORS_CHECK([[%define parse.lac full]],
+                           [AT_USER_ACTION_GRAMMAR],
+                           [AT_USER_ACTION_INPUT],
+                           [['b']], [[none]])
+AT_CONSISTENT_ERRORS_CHECK([[%define parse.lac full
+                             %define lr.default-reductions accepting]],
+                           [AT_USER_ACTION_GRAMMAR],
+                           [AT_USER_ACTION_INPUT],
+                           [[$end]], [[none]])
+
  m4_popdef([AT_USER_ACTION_GRAMMAR])
  m4_popdef([AT_USER_ACTION_INPUT])
  
@@ -431,6 +442,103 @@ AT_CLEANUP
  
  
  
+## ------------------------------------------------------- ##
+## LAC: %nonassoc requires splitting canonical LR states.  ##
+## ------------------------------------------------------- ##
+
+# This test case demonstrates that, when %nonassoc is used, canonical
+# LR(1) parser table construction followed by conflict resolution
+# without further state splitting is not always sufficient to produce a
+# parser that can detect all syntax errors as soon as possible on one
+# token of lookahead.  However, LAC solves the problem completely even
+# with minimal LR parser tables.
+
+AT_SETUP([[LAC: %nonassoc requires splitting canonical LR states]])
+AT_BISON_OPTION_PUSHDEFS
+AT_DATA_GRAMMAR([[input.y]],
+[[%code {
+  #include <stdio.h>
+  ]AT_YYERROR_DECLARE[
+  ]AT_YYLEX_DECLARE[
+}
+
+%error-verbose
+%nonassoc 'a'
+
+%%
+
+start:
+  'a' problem 'a' // First context.
+| 'b' problem 'b' // Second context.
+| 'c' reduce-nonassoc // Just makes reduce-nonassoc useful.
+;
+
+problem:
+  look reduce-nonassoc
+| look 'a'
+| look 'b'
+;
+
+// For the state reached after shifting the 'a' in these productions,
+// lookahead sets are the same in both the first and second contexts.
+// Thus, canonical LR reuses the same state for both contexts.  However,
+// the lookahead 'a' for the reduction "look: 'a'" later becomes an
+// error action only in the first context.  In order to immediately
+// detect the syntax error on 'a' here for only the first context, this
+// canonical LR state would have to be split into two states, and the
+// 'a' lookahead would have to be removed from only one of the states.
+look:
+  'a' // Reduction lookahead set is always ['a', 'b'].
+| 'a' 'b'
+| 'a' 'c' // 'c' is forgotten as an expected token.
+;
+
+reduce-nonassoc: %prec 'a';
+
+%%
+]AT_YYERROR_DEFINE[
+]AT_YYLEX_DEFINE(["aaa"])[
+
+int
+main (void)
+{
+  return yyparse ();
+}
+]])
+AT_BISON_OPTION_POPDEFS
+
+# Show canonical LR's failure.
+AT_BISON_CHECK([[-Dlr.type=canonical-lr -o input.c input.y]],
+               [[0]], [[]],
+[[input.y: conflicts: 2 shift/reduce
+]])
+AT_COMPILE([[input]])
+AT_PARSER_CHECK([[./input]], [[1]], [[]],
+[[syntax error, unexpected 'a', expecting 'b'
+]])
+
+# It's corrected by LAC.
+AT_BISON_CHECK([[-Dlr.type=canonical-lr -Dparse.lac=full \
+                 -o input.c input.y]], [[0]], [[]],
+[[input.y: conflicts: 2 shift/reduce
+]])
+AT_COMPILE([[input]])
+AT_PARSER_CHECK([[./input]], [[1]], [[]],
+[[syntax error, unexpected 'a', expecting 'b' or 'c'
+]])
+
+# IELR is sufficient when LAC is used.
+AT_BISON_CHECK([[-Dlr.type=ielr -Dparse.lac=full -o input.c input.y]],
+               [[0]], [[]],
+[[input.y: conflicts: 2 shift/reduce
+]])
+AT_COMPILE([[input]])
+AT_PARSER_CHECK([[./input]], [[1]], [[]],
+[[syntax error, unexpected 'a', expecting 'b' or 'c'
+]])
+
+AT_CLEANUP
+
  ## ------------------------- ##
  ## Unresolved SR Conflicts.  ##
  ## ------------------------- ##
@@ -478,7 +586,7 @@ exp (6)
      on left: 1 2, on right: 0 1
  
  
-state 0
+State 0
  
      0 $accept: . exp $end
      1 exp: . exp OP exp
@@ -489,14 +597,14 @@ state 0
      exp  go to state 2
  
  
-state 1
+State 1
  
      2 exp: NUM .
  
      $default  reduce using rule 2 (exp)
  
  
-state 2
+State 2
  
      0 $accept: exp . $end
      1 exp: exp . OP exp
@@ -505,14 +613,14 @@ state 2
      OP    shift, and go to state 4
  
  
-state 3
+State 3
  
      0 $accept: exp $end .
  
      $default  accept
  
  
-state 4
+State 4
  
      1 exp: . exp OP exp
      1    | exp OP . exp
@@ -523,7 +631,7 @@ state 4
      exp  go to state 5
  
  
-state 5
+State 5
  
      1 exp: exp . OP exp
      1    | exp OP exp .  [$end, OP]
@@ -581,7 +689,7 @@ exp (6)
      on left: 1 2, on right: 0 1
  
  
-state 0
+State 0
  
      0 $accept: . exp $end
      1 exp: . exp OP exp
@@ -592,14 +700,14 @@ state 0
      exp  go to state 2
  
  
-state 1
+State 1
  
      2 exp: NUM .
  
      $default  reduce using rule 2 (exp)
  
  
-state 2
+State 2
  
      0 $accept: exp . $end
      1 exp: exp . OP exp
@@ -608,14 +716,14 @@ state 2
      OP    shift, and go to state 4
  
  
-state 3
+State 3
  
      0 $accept: exp $end .
  
      $default  accept
  
  
-state 4
+State 4
  
      1 exp: . exp OP exp
      1    | exp OP . exp
@@ -626,7 +734,7 @@ state 4
      exp  go to state 5
  
  
-state 5
+State 5
  
      1 exp: exp . OP exp
      1    | exp OP exp .  [$end, OP]
@@ -721,7 +829,7 @@ id (7)
      on left: 4, on right: 2
  
  
-state 0
+State 0
  
      0 $accept: . exp $end
      1 exp: . num
@@ -736,7 +844,7 @@ state 0
      id   go to state 4
  
  
-state 1
+State 1
  
      3 num: '0' .  [$end]
      4 id: '0' .  [$end]
@@ -746,28 +854,28 @@ state 1
      $default  reduce using rule 3 (num)
  
  
-state 2
+State 2
  
      0 $accept: exp . $end
  
      $end  shift, and go to state 5
  
  
-state 3
+State 3
  
      1 exp: num .
  
      $default  reduce using rule 1 (exp)
  
  
-state 4
+State 4
  
      2 exp: id .
  
      $default  reduce using rule 2 (exp)
  
  
-state 5
+State 5
  
      0 $accept: exp $end .
  
@@ -794,7 +902,7 @@ exp: exp OP exp | NUM;
  
  AT_BISON_CHECK([-o input.c input.y], 1, [],
  [input.y: conflicts: 1 shift/reduce
-input.y: expected 0 shift/reduce conflicts
+input.y: error: expected 0 shift/reduce conflicts
  ])
  AT_CLEANUP
  
@@ -831,7 +939,7 @@ exp: exp OP exp | NUM;
  
  AT_BISON_CHECK([-o input.c input.y], 1, [],
  [input.y: conflicts: 1 shift/reduce
-input.y: expected 2 shift/reduce conflicts
+input.y: error: expected 2 shift/reduce conflicts
  ])
  AT_CLEANUP
  
@@ -851,7 +959,7 @@ a: 'a';
  
  AT_BISON_CHECK([-o input.c input.y], 1, [],
  [input.y: conflicts: 1 reduce/reduce
-input.y: expected 0 reduce/reduce conflicts
+input.y: error: expected 0 reduce/reduce conflicts
  ])
  AT_CLEANUP
  
@@ -1068,7 +1176,7 @@ reported_conflicts (9)
      on left: 8 9 10, on right: 1
  
  
-state 0
+State 0
  
      0 $accept: . start $end
      1 start: . resolved_conflict 'a' reported_conflicts 'a'
@@ -1083,28 +1191,28 @@ state 0
      Conflict between rule 3 and token 'a' resolved as reduce (%left 'a').
  
  
-state 1
+State 1
  
      0 $accept: start . $end
  
      $end  shift, and go to state 3
  
  
-state 2
+State 2
  
      1 start: resolved_conflict . 'a' reported_conflicts 'a'
  
      'a'  shift, and go to state 4
  
  
-state 3
+State 3
  
      0 $accept: start $end .
  
      $default  accept
  
  
-state 4
+State 4
  
      1 start: resolved_conflict 'a' . reported_conflicts 'a'
      8 reported_conflicts: . 'a'
@@ -1118,7 +1226,7 @@ state 4
      reported_conflicts  go to state 6
  
  
-state 5
+State 5
  
      8 reported_conflicts: 'a' .  ['a']
      9                   | 'a' .  ['a']
@@ -1128,14 +1236,14 @@ state 5
      $default  reduce using rule 8 (reported_conflicts)
  
  
-state 6
+State 6
  
      1 start: resolved_conflict 'a' reported_conflicts . 'a'
  
      'a'  shift, and go to state 7
  
  
-state 7
+State 7
  
      1 start: resolved_conflict 'a' reported_conflicts 'a' .
  
@@ -1189,8 +1297,8 @@ empty_c2: %prec 'c' ;
  empty_c3: %prec 'd' ;
  ]])
  AT_BISON_CHECK([[--report=all -o input.c input.y]], 0, [], [ignore])
-AT_CHECK([[cat input.output | sed -n '/^state 0$/,/^state 1$/p']], 0,
-[[state 0
+AT_CHECK([[cat input.output | sed -n '/^State 0$/,/^State 1$/p']], 0,
+[[State 0
  
      0 $accept: . start $end
      1 start: . 'a'
@@ -1208,7 +1316,7 @@ AT_CHECK([[cat input.output | sed -n '/^state 0$/,/^state 1$/p']], 0,
     13 empty_c3: .  ['c']
  
      'b'  shift, and go to state 1
- 
+
      'c'       reduce using rule 13 (empty_c3)
      $default  reduce using rule 9 (empty_a)
  
@@ -1226,7 +1334,7 @@ AT_CHECK([[cat input.output | sed -n '/^state 0$/,/^state 1$/p']], 0,
      Conflict between rule 13 and token 'c' resolved as reduce ('c' < 'd').
  
  
-state 1
+State 1
  ]])
  
  AT_CLEANUP
@@ -1265,8 +1373,8 @@ empty_c3: %prec 'c' ;
  ]])
  
  AT_BISON_CHECK([[--report=all -o input.c input.y]], 0, [], [ignore])
-AT_CHECK([[cat input.output | sed -n '/^state 0$/,/^state 1$/p']], 0,
-[[state 0
+AT_CHECK([[cat input.output | sed -n '/^State 0$/,/^State 1$/p']], 0,
+[[State 0
  
      0 $accept: . start $end
      1 start: . 'a'
@@ -1302,6 +1410,107 @@ AT_CHECK([[cat input.output | sed -n '/^state 0$/,/^state 1$/p']], 0,
      Conflict between rule 11 and token 'c' resolved as an error (%nonassoc 'c').
  
  
-state 1
+State 1
  ]])
  AT_CLEANUP
+
+
+## --------------------------------- ##
+## -W versus %expect and %expect-rr  ##
+## --------------------------------- ##
+
+AT_SETUP([[-W versus %expect and %expect-rr]])
+
+AT_DATA([[sr-rr.y]],
+[[%glr-parser
+%%
+start: 'a' | A 'a' | B 'a' ;
+A: ;
+B: ;
+]])
+AT_DATA([[sr.y]],
+[[%glr-parser
+%%
+start: 'a' | A 'a' ;
+A: ;
+]])
+AT_DATA([[rr.y]],
+[[%glr-parser
+%%
+start: A | B ;
+A: ;
+B: ;
+]])
+
+AT_BISON_CHECK([[sr-rr.y]], [[0]], [[]],
+[[sr-rr.y: conflicts: 1 shift/reduce, 1 reduce/reduce
+]])
+AT_BISON_CHECK([[-Wno-conflicts-sr sr-rr.y]], [[0]], [[]],
+[[sr-rr.y: conflicts: 1 reduce/reduce
+]])
+AT_BISON_CHECK([[-Wno-conflicts-rr sr-rr.y]], [[0]], [[]],
+[[sr-rr.y: conflicts: 1 shift/reduce
+]])
+
+[for gram in sr-rr sr rr; do
+  for sr_exp_i in '' 0 1 2; do
+    for rr_exp_i in '' 0 1 2; do
+      test -z "$sr_exp_i" && test -z "$rr_exp_i" && continue
+
+      # Build grammar file.
+      sr_exp=0
+      rr_exp=0
+      file=$gram
+      directives=
+      if test -n "$sr_exp_i"; then
+        sr_exp=$sr_exp_i
+        file=$file-expect-$sr_exp
+        directives="%expect $sr_exp"
+      fi
+      if test -n "$rr_exp_i"; then
+        rr_exp=$rr_exp_i
+        file=$file-expect-rr-$rr_exp
+        directives="$directives %expect-rr $rr_exp"
+      fi
+      file=$file.y
+      echo "$directives" > $file
+      cat $gram.y >> $file
+
+      # Count actual conflicts.
+      conflicts=
+      sr_count=0
+      rr_count=0
+      if test $gram = sr || test $gram = sr-rr; then
+        conflicts="1 shift/reduce"
+        sr_count=1
+      fi
+      if test $gram = rr || test $gram = sr-rr; then
+        if test -n "$conflicts"; then
+          conflicts="$conflicts, "
+        fi
+        conflicts="${conflicts}1 reduce/reduce"
+        rr_count=1
+      fi
+
+      # Run tests.
+      if test $sr_count -eq $sr_exp && test $rr_count -eq $rr_exp; then
+        ]AT_BISON_CHECK([[-Wnone $file]])[
+        ]AT_BISON_CHECK([[-Werror $file]])[
+      else
+        echo "$file: conflicts: $conflicts" > experr
+        if test $sr_count -ne $sr_exp; then
+          if test $sr_exp -ne 1; then s=s; else s= ; fi
+          echo "$file: error: expected $sr_exp shift/reduce conflict$s" >> experr
+        fi
+        if test $rr_count -ne $rr_exp; then
+          if test $rr_exp -ne 1; then s=s; else s= ; fi
+          echo "$file: error: expected $rr_exp reduce/reduce conflict$s" >> experr
+        fi
+        ]AT_BISON_CHECK([[-Wnone $file]], [[1]], [[]], [[experr]])[
+        ]AT_BISON_CHECK([[-Werror $file]], [[1]], [[]], [[experr]])[
+      fi
+    done
+  done
+done]
+
+AT_CLEANUP