Remove the useless rules from the parser.

* src/gram.h, src/gram.c (rules_swap, rule_rhs_length): New. (ritem_longest_rhs): Use the latter. * src/gram.h (rule_t): `number' is a new member. * src/reader.c (packgram): Set it. * src/reduce.c (reduce_grammar_tables): Move the useless rules at the end of `rules', and count them out of `nrules'. (reduce_output, dump_grammar): Adjust. * src/print.c (print_grammar): It is no longer needed to check for the usefulness of a rule, as useless rules are beyond `nrules + 1'. * tests/reduce.at (Reduced Automaton): New test. Changes in version 1.49a: * False `Token not used' report fixed. On a grammar such as /* Allocate input grammar variables for bison, This file is part of Bison, the GNU Compiler Compiler. int error_token_number; /*------------------------. | Dump RITEM for traces. | `------------------------*/ size_t ritem_longest_rhs (void) { int i; return max; } typedef struct rule_s { short lhs; short *rhs; short prec; extern int error_token_number; /* Dump RITEM for traces. */ void ritem_print PARAMS ((FILE *out)); fprintf (out, "%snn", _("Grammar")); fprintf (out, " %sn", _("Number, Line, Rule")); for (i = 1; i < nrules + 1; i++) fputs ("nn", out); while (p) { bucket *ruleprec = p->ruleprec; rules[ruleno].lhs = p->sym->number; rules[ruleno].rhs = ritem + itemno; rules[ruleno].line = p->line; bitset_set (V1, rules[i].precsym); } static void reduce_grammar_tables (void) { if (nuseless_productions > 0) { int pn; for (pn = 1; pn < nrules + 1; pn++) rules[pn].useful = bitset_test (P, pn); } } { int i; fprintf (out, "%snn", _("Useless rules:")); fputs ("nn", out); } } fprintf (out, "nn"); fprintf (out, "Rulesn-----nn"); fprintf (out, "Num (Prec, Assoc, Useful, Ritem Range) Lhs -> Rhs (Ritem range) [Num]n"); { int rhs_count = 0; /* Find the last RHS index in ritems. */ } fprintf (out, "nn"); fprintf (out, "Rules interpretedn-----------------nn"); { fprintf (out, "%-5d %s :", i, symbols[rules[i].lhs]->tag); for (r = rules[i].rhs; *r >= 0; r++) ## ------------------- ## ## Underivable Rules. ## ## ------------------- ##
2026-07-27 09:40:33 +00:00 · 2002-04-07 16:28:39 +00:00
parent 4416fcdb02
commit 588db0a892
1 changed files with 448 additions and 0 deletions
@@ -1,3 +1,451 @@
+2002-04-07  Akim Demaille  <[email protected]>
+
+	Remove the useless rules from the parser.
+
+	* src/gram.h, src/gram.c (rules_swap, rule_rhs_length): New.
+	(ritem_longest_rhs): Use the latter.
+	* src/gram.h (rule_t): `number' is a new member.
+	* src/reader.c (packgram): Set it.
+	* src/reduce.c (reduce_grammar_tables): Move the useless rules at
+	the end of `rules', and count them out of `nrules'.
+	(reduce_output, dump_grammar): Adjust.
+	* src/print.c (print_grammar): It is no longer needed to check for
+	the usefulness of a rule, as useless rules are beyond `nrules + 1'.
+	* tests/reduce.at (Reduced Automaton): New test.
+
+diff -x *.po -ur -x testsuite bison-1.49a/NEWS bison/NEWS
+--- bison-1.49a/NEWS	Sun Apr  7 17:36:56 2002
+++ bison/NEWS	Sun Apr  7 18:19:39 2002
+@@ -3,6 +3,10 @@
+
+	Changes in version 1.49a:
+
+* Useless rules are actually removed.
+  Before, Bison reported the useless rules, but, although not used,
+  included them in the parsers.
+
+	* False `Token not used' report fixed.
+	On a grammar such as
+
+diff -x *.po -ur -x testsuite bison-1.49a/src/gram.c bison/src/gram.c
+--- bison-1.49a/src/gram.c	Sun Apr  7 17:36:56 2002
+++ bison/src/gram.c	Sun Apr  7 18:19:39 2002
+@@ -1,5 +1,5 @@
+	/* Allocate input grammar variables for bison,
+-   Copyright 1984, 1986, 1989, 2001 Free Software Foundation, Inc.
+   Copyright 1984, 1986, 1989, 2001, 2002 Free Software Foundation, Inc.
+
+	This file is part of Bison, the GNU Compiler Compiler.
+
+@@ -51,6 +51,51 @@
+	int error_token_number;
+
+
+/*----------------------------------.
+| Swap the rules number R1 and R2.  |
+`----------------------------------*/
+
+void
+rules_swap (int r1, int r2)
+{
+  /* The easy part: swap the immediate contents of the structures. */
+  {
+    rule_t rule = rules[r1];
+    rules[r1] = rules[r2];
+    rules[r2] = rule;
+  }
+
+  /* The first negative number in the RHS is the rule number.  */
+  {
+    short *rhsp;
+    for (rhsp = rules[r1].rhs; *rhsp >= 0; ++rhsp)
+      /* Nothing. */;
+    assert (*rhsp == -r2);
+    *rhsp = -r1;
+
+    for (rhsp = rules[r2].rhs; *rhsp >= 0; ++rhsp)
+      /* Nothing. */;
+    assert (*rhsp == -r1);
+    *rhsp = -r2;
+  }
+}
+
+
+/*--------------------------------------.
+| Return the number of symbols in RHS.  |
+`--------------------------------------*/
+
+int
+rule_rhs_length (rule_t *rule)
+{
+  int res = 0;
+  short *rhsp;
+  for (rhsp = rule->rhs; *rhsp >= 0; ++rhsp)
+    ++res;
+  return res;
+}
+
+
+	/*------------------------.
+	| Dump RITEM for traces.  |
+	`------------------------*/
+@@ -76,23 +121,15 @@
+	size_t
+	ritem_longest_rhs (void)
+	{
+-  int length;
+-  int max;
+  int max = 0;
+	int i;
+
+-  length = 0;
+-  max = 0;
+-  for (i = 0; i < nritems; ++i)
+-    if (ritem[i] >= 0)
+-      {
+-	length++;
+-      }
+-    else
+-      {
+-	if (length > max)
+-	  max = length;
+-	length = 0;
+-      }
+  for (i = 1; i < nrules + 1; ++i)
+    {
+      int length = rule_rhs_length (&rules[i]);
+      if (length > max)
+	max = length;
+    }
+
+	return max;
+	}
+diff -x *.po -ur -x testsuite bison-1.49a/src/gram.h bison/src/gram.h
+--- bison-1.49a/src/gram.h	Sun Apr  7 17:55:00 2002
+++ bison/src/gram.h	Sun Apr  7 18:19:39 2002
+@@ -124,6 +124,10 @@
+
+	typedef struct rule_s
+	{
+  /* The number of the rule in the source.  It is usually the index in
+     RULES too, except if there are useless rules.  */
+  short number;
+
+	short lhs;
+	short *rhs;
+	short prec;
+@@ -166,6 +170,11 @@
+
+	extern int error_token_number;
+
+/* Swap two rules. */
+void rules_swap PARAMS ((int r1, int r2));
+
+/* Report the length of the RHS. */
+int rule_rhs_length PARAMS ((rule_t *rule));
+
+	/* Dump RITEM for traces. */
+	void ritem_print PARAMS ((FILE *out));
+diff -x *.po -ur -x testsuite bison-1.49a/src/print.c bison/src/print.c
+--- bison-1.49a/src/print.c	Sun Apr  7 17:55:00 2002
+++ bison/src/print.c	Sun Apr  7 18:19:39 2002
+@@ -366,19 +366,17 @@
+	fprintf (out, "%s\n\n", _("Grammar"));
+	fprintf (out, "  %s\n", _("Number, Line, Rule"));
+	for (i = 1; i < nrules + 1; i++)
+-    /* Don't print rules disabled in reduce_grammar_tables.  */
+-    if (rules[i].useful)
+-      {
+-	fprintf (out, _("  %3d %3d %s ->"),
+-		 i - 1, rules[i].line, escape (symbols[rules[i].lhs]->tag));
+-	rule = rules[i].rhs;
+-	if (*rule >= 0)
+-	  while (*rule >= 0)
+-	    fprintf (out, " %s", escape (symbols[*rule++]->tag));
+-	else
+-	  fprintf (out, " /* %s */", _("empty"));
+-	fputc ('\n', out);
+-      }
+    {
+      fprintf (out, _("  %3d %3d %s ->"),
+	       i - 1, rules[i].line, escape (symbols[rules[i].lhs]->tag));
+      rule = rules[i].rhs;
+      if (*rule >= 0)
+	while (*rule >= 0)
+	  fprintf (out, " %s", escape (symbols[*rule++]->tag));
+      else
+	fprintf (out, " /* %s */", _("empty"));
+      fputc ('\n', out);
+    }
+	fputs ("\n\n", out);
+
+
+diff -x *.po -ur -x testsuite bison-1.49a/src/reader.c bison/src/reader.c
+--- bison-1.49a/src/reader.c	Sun Apr  7 17:56:13 2002
+++ bison/src/reader.c	Sun Apr  7 18:19:39 2002
+@@ -1687,6 +1687,7 @@
+	while (p)
+	{
+	bucket *ruleprec = p->ruleprec;
+      rules[ruleno].number = ruleno;
+	rules[ruleno].lhs = p->sym->number;
+	rules[ruleno].rhs = ritem + itemno;
+	rules[ruleno].line = p->line;
+diff -x *.po -ur -x testsuite bison-1.49a/src/reduce.c bison/src/reduce.c
+--- bison-1.49a/src/reduce.c	Sun Apr  7 17:55:00 2002
+++ bison/src/reduce.c	Sun Apr  7 18:19:39 2002
+@@ -220,70 +220,59 @@
+	bitset_set (V1, rules[i].precsym);
+	}
+
+
+/*-------------------------------------------------------------------.
+| Put the useless productions at the end of RULES, and adjust NRULES |
+| accordingly.                                                       |
+`-------------------------------------------------------------------*/
+
+	static void
+	reduce_grammar_tables (void)
+	{
+-  /* This is turned off because we would need to change the numbers in
+-     the case statements in the actions file.
+-
+-     We don't disable it via CPP so that it is still checked with the
+-     rest of the code, to avoid its becoming completely obsolete.
+-
+-     FIXME: I think the comment above demonstrates this code must be
+-     turned off for *semantic* parser, not in the general case.  Try
+-     to understand this better --akim.  */
+-
+-  if (0)
+-    /* remove useless productions */
+-    if (nuseless_productions > 0)
+-      {
+-	short np, pn, ni, pi;
+-
+-	np = 0;
+-	ni = 0;
+-	for (pn = 1; pn < nrules + 1; pn++)
+-	  if (bitset_test (P, pn))
+-	    {
+-	      np++;
+-	      if (pn != np)
+-		{
+-		  rules[np].lhs   = rules[pn].lhs;
+-		  rules[np].line  = rules[pn].line;
+-		  rules[np].prec  = rules[pn].prec;
+-		  rules[np].assoc = rules[pn].assoc;
+-		  rules[np].rhs   = rules[pn].rhs;
+-		  if (rules[np].rhs - ritem != ni)
+-		    {
+-		      pi = rules[np].rhs - ritem;
+-		      rules[np].rhs = ritem + ni;
+-		      while (ritem[pi] >= 0)
+-			ritem[ni++] = ritem[pi++];
+-		      ritem[ni++] = -np;
+-		    }
+-		}
+-	      else
+-		{
+-		  while (ritem[ni++] >= 0)
+-		    /* Nothing. */;
+-		}
+-	    }
+-
+-	ritem[ni] = 0;
+-	nrules -= nuseless_productions;
+-	nitems = ni;
+-	nritems = ni;
+-
+-	/* Is it worth it to reduce the amount of memory for the
+-	   grammar? Probably not.  */
+-      }
+-
+-  /* Disable useless productions. */
+  /* Flag useless productions.  */
+	if (nuseless_productions > 0)
+	{
+	int pn;
+	for (pn = 1; pn < nrules + 1; pn++)
+	rules[pn].useful = bitset_test (P, pn);
+	}
+
+  /* Map the nonterminals to their new index: useful first, useless
+     afterwards.  Kept for later report.  */
+  if (nuseless_productions > 0)
+    {
+      short *map = XCALLOC (short, nrules + 1) - 1;
+      int useful = 1;
+      int useless = nrules + 1 - nuseless_productions;
+      int i;
+      for (i = 1; i < nrules + 1; ++i)
+	map[i] = rules[i].useful ? useful++ : useless++;
+
+      /* Shuffle elements of tables indexed by symbol number.  */
+      for (i = 1; i < nrules + 1; ++i)
+	if (i != map[i])
+	  {
+	    int j = map[i];
+	    rules_swap (i, map[i]);
+	    map[i] = map[j];
+	    map[j] = j;
+	  }
+
+      free (map + 1);
+      nrules -= nuseless_productions;
+    }
+
+  /* Adjust NRITEMS and NITEMS.  */
+  {
+    int r;
+    int length;
+    for (r = nrules + 1; r < nrules + 1 + nuseless_productions; ++r)
+      {
+	length = rule_rhs_length (&rules[r]);
+	nritems -= length + 1;
+	nitems -= length + 1;
+      }
+  }
+	}
+
+
+@@ -378,16 +367,15 @@
+	{
+	int i;
+	fprintf (out, "%s\n\n", _("Useless rules:"));
+-      for (i = 1; i < nrules + 1; i++)
+-	if (!rules[i].useful)
+-	  {
+-	    rule r;
+-	    fprintf (out, "#%-4d  ", i - 1);
+-	    fprintf (out, "%s:", symbols[rules[i].lhs]->tag);
+-	    for (r = rules[i].rhs; *r >= 0; r++)
+-	      fprintf (out, " %s", symbols[*r]->tag);
+-	    fputs (";\n", out);
+-	  }
+      for (i = nrules + 1; i < nuseless_productions + nrules + 1; i++)
+	{
+	  rule r;
+	  fprintf (out, "#%-4d  ", rules[i].number - 1);
+	  fprintf (out, "%s:", symbols[rules[i].lhs]->tag);
+	  for (r = rules[i].rhs; *r >= 0; r++)
+	    fprintf (out, " %s", symbols[*r]->tag);
+	  fputs (";\n", out);
+	}
+	fputs ("\n\n", out);
+	}
+	}
+@@ -411,7 +399,7 @@
+	fprintf (out, "\n\n");
+	fprintf (out, "Rules\n-----\n\n");
+	fprintf (out, "Num (Prec, Assoc, Useful, Ritem Range) Lhs -> Rhs (Ritem range) [Num]\n");
+-  for (i = 1; i < nrules + 1; i++)
+  for (i = 1; i < nrules + nuseless_productions + 1; i++)
+	{
+	int rhs_count = 0;
+	/* Find the last RHS index in ritems. */
+@@ -429,7 +417,7 @@
+	}
+	fprintf (out, "\n\n");
+	fprintf (out, "Rules interpreted\n-----------------\n\n");
+-  for (i = 1; i < nrules + 1; i++)
+  for (i = 1; i < nrules + nuseless_productions + 1; i++)
+	{
+	fprintf (out, "%-5d  %s :", i, symbols[rules[i].lhs]->tag);
+	for (r = rules[i].rhs; *r >= 0; r++)
+diff -x *.po -ur -x testsuite bison-1.49a/tests/reduce.at bison/tests/reduce.at
+--- bison-1.49a/tests/reduce.at	Sun Apr  7 17:36:56 2002
+++ bison/tests/reduce.at	Sun Apr  7 18:19:39 2002
+@@ -174,6 +174,89 @@
+
+
+	## ------------------- ##
+## Reduced Automaton.  ##
+## ------------------- ##
+
+# Check that the automaton is that as the for the grammar reduced by
+# hand.
+
+AT_SETUP([Reduced Automaton])
+
+# The non reduced grammar.
+# ------------------------
+AT_DATA([[not-reduced.y]],
+[[/* A useless token. */
+%token useless_token
+/* A useful one. */
+%token useful
+%verbose
+%output="not-reduced.c"
+
+%%
+
+exp: useful            { /* A useful action. */ }
+   | non_productive    { /* A non productive action. */ }
+   ;
+
+not_reachable: useful  { /* A not reachable action. */ }
+             ;
+
+non_productive: non_productive useless_token
+                       { /* Another non productive action. */ }
+              ;
+]])
+
+AT_CHECK([[bison not-reduced.y]], 0, [],
+[[not-reduced.y contains 2 useless nonterminals and 3 useless rules
+]])
+
+AT_CHECK([[sed -n '/^Grammar/q;/^$/!p' not-reduced.output]], 0,
+[[Useless nonterminals:
+   not_reachable
+   non_productive
+Terminals which are not used:
+   useless_token
+Useless rules:
+#2     exp: non_productive;
+#3     not_reachable: useful;
+#4     non_productive: non_productive useless_token;
+]])
+
+# The reduced grammar.
+# --------------------
+AT_DATA([[reduced.y]],
+[[/* A useless token. */
+%token useless_token
+/* A useful one. */
+%token useful
+%verbose
+%output="reduced.c"
+
+%%
+
+exp: useful            { /* A useful action. */ }
+//   | non_productive    { /* A non productive action. */ } */
+   ;
+
+//not_reachable: useful  { /* A not reachable action. */ }
+//             ;
+
+//non_productive: non_productive useless_token
+//                       { /* Another non productive action. */ }
+//              ;
+]])
+
+AT_CHECK([[bison reduced.y]])
+
+# Comparing the parsers.
+cp reduced.c expout
+AT_CHECK([sed 's/not-reduced/reduced/g' not-reduced.c], 0, [expout])
+
+AT_CLEANUP
+
+
+
+## ------------------- ##
+	## Underivable Rules.  ##
+	## ------------------- ##
+
 2002-04-07  Akim Demaille  <[email protected]>

 	* src/reduce.c (inaccessable_symbols): Fix a buglet: because of a