* src/gram.h (item_number_t): New, the type of item numbers in

RITEM.  Note that it must be able to code symbol numbers as
positive number, and the negation of rule numbers as negative
numbers.
Adjust all dependencies (pretty many).
* src/reduce.c (rule): Remove this `short *' pointer: use
item_number_t.
* src/system.h (MINSHORT, MAXSHORT): Remove.
Include `limits.h'.
Adjust dependencies to using SHRT_MAX and SHRT_MIN.
(shortcpy): Remove.
(MAXTABLE): Move to...
* src/output.c (MAXTABLE): here.
(prepare_rules): Use output_int_table to output rhs.
* data/bison.simple, data/bison.c++: Adjust.
* tests/torture.at (Big triangle): Move the limit from 254 to
500.
* tests/regression.at (Web2c Actions): Ajust.
Trying with bigger grammars shows various phenomena: at 3000 (28Mb
of grammar file) bison is killed by my system, at 2000 (12Mb) bison
passes, but produces negative #line number, once fixed, GCC is
killed while compiling 14Mb, at 1500 (6.7 Mb of grammar, 8.2Mb of
C), it passes.
* src/state.h (state_h): Code input lines on ints, not shorts.
This commit is contained in:
Akim Demaille
2002-04-08 11:46:26 +00:00
parent 355e7c1cd1
commit 62a3e4f0c5
24 changed files with 269 additions and 117 deletions

View File

@@ -1,3 +1,31 @@
2002-04-08 Akim Demaille <akim@epita.fr>
* src/gram.h (item_number_t): New, the type of item numbers in
RITEM. Note that it must be able to code symbol numbers as
positive number, and the negation of rule numbers as negative
numbers.
Adjust all dependencies (pretty many).
* src/reduce.c (rule): Remove this `short *' pointer: use
item_number_t.
* src/system.h (MINSHORT, MAXSHORT): Remove.
Include `limits.h'.
Adjust dependencies to using SHRT_MAX and SHRT_MIN.
(shortcpy): Remove.
(MAXTABLE): Move to...
* src/output.c (MAXTABLE): here.
(prepare_rules): Use output_int_table to output rhs.
* data/bison.simple, data/bison.c++: Adjust.
* tests/torture.at (Big triangle): Move the limit from 254 to
500.
* tests/regression.at (Web2c Actions): Ajust.
Trying with bigger grammars shows various phenomena: at 3000 (28Mb
of grammar file) bison is killed by my system, at 2000 (12Mb) bison
passes, but produces negative #line number, once fixed, GCC is
killed while compiling 14Mb, at 1500 (6.7 Mb of grammar, 8.2Mb of
C), it passes.
* src/state.h (state_h): Code input lines on ints, not shorts.
2002-04-08 Akim Demaille <akim@epita.fr> 2002-04-08 Akim Demaille <akim@epita.fr>
* src/reduce.c (reduce_grammar): First reduce the nonterminals, * src/reduce.c (reduce_grammar): First reduce the nonterminals,

3
NEWS
View File

@@ -4,7 +4,8 @@ Bison News
Changes in version 1.49a: Changes in version 1.49a:
* Large grammars * Large grammars
Are now supported. Are now supported (large token numbers, large grammar size (= sum of
the LHS and RHS lengths).
* The initial rule is explicit. * The initial rule is explicit.
Bison used to play hacks with the initial rule, which the user does Bison used to play hacks with the initial rule, which the user does

View File

@@ -168,6 +168,7 @@ namespace yy
struct Traits< b4_name > struct Traits< b4_name >
{ {
typedef typedef b4_uint_type(b4_token_number_max) TokenNumberType; typedef typedef b4_uint_type(b4_token_number_max) TokenNumberType;
typedef typedef b4_sint_type(b4_item_number_max) RhsNumberType;
typedef int StateType; typedef int StateType;
typedef yystype SemanticType; typedef yystype SemanticType;
typedef b4_ltype LocationType; typedef b4_ltype LocationType;
@@ -181,8 +182,9 @@ namespace yy
public: public:
typedef Traits< b4_name >::TokenNumberType TokenNumberType; typedef Traits< b4_name >::TokenNumberType TokenNumberType;
typedef Traits< b4_name >::RhsNumberType TokenNumberType;
typedef Traits< b4_name >::StateType StateType; typedef Traits< b4_name >::StateType StateType;
typedef Traits< b4_name >::SemanticType SemanticType; typedef Traits< b4_name >::SemanticType SemanticType;
typedef Traits< b4_name >::LocationType LocationType; typedef Traits< b4_name >::LocationType LocationType;
typedef Stack< StateType > StateStack; typedef Stack< StateType > StateStack;
@@ -684,7 +686,7 @@ const yy::b4_name::name_[[]] =
#if YYDEBUG #if YYDEBUG
/* YYRHS -- A `-1'-separated list of the rules' RHS. */ /* YYRHS -- A `-1'-separated list of the rules' RHS. */
const short const RhsNumberType
yy::b4_name::rhs_[[]] = yy::b4_name::rhs_[[]] =
{ {
b4_rhs b4_rhs

View File

@@ -286,7 +286,8 @@ static const short yyprhs[[]] =
}; };
/* YYRHS -- A `-1'-separated list of the rules' RHS. */ /* YYRHS -- A `-1'-separated list of the rules' RHS. */
static const short yyrhs[[]] = typedef b4_sint_type(b4_rhs_number_max) yyrhs_t;
static const yyrhs_t yyrhs[[]] =
{ {
b4_rhs b4_rhs
}; };

View File

@@ -56,9 +56,9 @@ static short *shift_symbol = NULL;
static short *redset = NULL; static short *redset = NULL;
static short *shiftset = NULL; static short *shiftset = NULL;
static short **kernel_base = NULL; static item_number_t **kernel_base = NULL;
static int *kernel_size = NULL; static int *kernel_size = NULL;
static short *kernel_items = NULL; static item_number_t *kernel_items = NULL;
/* hash table for states, to recognize equivalent ones. */ /* hash table for states, to recognize equivalent ones. */
@@ -70,7 +70,7 @@ static void
allocate_itemsets (void) allocate_itemsets (void)
{ {
int i, r; int i, r;
short *rhsp; item_number_t *rhsp;
/* Count the number of occurrences of all the symbols in RITEMS. /* Count the number of occurrences of all the symbols in RITEMS.
Note that useless productions (hence useless nonterminals) are Note that useless productions (hence useless nonterminals) are
@@ -92,9 +92,9 @@ allocate_itemsets (void)
appears as an item, which is symbol_count[symbol]. appears as an item, which is symbol_count[symbol].
We allocate that much space for each symbol. */ We allocate that much space for each symbol. */
kernel_base = XCALLOC (short *, nsyms); kernel_base = XCALLOC (item_number_t *, nsyms);
if (count) if (count)
kernel_items = XCALLOC (short, count); kernel_items = XCALLOC (item_number_t, count);
count = 0; count = 0;
for (i = 0; i < nsyms; i++) for (i = 0; i < nsyms; i++)
@@ -194,15 +194,16 @@ new_state (int symbol)
nstates, symbol, quotearg_style (escape_quoting_style, nstates, symbol, quotearg_style (escape_quoting_style,
symbols[symbol]->tag)); symbols[symbol]->tag));
if (nstates >= MAXSHORT) if (nstates >= SHRT_MAX)
fatal (_("too many states (max %d)"), MAXSHORT); fatal (_("too many states (max %d)"), SHRT_MAX);
p = STATE_ALLOC (kernel_size[symbol]); p = STATE_ALLOC (kernel_size[symbol]);
p->accessing_symbol = symbol; p->accessing_symbol = symbol;
p->number = nstates; p->number = nstates;
p->nitems = kernel_size[symbol]; p->nitems = kernel_size[symbol];
shortcpy (p->items, kernel_base[symbol], kernel_size[symbol]); memcpy (p->items, kernel_base[symbol],
kernel_size[symbol] * sizeof (kernel_base[symbol][0]));
/* If this is the eoftoken, and this is not the initial state, then /* If this is the eoftoken, and this is not the initial state, then
this is the final state. */ this is the final state. */
@@ -340,7 +341,7 @@ static void
save_shifts (void) save_shifts (void)
{ {
shifts *p = shifts_new (nshifts); shifts *p = shifts_new (nshifts);
shortcpy (p->shifts, shiftset, nshifts); memcpy (p->shifts, shiftset, nshifts * sizeof (shiftset[0]));
this_state->shifts = p; this_state->shifts = p;
} }
@@ -372,7 +373,7 @@ save_reductions (void)
/* Make a reductions structure and copy the data into it. */ /* Make a reductions structure and copy the data into it. */
this_state->reductions = reductions_new (count); this_state->reductions = reductions_new (count);
shortcpy (this_state->reductions->rules, redset, count); memcpy (this_state->reductions->rules, redset, count * sizeof (redset[0]));
} }

View File

@@ -30,7 +30,7 @@
#include "derives.h" #include "derives.h"
/* NITEMSET is the size of the array ITEMSET. */ /* NITEMSET is the size of the array ITEMSET. */
short *itemset; item_number_t *itemset;
int nritemset; int nritemset;
static bitset ruleset; static bitset ruleset;
@@ -49,13 +49,13 @@ static bitsetv firsts = NULL;
`-----------------*/ `-----------------*/
static void static void
print_closure (const char *title, short *array, size_t size) print_closure (const char *title, item_number_t *array, size_t size)
{ {
size_t i; size_t i;
fprintf (stderr, "Closure: %s\n", title); fprintf (stderr, "Closure: %s\n", title);
for (i = 0; i < size; ++i) for (i = 0; i < size; ++i)
{ {
short *rp; item_number_t *rp;
fprintf (stderr, " %2d: .", array[i]); fprintf (stderr, " %2d: .", array[i]);
for (rp = &ritem[array[i]]; *rp >= 0; ++rp) for (rp = &ritem[array[i]]; *rp >= 0; ++rp)
fprintf (stderr, " %s", fprintf (stderr, " %s",
@@ -100,7 +100,7 @@ print_fderives (void)
for (j = 0; j < nrules + 1; j++) for (j = 0; j < nrules + 1; j++)
if (bitset_test (FDERIVES (i), j)) if (bitset_test (FDERIVES (i), j))
{ {
short *rhsp; item_number_t *rhsp;
fprintf (stderr, "\t\t%d:", j - 1); fprintf (stderr, "\t\t%d:", j - 1);
for (rhsp = rules[j].rhs; *rhsp >= 0; ++rhsp) for (rhsp = rules[j].rhs; *rhsp >= 0; ++rhsp)
fprintf (stderr, " %s", fprintf (stderr, " %s",
@@ -231,7 +231,7 @@ set_fderives (void)
void void
new_closure (int n) new_closure (int n)
{ {
itemset = XCALLOC (short, n); itemset = XCALLOC (item_number_t, n);
ruleset = bitset_create (nrules + 1, BITSET_FIXED); ruleset = bitset_create (nrules + 1, BITSET_FIXED);
@@ -241,7 +241,7 @@ new_closure (int n)
void void
closure (short *core, int n) closure (item_number_t *core, int n)
{ {
/* Index over CORE. */ /* Index over CORE. */
int c; int c;
@@ -263,7 +263,7 @@ closure (short *core, int n)
for (ruleno = 0; ruleno < nrules + 1; ++ruleno) for (ruleno = 0; ruleno < nrules + 1; ++ruleno)
if (bitset_test (ruleset, ruleno)) if (bitset_test (ruleset, ruleno))
{ {
int itemno = rules[ruleno].rhs - ritem; item_number_t itemno = rules[ruleno].rhs - ritem;
while (c < n && core[c] < itemno) while (c < n && core[c] < itemno)
{ {
itemset[nritemset] = core[c]; itemset[nritemset] = core[c];

View File

@@ -42,14 +42,14 @@ void new_closure PARAMS ((int n));
significant). CLOSURE places there the indices of all items which significant). CLOSURE places there the indices of all items which
represent units of input that could arrive next. */ represent units of input that could arrive next. */
void closure PARAMS ((short *items, int n)); void closure PARAMS ((item_number_t *items, int n));
/* Frees ITEMSET, RULESET and internal data. */ /* Frees ITEMSET, RULESET and internal data. */
void free_closure PARAMS ((void)); void free_closure PARAMS ((void));
extern short *itemset; extern item_number_t *itemset;
extern int nritemset; extern int nritemset;
#endif /* !CLOSURE_H_ */ #endif /* !CLOSURE_H_ */

View File

@@ -42,7 +42,7 @@ print_derives (void)
fprintf (stderr, "\t%s derives\n", symbols[i]->tag); fprintf (stderr, "\t%s derives\n", symbols[i]->tag);
for (sp = derives[i]; *sp > 0; sp++) for (sp = derives[i]; *sp > 0; sp++)
{ {
short *rhsp; item_number_t *rhsp;
fprintf (stderr, "\t\t%d:", *sp); fprintf (stderr, "\t\t%d:", *sp);
for (rhsp = rules[*sp].rhs; *rhsp >= 0; ++rhsp) for (rhsp = rules[*sp].rhs; *rhsp >= 0; ++rhsp)
fprintf (stderr, " %s", symbols[*rhsp]->tag); fprintf (stderr, " %s", symbols[*rhsp]->tag);

View File

@@ -27,7 +27,7 @@
/* comments for these variables are in gram.h */ /* comments for these variables are in gram.h */
short *ritem = NULL; item_number_t *ritem = NULL;
int nritems = 0; int nritems = 0;
rule_t *rules = NULL; rule_t *rules = NULL;
@@ -59,7 +59,7 @@ int
rule_rhs_length (rule_t *rule) rule_rhs_length (rule_t *rule)
{ {
int res = 0; int res = 0;
short *rhsp; item_number_t *rhsp;
for (rhsp = rule->rhs; *rhsp >= 0; ++rhsp) for (rhsp = rule->rhs; *rhsp >= 0; ++rhsp)
++res; ++res;
return res; return res;

View File

@@ -109,11 +109,14 @@ extern int nsyms;
extern int ntokens; extern int ntokens;
extern int nvars; extern int nvars;
extern short *ritem; #define ITEM_NUMBER_MAX INT_MAX
typedef int item_number_t;
extern item_number_t *ritem;
extern int nritems; extern int nritems;
extern int start_symbol; extern int start_symbol;
typedef struct rule_s typedef struct rule_s
{ {
/* The number of the rule in the source. It is usually the index in /* The number of the rule in the source. It is usually the index in
@@ -125,7 +128,7 @@ typedef struct rule_s
short number; short number;
symbol_t *lhs; symbol_t *lhs;
short *rhs; item_number_t *rhs;
/* This symbol provides both the associativity, and the precedence. */ /* This symbol provides both the associativity, and the precedence. */
symbol_t *prec; symbol_t *prec;
@@ -133,14 +136,14 @@ typedef struct rule_s
/* This symbol was attached to the rule via %prec. */ /* This symbol was attached to the rule via %prec. */
symbol_t *precsym; symbol_t *precsym;
short line; int line;
bool useful; bool useful;
const char *action; const char *action;
short action_line; int action_line;
const char *guard; const char *guard;
short guard_line; int guard_line;
} rule_t; } rule_t;
extern struct rule_s *rules; extern struct rule_s *rules;

View File

@@ -28,11 +28,11 @@
#include "bitset.h" #include "bitset.h"
#include "bitsetv.h" #include "bitsetv.h"
#include "quotearg.h" #include "quotearg.h"
#include "symtab.h"
#include "gram.h"
#include "reader.h" #include "reader.h"
#include "types.h" #include "types.h"
#include "LR0.h" #include "LR0.h"
#include "symtab.h"
#include "gram.h"
#include "complain.h" #include "complain.h"
#include "lalr.h" #include "lalr.h"
#include "nullable.h" #include "nullable.h"
@@ -170,8 +170,8 @@ set_goto_map (void)
shifts *sp = states[state]->shifts; shifts *sp = states[state]->shifts;
for (i = sp->nshifts - 1; i >= 0 && SHIFT_IS_GOTO (sp, i); --i) for (i = sp->nshifts - 1; i >= 0 && SHIFT_IS_GOTO (sp, i); --i)
{ {
if (ngotos == MAXSHORT) if (ngotos == SHRT_MAX)
fatal (_("too many gotos (max %d)"), MAXSHORT); fatal (_("too many gotos (max %d)"), SHRT_MAX);
ngotos++; ngotos++;
goto_map[SHIFT_SYMBOL (sp, i)]++; goto_map[SHIFT_SYMBOL (sp, i)]++;
@@ -275,7 +275,7 @@ initialize_F (void)
if (nedges) if (nedges)
{ {
reads[i] = XCALLOC (short, nedges + 1); reads[i] = XCALLOC (short, nedges + 1);
shortcpy (reads[i], edge, nedges); memcpy (reads[i], edge, nedges * sizeof (edge[0]));
reads[i][nedges] = -1; reads[i][nedges] = -1;
nedges = 0; nedges = 0;
} }
@@ -415,7 +415,7 @@ build_relations (void)
{ {
int done; int done;
int length = 1; int length = 1;
short *rp; item_number_t *rp;
state_t *state = states[from_state[i]]; state_t *state = states[from_state[i]];
states1[0] = state->number; states1[0] = state->number;

View File

@@ -23,6 +23,8 @@
#include "system.h" #include "system.h"
#include "bitset.h" #include "bitset.h"
#include "getargs.h" #include "getargs.h"
#include "symtab.h"
#include "gram.h"
#include "files.h" #include "files.h"
#include "complain.h" #include "complain.h"
#include "derives.h" #include "derives.h"
@@ -36,7 +38,6 @@
#include "conflicts.h" #include "conflicts.h"
#include "print_graph.h" #include "print_graph.h"
#include "muscle_tab.h" #include "muscle_tab.h"
#include "symtab.h"
#include "lex.h" #include "lex.h"
/* The name this program was run with, for messages. */ /* The name this program was run with, for messages. */

View File

@@ -74,7 +74,7 @@ set_nullable (void)
if (rules[ruleno].rhs[0] >= 0) if (rules[ruleno].rhs[0] >= 0)
{ {
/* This rule has a non empty RHS. */ /* This rule has a non empty RHS. */
short *r; item_number_t *r;
int any_tokens = 0; int any_tokens = 0;
for (r = rules[ruleno].rhs; *r >= 0; ++r) for (r = rules[ruleno].rhs; *r >= 0; ++r)
if (ISTOKEN (*r)) if (ISTOKEN (*r))

View File

@@ -153,11 +153,47 @@ get_lines_number (const char *s)
`----------------------------------------------------------------*/ `----------------------------------------------------------------*/
static inline long int static inline long int
output_table_data (struct obstack *oout, output_short_table (struct obstack *oout,
short *table_data, short *table_data,
short first, short first,
int begin, int begin,
int end) int end)
{
long int max = first;
int i;
int j = 1;
obstack_fgrow1 (oout, "%6d", first);
for (i = begin; i < end; ++i)
{
obstack_1grow (oout, ',');
if (j >= 10)
{
obstack_sgrow (oout, "\n ");
j = 1;
}
else
++j;
obstack_fgrow1 (oout, "%6d", table_data[i]);
if (table_data[i] > max)
max = table_data[i];
}
obstack_1grow (oout, 0);
return max;
}
/*--------------------.
| Similar, for ints. |
`--------------------*/
static inline long int
output_int_table (struct obstack *oout,
int *table_data,
int first,
int begin,
int end)
{ {
long int max = first; long int max = first;
int i; int i;
@@ -192,7 +228,7 @@ output_table_data (struct obstack *oout,
static void static void
prepare_tokens (void) prepare_tokens (void)
{ {
long int max = output_table_data (&format_obstack, token_translations, long int max = output_short_table (&format_obstack, token_translations,
0, 1, max_user_token_number + 1); 0, 1, max_user_token_number + 1);
muscle_insert ("translate", obstack_finish (&format_obstack)); muscle_insert ("translate", obstack_finish (&format_obstack));
MUSCLE_INSERT_LONG_INT ("token_number_max", max); MUSCLE_INSERT_LONG_INT ("token_number_max", max);
@@ -237,7 +273,7 @@ prepare_tokens (void)
short *values = XCALLOC (short, ntokens + 1); short *values = XCALLOC (short, ntokens + 1);
for (i = 0; i < ntokens + 1; ++i) for (i = 0; i < ntokens + 1; ++i)
values[i] = symbols[i]->user_token_number; values[i] = symbols[i]->user_token_number;
output_table_data (&format_obstack, values, output_short_table (&format_obstack, values,
0, 1, ntokens + 1); 0, 1, ntokens + 1);
muscle_insert ("toknum", obstack_finish (&format_obstack)); muscle_insert ("toknum", obstack_finish (&format_obstack));
free (values); free (values);
@@ -253,10 +289,11 @@ prepare_tokens (void)
static void static void
prepare_rules (void) prepare_rules (void)
{ {
short *rhsp; long int max;
item_number_t *rhsp;
int r; int r;
int i = 0; int i = 0;
short *rhs = XMALLOC (short, nritems); item_number_t *rhs = XMALLOC (item_number_t, nritems);
short *prhs = XMALLOC (short, nrules + 1); short *prhs = XMALLOC (short, nrules + 1);
short *r1 = XMALLOC (short, nrules + 1); short *r1 = XMALLOC (short, nrules + 1);
short *r2 = XMALLOC (short, nrules + 1); short *r2 = XMALLOC (short, nrules + 1);
@@ -280,19 +317,20 @@ prepare_rules (void)
} }
assert (i == nritems); assert (i == nritems);
output_table_data (&format_obstack, rhs, ritem[0], 1, nritems); max = output_int_table (&format_obstack, rhs, ritem[0], 1, nritems);
muscle_insert ("rhs", obstack_finish (&format_obstack)); muscle_insert ("rhs", obstack_finish (&format_obstack));
MUSCLE_INSERT_LONG_INT ("rhs_number_max", max);
output_table_data (&format_obstack, prhs, 0, 1, nrules + 1); output_short_table (&format_obstack, prhs, 0, 1, nrules + 1);
muscle_insert ("prhs", obstack_finish (&format_obstack)); muscle_insert ("prhs", obstack_finish (&format_obstack));
output_table_data (&format_obstack, rline, 0, 1, nrules + 1); output_short_table (&format_obstack, rline, 0, 1, nrules + 1);
muscle_insert ("rline", obstack_finish (&format_obstack)); muscle_insert ("rline", obstack_finish (&format_obstack));
output_table_data (&format_obstack, r1, 0, 1, nrules + 1); output_short_table (&format_obstack, r1, 0, 1, nrules + 1);
muscle_insert ("r1", obstack_finish (&format_obstack)); muscle_insert ("r1", obstack_finish (&format_obstack));
output_table_data (&format_obstack, r2, 0, 1, nrules + 1); output_short_table (&format_obstack, r2, 0, 1, nrules + 1);
muscle_insert ("r2", obstack_finish (&format_obstack)); muscle_insert ("r2", obstack_finish (&format_obstack));
free (rhs); free (rhs);
@@ -311,7 +349,7 @@ prepare_states (void)
short *values = (short *) alloca (sizeof (short) * nstates); short *values = (short *) alloca (sizeof (short) * nstates);
for (i = 0; i < nstates; ++i) for (i = 0; i < nstates; ++i)
values[i] = states[i]->accessing_symbol; values[i] = states[i]->accessing_symbol;
output_table_data (&format_obstack, values, output_short_table (&format_obstack, values,
0, 1, nstates); 0, 1, nstates);
muscle_insert ("stos", obstack_finish (&format_obstack)); muscle_insert ("stos", obstack_finish (&format_obstack));
} }
@@ -323,7 +361,7 @@ prepare_states (void)
| default action (yydefact) for the state. In addition, actrow is | | default action (yydefact) for the state. In addition, actrow is |
| filled with what to do for each kind of token, index by symbol | | filled with what to do for each kind of token, index by symbol |
| number, with zero meaning do the default action. The value | | number, with zero meaning do the default action. The value |
| MINSHORT, a very negative number, means this situation is an | | SHRT_MIN, a very negative number, means this situation is an |
| error. The parser recognizes this value specially. | | error. The parser recognizes this value specially. |
| | | |
| This is where conflicts are resolved. The loop over lookahead | | This is where conflicts are resolved. The loop over lookahead |
@@ -384,11 +422,11 @@ action_row (state_t *state)
} }
/* See which tokens are an explicit error in this state (due to /* See which tokens are an explicit error in this state (due to
%nonassoc). For them, record MINSHORT as the action. */ %nonassoc). For them, record SHRT_MIN as the action. */
for (i = 0; i < errp->nerrs; i++) for (i = 0; i < errp->nerrs; i++)
{ {
int symbol = errp->errs[i]; int symbol = errp->errs[i];
actrow[symbol] = MINSHORT; actrow[symbol] = SHRT_MIN;
} }
/* Now find the most common reduction and make it the default action /* Now find the most common reduction and make it the default action
@@ -438,7 +476,7 @@ action_row (state_t *state)
if (default_rule == 0) if (default_rule == 0)
for (i = 0; i < ntokens; i++) for (i = 0; i < ntokens; i++)
if (actrow[i] == MINSHORT) if (actrow[i] == SHRT_MIN)
actrow[i] = 0; actrow[i] = 0;
return default_rule; return default_rule;
@@ -498,7 +536,7 @@ token_actions (void)
save_row (i); save_row (i);
} }
output_table_data (&format_obstack, yydefact, output_short_table (&format_obstack, yydefact,
yydefact[0], 1, nstates); yydefact[0], 1, nstates);
muscle_insert ("defact", obstack_finish (&format_obstack)); muscle_insert ("defact", obstack_finish (&format_obstack));
@@ -692,7 +730,7 @@ goto_actions (void)
yydefgoto[i - ntokens] = default_state; yydefgoto[i - ntokens] = default_state;
} }
output_table_data (&format_obstack, yydefgoto, output_short_table (&format_obstack, yydefgoto,
yydefgoto[0], 1, nsyms - ntokens); yydefgoto[0], 1, nsyms - ntokens);
muscle_insert ("defgoto", obstack_finish (&format_obstack)); muscle_insert ("defgoto", obstack_finish (&format_obstack));
@@ -769,6 +807,8 @@ matching_state (int vector)
return -1; return -1;
} }
/* FIXME: For the time being, best approximation... */
#define MAXTABLE SHRT_MAX
static int static int
pack_vector (int vector) pack_vector (int vector)
@@ -841,7 +881,7 @@ pack_table (void)
high = 0; high = 0;
for (i = 0; i < nvectors; i++) for (i = 0; i < nvectors; i++)
base[i] = MINSHORT; base[i] = SHRT_MIN;
for (i = 0; i < MAXTABLE; i++) for (i = 0; i < MAXTABLE; i++)
check[i] = -1; check[i] = -1;
@@ -877,12 +917,12 @@ static void
output_base (void) output_base (void)
{ {
/* Output pact. */ /* Output pact. */
output_table_data (&format_obstack, base, output_short_table (&format_obstack, base,
base[0], 1, nstates); base[0], 1, nstates);
muscle_insert ("pact", obstack_finish (&format_obstack)); muscle_insert ("pact", obstack_finish (&format_obstack));
/* Output pgoto. */ /* Output pgoto. */
output_table_data (&format_obstack, base, output_short_table (&format_obstack, base,
base[nstates], nstates + 1, nvectors); base[nstates], nstates + 1, nvectors);
muscle_insert ("pgoto", obstack_finish (&format_obstack)); muscle_insert ("pgoto", obstack_finish (&format_obstack));
@@ -893,7 +933,7 @@ output_base (void)
static void static void
output_table (void) output_table (void)
{ {
output_table_data (&format_obstack, table, output_short_table (&format_obstack, table,
table[0], 1, high + 1); table[0], 1, high + 1);
muscle_insert ("table", obstack_finish (&format_obstack)); muscle_insert ("table", obstack_finish (&format_obstack));
XFREE (table); XFREE (table);
@@ -903,7 +943,7 @@ output_table (void)
static void static void
output_check (void) output_check (void)
{ {
output_table_data (&format_obstack, check, output_short_table (&format_obstack, check,
check[0], 1, high + 1); check[0], 1, high + 1);
muscle_insert ("check", obstack_finish (&format_obstack)); muscle_insert ("check", obstack_finish (&format_obstack));
XFREE (check); XFREE (check);
@@ -1033,7 +1073,7 @@ static void
prepare (void) prepare (void)
{ {
MUSCLE_INSERT_INT ("last", high); MUSCLE_INSERT_INT ("last", high);
MUSCLE_INSERT_INT ("flag", MINSHORT); MUSCLE_INSERT_INT ("flag", SHRT_MIN);
MUSCLE_INSERT_INT ("pure", pure_parser); MUSCLE_INSERT_INT ("pure", pure_parser);
MUSCLE_INSERT_INT ("nsym", nsyms); MUSCLE_INSERT_INT ("nsym", nsyms);
MUSCLE_INSERT_INT ("debug", debug_flag); MUSCLE_INSERT_INT ("debug", debug_flag);

View File

@@ -69,7 +69,7 @@ static void
print_core (FILE *out, state_t *state) print_core (FILE *out, state_t *state)
{ {
int i; int i;
short *sitems = state->items; item_number_t *sitems = state->items;
int snritems = state->nitems; int snritems = state->nitems;
/* New experimental feature: if TRACE_FLAGS output all the items of /* New experimental feature: if TRACE_FLAGS output all the items of
@@ -85,8 +85,8 @@ print_core (FILE *out, state_t *state)
{ {
for (i = 0; i < snritems; i++) for (i = 0; i < snritems; i++)
{ {
short *sp; item_number_t *sp;
short *sp1; item_number_t *sp1;
int rule; int rule;
sp1 = sp = ritem + sitems[i]; sp1 = sp = ritem + sitems[i];
@@ -361,7 +361,7 @@ static void
print_grammar (FILE *out) print_grammar (FILE *out)
{ {
int i, j; int i, j;
short *rule; item_number_t *rule;
char buffer[90]; char buffer[90];
int column = 0; int column = 0;

View File

@@ -50,7 +50,7 @@ static void
print_core (state_t *state, struct obstack *node_obstack) print_core (state_t *state, struct obstack *node_obstack)
{ {
int i; int i;
short *sitems = state->items; item_number_t *sitems = state->items;
int snritems = state->nitems; int snritems = state->nitems;
/* Output all the items of a state, not only its kernel. */ /* Output all the items of a state, not only its kernel. */
@@ -64,8 +64,8 @@ print_core (state_t *state, struct obstack *node_obstack)
obstack_fgrow1 (node_obstack, "state %2d\n", state->number); obstack_fgrow1 (node_obstack, "state %2d\n", state->number);
for (i = 0; i < snritems; i++) for (i = 0; i < snritems; i++)
{ {
short *sp; item_number_t *sp;
short *sp1; item_number_t *sp1;
int rule; int rule;
sp1 = sp = ritem + sitems[i]; sp1 = sp = ritem + sitems[i];

View File

@@ -1637,9 +1637,9 @@ readgram (void)
grammar = p; grammar = p;
startval = axiom; startval = axiom;
if (nsyms > MAXSHORT) if (nsyms > SHRT_MAX)
fatal (_("too many symbols (tokens plus nonterminals); maximum %d"), fatal (_("too many symbols (tokens plus nonterminals); maximum %d"),
MAXSHORT); SHRT_MAX);
assert (nsyms == ntokens + nvars); assert (nsyms == ntokens + nvars);
} }
@@ -1741,11 +1741,7 @@ packgram (void)
int ruleno; int ruleno;
symbol_list *p; symbol_list *p;
/* We use short to index items. */ ritem = XCALLOC (item_number_t, nritems + 1);
if (nritems >= MAXSHORT)
fatal (_("too many items (max %d)"), MAXSHORT);
ritem = XCALLOC (short, nritems + 1);
rules = XCALLOC (rule_t, nrules) - 1; rules = XCALLOC (rule_t, nrules) - 1;
itemno = 0; itemno = 0;

View File

@@ -37,9 +37,6 @@
#include "getargs.h" #include "getargs.h"
#include "bitset.h" #include "bitset.h"
typedef short *rule;
/* Set of all nonterminals which are not useless. */ /* Set of all nonterminals which are not useless. */
static bitset N; static bitset N;
@@ -67,7 +64,7 @@ int nuseless_nonterminals;
static bool static bool
useful_production (int i, bitset N0) useful_production (int i, bitset N0)
{ {
rule r; item_number_t *r;
short n; short n;
/* A production is useful if all of the nonterminals in its appear /* A production is useful if all of the nonterminals in its appear
@@ -139,7 +136,7 @@ inaccessable_symbols (void)
bitset Vp, Vs, Pp; bitset Vp, Vs, Pp;
int i; int i;
short t; short t;
rule r; item_number_t *r;
/* Find out which productions are reachable and which symbols are /* Find out which productions are reachable and which symbols are
used. Starting with an empty set of productions and a set of used. Starting with an empty set of productions and a set of
@@ -252,7 +249,7 @@ reduce_grammar_tables (void)
/* Renumber the rules markers in RITEMS. */ /* Renumber the rules markers in RITEMS. */
for (i = 1; i < nrules + 1; ++i) for (i = 1; i < nrules + 1; ++i)
{ {
short *rhsp = rules[i].rhs; item_number_t *rhsp = rules[i].rhs;
for (/* Nothing. */; *rhsp >= 0; ++rhsp) for (/* Nothing. */; *rhsp >= 0; ++rhsp)
/* Nothing. */; /* Nothing. */;
*rhsp = -i; *rhsp = -i;
@@ -361,7 +358,7 @@ reduce_output (FILE *out)
fprintf (out, "%s\n\n", _("Useless rules:")); fprintf (out, "%s\n\n", _("Useless rules:"));
for (i = nrules + 1; i < nuseless_productions + nrules + 1; i++) for (i = nrules + 1; i < nuseless_productions + nrules + 1; i++)
{ {
rule r; item_number_t *r;
fprintf (out, "#%-4d ", rules[i].user_number - 1); fprintf (out, "#%-4d ", rules[i].user_number - 1);
fprintf (out, "%s:", quotearg_style (escape_quoting_style, fprintf (out, "%s:", quotearg_style (escape_quoting_style,
rules[i].lhs->tag)); rules[i].lhs->tag));
@@ -378,7 +375,7 @@ static void
dump_grammar (FILE *out) dump_grammar (FILE *out)
{ {
int i; int i;
rule r; item_number_t *r;
fprintf (out, "REDUCED GRAMMAR\n\n"); fprintf (out, "REDUCED GRAMMAR\n\n");
fprintf (out, fprintf (out,

View File

@@ -1,5 +1,5 @@
/* Type definitions for nondeterministic finite state machine for bison, /* Type definitions for nondeterministic finite state machine for bison,
Copyright 2001 Free Software Foundation, Inc. Copyright (C) 2001, 2002 Free Software Foundation, Inc.
This file is part of Bison, the GNU Compiler Compiler. This file is part of Bison, the GNU Compiler Compiler.
@@ -20,6 +20,7 @@
#include "system.h" #include "system.h"
#include "gram.h"
#include "state.h" #include "state.h"
/*---------------------------------. /*---------------------------------.

View File

@@ -186,11 +186,11 @@ typedef struct state_s
/* Its items. */ /* Its items. */
short nitems; short nitems;
short items[1]; item_number_t items[1];
} state_t; } state_t;
#define STATE_ALLOC(Nitems) \ #define STATE_ALLOC(Nitems) \
(state_t *) xcalloc ((unsigned) (sizeof (state_t) \ (state_t *) xcalloc ((unsigned) (sizeof (state_t) \
+ (Nitems - 1) * sizeof (short)), 1) + (Nitems - 1) * sizeof (item_number_t)), 1)
#endif /* !STATE_H_ */ #endif /* !STATE_H_ */

View File

@@ -53,7 +53,7 @@ struct symbol_s
short number; short number;
short prec; short prec;
associativity assoc; associativity assoc;
short user_token_number; int user_token_number;
/* Points to the other in the identifier-symbol pair for an /* Points to the other in the identifier-symbol pair for an
alias. Special value SALIAS in the identifier half of the alias. Special value SALIAS in the identifier half of the

View File

@@ -89,6 +89,9 @@ char *alloca ();
# endif # endif
#endif #endif
/* FIXME: Autoconfiscate. */
#include <limits.h>
# include "xalloc.h" # include "xalloc.h"
/* From xstrndup.c. */ /* From xstrndup.c. */
@@ -219,23 +222,6 @@ do { \
} while (0) } while (0)
/*---------------------------------.
| Machine-dependencies for Bison. |
`---------------------------------*/
#ifdef eta10
# define MAXSHORT 2147483647
# define MINSHORT -2147483648
#else
# define MAXSHORT 32767
# define MINSHORT -32768
#endif
#if defined (MSDOS) && !defined (__GO32__)
# define MAXTABLE 16383
#else
# define MAXTABLE 32767
#endif
/*-----------------------------------------. /*-----------------------------------------.
| Extensions to use for the output files. | | Extensions to use for the output files. |
@@ -269,13 +255,6 @@ do { \
/*----------------------------.
| As memcpy, but for shorts. |
`----------------------------*/
#define shortcpy(Dest, Src, Num) \
memcpy (Dest, Src, Num * sizeof (short))
/*---------------------. /*---------------------.
| Free a linked list. | | Free a linked list. |
`---------------------*/ `---------------------*/

View File

@@ -467,7 +467,7 @@ static const short yyprhs[] =
{ {
0, 0, 3, 5, 6, 9, 14 0, 0, 3, 5, 6, 9, 14
}; };
static const short yyrhs[] = static const yyrhs_t yyrhs[] =
{ {
8, 0, -1, 9, -1, -1, 10, 11, -1, 3, 8, 0, -1, 9, -1, -1, 10, 11, -1, 3,
4, 5, 8, -1, 6, 8, -1 4, 5, 8, -1, 6, 8, -1

View File

@@ -140,6 +140,108 @@ AT_CLEANUP
# AT_DATA_HORIZONTAL_GRAMMAR(FILE-NAME, SIZE)
# -------------------------------------------
# Create FILE-NAME, containing a self checking parser for a huge
# horizontal grammar.
# FIXME: The `10 *' below are there to avoid clashes with predefined
# tokens. These clashes should be exercised, I'm afraid something
# is broken wrt previous Bisons.
m4_define([AT_DATA_HORIZONTAL_GRAMMAR],
[AT_DATA([[gengram.pl]],
[[#! /usr/bin/perl -w
use strict;
my $max = $ARGV[0] || 10;
print <<EOF;
%{
#include <stdio.h>
#include <stdlib.h>
#include <assert.h>
#define YYERROR_VERBOSE 1
#define YYDEBUG 1
static int yylex (void);
static void yyerror (const char *msg);
%}
EOF
for my $size (1 .. $max)
{
print "%token \"$size\" ", $size * 10, "\n";
};
print <<EOF;
%%
EOF
use Text::Wrap;
print
wrap ("exp: ", " ",
(map { "\"$_\"" } (1 .. $max)), ";"),
"\n";
print <<EOF;
%%
static int
yylex (void)
{
static int counter = 1;
if (counter > $max)
return 0;
else
return counter++ * 10;
}
static void
yyerror (const char *msg)
{
fprintf (stderr, "%s\\n", msg);
}
int
main (void)
{
yydebug = !!getenv ("YYDEBUG");
return yyparse ();
}
EOF
]])
AT_CHECK([perl -w ./gengram.pl $2 || exit 77], 0, [stdout])
mv stdout $1
])
## ---------------- ##
## Big horizontal. ##
## ---------------- ##
AT_SETUP([Big horizontal])
# I have been able to go up to 10000 on my machine, but I had to
# increase the maximum stack size (* 100). It gave:
#
# input.y 263k
# input.tab.c 1.3M
# input 453k
#
# gengram.pl 10000 0.70s user 0.01s sys 99% cpu 0.711 total
# bison input.y 730.56s user 0.53s sys 99% cpu 12:12.34 total
# gcc -Wall input.tab.c -o input 5.81s user 0.20s sys 100% cpu 6.01 total
# ./input 0.00s user 0.01s sys 108% cpu 0.01 total
#
AT_DATA_HORIZONTAL_GRAMMAR([input.y], [1000])
AT_CHECK([bison input.y -v -o input.c])
AT_CHECK([$CC $CFLAGS $CPPFLAGS input.c -o input], 0, [], [ignore])
AT_CHECK([./input])
AT_CLEANUP
# AT_DATA_STACK_TORTURE(C-PROLOGUE) # AT_DATA_STACK_TORTURE(C-PROLOGUE)
# --------------------------------- # ---------------------------------
# A parser specialized in torturing the stack size. # A parser specialized in torturing the stack size.