mirror of
https://git.savannah.gnu.org/git/bison.git
synced 2026-03-10 04:43:03 +00:00
612 lines
16 KiB
C
612 lines
16 KiB
C
/* Generate the nondeterministic finite state machine for bison,
|
||
Copyright 1984, 1986, 1989, 2000, 2001 Free Software Foundation, Inc.
|
||
|
||
This file is part of Bison, the GNU Compiler Compiler.
|
||
|
||
Bison is free software; you can redistribute it and/or modify
|
||
it under the terms of the GNU General Public License as published by
|
||
the Free Software Foundation; either version 2, or (at your option)
|
||
any later version.
|
||
|
||
Bison is distributed in the hope that it will be useful,
|
||
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
GNU General Public License for more details.
|
||
|
||
You should have received a copy of the GNU General Public License
|
||
along with Bison; see the file COPYING. If not, write to
|
||
the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
||
Boston, MA 02111-1307, USA. */
|
||
|
||
|
||
/* See comments in state.h for the data structures that represent it.
|
||
The entry point is generate_states. */
|
||
|
||
#include "system.h"
|
||
#include "getargs.h"
|
||
#include "reader.h"
|
||
#include "gram.h"
|
||
#include "state.h"
|
||
#include "complain.h"
|
||
#include "closure.h"
|
||
#include "LR0.h"
|
||
#include "lalr.h"
|
||
#include "reduce.h"
|
||
|
||
int nstates;
|
||
int final_state;
|
||
static state_t *first_state = NULL;
|
||
|
||
static state_t *this_state = NULL;
|
||
static state_t *last_state = NULL;
|
||
|
||
static int nshifts;
|
||
static short *shift_symbol = NULL;
|
||
|
||
static short *redset = NULL;
|
||
static short *shiftset = NULL;
|
||
|
||
static short **kernel_base = NULL;
|
||
static int *kernel_size = NULL;
|
||
static short *kernel_items = NULL;
|
||
|
||
/* hash table for states, to recognize equivalent ones. */
|
||
|
||
#define STATE_HASH_SIZE 1009
|
||
static state_t **state_hash = NULL;
|
||
|
||
|
||
static void
|
||
allocate_itemsets (void)
|
||
{
|
||
int i;
|
||
|
||
/* Count the number of occurrences of all the symbols in RITEMS.
|
||
Note that useless productions (hence useless nonterminals) are
|
||
browsed too, hence we need to allocate room for _all_ the
|
||
symbols. */
|
||
int count = 0;
|
||
short *symbol_count = XCALLOC (short, nsyms + nuseless_nonterminals);
|
||
|
||
for (i = 0; ritem[i]; ++i)
|
||
if (ritem[i] > 0)
|
||
{
|
||
count++;
|
||
symbol_count[ritem[i]]++;
|
||
}
|
||
|
||
/* See comments before new_itemsets. All the vectors of items
|
||
live inside KERNEL_ITEMS. The number of active items after
|
||
some symbol cannot be more than the number of times that symbol
|
||
appears as an item, which is symbol_count[symbol].
|
||
We allocate that much space for each symbol. */
|
||
|
||
kernel_base = XCALLOC (short *, nsyms);
|
||
if (count)
|
||
kernel_items = XCALLOC (short, count);
|
||
|
||
count = 0;
|
||
for (i = 0; i < nsyms; i++)
|
||
{
|
||
kernel_base[i] = kernel_items + count;
|
||
count += symbol_count[i];
|
||
}
|
||
|
||
free (symbol_count);
|
||
kernel_size = XCALLOC (int, nsyms);
|
||
}
|
||
|
||
|
||
static void
|
||
allocate_storage (void)
|
||
{
|
||
allocate_itemsets ();
|
||
|
||
shiftset = XCALLOC (short, nsyms);
|
||
redset = XCALLOC (short, nrules + 1);
|
||
state_hash = XCALLOC (state_t *, STATE_HASH_SIZE);
|
||
}
|
||
|
||
|
||
static void
|
||
free_storage (void)
|
||
{
|
||
free (shift_symbol);
|
||
free (redset);
|
||
free (shiftset);
|
||
free (kernel_base);
|
||
free (kernel_size);
|
||
XFREE (kernel_items);
|
||
free (state_hash);
|
||
}
|
||
|
||
|
||
|
||
|
||
/*----------------------------------------------------------------.
|
||
| Find which symbols can be shifted in the current state, and for |
|
||
| each one record which items would be active after that shift. |
|
||
| Uses the contents of itemset. |
|
||
| |
|
||
| shift_symbol is set to a vector of the symbols that can be |
|
||
| shifted. For each symbol in the grammar, kernel_base[symbol] |
|
||
| points to a vector of item numbers activated if that symbol is |
|
||
| shifted, and kernel_size[symbol] is their numbers. |
|
||
`----------------------------------------------------------------*/
|
||
|
||
static void
|
||
new_itemsets (void)
|
||
{
|
||
int i;
|
||
|
||
if (trace_flag)
|
||
fprintf (stderr, "Entering new_itemsets, state = %d\n",
|
||
this_state->number);
|
||
|
||
for (i = 0; i < nsyms; i++)
|
||
kernel_size[i] = 0;
|
||
|
||
shift_symbol = XCALLOC (short, nsyms);
|
||
nshifts = 0;
|
||
|
||
for (i = 0; i < nitemset; ++i)
|
||
{
|
||
int symbol = ritem[itemset[i]];
|
||
if (symbol > 0)
|
||
{
|
||
if (!kernel_size[symbol])
|
||
{
|
||
shift_symbol[nshifts] = symbol;
|
||
nshifts++;
|
||
}
|
||
|
||
kernel_base[symbol][kernel_size[symbol]] = itemset[i] + 1;
|
||
kernel_size[symbol]++;
|
||
}
|
||
}
|
||
}
|
||
|
||
|
||
|
||
/*-----------------------------------------------------------------.
|
||
| Subroutine of get_state. Create a new state for those items, if |
|
||
| necessary. |
|
||
`-----------------------------------------------------------------*/
|
||
|
||
static state_t *
|
||
new_state (int symbol)
|
||
{
|
||
state_t *p;
|
||
|
||
if (trace_flag)
|
||
fprintf (stderr, "Entering new_state, state = %d, symbol = %d (%s)\n",
|
||
this_state->number, symbol, tags[symbol]);
|
||
|
||
if (nstates >= MAXSHORT)
|
||
fatal (_("too many states (max %d)"), MAXSHORT);
|
||
|
||
p = STATE_ALLOC (kernel_size[symbol]);
|
||
p->accessing_symbol = symbol;
|
||
p->number = nstates;
|
||
p->nitems = kernel_size[symbol];
|
||
|
||
shortcpy (p->items, kernel_base[symbol], kernel_size[symbol]);
|
||
|
||
last_state->next = p;
|
||
last_state = p;
|
||
nstates++;
|
||
|
||
return p;
|
||
}
|
||
|
||
|
||
/*--------------------------------------------------------------.
|
||
| Find the state number for the state we would get to (from the |
|
||
| current state) by shifting symbol. Create a new state if no |
|
||
| equivalent one exists already. Used by append_states. |
|
||
`--------------------------------------------------------------*/
|
||
|
||
static int
|
||
get_state (int symbol)
|
||
{
|
||
int key;
|
||
int i;
|
||
state_t *sp;
|
||
|
||
if (trace_flag)
|
||
fprintf (stderr, "Entering get_state, state = %d, symbol = %d (%s)\n",
|
||
this_state->number, symbol, tags[symbol]);
|
||
|
||
/* Add up the target state's active item numbers to get a hash key.
|
||
*/
|
||
key = 0;
|
||
for (i = 0; i < kernel_size[symbol]; ++i)
|
||
key += kernel_base[symbol][i];
|
||
key = key % STATE_HASH_SIZE;
|
||
sp = state_hash[key];
|
||
|
||
if (sp)
|
||
{
|
||
int found = 0;
|
||
while (!found)
|
||
{
|
||
if (sp->nitems == kernel_size[symbol])
|
||
{
|
||
found = 1;
|
||
for (i = 0; i < kernel_size[symbol]; ++i)
|
||
if (kernel_base[symbol][i] != sp->items[i])
|
||
found = 0;
|
||
}
|
||
|
||
if (!found)
|
||
{
|
||
if (sp->link)
|
||
{
|
||
sp = sp->link;
|
||
}
|
||
else /* bucket exhausted and no match */
|
||
{
|
||
sp = sp->link = new_state (symbol);
|
||
found = 1;
|
||
}
|
||
}
|
||
}
|
||
}
|
||
else /* bucket is empty */
|
||
{
|
||
state_hash[key] = sp = new_state (symbol);
|
||
}
|
||
|
||
if (trace_flag)
|
||
fprintf (stderr, "Exiting get_state => %d\n", sp->number);
|
||
|
||
return sp->number;
|
||
}
|
||
|
||
/*------------------------------------------------------------------.
|
||
| Use the information computed by new_itemsets to find the state |
|
||
| numbers reached by each shift transition from the current state. |
|
||
| |
|
||
| shiftset is set up as a vector of state numbers of those states. |
|
||
`------------------------------------------------------------------*/
|
||
|
||
static void
|
||
append_states (void)
|
||
{
|
||
int i;
|
||
int j;
|
||
int symbol;
|
||
|
||
if (trace_flag)
|
||
fprintf (stderr, "Entering append_states, state = %d\n",
|
||
this_state->number);
|
||
|
||
/* first sort shift_symbol into increasing order */
|
||
|
||
for (i = 1; i < nshifts; i++)
|
||
{
|
||
symbol = shift_symbol[i];
|
||
j = i;
|
||
while (j > 0 && shift_symbol[j - 1] > symbol)
|
||
{
|
||
shift_symbol[j] = shift_symbol[j - 1];
|
||
j--;
|
||
}
|
||
shift_symbol[j] = symbol;
|
||
}
|
||
|
||
for (i = 0; i < nshifts; i++)
|
||
shiftset[i] = get_state (shift_symbol[i]);
|
||
}
|
||
|
||
|
||
static void
|
||
new_states (void)
|
||
{
|
||
first_state = last_state = this_state = STATE_ALLOC (0);
|
||
nstates = 1;
|
||
}
|
||
|
||
|
||
/*------------------------------------------------------------.
|
||
| Save the NSHIFTS of SHIFTSET into the current linked list. |
|
||
`------------------------------------------------------------*/
|
||
|
||
static void
|
||
save_shifts (void)
|
||
{
|
||
shifts *p = shifts_new (nshifts);
|
||
shortcpy (p->shifts, shiftset, nshifts);
|
||
this_state->shifts = p;
|
||
}
|
||
|
||
|
||
/*------------------------------------------------------------------.
|
||
| Subroutine of augment_automaton. Create the next-to-final state, |
|
||
| to which a shift has already been made in the initial state. |
|
||
| |
|
||
| The task of this state consists in shifting (actually, it's a |
|
||
| goto, but shifts and gotos are both stored in SHIFTS) the start |
|
||
| symbols, hence the name. |
|
||
`------------------------------------------------------------------*/
|
||
|
||
static void
|
||
insert_start_shifting_state (void)
|
||
{
|
||
state_t *statep;
|
||
shifts *sp;
|
||
|
||
statep = STATE_ALLOC (0);
|
||
statep->number = nstates++;
|
||
|
||
/* The distinctive feature of this state from the
|
||
eof_shifting_state, is that it is labeled as post-start-symbol
|
||
shifting. I fail to understand why this state, and the
|
||
post-start-start can't be merged into one. But it does fail if
|
||
you try. --akim */
|
||
statep->accessing_symbol = start_symbol;
|
||
|
||
last_state->next = statep;
|
||
last_state = statep;
|
||
|
||
/* Make a shift from this state to (what will be) the final state. */
|
||
sp = shifts_new (1);
|
||
statep->shifts = sp;
|
||
sp->shifts[0] = nstates;
|
||
}
|
||
|
||
|
||
/*-----------------------------------------------------------------.
|
||
| Subroutine of augment_automaton. Create the final state, which |
|
||
| shifts `0', the end of file. The initial state shifts the start |
|
||
| symbol, and goes to here. |
|
||
`-----------------------------------------------------------------*/
|
||
|
||
static void
|
||
insert_eof_shifting_state (void)
|
||
{
|
||
state_t *statep;
|
||
shifts *sp;
|
||
|
||
/* Make the final state--the one that follows a shift from the
|
||
next-to-final state.
|
||
The symbol for that shift is 0 (end-of-file). */
|
||
statep = STATE_ALLOC (0);
|
||
statep->number = nstates++;
|
||
|
||
last_state->next = statep;
|
||
last_state = statep;
|
||
|
||
/* Make the shift from the final state to the termination state. */
|
||
sp = shifts_new (1);
|
||
statep->shifts = sp;
|
||
sp->shifts[0] = nstates;
|
||
}
|
||
|
||
|
||
/*---------------------------------------------------------------.
|
||
| Subroutine of augment_automaton. Create the accepting state. |
|
||
`---------------------------------------------------------------*/
|
||
|
||
static void
|
||
insert_accepting_state (void)
|
||
{
|
||
state_t *statep;
|
||
|
||
/* Note that the variable `final_state' refers to what we sometimes
|
||
call the termination state. */
|
||
final_state = nstates;
|
||
|
||
/* Make the termination state. */
|
||
statep = STATE_ALLOC (0);
|
||
statep->number = nstates++;
|
||
last_state->next = statep;
|
||
last_state = statep;
|
||
}
|
||
|
||
|
||
|
||
|
||
|
||
/*------------------------------------------------------------------.
|
||
| Make sure that the initial state has a shift that accepts the |
|
||
| grammar's start symbol and goes to the next-to-final state, which |
|
||
| has a shift going to the final state, which has a shift to the |
|
||
| termination state. Create such states and shifts if they don't |
|
||
| happen to exist already. |
|
||
`------------------------------------------------------------------*/
|
||
|
||
static void
|
||
augment_automaton (void)
|
||
{
|
||
if (!first_state->shifts->nshifts)
|
||
{
|
||
/* The first state has no shifts. Make one shift, from the
|
||
initial state to the next-to-final state. */
|
||
|
||
shifts *sp = shifts_new (1);
|
||
first_state->shifts = sp;
|
||
sp->shifts[0] = nstates;
|
||
|
||
/* Create the next-to-final state, with shift to
|
||
what will be the final state. */
|
||
insert_start_shifting_state ();
|
||
}
|
||
else
|
||
{
|
||
state_t *statep = first_state->next;
|
||
/* The states reached by shifts from FIRST_STATE are numbered
|
||
1..(SP->NSHIFTS). Look for one reached by START_SYMBOL.
|
||
This is typical of `start: start ... ;': there is a state
|
||
with the item `start: start . ...'. We want to add a `shift
|
||
on EOF to eof-shifting state here. */
|
||
while (statep->accessing_symbol != start_symbol
|
||
&& statep->number < first_state->shifts->nshifts)
|
||
statep = statep->next;
|
||
|
||
if (statep->accessing_symbol == start_symbol)
|
||
{
|
||
/* We already have STATEP, a next-to-final state for `start:
|
||
start . ...'. Make sure it has a shift to what will be
|
||
the final state. */
|
||
int i;
|
||
|
||
/* Find the shift of the inital state that leads to STATEP. */
|
||
shifts *sp = statep->shifts;
|
||
|
||
shifts *sp1 = shifts_new (sp->nshifts + 1);
|
||
statep->shifts = sp1;
|
||
sp1->shifts[0] = nstates;
|
||
for (i = sp->nshifts; i > 0; i--)
|
||
sp1->shifts[i] = sp->shifts[i - 1];
|
||
|
||
XFREE (sp);
|
||
|
||
insert_eof_shifting_state ();
|
||
}
|
||
else
|
||
{
|
||
/* There is no state for `start: start . ...'. */
|
||
int i, k;
|
||
shifts *sp = first_state->shifts;
|
||
shifts *sp1 = NULL;
|
||
|
||
/* Add one more shift to the initial state, going to the
|
||
next-to-final state (yet to be made). */
|
||
sp1 = shifts_new (sp->nshifts + 1);
|
||
first_state->shifts = sp1;
|
||
/* Stick this shift into the vector at the proper place. */
|
||
statep = first_state->next;
|
||
for (k = 0, i = 0; i < sp->nshifts; k++, i++)
|
||
{
|
||
if (statep->accessing_symbol > start_symbol && i == k)
|
||
sp1->shifts[k++] = nstates;
|
||
sp1->shifts[k] = sp->shifts[i];
|
||
statep = statep->next;
|
||
}
|
||
if (i == k)
|
||
sp1->shifts[k++] = nstates;
|
||
|
||
XFREE (sp);
|
||
|
||
/* Create the next-to-final state, with shift to what will
|
||
be the final state. Corresponds to `start: start . ...'. */
|
||
insert_start_shifting_state ();
|
||
}
|
||
}
|
||
|
||
insert_accepting_state ();
|
||
}
|
||
|
||
|
||
/*----------------------------------------------------------------.
|
||
| Find which rules can be used for reduction transitions from the |
|
||
| current state and make a reductions structure for the state to |
|
||
| record their rule numbers. |
|
||
`----------------------------------------------------------------*/
|
||
|
||
static void
|
||
save_reductions (void)
|
||
{
|
||
int count;
|
||
int i;
|
||
|
||
/* Find and count the active items that represent ends of rules. */
|
||
|
||
count = 0;
|
||
for (i = 0; i < nitemset; ++i)
|
||
{
|
||
int item = ritem[itemset[i]];
|
||
if (item < 0)
|
||
redset[count++] = -item;
|
||
}
|
||
|
||
/* Make a reductions structure and copy the data into it. */
|
||
|
||
if (count)
|
||
{
|
||
reductions *p = REDUCTIONS_ALLOC (count);
|
||
p->nreds = count;
|
||
shortcpy (p->rules, redset, count);
|
||
|
||
this_state->reductions = p;
|
||
}
|
||
}
|
||
|
||
|
||
/*--------------------.
|
||
| Build STATE_TABLE. |
|
||
`--------------------*/
|
||
|
||
static void
|
||
set_state_table (void)
|
||
{
|
||
/* NSTATES + 1 because lookahead for the pseudo state number NSTATES
|
||
might be used (see conflicts.c). It is too opaque for me to
|
||
provide a probably less hacky implementation. --akim */
|
||
state_table = XCALLOC (state_t *, nstates + 1);
|
||
|
||
{
|
||
state_t *sp;
|
||
for (sp = first_state; sp; sp = sp->next)
|
||
state_table[sp->number] = sp;
|
||
}
|
||
|
||
/* Pessimization, but simplification of the code: make sure all the
|
||
states have a shifts, even if reduced to 0 shifts. */
|
||
{
|
||
int i;
|
||
for (i = 0; i < nstates; i++)
|
||
if (!state_table[i]->shifts)
|
||
state_table[i]->shifts = shifts_new (0);
|
||
}
|
||
}
|
||
|
||
/*-------------------------------------------------------------------.
|
||
| Compute the nondeterministic finite state machine (see state.h for |
|
||
| details) from the grammar. |
|
||
`-------------------------------------------------------------------*/
|
||
|
||
void
|
||
generate_states (void)
|
||
{
|
||
allocate_storage ();
|
||
new_closure (nitems);
|
||
new_states ();
|
||
|
||
while (this_state)
|
||
{
|
||
if (trace_flag)
|
||
fprintf (stderr, "Processing state %d (reached by %s)\n",
|
||
this_state->number, tags[this_state->accessing_symbol]);
|
||
/* Set up ruleset and itemset for the transitions out of this
|
||
state. ruleset gets a 1 bit for each rule that could reduce
|
||
now. itemset gets a vector of all the items that could be
|
||
accepted next. */
|
||
closure (this_state->items, this_state->nitems);
|
||
/* record the reductions allowed out of this state */
|
||
save_reductions ();
|
||
/* find the itemsets of the states that shifts can reach */
|
||
new_itemsets ();
|
||
/* find or create the core structures for those states */
|
||
append_states ();
|
||
|
||
/* create the shifts structures for the shifts to those states,
|
||
now that the state numbers transitioning to are known */
|
||
save_shifts ();
|
||
|
||
/* states are queued when they are created; process them all */
|
||
this_state = this_state->next;
|
||
}
|
||
|
||
/* discard various storage */
|
||
free_closure ();
|
||
free_storage ();
|
||
|
||
/* set up initial and final states as parser wants them */
|
||
augment_automaton ();
|
||
|
||
/* Set up STATE_TABLE. */
|
||
set_state_table ();
|
||
}
|