123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745 |
- /* Compute look-ahead criteria for bison,
- Copyright (C) 1984, 1986 Bob Corbett and Free Software Foundation, Inc.
- BISON is distributed in the hope that it will be useful, but WITHOUT ANY
- WARRANTY. No author or distributor accepts responsibility to anyone
- for the consequences of using it or for whether it serves any
- particular purpose or works at all, unless he says so in writing.
- Refer to the BISON General Public License for full details.
- Everyone is granted permission to copy, modify and redistribute BISON,
- but only under the conditions described in the BISON General Public
- License. A copy of this license is supposed to have been given to you
- along with BISON so you can know your rights and responsibilities. It
- should be in a file named COPYING. Among other things, the copyright
- notice and this notice must be preserved on all copies.
- In other words, you are welcome to use, share and improve this program.
- You are forbidden to forbid anyone else to use, share and improve
- what you give them. Help stamp out software-hoarding! */
- /* Compute how to make the finite state machine deterministic;
- find which rules need lookahead in each state, and which lookahead tokens they accept.
- lalr(), the entry point, builds these data structures:
- goto_map, from_state and to_state
- record each shift transition which accepts a variable (a nonterminal).
- ngotos is the number of such transitions.
- from_state[t] is the state number which a transition leads from
- and to_state[t] is the state number it leads to.
- All the transitions that accept a particular variable are grouped together and
- goto_map[i - ntokens] is the index in from_state and to_state of the first of them.
- consistent[s] is nonzero if no lookahead is needed to decide what to do in state s.
- LAruleno is a vector which records the rules that need lookahead in various states.
- The elements of LAruleno that apply to state s are those from
- lookaheads[s] through lookaheads[s+1]-1.
- Each element of LAruleno is a rule number.
- If lr is the length of LAruleno, then a number from 0 to lr-1
- can specify both a rule and a state where the rule might be applied.
- LA is a lr by ntokens matrix of bits.
- LA[l, i] is 1 if the rule LAruleno[l] is applicable in the appropriate state
- when the next token is symbol i.
- If LA[l, i] and LA[l, j] are both 1 for i != j, it is a conflict.
- */
- #include <stdio.h>
- #include "machine.h"
- #include "types.h"
- #include "state.h"
- #include "new.h"
- #include "gram.h"
- extern short **derives;
- extern char *nullable;
- int tokensetsize;
- short *lookaheads;
- short *LAruleno;
- unsigned *LA;
- short *accessing_symbol;
- char *consistent;
- core **state_table;
- shifts **shift_table;
- reductions **reduction_table;
- short *goto_map;
- short *from_state;
- short *to_state;
- short **transpose();
- static int infinity;
- static int maxrhs;
- static int ngotos;
- static unsigned *F;
- static short **includes;
- static shorts **lookback;
- static short **R;
- static short *INDEX;
- static short *VERTICES;
- static int top;
- lalr()
- {
- tokensetsize = WORDSIZE(ntokens);
- set_state_table();
- set_accessing_symbol();
- set_shift_table();
- set_reduction_table();
- set_maxrhs();
- initialize_LA();
- set_goto_map();
- initialize_F();
- build_relations();
- compute_FOLLOWS();
- compute_lookaheads();
- }
- set_state_table()
- {
- register core *sp;
- state_table = NEW2(nstates, core *);
- for (sp = first_state; sp; sp = sp->next)
- state_table[sp->number] = sp;
- }
- set_accessing_symbol()
- {
- register core *sp;
- accessing_symbol = NEW2(nstates, short);
- for (sp = first_state; sp; sp = sp->next)
- accessing_symbol[sp->number] = sp->accessing_symbol;
- }
- set_shift_table()
- {
- register shifts *sp;
- shift_table = NEW2(nstates, shifts *);
- for (sp = first_shift; sp; sp = sp->next)
- shift_table[sp->number] = sp;
- }
- set_reduction_table()
- {
- register reductions *rp;
- reduction_table = NEW2(nstates, reductions *);
- for (rp = first_reduction; rp; rp = rp->next)
- reduction_table[rp->number] = rp;
- }
- set_maxrhs()
- {
- register short *itemp;
- register int length;
- register int max;
- length = 0;
- max = 0;
- for (itemp = ritem; *itemp; itemp++)
- {
- if (*itemp > 0)
- {
- length++;
- }
- else
- {
- if (length > max) max = length;
- length = 0;
- }
- }
- maxrhs = max;
- }
- initialize_LA()
- {
- register int i;
- register int j;
- register int count;
- register reductions *rp;
- register shifts *sp;
- register short *np;
- consistent = NEW2(nstates, char);
- lookaheads = NEW2(nstates + 1, short);
- count = 0;
- for (i = 0; i < nstates; i++)
- {
- register int j;
- lookaheads[i] = count;
- rp = reduction_table[i];
- sp = shift_table[i];
- if (rp && (rp->nreds > 1
- || (sp && ! ISVAR(accessing_symbol[sp->shifts[0]]))))
- count += rp->nreds;
- else
- consistent[i] = 1;
- if (sp)
- for (j = 0; j < sp->nshifts; j++)
- {
- if (accessing_symbol[sp->shifts[j]] == error_token_number)
- {
- consistent[i] = 0;
- break;
- }
- }
- }
- lookaheads[nstates] = count;
- LA = NEW2(count * tokensetsize, unsigned);
- LAruleno = NEW2(count, short);
- lookback = NEW2(count, shorts *);
- np = LAruleno;
- for (i = 0; i < nstates; i++)
- {
- if (!consistent[i])
- {
- if (rp = reduction_table[i])
- for (j = 0; j < rp->nreds; j++)
- *np++ = rp->rules[j];
- }
- }
- }
- set_goto_map()
- {
- register shifts *sp;
- register int i;
- register int symbol;
- register int k;
- register short *temp_map;
- register int state2;
- register int state1;
- goto_map = NEW2(nvars + 1, short) - ntokens;
- temp_map = NEW2(nvars + 1, short) - ntokens;
- ngotos = 0;
- for (sp = first_shift; sp; sp = sp->next)
- {
- for (i = sp->nshifts - 1; i >= 0; i--)
- {
- symbol = accessing_symbol[sp->shifts[i]];
- if (ISTOKEN(symbol)) break;
- if (ngotos == MAXSHORT)
- toomany("gotos");
- ngotos++;
- goto_map[symbol]++;
- }
- }
- k = 0;
- for (i = ntokens; i < nsyms; i++)
- {
- temp_map[i] = k;
- k += goto_map[i];
- }
- for (i = ntokens; i < nsyms; i++)
- goto_map[i] = temp_map[i];
- goto_map[nsyms] = ngotos;
- temp_map[nsyms] = ngotos;
- from_state = NEW2(ngotos, short);
- to_state = NEW2(ngotos, short);
- for (sp = first_shift; sp; sp = sp->next)
- {
- state1 = sp->number;
- for (i = sp->nshifts - 1; i >= 0; i--)
- {
- state2 = sp->shifts[i];
- symbol = accessing_symbol[state2];
- if (ISTOKEN(symbol)) break;
- k = temp_map[symbol]++;
- from_state[k] = state1;
- to_state[k] = state2;
- }
- }
- FREE(temp_map + ntokens);
- }
- /* Map_goto maps a state/symbol pair into its numeric representation. */
- int
- map_goto(state, symbol)
- int state;
- int symbol;
- {
- register int high;
- register int low;
- register int middle;
- register int s;
- low = goto_map[symbol];
- high = goto_map[symbol + 1];
- while (low <= high)
- {
- middle = (low + high) / 2;
- s = from_state[middle];
- if (s == state)
- return (middle);
- else if (s < state)
- low = middle + 1;
- else
- high = middle - 1;
- }
- berror("map_goto");
- /* NOTREACHED */
- }
- initialize_F()
- {
- register int i;
- register int j;
- register int k;
- register shifts *sp;
- register short *edge;
- register unsigned *rowp;
- register short *rp;
- register short **reads;
- register int nedges;
- register int stateno;
- register int symbol;
- register int nwords;
- nwords = ngotos * tokensetsize;
- F = NEW2(nwords, unsigned);
- reads = NEW2(ngotos, short *);
- edge = NEW2(ngotos + 1, short);
- nedges = 0;
- rowp = F;
- for (i = 0; i < ngotos; i++)
- {
- stateno = to_state[i];
- sp = shift_table[stateno];
- if (sp)
- {
- k = sp->nshifts;
- for (j = 0; j < k; j++)
- {
- symbol = accessing_symbol[sp->shifts[j]];
- if (ISVAR(symbol))
- break;
- SETBIT(rowp, symbol);
- }
- for (; j < k; j++)
- {
- symbol = accessing_symbol[sp->shifts[j]];
- if (nullable[symbol])
- edge[nedges++] = map_goto(stateno, symbol);
- }
-
- if (nedges)
- {
- reads[i] = rp = NEW2(nedges + 1, short);
- for (j = 0; j < nedges; j++)
- rp[j] = edge[j];
- rp[nedges] = -1;
- nedges = 0;
- }
- }
- rowp += tokensetsize;
- }
- digraph(reads);
- for (i = 0; i < ngotos; i++)
- {
- if (reads[i])
- FREE(reads[i]);
- }
- FREE(reads);
- FREE(edge);
- }
- build_relations()
- {
- register int i;
- register int j;
- register int k;
- register short *rulep;
- register short *rp;
- register shifts *sp;
- register int length;
- register int nedges;
- register int done;
- register int state1;
- register int stateno;
- register int symbol1;
- register int symbol2;
- register short *shortp;
- register short *edge;
- register short *states;
- register short **new_includes;
- includes = NEW2(ngotos, short *);
- edge = NEW2(ngotos + 1, short);
- states = NEW2(maxrhs + 1, short);
- for (i = 0; i < ngotos; i++)
- {
- nedges = 0;
- state1 = from_state[i];
- symbol1 = accessing_symbol[to_state[i]];
- for (rulep = derives[symbol1]; *rulep > 0; rulep++)
- {
- length = 1;
- states[0] = state1;
- stateno = state1;
- for (rp = ritem + rrhs[*rulep]; *rp > 0; rp++)
- {
- symbol2 = *rp;
- sp = shift_table[stateno];
- k = sp->nshifts;
- for (j = 0; j < k; j++)
- {
- stateno = sp->shifts[j];
- if (accessing_symbol[stateno] == symbol2) break;
- }
- states[length++] = stateno;
- }
- if (!consistent[stateno])
- add_lookback_edge(stateno, *rulep, i);
- length--;
- done = 0;
- while (!done)
- {
- done = 1;
- rp--;
- /* JF added rp>=ritem && I hope to god its right! */
- if (rp>=ritem && ISVAR(*rp))
- {
- stateno = states[--length];
- edge[nedges++] = map_goto(stateno, *rp);
- if (nullable[*rp]) done = 0;
- }
- }
- }
- if (nedges)
- {
- includes[i] = shortp = NEW2(nedges + 1, short);
- for (j = 0; j < nedges; j++)
- shortp[j] = edge[j];
- shortp[nedges] = -1;
- }
- }
- new_includes = transpose(includes, ngotos);
- for (i = 0; i < ngotos; i++)
- if (includes[i])
- FREE(includes[i]);
- FREE(includes);
- includes = new_includes;
- FREE(edge);
- FREE(states);
- }
- add_lookback_edge(stateno, ruleno, gotono)
- int stateno;
- int ruleno;
- int gotono;
- {
- register int i;
- register int k;
- register int found;
- register shorts *sp;
- i = lookaheads[stateno];
- k = lookaheads[stateno + 1];
- found = 0;
- while (!found && i < k)
- {
- if (LAruleno[i] == ruleno)
- found = 1;
- else
- i++;
- }
- if (found == 0)
- berror("add_lookback_edge");
- sp = NEW(shorts);
- sp->next = lookback[i];
- sp->value = gotono;
- lookback[i] = sp;
- }
- short **
- transpose(R, n)
- short **R;
- int n;
- {
- register short **new_R;
- register short **temp_R;
- register short *nedges;
- register short *sp;
- register int i;
- register int k;
- nedges = NEW2(n, short);
- for (i = 0; i < n; i++)
- {
- sp = R[i];
- if (sp)
- {
- while (*sp >= 0)
- nedges[*sp++]++;
- }
- }
- new_R = NEW2(n, short *);
- temp_R = NEW2(n, short *);
- for (i = 0; i < n; i++)
- {
- k = nedges[i];
- if (k > 0)
- {
- sp = NEW2(k + 1, short);
- new_R[i] = sp;
- temp_R[i] = sp;
- sp[k] = -1;
- }
- }
- FREE(nedges);
- for (i = 0; i < n; i++)
- {
- sp = R[i];
- if (sp)
- {
- while (*sp >= 0)
- *temp_R[*sp++]++ = i;
- }
- }
- FREE(temp_R);
- return (new_R);
- }
- compute_FOLLOWS()
- {
- register int i;
- digraph(includes);
- for (i = 0; i < ngotos; i++)
- {
- if (includes[i]) FREE(includes[i]);
- }
- FREE(includes);
- }
- compute_lookaheads()
- {
- register int i;
- register int n;
- register unsigned *fp1;
- register unsigned *fp2;
- register unsigned *fp3;
- register shorts *sp;
- register unsigned *rowp;
- /* register short *rulep; JF unused */
- /* register int count; JF unused */
- register shorts *sptmp;/* JF */
- rowp = LA;
- n = lookaheads[nstates];
- for (i = 0; i < n; i++)
- {
- fp3 = rowp + tokensetsize;
- for (sp = lookback[i]; sp; sp = sp->next)
- {
- fp1 = rowp;
- fp2 = F + tokensetsize * sp->value;
- while (fp1 < fp3)
- *fp1++ |= *fp2++;
- }
- rowp = fp3;
- }
- for (i = 0; i < n; i++)
- {/* JF removed ref to freed storage */
- for (sp = lookback[i]; sp; sp = sptmp) {
- sptmp=sp->next;
- FREE(sp);
- }
- }
- FREE(lookback);
- FREE(F);
- }
- digraph(relation)
- short **relation;
- {
- register int i;
- infinity = ngotos + 2;
- INDEX = NEW2(ngotos + 1, short);
- VERTICES = NEW2(ngotos + 1, short);
- top = 0;
- R = relation;
- for (i = 0; i < ngotos; i++)
- INDEX[i] = 0;
- for (i = 0; i < ngotos; i++)
- {
- if (INDEX[i] == 0 && R[i])
- traverse(i);
- }
- FREE(INDEX);
- FREE(VERTICES);
- }
- traverse(i)
- register int i;
- {
- register unsigned *fp1;
- register unsigned *fp2;
- register unsigned *fp3;
- register int j;
- register short *rp;
- int height;
- unsigned *base;
- VERTICES[++top] = i;
- INDEX[i] = height = top;
- base = F + i * tokensetsize;
- fp3 = base + tokensetsize;
- rp = R[i];
- if (rp)
- {
- while ((j = *rp++) >= 0)
- {
- if (INDEX[j] == 0)
- traverse(j);
- if (INDEX[i] > INDEX[j])
- INDEX[i] = INDEX[j];
- fp1 = base;
- fp2 = F + j * tokensetsize;
- while (fp1 < fp3)
- *fp1++ |= *fp2++;
- }
- }
- if (INDEX[i] == height)
- {
- for (;;)
- {
- j = VERTICES[top--];
- INDEX[j] = infinity;
- if (i == j)
- break;
- fp1 = base;
- fp2 = F + j * tokensetsize;
- while (fp1 < fp3)
- *fp2++ = *fp1++;
- }
- }
- }
|