| /*********************************************************** |
| Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam, |
| The Netherlands. |
| |
| All Rights Reserved |
| |
| Permission to use, copy, modify, and distribute this software and its |
| documentation for any purpose and without fee is hereby granted, |
| provided that the above copyright notice appear in all copies and that |
| both that copyright notice and this permission notice appear in |
| supporting documentation, and that the names of Stichting Mathematisch |
| Centrum or CWI or Corporation for National Research Initiatives or |
| CNRI not be used in advertising or publicity pertaining to |
| distribution of the software without specific, written prior |
| permission. |
| |
| While CWI is the initial source for this software, a modified version |
| is made available by the Corporation for National Research Initiatives |
| (CNRI) at the Internet address ftp://ftp.python.org. |
| |
| STICHTING MATHEMATISCH CENTRUM AND CNRI DISCLAIM ALL WARRANTIES WITH |
| REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF |
| MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH |
| CENTRUM OR CNRI BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL |
| DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR |
| PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER |
| TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR |
| PERFORMANCE OF THIS SOFTWARE. |
| |
| ******************************************************************/ |
| |
| /* Grammar implementation */ |
| |
| #include "pgenheaders.h" |
| |
| #include <ctype.h> |
| |
| #include "assert.h" |
| #include "token.h" |
| #include "grammar.h" |
| |
| extern int Py_DebugFlag; |
| |
| grammar * |
| newgrammar(start) |
| int start; |
| { |
| grammar *g; |
| |
| g = PyMem_NEW(grammar, 1); |
| if (g == NULL) |
| Py_FatalError("no mem for new grammar"); |
| g->g_ndfas = 0; |
| g->g_dfa = NULL; |
| g->g_start = start; |
| g->g_ll.ll_nlabels = 0; |
| g->g_ll.ll_label = NULL; |
| g->g_accel = 0; |
| return g; |
| } |
| |
| dfa * |
| adddfa(g, type, name) |
| grammar *g; |
| int type; |
| char *name; |
| { |
| dfa *d; |
| |
| PyMem_RESIZE(g->g_dfa, dfa, g->g_ndfas + 1); |
| if (g->g_dfa == NULL) |
| Py_FatalError("no mem to resize dfa in adddfa"); |
| d = &g->g_dfa[g->g_ndfas++]; |
| d->d_type = type; |
| d->d_name = name; |
| d->d_nstates = 0; |
| d->d_state = NULL; |
| d->d_initial = -1; |
| d->d_first = NULL; |
| return d; /* Only use while fresh! */ |
| } |
| |
| int |
| addstate(d) |
| dfa *d; |
| { |
| state *s; |
| |
| PyMem_RESIZE(d->d_state, state, d->d_nstates + 1); |
| if (d->d_state == NULL) |
| Py_FatalError("no mem to resize state in addstate"); |
| s = &d->d_state[d->d_nstates++]; |
| s->s_narcs = 0; |
| s->s_arc = NULL; |
| s->s_lower = 0; |
| s->s_upper = 0; |
| s->s_accel = NULL; |
| s->s_accept = 0; |
| return s - d->d_state; |
| } |
| |
| void |
| addarc(d, from, to, lbl) |
| dfa *d; |
| int lbl; |
| { |
| state *s; |
| arc *a; |
| |
| assert(0 <= from && from < d->d_nstates); |
| assert(0 <= to && to < d->d_nstates); |
| |
| s = &d->d_state[from]; |
| PyMem_RESIZE(s->s_arc, arc, s->s_narcs + 1); |
| if (s->s_arc == NULL) |
| Py_FatalError("no mem to resize arc list in addarc"); |
| a = &s->s_arc[s->s_narcs++]; |
| a->a_lbl = lbl; |
| a->a_arrow = to; |
| } |
| |
| int |
| addlabel(ll, type, str) |
| labellist *ll; |
| int type; |
| char *str; |
| { |
| int i; |
| label *lb; |
| |
| for (i = 0; i < ll->ll_nlabels; i++) { |
| if (ll->ll_label[i].lb_type == type && |
| strcmp(ll->ll_label[i].lb_str, str) == 0) |
| return i; |
| } |
| PyMem_RESIZE(ll->ll_label, label, ll->ll_nlabels + 1); |
| if (ll->ll_label == NULL) |
| Py_FatalError("no mem to resize labellist in addlabel"); |
| lb = &ll->ll_label[ll->ll_nlabels++]; |
| lb->lb_type = type; |
| lb->lb_str = str; /* XXX strdup(str) ??? */ |
| return lb - ll->ll_label; |
| } |
| |
| /* Same, but rather dies than adds */ |
| |
| int |
| findlabel(ll, type, str) |
| labellist *ll; |
| int type; |
| char *str; |
| { |
| int i; |
| |
| for (i = 0; i < ll->ll_nlabels; i++) { |
| if (ll->ll_label[i].lb_type == type /*&& |
| strcmp(ll->ll_label[i].lb_str, str) == 0*/) |
| return i; |
| } |
| fprintf(stderr, "Label %d/'%s' not found\n", type, str); |
| Py_FatalError("grammar.c:findlabel()"); |
| return 0; /* Make gcc -Wall happy */ |
| } |
| |
| /* Forward */ |
| static void translabel Py_PROTO((grammar *, label *)); |
| |
| void |
| translatelabels(g) |
| grammar *g; |
| { |
| int i; |
| |
| #ifdef Py_DEBUG |
| printf("Translating labels ...\n"); |
| #endif |
| /* Don't translate EMPTY */ |
| for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++) |
| translabel(g, &g->g_ll.ll_label[i]); |
| } |
| |
| static void |
| translabel(g, lb) |
| grammar *g; |
| label *lb; |
| { |
| int i; |
| |
| if (Py_DebugFlag) |
| printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb)); |
| |
| if (lb->lb_type == NAME) { |
| for (i = 0; i < g->g_ndfas; i++) { |
| if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) { |
| if (Py_DebugFlag) |
| printf( |
| "Label %s is non-terminal %d.\n", |
| lb->lb_str, |
| g->g_dfa[i].d_type); |
| lb->lb_type = g->g_dfa[i].d_type; |
| lb->lb_str = NULL; |
| return; |
| } |
| } |
| for (i = 0; i < (int)N_TOKENS; i++) { |
| if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) { |
| if (Py_DebugFlag) |
| printf("Label %s is terminal %d.\n", |
| lb->lb_str, i); |
| lb->lb_type = i; |
| lb->lb_str = NULL; |
| return; |
| } |
| } |
| printf("Can't translate NAME label '%s'\n", lb->lb_str); |
| return; |
| } |
| |
| if (lb->lb_type == STRING) { |
| if (isalpha(lb->lb_str[1]) || lb->lb_str[1] == '_') { |
| char *p; |
| if (Py_DebugFlag) |
| printf("Label %s is a keyword\n", lb->lb_str); |
| lb->lb_type = NAME; |
| lb->lb_str++; |
| p = strchr(lb->lb_str, '\''); |
| if (p) |
| *p = '\0'; |
| } |
| else if (lb->lb_str[2] == lb->lb_str[0]) { |
| int type = (int) PyToken_OneChar(lb->lb_str[1]); |
| if (type != OP) { |
| lb->lb_type = type; |
| lb->lb_str = NULL; |
| } |
| else |
| printf("Unknown OP label %s\n", |
| lb->lb_str); |
| } |
| else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) { |
| int type = (int) PyToken_TwoChars(lb->lb_str[1], |
| lb->lb_str[2]); |
| if (type != OP) { |
| lb->lb_type = type; |
| lb->lb_str = NULL; |
| } |
| else |
| printf("Unknown OP label %s\n", |
| lb->lb_str); |
| } |
| else |
| printf("Can't translate STRING label %s\n", |
| lb->lb_str); |
| } |
| else |
| printf("Can't translate label '%s'\n", |
| PyGrammar_LabelRepr(lb)); |
| } |