| |
| /* Grammar implementation */ |
| |
| #include "Python.h" |
| #include "pgenheaders.h" |
| |
| #include <ctype.h> |
| |
| #include "token.h" |
| #include "grammar.h" |
| |
| #ifdef RISCOS |
| #include <unixlib.h> |
| #endif |
| |
| extern int Py_DebugFlag; |
| |
| grammar * |
| newgrammar(int start) |
| { |
| grammar *g; |
| |
| g = PyMem_NEW(grammar, 1); |
| if (g == NULL) |
| Py_FatalError("no mem for new grammar"); |
| g->g_ndfas = 0; |
| g->g_dfa = NULL; |
| g->g_start = start; |
| g->g_ll.ll_nlabels = 0; |
| g->g_ll.ll_label = NULL; |
| g->g_accel = 0; |
| return g; |
| } |
| |
| dfa * |
| adddfa(grammar *g, int type, char *name) |
| { |
| dfa *d; |
| |
| PyMem_RESIZE(g->g_dfa, dfa, g->g_ndfas + 1); |
| if (g->g_dfa == NULL) |
| Py_FatalError("no mem to resize dfa in adddfa"); |
| d = &g->g_dfa[g->g_ndfas++]; |
| d->d_type = type; |
| d->d_name = strdup(name); |
| d->d_nstates = 0; |
| d->d_state = NULL; |
| d->d_initial = -1; |
| d->d_first = NULL; |
| return d; /* Only use while fresh! */ |
| } |
| |
| int |
| addstate(dfa *d) |
| { |
| state *s; |
| |
| PyMem_RESIZE(d->d_state, state, d->d_nstates + 1); |
| if (d->d_state == NULL) |
| Py_FatalError("no mem to resize state in addstate"); |
| s = &d->d_state[d->d_nstates++]; |
| s->s_narcs = 0; |
| s->s_arc = NULL; |
| s->s_lower = 0; |
| s->s_upper = 0; |
| s->s_accel = NULL; |
| s->s_accept = 0; |
| return s - d->d_state; |
| } |
| |
| void |
| addarc(dfa *d, int from, int to, int lbl) |
| { |
| state *s; |
| arc *a; |
| |
| assert(0 <= from && from < d->d_nstates); |
| assert(0 <= to && to < d->d_nstates); |
| |
| s = &d->d_state[from]; |
| PyMem_RESIZE(s->s_arc, arc, s->s_narcs + 1); |
| if (s->s_arc == NULL) |
| Py_FatalError("no mem to resize arc list in addarc"); |
| a = &s->s_arc[s->s_narcs++]; |
| a->a_lbl = lbl; |
| a->a_arrow = to; |
| } |
| |
| int |
| addlabel(labellist *ll, int type, char *str) |
| { |
| int i; |
| label *lb; |
| |
| for (i = 0; i < ll->ll_nlabels; i++) { |
| if (ll->ll_label[i].lb_type == type && |
| strcmp(ll->ll_label[i].lb_str, str) == 0) |
| return i; |
| } |
| PyMem_RESIZE(ll->ll_label, label, ll->ll_nlabels + 1); |
| if (ll->ll_label == NULL) |
| Py_FatalError("no mem to resize labellist in addlabel"); |
| lb = &ll->ll_label[ll->ll_nlabels++]; |
| lb->lb_type = type; |
| lb->lb_str = strdup(str); |
| if (Py_DebugFlag) |
| printf("Label @ %8p, %d: %s\n", ll, ll->ll_nlabels, |
| PyGrammar_LabelRepr(lb)); |
| return lb - ll->ll_label; |
| } |
| |
| /* Same, but rather dies than adds */ |
| |
| int |
| findlabel(labellist *ll, int type, char *str) |
| { |
| int i; |
| |
| for (i = 0; i < ll->ll_nlabels; i++) { |
| if (ll->ll_label[i].lb_type == type /*&& |
| strcmp(ll->ll_label[i].lb_str, str) == 0*/) |
| return i; |
| } |
| fprintf(stderr, "Label %d/'%s' not found\n", type, str); |
| Py_FatalError("grammar.c:findlabel()"); |
| return 0; /* Make gcc -Wall happy */ |
| } |
| |
| /* Forward */ |
| static void translabel(grammar *, label *); |
| |
| void |
| translatelabels(grammar *g) |
| { |
| int i; |
| |
| #ifdef Py_DEBUG |
| printf("Translating labels ...\n"); |
| #endif |
| /* Don't translate EMPTY */ |
| for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++) |
| translabel(g, &g->g_ll.ll_label[i]); |
| } |
| |
| static void |
| translabel(grammar *g, label *lb) |
| { |
| int i; |
| |
| if (Py_DebugFlag) |
| printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb)); |
| |
| if (lb->lb_type == NAME) { |
| for (i = 0; i < g->g_ndfas; i++) { |
| if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) { |
| if (Py_DebugFlag) |
| printf( |
| "Label %s is non-terminal %d.\n", |
| lb->lb_str, |
| g->g_dfa[i].d_type); |
| lb->lb_type = g->g_dfa[i].d_type; |
| free(lb->lb_str); |
| lb->lb_str = NULL; |
| return; |
| } |
| } |
| for (i = 0; i < (int)N_TOKENS; i++) { |
| if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) { |
| if (Py_DebugFlag) |
| printf("Label %s is terminal %d.\n", |
| lb->lb_str, i); |
| lb->lb_type = i; |
| free(lb->lb_str); |
| lb->lb_str = NULL; |
| return; |
| } |
| } |
| printf("Can't translate NAME label '%s'\n", lb->lb_str); |
| return; |
| } |
| |
| if (lb->lb_type == STRING) { |
| if (isalpha(Py_CHARMASK(lb->lb_str[1])) || |
| lb->lb_str[1] == '_') { |
| char *p; |
| char *src; |
| char *dest; |
| size_t name_len; |
| if (Py_DebugFlag) |
| printf("Label %s is a keyword\n", lb->lb_str); |
| lb->lb_type = NAME; |
| src = lb->lb_str + 1; |
| p = strchr(src, '\''); |
| if (p) |
| name_len = p - src; |
| else |
| name_len = strlen(src); |
| dest = malloc(name_len + 1); |
| strncpy(dest, src, name_len); |
| dest[name_len] = '\0'; |
| free(lb->lb_str); |
| lb->lb_str = dest; |
| } |
| else if (lb->lb_str[2] == lb->lb_str[0]) { |
| int type = (int) PyToken_OneChar(lb->lb_str[1]); |
| if (type != OP) { |
| lb->lb_type = type; |
| free(lb->lb_str); |
| lb->lb_str = NULL; |
| } |
| else |
| printf("Unknown OP label %s\n", |
| lb->lb_str); |
| } |
| else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) { |
| int type = (int) PyToken_TwoChars(lb->lb_str[1], |
| lb->lb_str[2]); |
| if (type != OP) { |
| lb->lb_type = type; |
| free(lb->lb_str); |
| lb->lb_str = NULL; |
| } |
| else |
| printf("Unknown OP label %s\n", |
| lb->lb_str); |
| } |
| else if (lb->lb_str[2] && lb->lb_str[3] && lb->lb_str[4] == lb->lb_str[0]) { |
| int type = (int) PyToken_ThreeChars(lb->lb_str[1], |
| lb->lb_str[2], |
| lb->lb_str[3]); |
| if (type != OP) { |
| lb->lb_type = type; |
| free(lb->lb_str); |
| lb->lb_str = NULL; |
| } |
| else |
| printf("Unknown OP label %s\n", |
| lb->lb_str); |
| } |
| else |
| printf("Can't translate STRING label %s\n", |
| lb->lb_str); |
| } |
| else |
| printf("Can't translate label '%s'\n", |
| PyGrammar_LabelRepr(lb)); |
| } |