blob: c4efce76906161355225832edd241230bcd8227d [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001/***********************************************************
Guido van Rossumfd71b9e2000-06-30 23:50:40 +00002Copyright (c) 2000, BeOpen.com.
3Copyright (c) 1995-2000, Corporation for National Research Initiatives.
4Copyright (c) 1990-1995, Stichting Mathematisch Centrum.
5All rights reserved.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00006
Guido van Rossumfd71b9e2000-06-30 23:50:40 +00007See the file "Misc/COPYRIGHT" for information on usage and
8redistribution of this file, and for a DISCLAIMER OF ALL WARRANTIES.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00009******************************************************************/
10
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000011/* Grammar implementation */
12
Guido van Rossum3f5da241990-12-20 15:06:42 +000013#include "pgenheaders.h"
14
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000015#include <ctype.h>
16
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000017#include "assert.h"
18#include "token.h"
19#include "grammar.h"
20
Guido van Rossum86bea461997-04-29 21:03:06 +000021extern int Py_DebugFlag;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000022
23grammar *
Thomas Wouters23c9e002000-07-22 19:20:54 +000024newgrammar(int start)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000025{
26 grammar *g;
27
Guido van Rossum86bea461997-04-29 21:03:06 +000028 g = PyMem_NEW(grammar, 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000029 if (g == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000030 Py_FatalError("no mem for new grammar");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000031 g->g_ndfas = 0;
32 g->g_dfa = NULL;
33 g->g_start = start;
34 g->g_ll.ll_nlabels = 0;
35 g->g_ll.ll_label = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000036 g->g_accel = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000037 return g;
38}
39
40dfa *
Thomas Wouters23c9e002000-07-22 19:20:54 +000041adddfa(grammar *g, int type, char *name)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000042{
43 dfa *d;
44
Guido van Rossum86bea461997-04-29 21:03:06 +000045 PyMem_RESIZE(g->g_dfa, dfa, g->g_ndfas + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000046 if (g->g_dfa == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000047 Py_FatalError("no mem to resize dfa in adddfa");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000048 d = &g->g_dfa[g->g_ndfas++];
49 d->d_type = type;
50 d->d_name = name;
51 d->d_nstates = 0;
52 d->d_state = NULL;
53 d->d_initial = -1;
54 d->d_first = NULL;
55 return d; /* Only use while fresh! */
56}
57
58int
Thomas Wouters23c9e002000-07-22 19:20:54 +000059addstate(dfa *d)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000060{
61 state *s;
62
Guido van Rossum86bea461997-04-29 21:03:06 +000063 PyMem_RESIZE(d->d_state, state, d->d_nstates + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000064 if (d->d_state == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000065 Py_FatalError("no mem to resize state in addstate");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000066 s = &d->d_state[d->d_nstates++];
67 s->s_narcs = 0;
68 s->s_arc = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000069 s->s_lower = 0;
70 s->s_upper = 0;
71 s->s_accel = NULL;
72 s->s_accept = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000073 return s - d->d_state;
74}
75
76void
Thomas Wouters23c9e002000-07-22 19:20:54 +000077addarc(dfa *d, int from, int to, int lbl)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000078{
79 state *s;
80 arc *a;
81
82 assert(0 <= from && from < d->d_nstates);
83 assert(0 <= to && to < d->d_nstates);
84
85 s = &d->d_state[from];
Guido van Rossum86bea461997-04-29 21:03:06 +000086 PyMem_RESIZE(s->s_arc, arc, s->s_narcs + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000087 if (s->s_arc == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000088 Py_FatalError("no mem to resize arc list in addarc");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000089 a = &s->s_arc[s->s_narcs++];
90 a->a_lbl = lbl;
91 a->a_arrow = to;
92}
93
94int
Thomas Wouters23c9e002000-07-22 19:20:54 +000095addlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000096{
97 int i;
98 label *lb;
99
100 for (i = 0; i < ll->ll_nlabels; i++) {
101 if (ll->ll_label[i].lb_type == type &&
102 strcmp(ll->ll_label[i].lb_str, str) == 0)
103 return i;
104 }
Guido van Rossum86bea461997-04-29 21:03:06 +0000105 PyMem_RESIZE(ll->ll_label, label, ll->ll_nlabels + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000106 if (ll->ll_label == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +0000107 Py_FatalError("no mem to resize labellist in addlabel");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000108 lb = &ll->ll_label[ll->ll_nlabels++];
109 lb->lb_type = type;
110 lb->lb_str = str; /* XXX strdup(str) ??? */
111 return lb - ll->ll_label;
112}
113
114/* Same, but rather dies than adds */
115
116int
Thomas Wouters23c9e002000-07-22 19:20:54 +0000117findlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000118{
119 int i;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000120
121 for (i = 0; i < ll->ll_nlabels; i++) {
122 if (ll->ll_label[i].lb_type == type /*&&
123 strcmp(ll->ll_label[i].lb_str, str) == 0*/)
124 return i;
125 }
126 fprintf(stderr, "Label %d/'%s' not found\n", type, str);
Guido van Rossum86bea461997-04-29 21:03:06 +0000127 Py_FatalError("grammar.c:findlabel()");
Guido van Rossumfd8a3931996-12-02 18:27:33 +0000128 return 0; /* Make gcc -Wall happy */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000129}
130
Guido van Rossum3f5da241990-12-20 15:06:42 +0000131/* Forward */
Tim Petersdbd9ba62000-07-09 03:09:57 +0000132static void translabel(grammar *, label *);
Guido van Rossum3f5da241990-12-20 15:06:42 +0000133
134void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000135translatelabels(grammar *g)
Guido van Rossum3f5da241990-12-20 15:06:42 +0000136{
137 int i;
Guido van Rossum588633d1994-12-30 15:46:02 +0000138
Guido van Rossum408027e1996-12-30 16:17:54 +0000139#ifdef Py_DEBUG
Guido van Rossum3f5da241990-12-20 15:06:42 +0000140 printf("Translating labels ...\n");
Guido van Rossum588633d1994-12-30 15:46:02 +0000141#endif
Guido van Rossum3f5da241990-12-20 15:06:42 +0000142 /* Don't translate EMPTY */
143 for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++)
144 translabel(g, &g->g_ll.ll_label[i]);
145}
146
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000147static void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000148translabel(grammar *g, label *lb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000149{
150 int i;
151
Guido van Rossum86bea461997-04-29 21:03:06 +0000152 if (Py_DebugFlag)
153 printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000154
155 if (lb->lb_type == NAME) {
156 for (i = 0; i < g->g_ndfas; i++) {
157 if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000158 if (Py_DebugFlag)
159 printf(
160 "Label %s is non-terminal %d.\n",
161 lb->lb_str,
162 g->g_dfa[i].d_type);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000163 lb->lb_type = g->g_dfa[i].d_type;
164 lb->lb_str = NULL;
165 return;
166 }
167 }
168 for (i = 0; i < (int)N_TOKENS; i++) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000169 if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) {
170 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000171 printf("Label %s is terminal %d.\n",
172 lb->lb_str, i);
173 lb->lb_type = i;
174 lb->lb_str = NULL;
175 return;
176 }
177 }
178 printf("Can't translate NAME label '%s'\n", lb->lb_str);
179 return;
180 }
181
182 if (lb->lb_type == STRING) {
Guido van Rossumbb3649e1998-04-10 22:09:39 +0000183 if (isalpha((int)(lb->lb_str[1])) || lb->lb_str[1] == '_') {
Guido van Rossum1d5735e1994-08-30 08:27:36 +0000184 char *p;
Guido van Rossum86bea461997-04-29 21:03:06 +0000185 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000186 printf("Label %s is a keyword\n", lb->lb_str);
187 lb->lb_type = NAME;
188 lb->lb_str++;
189 p = strchr(lb->lb_str, '\'');
190 if (p)
191 *p = '\0';
192 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000193 else if (lb->lb_str[2] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000194 int type = (int) PyToken_OneChar(lb->lb_str[1]);
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000195 if (type != OP) {
196 lb->lb_type = type;
197 lb->lb_str = NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000198 }
199 else
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000200 printf("Unknown OP label %s\n",
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000201 lb->lb_str);
202 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000203 else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000204 int type = (int) PyToken_TwoChars(lb->lb_str[1],
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000205 lb->lb_str[2]);
206 if (type != OP) {
207 lb->lb_type = type;
208 lb->lb_str = NULL;
209 }
210 else
211 printf("Unknown OP label %s\n",
212 lb->lb_str);
213 }
Thomas Wouters434d0822000-08-24 20:11:32 +0000214 else if (lb->lb_str[2] && lb->lb_str[3] && lb->lb_str[4] == lb->lb_str[0]) {
215 int type = (int) PyToken_ThreeChars(lb->lb_str[1],
216 lb->lb_str[2],
217 lb->lb_str[3]);
218 if (type != OP) {
219 lb->lb_type = type;
220 lb->lb_str = NULL;
221 }
222 else
223 printf("Unknown OP label %s\n",
224 lb->lb_str);
225 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000226 else
227 printf("Can't translate STRING label %s\n",
228 lb->lb_str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000229 }
230 else
Guido van Rossum86bea461997-04-29 21:03:06 +0000231 printf("Can't translate label '%s'\n",
232 PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000233}