blob: 880bf84b421acc5e7847e0ccba0ef0271d09ac98 [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002/* Grammar implementation */
3
Tim Peters1ca12962001-12-04 03:18:48 +00004#include "Python.h"
Guido van Rossum3f5da241990-12-20 15:06:42 +00005#include "pgenheaders.h"
6
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00007#include <ctype.h>
8
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00009#include "token.h"
10#include "grammar.h"
11
Martin v. Löwisa94568a2003-05-10 07:36:56 +000012#ifdef RISCOS
13#include <unixlib.h>
14#endif
15
Guido van Rossum86bea461997-04-29 21:03:06 +000016extern int Py_DebugFlag;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000017
18grammar *
Thomas Wouters23c9e002000-07-22 19:20:54 +000019newgrammar(int start)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000020{
21 grammar *g;
22
Neal Norwitz2c4e4f92006-04-10 06:42:25 +000023 g = PyObject_MALLOC(sizeof(grammar));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000024 if (g == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000025 Py_FatalError("no mem for new grammar");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000026 g->g_ndfas = 0;
27 g->g_dfa = NULL;
28 g->g_start = start;
29 g->g_ll.ll_nlabels = 0;
30 g->g_ll.ll_label = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000031 g->g_accel = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000032 return g;
33}
34
35dfa *
Thomas Wouters23c9e002000-07-22 19:20:54 +000036adddfa(grammar *g, int type, char *name)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000037{
38 dfa *d;
39
Neal Norwitz2c4e4f92006-04-10 06:42:25 +000040 g->g_dfa = PyObject_REALLOC(g->g_dfa, sizeof(dfa) * (g->g_ndfas + 1));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000041 if (g->g_dfa == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000042 Py_FatalError("no mem to resize dfa in adddfa");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000043 d = &g->g_dfa[g->g_ndfas++];
44 d->d_type = type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +000045 d->d_name = strdup(name);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000046 d->d_nstates = 0;
47 d->d_state = NULL;
48 d->d_initial = -1;
49 d->d_first = NULL;
50 return d; /* Only use while fresh! */
51}
52
53int
Thomas Wouters23c9e002000-07-22 19:20:54 +000054addstate(dfa *d)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000055{
56 state *s;
57
Neal Norwitz2c4e4f92006-04-10 06:42:25 +000058 d->d_state = PyObject_REALLOC(d->d_state,
59 sizeof(state) * (d->d_nstates + 1));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000060 if (d->d_state == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000061 Py_FatalError("no mem to resize state in addstate");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000062 s = &d->d_state[d->d_nstates++];
63 s->s_narcs = 0;
64 s->s_arc = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000065 s->s_lower = 0;
66 s->s_upper = 0;
67 s->s_accel = NULL;
68 s->s_accept = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000069 return s - d->d_state;
70}
71
72void
Thomas Wouters23c9e002000-07-22 19:20:54 +000073addarc(dfa *d, int from, int to, int lbl)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000074{
75 state *s;
76 arc *a;
77
78 assert(0 <= from && from < d->d_nstates);
79 assert(0 <= to && to < d->d_nstates);
80
81 s = &d->d_state[from];
Neal Norwitz2c4e4f92006-04-10 06:42:25 +000082 s->s_arc = PyObject_REALLOC(s->s_arc, sizeof(arc) * (s->s_narcs + 1));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000083 if (s->s_arc == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000084 Py_FatalError("no mem to resize arc list in addarc");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000085 a = &s->s_arc[s->s_narcs++];
86 a->a_lbl = lbl;
87 a->a_arrow = to;
88}
89
90int
Thomas Wouters23c9e002000-07-22 19:20:54 +000091addlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000092{
93 int i;
94 label *lb;
95
96 for (i = 0; i < ll->ll_nlabels; i++) {
97 if (ll->ll_label[i].lb_type == type &&
98 strcmp(ll->ll_label[i].lb_str, str) == 0)
99 return i;
100 }
Neal Norwitz2c4e4f92006-04-10 06:42:25 +0000101 ll->ll_label = PyObject_REALLOC(ll->ll_label,
102 sizeof(label) * (ll->ll_nlabels + 1));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000103 if (ll->ll_label == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +0000104 Py_FatalError("no mem to resize labellist in addlabel");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000105 lb = &ll->ll_label[ll->ll_nlabels++];
106 lb->lb_type = type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000107 lb->lb_str = strdup(str);
108 if (Py_DebugFlag)
Guido van Rossumc6966172004-03-20 22:34:14 +0000109 printf("Label @ %8p, %d: %s\n", ll, ll->ll_nlabels,
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000110 PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000111 return lb - ll->ll_label;
112}
113
114/* Same, but rather dies than adds */
115
116int
Thomas Wouters23c9e002000-07-22 19:20:54 +0000117findlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000118{
119 int i;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000120
121 for (i = 0; i < ll->ll_nlabels; i++) {
122 if (ll->ll_label[i].lb_type == type /*&&
123 strcmp(ll->ll_label[i].lb_str, str) == 0*/)
124 return i;
125 }
126 fprintf(stderr, "Label %d/'%s' not found\n", type, str);
Guido van Rossum86bea461997-04-29 21:03:06 +0000127 Py_FatalError("grammar.c:findlabel()");
Guido van Rossumfd8a3931996-12-02 18:27:33 +0000128 return 0; /* Make gcc -Wall happy */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000129}
130
Guido van Rossum3f5da241990-12-20 15:06:42 +0000131/* Forward */
Tim Petersdbd9ba62000-07-09 03:09:57 +0000132static void translabel(grammar *, label *);
Guido van Rossum3f5da241990-12-20 15:06:42 +0000133
134void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000135translatelabels(grammar *g)
Guido van Rossum3f5da241990-12-20 15:06:42 +0000136{
137 int i;
Guido van Rossum588633d1994-12-30 15:46:02 +0000138
Guido van Rossum408027e1996-12-30 16:17:54 +0000139#ifdef Py_DEBUG
Guido van Rossum3f5da241990-12-20 15:06:42 +0000140 printf("Translating labels ...\n");
Guido van Rossum588633d1994-12-30 15:46:02 +0000141#endif
Guido van Rossum3f5da241990-12-20 15:06:42 +0000142 /* Don't translate EMPTY */
143 for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++)
144 translabel(g, &g->g_ll.ll_label[i]);
145}
146
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000147static void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000148translabel(grammar *g, label *lb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000149{
150 int i;
151
Guido van Rossum86bea461997-04-29 21:03:06 +0000152 if (Py_DebugFlag)
153 printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000154
155 if (lb->lb_type == NAME) {
156 for (i = 0; i < g->g_ndfas; i++) {
157 if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000158 if (Py_DebugFlag)
159 printf(
160 "Label %s is non-terminal %d.\n",
161 lb->lb_str,
162 g->g_dfa[i].d_type);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000163 lb->lb_type = g->g_dfa[i].d_type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000164 free(lb->lb_str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000165 lb->lb_str = NULL;
166 return;
167 }
168 }
169 for (i = 0; i < (int)N_TOKENS; i++) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000170 if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) {
171 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000172 printf("Label %s is terminal %d.\n",
173 lb->lb_str, i);
174 lb->lb_type = i;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000175 free(lb->lb_str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000176 lb->lb_str = NULL;
177 return;
178 }
179 }
180 printf("Can't translate NAME label '%s'\n", lb->lb_str);
181 return;
182 }
183
184 if (lb->lb_type == STRING) {
Neal Norwitz30b5c5d2005-12-19 06:05:18 +0000185 if (isalpha(Py_CHARMASK(lb->lb_str[1])) ||
186 lb->lb_str[1] == '_') {
Guido van Rossum1d5735e1994-08-30 08:27:36 +0000187 char *p;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000188 char *src;
189 char *dest;
190 size_t name_len;
Guido van Rossum86bea461997-04-29 21:03:06 +0000191 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000192 printf("Label %s is a keyword\n", lb->lb_str);
193 lb->lb_type = NAME;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000194 src = lb->lb_str + 1;
195 p = strchr(src, '\'');
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000196 if (p)
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000197 name_len = p - src;
198 else
199 name_len = strlen(src);
200 dest = malloc(name_len + 1);
201 strncpy(dest, src, name_len);
202 dest[name_len] = '\0';
203 free(lb->lb_str);
204 lb->lb_str = dest;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000205 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000206 else if (lb->lb_str[2] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000207 int type = (int) PyToken_OneChar(lb->lb_str[1]);
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000208 if (type != OP) {
209 lb->lb_type = type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000210 free(lb->lb_str);
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000211 lb->lb_str = NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000212 }
213 else
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000214 printf("Unknown OP label %s\n",
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000215 lb->lb_str);
216 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000217 else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000218 int type = (int) PyToken_TwoChars(lb->lb_str[1],
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000219 lb->lb_str[2]);
220 if (type != OP) {
221 lb->lb_type = type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000222 free(lb->lb_str);
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000223 lb->lb_str = NULL;
224 }
225 else
226 printf("Unknown OP label %s\n",
227 lb->lb_str);
228 }
Thomas Wouters434d0822000-08-24 20:11:32 +0000229 else if (lb->lb_str[2] && lb->lb_str[3] && lb->lb_str[4] == lb->lb_str[0]) {
230 int type = (int) PyToken_ThreeChars(lb->lb_str[1],
231 lb->lb_str[2],
232 lb->lb_str[3]);
233 if (type != OP) {
234 lb->lb_type = type;
Guido van Rossumd3ab37f2003-04-17 14:55:42 +0000235 free(lb->lb_str);
Thomas Wouters434d0822000-08-24 20:11:32 +0000236 lb->lb_str = NULL;
237 }
238 else
239 printf("Unknown OP label %s\n",
240 lb->lb_str);
241 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000242 else
243 printf("Can't translate STRING label %s\n",
244 lb->lb_str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000245 }
246 else
Guido van Rossum86bea461997-04-29 21:03:06 +0000247 printf("Can't translate label '%s'\n",
248 PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000249}