blob: 2a0574da9e8adece77b9749c89a4166f366a23b2 [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00002/* Grammar implementation */
3
Guido van Rossum3f5da241990-12-20 15:06:42 +00004#include "pgenheaders.h"
5
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00006#include <ctype.h>
7
Guido van Rossum85a5fbb1990-10-14 12:07:46 +00008#include "assert.h"
9#include "token.h"
10#include "grammar.h"
11
Guido van Rossum86bea461997-04-29 21:03:06 +000012extern int Py_DebugFlag;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000013
14grammar *
Thomas Wouters23c9e002000-07-22 19:20:54 +000015newgrammar(int start)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000016{
17 grammar *g;
18
Guido van Rossum86bea461997-04-29 21:03:06 +000019 g = PyMem_NEW(grammar, 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000020 if (g == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000021 Py_FatalError("no mem for new grammar");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000022 g->g_ndfas = 0;
23 g->g_dfa = NULL;
24 g->g_start = start;
25 g->g_ll.ll_nlabels = 0;
26 g->g_ll.ll_label = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000027 g->g_accel = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000028 return g;
29}
30
31dfa *
Thomas Wouters23c9e002000-07-22 19:20:54 +000032adddfa(grammar *g, int type, char *name)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000033{
34 dfa *d;
35
Guido van Rossum86bea461997-04-29 21:03:06 +000036 PyMem_RESIZE(g->g_dfa, dfa, g->g_ndfas + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000037 if (g->g_dfa == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000038 Py_FatalError("no mem to resize dfa in adddfa");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000039 d = &g->g_dfa[g->g_ndfas++];
40 d->d_type = type;
41 d->d_name = name;
42 d->d_nstates = 0;
43 d->d_state = NULL;
44 d->d_initial = -1;
45 d->d_first = NULL;
46 return d; /* Only use while fresh! */
47}
48
49int
Thomas Wouters23c9e002000-07-22 19:20:54 +000050addstate(dfa *d)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000051{
52 state *s;
53
Guido van Rossum86bea461997-04-29 21:03:06 +000054 PyMem_RESIZE(d->d_state, state, d->d_nstates + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000055 if (d->d_state == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000056 Py_FatalError("no mem to resize state in addstate");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000057 s = &d->d_state[d->d_nstates++];
58 s->s_narcs = 0;
59 s->s_arc = NULL;
Guido van Rossum588633d1994-12-30 15:46:02 +000060 s->s_lower = 0;
61 s->s_upper = 0;
62 s->s_accel = NULL;
63 s->s_accept = 0;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000064 return s - d->d_state;
65}
66
67void
Thomas Wouters23c9e002000-07-22 19:20:54 +000068addarc(dfa *d, int from, int to, int lbl)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000069{
70 state *s;
71 arc *a;
72
73 assert(0 <= from && from < d->d_nstates);
74 assert(0 <= to && to < d->d_nstates);
75
76 s = &d->d_state[from];
Guido van Rossum86bea461997-04-29 21:03:06 +000077 PyMem_RESIZE(s->s_arc, arc, s->s_narcs + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000078 if (s->s_arc == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000079 Py_FatalError("no mem to resize arc list in addarc");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000080 a = &s->s_arc[s->s_narcs++];
81 a->a_lbl = lbl;
82 a->a_arrow = to;
83}
84
85int
Thomas Wouters23c9e002000-07-22 19:20:54 +000086addlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000087{
88 int i;
89 label *lb;
90
91 for (i = 0; i < ll->ll_nlabels; i++) {
92 if (ll->ll_label[i].lb_type == type &&
93 strcmp(ll->ll_label[i].lb_str, str) == 0)
94 return i;
95 }
Guido van Rossum86bea461997-04-29 21:03:06 +000096 PyMem_RESIZE(ll->ll_label, label, ll->ll_nlabels + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000097 if (ll->ll_label == NULL)
Guido van Rossum86bea461997-04-29 21:03:06 +000098 Py_FatalError("no mem to resize labellist in addlabel");
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000099 lb = &ll->ll_label[ll->ll_nlabels++];
100 lb->lb_type = type;
101 lb->lb_str = str; /* XXX strdup(str) ??? */
102 return lb - ll->ll_label;
103}
104
105/* Same, but rather dies than adds */
106
107int
Thomas Wouters23c9e002000-07-22 19:20:54 +0000108findlabel(labellist *ll, int type, char *str)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000109{
110 int i;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000111
112 for (i = 0; i < ll->ll_nlabels; i++) {
113 if (ll->ll_label[i].lb_type == type /*&&
114 strcmp(ll->ll_label[i].lb_str, str) == 0*/)
115 return i;
116 }
117 fprintf(stderr, "Label %d/'%s' not found\n", type, str);
Guido van Rossum86bea461997-04-29 21:03:06 +0000118 Py_FatalError("grammar.c:findlabel()");
Guido van Rossumfd8a3931996-12-02 18:27:33 +0000119 return 0; /* Make gcc -Wall happy */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000120}
121
Guido van Rossum3f5da241990-12-20 15:06:42 +0000122/* Forward */
Tim Petersdbd9ba62000-07-09 03:09:57 +0000123static void translabel(grammar *, label *);
Guido van Rossum3f5da241990-12-20 15:06:42 +0000124
125void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000126translatelabels(grammar *g)
Guido van Rossum3f5da241990-12-20 15:06:42 +0000127{
128 int i;
Guido van Rossum588633d1994-12-30 15:46:02 +0000129
Guido van Rossum408027e1996-12-30 16:17:54 +0000130#ifdef Py_DEBUG
Guido van Rossum3f5da241990-12-20 15:06:42 +0000131 printf("Translating labels ...\n");
Guido van Rossum588633d1994-12-30 15:46:02 +0000132#endif
Guido van Rossum3f5da241990-12-20 15:06:42 +0000133 /* Don't translate EMPTY */
134 for (i = EMPTY+1; i < g->g_ll.ll_nlabels; i++)
135 translabel(g, &g->g_ll.ll_label[i]);
136}
137
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000138static void
Thomas Wouters23c9e002000-07-22 19:20:54 +0000139translabel(grammar *g, label *lb)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000140{
141 int i;
142
Guido van Rossum86bea461997-04-29 21:03:06 +0000143 if (Py_DebugFlag)
144 printf("Translating label %s ...\n", PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000145
146 if (lb->lb_type == NAME) {
147 for (i = 0; i < g->g_ndfas; i++) {
148 if (strcmp(lb->lb_str, g->g_dfa[i].d_name) == 0) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000149 if (Py_DebugFlag)
150 printf(
151 "Label %s is non-terminal %d.\n",
152 lb->lb_str,
153 g->g_dfa[i].d_type);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000154 lb->lb_type = g->g_dfa[i].d_type;
155 lb->lb_str = NULL;
156 return;
157 }
158 }
159 for (i = 0; i < (int)N_TOKENS; i++) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000160 if (strcmp(lb->lb_str, _PyParser_TokenNames[i]) == 0) {
161 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000162 printf("Label %s is terminal %d.\n",
163 lb->lb_str, i);
164 lb->lb_type = i;
165 lb->lb_str = NULL;
166 return;
167 }
168 }
169 printf("Can't translate NAME label '%s'\n", lb->lb_str);
170 return;
171 }
172
173 if (lb->lb_type == STRING) {
Guido van Rossumbb3649e1998-04-10 22:09:39 +0000174 if (isalpha((int)(lb->lb_str[1])) || lb->lb_str[1] == '_') {
Guido van Rossum1d5735e1994-08-30 08:27:36 +0000175 char *p;
Guido van Rossum86bea461997-04-29 21:03:06 +0000176 if (Py_DebugFlag)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000177 printf("Label %s is a keyword\n", lb->lb_str);
178 lb->lb_type = NAME;
179 lb->lb_str++;
180 p = strchr(lb->lb_str, '\'');
181 if (p)
182 *p = '\0';
183 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000184 else if (lb->lb_str[2] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000185 int type = (int) PyToken_OneChar(lb->lb_str[1]);
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000186 if (type != OP) {
187 lb->lb_type = type;
188 lb->lb_str = NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000189 }
190 else
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000191 printf("Unknown OP label %s\n",
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000192 lb->lb_str);
193 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000194 else if (lb->lb_str[2] && lb->lb_str[3] == lb->lb_str[0]) {
Guido van Rossum86bea461997-04-29 21:03:06 +0000195 int type = (int) PyToken_TwoChars(lb->lb_str[1],
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000196 lb->lb_str[2]);
197 if (type != OP) {
198 lb->lb_type = type;
199 lb->lb_str = NULL;
200 }
201 else
202 printf("Unknown OP label %s\n",
203 lb->lb_str);
204 }
Thomas Wouters434d0822000-08-24 20:11:32 +0000205 else if (lb->lb_str[2] && lb->lb_str[3] && lb->lb_str[4] == lb->lb_str[0]) {
206 int type = (int) PyToken_ThreeChars(lb->lb_str[1],
207 lb->lb_str[2],
208 lb->lb_str[3]);
209 if (type != OP) {
210 lb->lb_type = type;
211 lb->lb_str = NULL;
212 }
213 else
214 printf("Unknown OP label %s\n",
215 lb->lb_str);
216 }
Guido van Rossumc64d04d1991-10-20 20:20:00 +0000217 else
218 printf("Can't translate STRING label %s\n",
219 lb->lb_str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000220 }
221 else
Guido van Rossum86bea461997-04-29 21:03:06 +0000222 printf("Can't translate label '%s'\n",
223 PyGrammar_LabelRepr(lb));
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000224}