blob: 5b0d99050fcc709994e98d7e9b91bf0971d76790 [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001/***********************************************************
Guido van Rossumb9f8d6e1995-01-04 19:08:09 +00002Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam,
3The Netherlands.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00004
5 All Rights Reserved
6
Guido van Rossumd266eb41996-10-25 14:44:06 +00007Permission to use, copy, modify, and distribute this software and its
8documentation for any purpose and without fee is hereby granted,
Guido van Rossumf70e43a1991-02-19 12:39:46 +00009provided that the above copyright notice appear in all copies and that
Guido van Rossumd266eb41996-10-25 14:44:06 +000010both that copyright notice and this permission notice appear in
Guido van Rossumf70e43a1991-02-19 12:39:46 +000011supporting documentation, and that the names of Stichting Mathematisch
Guido van Rossumd266eb41996-10-25 14:44:06 +000012Centrum or CWI or Corporation for National Research Initiatives or
13CNRI not be used in advertising or publicity pertaining to
14distribution of the software without specific, written prior
15permission.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000016
Guido van Rossumd266eb41996-10-25 14:44:06 +000017While CWI is the initial source for this software, a modified version
18is made available by the Corporation for National Research Initiatives
19(CNRI) at the Internet address ftp://ftp.python.org.
20
21STICHTING MATHEMATISCH CENTRUM AND CNRI DISCLAIM ALL WARRANTIES WITH
22REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
23MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH
24CENTRUM OR CNRI BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
25DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
26PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
27TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
28PERFORMANCE OF THIS SOFTWARE.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000029
30******************************************************************/
31
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000032/* Parser-tokenizer link implementation */
33
Guido van Rossum3f5da241990-12-20 15:06:42 +000034#include "pgenheaders.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000035#include "tokenizer.h"
36#include "node.h"
37#include "grammar.h"
38#include "parser.h"
Guido van Rossum3f5da241990-12-20 15:06:42 +000039#include "parsetok.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000040#include "errcode.h"
41
Guido van Rossum6135df61998-04-10 19:35:06 +000042int Py_TabcheckFlag;
43
Guido van Rossum3f5da241990-12-20 15:06:42 +000044
45/* Forward */
Guido van Rossum86bea461997-04-29 21:03:06 +000046static node *parsetok Py_PROTO((struct tok_state *, grammar *, int,
Guido van Rossumbd0389d1994-08-29 12:25:45 +000047 perrdetail *));
Guido van Rossum3f5da241990-12-20 15:06:42 +000048
49/* Parse input coming from a string. Return error code, print some errors. */
50
Guido van Rossumbd0389d1994-08-29 12:25:45 +000051node *
Guido van Rossum86bea461997-04-29 21:03:06 +000052PyParser_ParseString(s, g, start, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000053 char *s;
54 grammar *g;
55 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000056 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000057{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000058 struct tok_state *tok;
59
60 err_ret->error = E_OK;
61 err_ret->filename = NULL;
62 err_ret->lineno = 0;
63 err_ret->offset = 0;
64 err_ret->text = NULL;
65
Guido van Rossum86bea461997-04-29 21:03:06 +000066 if ((tok = PyTokenizer_FromString(s)) == NULL) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +000067 err_ret->error = E_NOMEM;
68 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000069 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000070
Guido van Rossum89ce4541998-12-21 18:32:40 +000071 if (Py_TabcheckFlag || Py_VerboseFlag) {
72 tok->filename = "<string>";
73 tok->altwarning = (tok->filename != NULL);
74 if (Py_TabcheckFlag >= 2)
75 tok->alterror++;
76 }
77
Guido van Rossumbd0389d1994-08-29 12:25:45 +000078 return parsetok(tok, g, start, err_ret);
Guido van Rossum3f5da241990-12-20 15:06:42 +000079}
80
81
82/* Parse input coming from a file. Return error code, print some errors. */
83
Guido van Rossumbd0389d1994-08-29 12:25:45 +000084node *
Guido van Rossum86bea461997-04-29 21:03:06 +000085PyParser_ParseFile(fp, filename, g, start, ps1, ps2, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000086 FILE *fp;
87 char *filename;
88 grammar *g;
89 int start;
90 char *ps1, *ps2;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000091 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000092{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000093 struct tok_state *tok;
94
95 err_ret->error = E_OK;
96 err_ret->filename = filename;
97 err_ret->lineno = 0;
98 err_ret->offset = 0;
99 err_ret->text = NULL;
100
Guido van Rossum86bea461997-04-29 21:03:06 +0000101 if ((tok = PyTokenizer_FromFile(fp, ps1, ps2)) == NULL) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000102 err_ret->error = E_NOMEM;
103 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +0000104 }
Guido van Rossum6135df61998-04-10 19:35:06 +0000105 if (Py_TabcheckFlag || Py_VerboseFlag) {
106 tok->filename = filename;
107 tok->altwarning = (filename != NULL);
108 if (Py_TabcheckFlag >= 2)
109 tok->alterror++;
110 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000111
Guido van Rossum91ece421992-03-25 22:32:00 +0000112#ifdef macintosh
113 {
114 int tabsize = guesstabsize(filename);
115 if (tabsize > 0)
116 tok->tabsize = tabsize;
117 }
118#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000119
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000120 return parsetok(tok, g, start, err_ret);
121}
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000122
123/* Parse input coming from the given tokenizer structure.
124 Return error code. */
125
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000126static node *
127parsetok(tok, g, start, err_ret)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000128 struct tok_state *tok;
129 grammar *g;
130 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000131 perrdetail *err_ret;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000132{
133 parser_state *ps;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000134 node *n;
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000135 int started = 0;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000136
Guido van Rossum86bea461997-04-29 21:03:06 +0000137 if ((ps = PyParser_New(g, start)) == NULL) {
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000138 fprintf(stderr, "no mem for new parser\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000139 err_ret->error = E_NOMEM;
140 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000141 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000142
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000143 for (;;) {
144 char *a, *b;
145 int type;
146 int len;
147 char *str;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000148
Guido van Rossum86bea461997-04-29 21:03:06 +0000149 type = PyTokenizer_Get(tok, &a, &b);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000150 if (type == ERRORTOKEN) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000151 err_ret->error = tok->done;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000152 break;
153 }
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000154 if (type == ENDMARKER && started) {
155 type = NEWLINE; /* Add an extra newline */
156 started = 0;
157 }
158 else
159 started = 1;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000160 len = b - a; /* XXX this may compute NULL - NULL */
Guido van Rossum86bea461997-04-29 21:03:06 +0000161 str = PyMem_NEW(char, len + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000162 if (str == NULL) {
163 fprintf(stderr, "no mem for next token\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000164 err_ret->error = E_NOMEM;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000165 break;
166 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000167 if (len > 0)
168 strncpy(str, a, len);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000169 str[len] = '\0';
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000170 if ((err_ret->error =
Guido van Rossum86bea461997-04-29 21:03:06 +0000171 PyParser_AddToken(ps, (int)type, str,
Guido van Rossumff0ec521997-07-27 01:52:50 +0000172 tok->lineno)) != E_OK) {
173 if (err_ret->error != E_DONE)
174 PyMem_DEL(str);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000175 break;
Guido van Rossumff0ec521997-07-27 01:52:50 +0000176 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000177 }
178
179 if (err_ret->error == E_DONE) {
180 n = ps->p_tree;
181 ps->p_tree = NULL;
182 }
183 else
184 n = NULL;
185
Guido van Rossum86bea461997-04-29 21:03:06 +0000186 PyParser_Delete(ps);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000187
188 if (n == NULL) {
189 if (tok->lineno <= 1 && tok->done == E_EOF)
190 err_ret->error = E_EOF;
191 err_ret->lineno = tok->lineno;
192 err_ret->offset = tok->cur - tok->buf;
193 if (tok->buf != NULL) {
194 int len = tok->inp - tok->buf;
195 err_ret->text = malloc(len + 1);
196 if (err_ret->text != NULL) {
Guido van Rossumec498271995-01-20 16:59:12 +0000197 if (len > 0)
198 strncpy(err_ret->text, tok->buf, len);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000199 err_ret->text[len] = '\0';
200 }
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000201 }
202 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000203
Guido van Rossum86bea461997-04-29 21:03:06 +0000204 PyTokenizer_Free(tok);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000205
206 return n;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000207}