blob: 251e5074dda78da4f467cecf219faabab9e9fa7d [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001/***********************************************************
Guido van Rossumb9f8d6e1995-01-04 19:08:09 +00002Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam,
3The Netherlands.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00004
5 All Rights Reserved
6
Guido van Rossumd266eb41996-10-25 14:44:06 +00007Permission to use, copy, modify, and distribute this software and its
8documentation for any purpose and without fee is hereby granted,
Guido van Rossumf70e43a1991-02-19 12:39:46 +00009provided that the above copyright notice appear in all copies and that
Guido van Rossumd266eb41996-10-25 14:44:06 +000010both that copyright notice and this permission notice appear in
Guido van Rossumf70e43a1991-02-19 12:39:46 +000011supporting documentation, and that the names of Stichting Mathematisch
Guido van Rossumd266eb41996-10-25 14:44:06 +000012Centrum or CWI or Corporation for National Research Initiatives or
13CNRI not be used in advertising or publicity pertaining to
14distribution of the software without specific, written prior
15permission.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000016
Guido van Rossumd266eb41996-10-25 14:44:06 +000017While CWI is the initial source for this software, a modified version
18is made available by the Corporation for National Research Initiatives
19(CNRI) at the Internet address ftp://ftp.python.org.
20
21STICHTING MATHEMATISCH CENTRUM AND CNRI DISCLAIM ALL WARRANTIES WITH
22REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
23MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH
24CENTRUM OR CNRI BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
25DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
26PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
27TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
28PERFORMANCE OF THIS SOFTWARE.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000029
30******************************************************************/
31
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000032/* Parser-tokenizer link implementation */
33
Guido van Rossum3f5da241990-12-20 15:06:42 +000034#include "pgenheaders.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000035#include "tokenizer.h"
36#include "node.h"
37#include "grammar.h"
38#include "parser.h"
Guido van Rossum3f5da241990-12-20 15:06:42 +000039#include "parsetok.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000040#include "errcode.h"
41
Guido van Rossum3f5da241990-12-20 15:06:42 +000042
43/* Forward */
Guido van Rossum86bea461997-04-29 21:03:06 +000044static node *parsetok Py_PROTO((struct tok_state *, grammar *, int,
Guido van Rossumbd0389d1994-08-29 12:25:45 +000045 perrdetail *));
Guido van Rossum3f5da241990-12-20 15:06:42 +000046
47/* Parse input coming from a string. Return error code, print some errors. */
48
Guido van Rossumbd0389d1994-08-29 12:25:45 +000049node *
Guido van Rossum86bea461997-04-29 21:03:06 +000050PyParser_ParseString(s, g, start, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000051 char *s;
52 grammar *g;
53 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000054 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000055{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000056 struct tok_state *tok;
57
58 err_ret->error = E_OK;
59 err_ret->filename = NULL;
60 err_ret->lineno = 0;
61 err_ret->offset = 0;
62 err_ret->text = NULL;
63
Guido van Rossum86bea461997-04-29 21:03:06 +000064 if ((tok = PyTokenizer_FromString(s)) == NULL) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +000065 err_ret->error = E_NOMEM;
66 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000067 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000068
69 return parsetok(tok, g, start, err_ret);
Guido van Rossum3f5da241990-12-20 15:06:42 +000070}
71
72
73/* Parse input coming from a file. Return error code, print some errors. */
74
Guido van Rossumbd0389d1994-08-29 12:25:45 +000075node *
Guido van Rossum86bea461997-04-29 21:03:06 +000076PyParser_ParseFile(fp, filename, g, start, ps1, ps2, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000077 FILE *fp;
78 char *filename;
79 grammar *g;
80 int start;
81 char *ps1, *ps2;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000082 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000083{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000084 struct tok_state *tok;
85
86 err_ret->error = E_OK;
87 err_ret->filename = filename;
88 err_ret->lineno = 0;
89 err_ret->offset = 0;
90 err_ret->text = NULL;
91
Guido van Rossum86bea461997-04-29 21:03:06 +000092 if ((tok = PyTokenizer_FromFile(fp, ps1, ps2)) == NULL) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +000093 err_ret->error = E_NOMEM;
94 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000095 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000096
Guido van Rossum91ece421992-03-25 22:32:00 +000097#ifdef macintosh
98 {
99 int tabsize = guesstabsize(filename);
100 if (tabsize > 0)
101 tok->tabsize = tabsize;
102 }
103#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000104
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000105 return parsetok(tok, g, start, err_ret);
106}
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000107
108/* Parse input coming from the given tokenizer structure.
109 Return error code. */
110
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000111static node *
112parsetok(tok, g, start, err_ret)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000113 struct tok_state *tok;
114 grammar *g;
115 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000116 perrdetail *err_ret;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000117{
118 parser_state *ps;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000119 node *n;
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000120 int started = 0;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000121
Guido van Rossum86bea461997-04-29 21:03:06 +0000122 if ((ps = PyParser_New(g, start)) == NULL) {
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000123 fprintf(stderr, "no mem for new parser\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000124 err_ret->error = E_NOMEM;
125 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000126 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000127
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000128 for (;;) {
129 char *a, *b;
130 int type;
131 int len;
132 char *str;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000133
Guido van Rossum86bea461997-04-29 21:03:06 +0000134 type = PyTokenizer_Get(tok, &a, &b);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000135 if (type == ERRORTOKEN) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000136 err_ret->error = tok->done;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000137 break;
138 }
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000139 if (type == ENDMARKER && started) {
140 type = NEWLINE; /* Add an extra newline */
141 started = 0;
142 }
143 else
144 started = 1;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000145 len = b - a; /* XXX this may compute NULL - NULL */
Guido van Rossum86bea461997-04-29 21:03:06 +0000146 str = PyMem_NEW(char, len + 1);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000147 if (str == NULL) {
148 fprintf(stderr, "no mem for next token\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000149 err_ret->error = E_NOMEM;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000150 break;
151 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000152 if (len > 0)
153 strncpy(str, a, len);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000154 str[len] = '\0';
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000155 if ((err_ret->error =
Guido van Rossum86bea461997-04-29 21:03:06 +0000156 PyParser_AddToken(ps, (int)type, str,
157 tok->lineno)) != E_OK)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000158 break;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000159 }
160
161 if (err_ret->error == E_DONE) {
162 n = ps->p_tree;
163 ps->p_tree = NULL;
164 }
165 else
166 n = NULL;
167
Guido van Rossum86bea461997-04-29 21:03:06 +0000168 PyParser_Delete(ps);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000169
170 if (n == NULL) {
171 if (tok->lineno <= 1 && tok->done == E_EOF)
172 err_ret->error = E_EOF;
173 err_ret->lineno = tok->lineno;
174 err_ret->offset = tok->cur - tok->buf;
175 if (tok->buf != NULL) {
176 int len = tok->inp - tok->buf;
177 err_ret->text = malloc(len + 1);
178 if (err_ret->text != NULL) {
Guido van Rossumec498271995-01-20 16:59:12 +0000179 if (len > 0)
180 strncpy(err_ret->text, tok->buf, len);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000181 err_ret->text[len] = '\0';
182 }
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000183 }
184 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000185
Guido van Rossum86bea461997-04-29 21:03:06 +0000186 PyTokenizer_Free(tok);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000187
188 return n;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000189}