blob: 7bccd350cd780219dcecf408ffb7d1e92c3ffe9e [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001/***********************************************************
Guido van Rossumb9f8d6e1995-01-04 19:08:09 +00002Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam,
3The Netherlands.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00004
5 All Rights Reserved
6
Guido van Rossumd266eb41996-10-25 14:44:06 +00007Permission to use, copy, modify, and distribute this software and its
8documentation for any purpose and without fee is hereby granted,
Guido van Rossumf70e43a1991-02-19 12:39:46 +00009provided that the above copyright notice appear in all copies and that
Guido van Rossumd266eb41996-10-25 14:44:06 +000010both that copyright notice and this permission notice appear in
Guido van Rossumf70e43a1991-02-19 12:39:46 +000011supporting documentation, and that the names of Stichting Mathematisch
Guido van Rossumd266eb41996-10-25 14:44:06 +000012Centrum or CWI or Corporation for National Research Initiatives or
13CNRI not be used in advertising or publicity pertaining to
14distribution of the software without specific, written prior
15permission.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000016
Guido van Rossumd266eb41996-10-25 14:44:06 +000017While CWI is the initial source for this software, a modified version
18is made available by the Corporation for National Research Initiatives
19(CNRI) at the Internet address ftp://ftp.python.org.
20
21STICHTING MATHEMATISCH CENTRUM AND CNRI DISCLAIM ALL WARRANTIES WITH
22REGARD TO THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF
23MERCHANTABILITY AND FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH
24CENTRUM OR CNRI BE LIABLE FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL
25DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR
26PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER
27TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR
28PERFORMANCE OF THIS SOFTWARE.
Guido van Rossumf70e43a1991-02-19 12:39:46 +000029
30******************************************************************/
31
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000032/* Parser-tokenizer link implementation */
33
Guido van Rossum3f5da241990-12-20 15:06:42 +000034#include "pgenheaders.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000035#include "tokenizer.h"
36#include "node.h"
37#include "grammar.h"
38#include "parser.h"
Guido van Rossum3f5da241990-12-20 15:06:42 +000039#include "parsetok.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000040#include "errcode.h"
41
Guido van Rossum3f5da241990-12-20 15:06:42 +000042
43/* Forward */
Guido van Rossumbd0389d1994-08-29 12:25:45 +000044static node *parsetok PROTO((struct tok_state *, grammar *, int,
45 perrdetail *));
Guido van Rossum3f5da241990-12-20 15:06:42 +000046
47/* Parse input coming from a string. Return error code, print some errors. */
48
Guido van Rossumbd0389d1994-08-29 12:25:45 +000049node *
50parsestring(s, g, start, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000051 char *s;
52 grammar *g;
53 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000054 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000055{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000056 struct tok_state *tok;
57
58 err_ret->error = E_OK;
59 err_ret->filename = NULL;
60 err_ret->lineno = 0;
61 err_ret->offset = 0;
62 err_ret->text = NULL;
63
64 if ((tok = tok_setups(s)) == NULL) {
65 err_ret->error = E_NOMEM;
66 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000067 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000068
69 return parsetok(tok, g, start, err_ret);
Guido van Rossum3f5da241990-12-20 15:06:42 +000070}
71
72
73/* Parse input coming from a file. Return error code, print some errors. */
74
Guido van Rossumbd0389d1994-08-29 12:25:45 +000075node *
76parsefile(fp, filename, g, start, ps1, ps2, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000077 FILE *fp;
78 char *filename;
79 grammar *g;
80 int start;
81 char *ps1, *ps2;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000082 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000083{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000084 struct tok_state *tok;
85
86 err_ret->error = E_OK;
87 err_ret->filename = filename;
88 err_ret->lineno = 0;
89 err_ret->offset = 0;
90 err_ret->text = NULL;
91
92 if ((tok = tok_setupf(fp, ps1, ps2)) == NULL) {
93 err_ret->error = E_NOMEM;
94 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000095 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000096
Guido van Rossum91ece421992-03-25 22:32:00 +000097#ifdef macintosh
98 {
99 int tabsize = guesstabsize(filename);
100 if (tabsize > 0)
101 tok->tabsize = tabsize;
102 }
103#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000104
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000105 return parsetok(tok, g, start, err_ret);
106}
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000107
108/* Parse input coming from the given tokenizer structure.
109 Return error code. */
110
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000111static node *
112parsetok(tok, g, start, err_ret)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000113 struct tok_state *tok;
114 grammar *g;
115 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000116 perrdetail *err_ret;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000117{
118 parser_state *ps;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000119 node *n;
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000120 int started = 0;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000121
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000122 if ((ps = newparser(g, start)) == NULL) {
123 fprintf(stderr, "no mem for new parser\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000124 err_ret->error = E_NOMEM;
125 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000126 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000127
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000128 for (;;) {
129 char *a, *b;
130 int type;
131 int len;
132 char *str;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000133
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000134 type = tok_get(tok, &a, &b);
135 if (type == ERRORTOKEN) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000136 err_ret->error = tok->done;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000137 break;
138 }
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000139 if (type == ENDMARKER && started) {
140 type = NEWLINE; /* Add an extra newline */
141 started = 0;
142 }
143 else
144 started = 1;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000145 len = b - a; /* XXX this may compute NULL - NULL */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000146 str = NEW(char, len + 1);
147 if (str == NULL) {
148 fprintf(stderr, "no mem for next token\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000149 err_ret->error = E_NOMEM;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000150 break;
151 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000152 if (len > 0)
153 strncpy(str, a, len);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000154 str[len] = '\0';
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000155 if ((err_ret->error =
156 addtoken(ps, (int)type, str, tok->lineno)) != E_OK)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000157 break;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000158 }
159
160 if (err_ret->error == E_DONE) {
161 n = ps->p_tree;
162 ps->p_tree = NULL;
163 }
164 else
165 n = NULL;
166
167 delparser(ps);
168
169 if (n == NULL) {
170 if (tok->lineno <= 1 && tok->done == E_EOF)
171 err_ret->error = E_EOF;
172 err_ret->lineno = tok->lineno;
173 err_ret->offset = tok->cur - tok->buf;
174 if (tok->buf != NULL) {
175 int len = tok->inp - tok->buf;
176 err_ret->text = malloc(len + 1);
177 if (err_ret->text != NULL) {
Guido van Rossumec498271995-01-20 16:59:12 +0000178 if (len > 0)
179 strncpy(err_ret->text, tok->buf, len);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000180 err_ret->text[len] = '\0';
181 }
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000182 }
183 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000184
185 tok_free(tok);
186
187 return n;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000188}