blob: 5e7957e29953f8c604913961140f11bf9a148a6e [file] [log] [blame]
Guido van Rossumf70e43a1991-02-19 12:39:46 +00001/***********************************************************
Guido van Rossumb9f8d6e1995-01-04 19:08:09 +00002Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam,
3The Netherlands.
Guido van Rossumf70e43a1991-02-19 12:39:46 +00004
5 All Rights Reserved
6
7Permission to use, copy, modify, and distribute this software and its
8documentation for any purpose and without fee is hereby granted,
9provided that the above copyright notice appear in all copies and that
10both that copyright notice and this permission notice appear in
11supporting documentation, and that the names of Stichting Mathematisch
12Centrum or CWI not be used in advertising or publicity pertaining to
13distribution of the software without specific, written prior permission.
14
15STICHTING MATHEMATISCH CENTRUM DISCLAIMS ALL WARRANTIES WITH REGARD TO
16THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND
17FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH CENTRUM BE LIABLE
18FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
19WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
20ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT
21OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
22
23******************************************************************/
24
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000025/* Parser-tokenizer link implementation */
26
Guido van Rossum3f5da241990-12-20 15:06:42 +000027#include "pgenheaders.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000028#include "tokenizer.h"
29#include "node.h"
30#include "grammar.h"
31#include "parser.h"
Guido van Rossum3f5da241990-12-20 15:06:42 +000032#include "parsetok.h"
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000033#include "errcode.h"
34
Guido van Rossum3f5da241990-12-20 15:06:42 +000035
36/* Forward */
Guido van Rossumbd0389d1994-08-29 12:25:45 +000037static node *parsetok PROTO((struct tok_state *, grammar *, int,
38 perrdetail *));
Guido van Rossum3f5da241990-12-20 15:06:42 +000039
40/* Parse input coming from a string. Return error code, print some errors. */
41
Guido van Rossumbd0389d1994-08-29 12:25:45 +000042node *
43parsestring(s, g, start, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000044 char *s;
45 grammar *g;
46 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000047 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000048{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000049 struct tok_state *tok;
50
51 err_ret->error = E_OK;
52 err_ret->filename = NULL;
53 err_ret->lineno = 0;
54 err_ret->offset = 0;
55 err_ret->text = NULL;
56
57 if ((tok = tok_setups(s)) == NULL) {
58 err_ret->error = E_NOMEM;
59 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000060 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000061
62 return parsetok(tok, g, start, err_ret);
Guido van Rossum3f5da241990-12-20 15:06:42 +000063}
64
65
66/* Parse input coming from a file. Return error code, print some errors. */
67
Guido van Rossumbd0389d1994-08-29 12:25:45 +000068node *
69parsefile(fp, filename, g, start, ps1, ps2, err_ret)
Guido van Rossum3f5da241990-12-20 15:06:42 +000070 FILE *fp;
71 char *filename;
72 grammar *g;
73 int start;
74 char *ps1, *ps2;
Guido van Rossumbd0389d1994-08-29 12:25:45 +000075 perrdetail *err_ret;
Guido van Rossum3f5da241990-12-20 15:06:42 +000076{
Guido van Rossumbd0389d1994-08-29 12:25:45 +000077 struct tok_state *tok;
78
79 err_ret->error = E_OK;
80 err_ret->filename = filename;
81 err_ret->lineno = 0;
82 err_ret->offset = 0;
83 err_ret->text = NULL;
84
85 if ((tok = tok_setupf(fp, ps1, ps2)) == NULL) {
86 err_ret->error = E_NOMEM;
87 return NULL;
Guido van Rossum3f5da241990-12-20 15:06:42 +000088 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +000089
Guido van Rossum91ece421992-03-25 22:32:00 +000090#ifdef macintosh
91 {
92 int tabsize = guesstabsize(filename);
93 if (tabsize > 0)
94 tok->tabsize = tabsize;
95 }
96#endif
Guido van Rossum85a5fbb1990-10-14 12:07:46 +000097
Guido van Rossumbd0389d1994-08-29 12:25:45 +000098 return parsetok(tok, g, start, err_ret);
99}
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000100
101/* Parse input coming from the given tokenizer structure.
102 Return error code. */
103
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000104static node *
105parsetok(tok, g, start, err_ret)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000106 struct tok_state *tok;
107 grammar *g;
108 int start;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000109 perrdetail *err_ret;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000110{
111 parser_state *ps;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000112 node *n;
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000113 int started = 0;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000114
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000115 if ((ps = newparser(g, start)) == NULL) {
116 fprintf(stderr, "no mem for new parser\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000117 err_ret->error = E_NOMEM;
118 return NULL;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000119 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000120
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000121 for (;;) {
122 char *a, *b;
123 int type;
124 int len;
125 char *str;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000126
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000127 type = tok_get(tok, &a, &b);
128 if (type == ERRORTOKEN) {
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000129 err_ret->error = tok->done;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000130 break;
131 }
Guido van Rossumd8b1d371992-03-04 16:40:44 +0000132 if (type == ENDMARKER && started) {
133 type = NEWLINE; /* Add an extra newline */
134 started = 0;
135 }
136 else
137 started = 1;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000138 len = b - a; /* XXX this may compute NULL - NULL */
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000139 str = NEW(char, len + 1);
140 if (str == NULL) {
141 fprintf(stderr, "no mem for next token\n");
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000142 err_ret->error = E_NOMEM;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000143 break;
144 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000145 if (len > 0)
146 strncpy(str, a, len);
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000147 str[len] = '\0';
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000148 if ((err_ret->error =
149 addtoken(ps, (int)type, str, tok->lineno)) != E_OK)
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000150 break;
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000151 }
152
153 if (err_ret->error == E_DONE) {
154 n = ps->p_tree;
155 ps->p_tree = NULL;
156 }
157 else
158 n = NULL;
159
160 delparser(ps);
161
162 if (n == NULL) {
163 if (tok->lineno <= 1 && tok->done == E_EOF)
164 err_ret->error = E_EOF;
165 err_ret->lineno = tok->lineno;
166 err_ret->offset = tok->cur - tok->buf;
167 if (tok->buf != NULL) {
168 int len = tok->inp - tok->buf;
169 err_ret->text = malloc(len + 1);
170 if (err_ret->text != NULL) {
Guido van Rossumec498271995-01-20 16:59:12 +0000171 if (len > 0)
172 strncpy(err_ret->text, tok->buf, len);
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000173 err_ret->text[len] = '\0';
174 }
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000175 }
176 }
Guido van Rossumbd0389d1994-08-29 12:25:45 +0000177
178 tok_free(tok);
179
180 return n;
Guido van Rossum85a5fbb1990-10-14 12:07:46 +0000181}