Guido van Rossum | f70e43a | 1991-02-19 12:39:46 +0000 | [diff] [blame] | 1 | /*********************************************************** |
Guido van Rossum | b9f8d6e | 1995-01-04 19:08:09 +0000 | [diff] [blame] | 2 | Copyright 1991-1995 by Stichting Mathematisch Centrum, Amsterdam, |
| 3 | The Netherlands. |
Guido van Rossum | f70e43a | 1991-02-19 12:39:46 +0000 | [diff] [blame] | 4 | |
| 5 | All Rights Reserved |
| 6 | |
| 7 | Permission to use, copy, modify, and distribute this software and its |
| 8 | documentation for any purpose and without fee is hereby granted, |
| 9 | provided that the above copyright notice appear in all copies and that |
| 10 | both that copyright notice and this permission notice appear in |
| 11 | supporting documentation, and that the names of Stichting Mathematisch |
| 12 | Centrum or CWI not be used in advertising or publicity pertaining to |
| 13 | distribution of the software without specific, written prior permission. |
| 14 | |
| 15 | STICHTING MATHEMATISCH CENTRUM DISCLAIMS ALL WARRANTIES WITH REGARD TO |
| 16 | THIS SOFTWARE, INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND |
| 17 | FITNESS, IN NO EVENT SHALL STICHTING MATHEMATISCH CENTRUM BE LIABLE |
| 18 | FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES |
| 19 | WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN |
| 20 | ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT |
| 21 | OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. |
| 22 | |
| 23 | ******************************************************************/ |
| 24 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 25 | /* Parser-tokenizer link implementation */ |
| 26 | |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 27 | #include "pgenheaders.h" |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 28 | #include "tokenizer.h" |
| 29 | #include "node.h" |
| 30 | #include "grammar.h" |
| 31 | #include "parser.h" |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 32 | #include "parsetok.h" |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 33 | #include "errcode.h" |
| 34 | |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 35 | |
| 36 | /* Forward */ |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 37 | static node *parsetok PROTO((struct tok_state *, grammar *, int, |
| 38 | perrdetail *)); |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 39 | |
| 40 | /* Parse input coming from a string. Return error code, print some errors. */ |
| 41 | |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 42 | node * |
| 43 | parsestring(s, g, start, err_ret) |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 44 | char *s; |
| 45 | grammar *g; |
| 46 | int start; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 47 | perrdetail *err_ret; |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 48 | { |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 49 | struct tok_state *tok; |
| 50 | |
| 51 | err_ret->error = E_OK; |
| 52 | err_ret->filename = NULL; |
| 53 | err_ret->lineno = 0; |
| 54 | err_ret->offset = 0; |
| 55 | err_ret->text = NULL; |
| 56 | |
| 57 | if ((tok = tok_setups(s)) == NULL) { |
| 58 | err_ret->error = E_NOMEM; |
| 59 | return NULL; |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 60 | } |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 61 | |
| 62 | return parsetok(tok, g, start, err_ret); |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 63 | } |
| 64 | |
| 65 | |
| 66 | /* Parse input coming from a file. Return error code, print some errors. */ |
| 67 | |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 68 | node * |
| 69 | parsefile(fp, filename, g, start, ps1, ps2, err_ret) |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 70 | FILE *fp; |
| 71 | char *filename; |
| 72 | grammar *g; |
| 73 | int start; |
| 74 | char *ps1, *ps2; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 75 | perrdetail *err_ret; |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 76 | { |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 77 | struct tok_state *tok; |
| 78 | |
| 79 | err_ret->error = E_OK; |
| 80 | err_ret->filename = filename; |
| 81 | err_ret->lineno = 0; |
| 82 | err_ret->offset = 0; |
| 83 | err_ret->text = NULL; |
| 84 | |
| 85 | if ((tok = tok_setupf(fp, ps1, ps2)) == NULL) { |
| 86 | err_ret->error = E_NOMEM; |
| 87 | return NULL; |
Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 88 | } |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 89 | |
Guido van Rossum | 91ece42 | 1992-03-25 22:32:00 +0000 | [diff] [blame] | 90 | #ifdef macintosh |
| 91 | { |
| 92 | int tabsize = guesstabsize(filename); |
| 93 | if (tabsize > 0) |
| 94 | tok->tabsize = tabsize; |
| 95 | } |
| 96 | #endif |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 97 | |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 98 | return parsetok(tok, g, start, err_ret); |
| 99 | } |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 100 | |
| 101 | /* Parse input coming from the given tokenizer structure. |
| 102 | Return error code. */ |
| 103 | |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 104 | static node * |
| 105 | parsetok(tok, g, start, err_ret) |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 106 | struct tok_state *tok; |
| 107 | grammar *g; |
| 108 | int start; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 109 | perrdetail *err_ret; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 110 | { |
| 111 | parser_state *ps; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 112 | node *n; |
Guido van Rossum | d8b1d37 | 1992-03-04 16:40:44 +0000 | [diff] [blame] | 113 | int started = 0; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 114 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 115 | if ((ps = newparser(g, start)) == NULL) { |
| 116 | fprintf(stderr, "no mem for new parser\n"); |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 117 | err_ret->error = E_NOMEM; |
| 118 | return NULL; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 119 | } |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 120 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 121 | for (;;) { |
| 122 | char *a, *b; |
| 123 | int type; |
| 124 | int len; |
| 125 | char *str; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 126 | |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 127 | type = tok_get(tok, &a, &b); |
| 128 | if (type == ERRORTOKEN) { |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 129 | err_ret->error = tok->done; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 130 | break; |
| 131 | } |
Guido van Rossum | d8b1d37 | 1992-03-04 16:40:44 +0000 | [diff] [blame] | 132 | if (type == ENDMARKER && started) { |
| 133 | type = NEWLINE; /* Add an extra newline */ |
| 134 | started = 0; |
| 135 | } |
| 136 | else |
| 137 | started = 1; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 138 | len = b - a; /* XXX this may compute NULL - NULL */ |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 139 | str = NEW(char, len + 1); |
| 140 | if (str == NULL) { |
| 141 | fprintf(stderr, "no mem for next token\n"); |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 142 | err_ret->error = E_NOMEM; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 143 | break; |
| 144 | } |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 145 | if (len > 0) |
| 146 | strncpy(str, a, len); |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 147 | str[len] = '\0'; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 148 | if ((err_ret->error = |
| 149 | addtoken(ps, (int)type, str, tok->lineno)) != E_OK) |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 150 | break; |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 151 | } |
| 152 | |
| 153 | if (err_ret->error == E_DONE) { |
| 154 | n = ps->p_tree; |
| 155 | ps->p_tree = NULL; |
| 156 | } |
| 157 | else |
| 158 | n = NULL; |
| 159 | |
| 160 | delparser(ps); |
| 161 | |
| 162 | if (n == NULL) { |
| 163 | if (tok->lineno <= 1 && tok->done == E_EOF) |
| 164 | err_ret->error = E_EOF; |
| 165 | err_ret->lineno = tok->lineno; |
| 166 | err_ret->offset = tok->cur - tok->buf; |
| 167 | if (tok->buf != NULL) { |
| 168 | int len = tok->inp - tok->buf; |
| 169 | err_ret->text = malloc(len + 1); |
| 170 | if (err_ret->text != NULL) { |
| 171 | strncpy(err_ret->text, tok->buf, len+1); |
| 172 | err_ret->text[len] = '\0'; |
| 173 | } |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 174 | } |
| 175 | } |
Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 176 | |
| 177 | tok_free(tok); |
| 178 | |
| 179 | return n; |
Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 180 | } |