| Guido van Rossum | f70e43a | 1991-02-19 12:39:46 +0000 | [diff] [blame] | 1 |  | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 2 | /* Parser-tokenizer link implementation */ | 
 | 3 |  | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 4 | #include "pgenheaders.h" | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 5 | #include "tokenizer.h" | 
 | 6 | #include "node.h" | 
 | 7 | #include "grammar.h" | 
 | 8 | #include "parser.h" | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 9 | #include "parsetok.h" | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 10 | #include "errcode.h" | 
 | 11 |  | 
| Guido van Rossum | 6135df6 | 1998-04-10 19:35:06 +0000 | [diff] [blame] | 12 | int Py_TabcheckFlag; | 
 | 13 |  | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 14 |  | 
 | 15 | /* Forward */ | 
| Tim Peters | dbd9ba6 | 2000-07-09 03:09:57 +0000 | [diff] [blame] | 16 | static node *parsetok(struct tok_state *, grammar *, int, perrdetail *); | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 17 |  | 
 | 18 | /* Parse input coming from a string.  Return error code, print some errors. */ | 
 | 19 |  | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 20 | node * | 
| Thomas Wouters | 23c9e00 | 2000-07-22 19:20:54 +0000 | [diff] [blame] | 21 | PyParser_ParseString(char *s, grammar *g, int start, perrdetail *err_ret) | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 22 | { | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 23 | 	struct tok_state *tok; | 
 | 24 |  | 
 | 25 | 	err_ret->error = E_OK; | 
 | 26 | 	err_ret->filename = NULL; | 
 | 27 | 	err_ret->lineno = 0; | 
 | 28 | 	err_ret->offset = 0; | 
 | 29 | 	err_ret->text = NULL; | 
| Barry Warsaw | 38aa14a | 2000-08-18 05:04:08 +0000 | [diff] [blame] | 30 | 	err_ret->token = -1; | 
 | 31 | 	err_ret->expected = -1; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 32 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 33 | 	if ((tok = PyTokenizer_FromString(s)) == NULL) { | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 34 | 		err_ret->error = E_NOMEM; | 
 | 35 | 		return NULL; | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 36 | 	} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 37 |  | 
| Guido van Rossum | 89ce454 | 1998-12-21 18:32:40 +0000 | [diff] [blame] | 38 | 	if (Py_TabcheckFlag || Py_VerboseFlag) { | 
 | 39 | 		tok->filename = "<string>"; | 
 | 40 | 		tok->altwarning = (tok->filename != NULL); | 
 | 41 | 		if (Py_TabcheckFlag >= 2) | 
 | 42 | 			tok->alterror++; | 
 | 43 | 	} | 
 | 44 |  | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 45 | 	return parsetok(tok, g, start, err_ret); | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 46 | } | 
 | 47 |  | 
 | 48 |  | 
 | 49 | /* Parse input coming from a file.  Return error code, print some errors. */ | 
 | 50 |  | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 51 | node * | 
| Thomas Wouters | 23c9e00 | 2000-07-22 19:20:54 +0000 | [diff] [blame] | 52 | PyParser_ParseFile(FILE *fp, char *filename, grammar *g, int start, | 
 | 53 | 		   char *ps1, char *ps2, perrdetail *err_ret) | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 54 | { | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 55 | 	struct tok_state *tok; | 
 | 56 |  | 
 | 57 | 	err_ret->error = E_OK; | 
 | 58 | 	err_ret->filename = filename; | 
 | 59 | 	err_ret->lineno = 0; | 
 | 60 | 	err_ret->offset = 0; | 
 | 61 | 	err_ret->text = NULL; | 
 | 62 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 63 | 	if ((tok = PyTokenizer_FromFile(fp, ps1, ps2)) == NULL) { | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 64 | 		err_ret->error = E_NOMEM; | 
 | 65 | 		return NULL; | 
| Guido van Rossum | 3f5da24 | 1990-12-20 15:06:42 +0000 | [diff] [blame] | 66 | 	} | 
| Guido van Rossum | 6135df6 | 1998-04-10 19:35:06 +0000 | [diff] [blame] | 67 | 	if (Py_TabcheckFlag || Py_VerboseFlag) { | 
 | 68 | 		tok->filename = filename; | 
 | 69 | 		tok->altwarning = (filename != NULL); | 
 | 70 | 		if (Py_TabcheckFlag >= 2) | 
 | 71 | 			tok->alterror++; | 
 | 72 | 	} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 73 |  | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 74 |  | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 75 | 	return parsetok(tok, g, start, err_ret); | 
 | 76 | } | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 77 |  | 
 | 78 | /* Parse input coming from the given tokenizer structure. | 
 | 79 |    Return error code. */ | 
 | 80 |  | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 81 | static node * | 
| Thomas Wouters | 23c9e00 | 2000-07-22 19:20:54 +0000 | [diff] [blame] | 82 | parsetok(struct tok_state *tok, grammar *g, int start, perrdetail *err_ret) | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 83 | { | 
 | 84 | 	parser_state *ps; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 85 | 	node *n; | 
| Guido van Rossum | d8b1d37 | 1992-03-04 16:40:44 +0000 | [diff] [blame] | 86 | 	int started = 0; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 87 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 88 | 	if ((ps = PyParser_New(g, start)) == NULL) { | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 89 | 		fprintf(stderr, "no mem for new parser\n"); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 90 | 		err_ret->error = E_NOMEM; | 
 | 91 | 		return NULL; | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 92 | 	} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 93 |  | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 94 | 	for (;;) { | 
 | 95 | 		char *a, *b; | 
 | 96 | 		int type; | 
| Guido van Rossum | 6da3434 | 2000-06-28 22:00:02 +0000 | [diff] [blame] | 97 | 		size_t len; | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 98 | 		char *str; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 99 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 100 | 		type = PyTokenizer_Get(tok, &a, &b); | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 101 | 		if (type == ERRORTOKEN) { | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 102 | 			err_ret->error = tok->done; | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 103 | 			break; | 
 | 104 | 		} | 
| Guido van Rossum | d8b1d37 | 1992-03-04 16:40:44 +0000 | [diff] [blame] | 105 | 		if (type == ENDMARKER && started) { | 
 | 106 | 			type = NEWLINE; /* Add an extra newline */ | 
 | 107 | 			started = 0; | 
 | 108 | 		} | 
 | 109 | 		else | 
 | 110 | 			started = 1; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 111 | 		len = b - a; /* XXX this may compute NULL - NULL */ | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 112 | 		str = PyMem_NEW(char, len + 1); | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 113 | 		if (str == NULL) { | 
 | 114 | 			fprintf(stderr, "no mem for next token\n"); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 115 | 			err_ret->error = E_NOMEM; | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 116 | 			break; | 
 | 117 | 		} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 118 | 		if (len > 0) | 
 | 119 | 			strncpy(str, a, len); | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 120 | 		str[len] = '\0'; | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 121 | 		if ((err_ret->error = | 
| Fred Drake | 85f3639 | 2000-07-11 17:53:00 +0000 | [diff] [blame] | 122 | 		     PyParser_AddToken(ps, (int)type, str, tok->lineno, | 
 | 123 | 				       &(err_ret->expected))) != E_OK) { | 
| Guido van Rossum | ff0ec52 | 1997-07-27 01:52:50 +0000 | [diff] [blame] | 124 | 			if (err_ret->error != E_DONE) | 
 | 125 | 				PyMem_DEL(str); | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 126 | 			break; | 
| Guido van Rossum | ff0ec52 | 1997-07-27 01:52:50 +0000 | [diff] [blame] | 127 | 		} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 128 | 	} | 
 | 129 |  | 
 | 130 | 	if (err_ret->error == E_DONE) { | 
 | 131 | 		n = ps->p_tree; | 
 | 132 | 		ps->p_tree = NULL; | 
 | 133 | 	} | 
 | 134 | 	else | 
 | 135 | 		n = NULL; | 
 | 136 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 137 | 	PyParser_Delete(ps); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 138 |  | 
 | 139 | 	if (n == NULL) { | 
 | 140 | 		if (tok->lineno <= 1 && tok->done == E_EOF) | 
 | 141 | 			err_ret->error = E_EOF; | 
 | 142 | 		err_ret->lineno = tok->lineno; | 
 | 143 | 		err_ret->offset = tok->cur - tok->buf; | 
 | 144 | 		if (tok->buf != NULL) { | 
| Guido van Rossum | 6da3434 | 2000-06-28 22:00:02 +0000 | [diff] [blame] | 145 | 			size_t len = tok->inp - tok->buf; | 
| Guido van Rossum | b18618d | 2000-05-03 23:44:39 +0000 | [diff] [blame] | 146 | 			err_ret->text = PyMem_NEW(char, len + 1); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 147 | 			if (err_ret->text != NULL) { | 
| Guido van Rossum | ec49827 | 1995-01-20 16:59:12 +0000 | [diff] [blame] | 148 | 				if (len > 0) | 
 | 149 | 					strncpy(err_ret->text, tok->buf, len); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 150 | 				err_ret->text[len] = '\0'; | 
 | 151 | 			} | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 152 | 		} | 
 | 153 | 	} | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 154 |  | 
| Guido van Rossum | 86bea46 | 1997-04-29 21:03:06 +0000 | [diff] [blame] | 155 | 	PyTokenizer_Free(tok); | 
| Guido van Rossum | bd0389d | 1994-08-29 12:25:45 +0000 | [diff] [blame] | 156 |  | 
 | 157 | 	return n; | 
| Guido van Rossum | 85a5fbb | 1990-10-14 12:07:46 +0000 | [diff] [blame] | 158 | } |