Jeremy Hylton | 3e0055f | 2005-10-20 19:59:25 +0000 | [diff] [blame] | 1 | /* |
Batuhan Taskaya | 02a1603 | 2020-10-10 20:14:59 +0300 | [diff] [blame] | 2 | * This file exposes PyAST_Validate interface to check the integrity |
| 3 | * of the given abstract syntax tree (potentially constructed manually). |
Jeremy Hylton | 3e0055f | 2005-10-20 19:59:25 +0000 | [diff] [blame] | 4 | */ |
| 5 | #include "Python.h" |
Victor Stinner | 94faa07 | 2021-03-23 20:47:40 +0100 | [diff] [blame] | 6 | #include "pycore_ast.h" // asdl_stmt_seq |
Jeremy Hylton | 3e0055f | 2005-10-20 19:59:25 +0000 | [diff] [blame] | 7 | |
| 8 | #include <assert.h> |
Serhiy Storchaka | 58159ef | 2019-01-12 09:46:50 +0200 | [diff] [blame] | 9 | |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 10 | static int validate_stmts(asdl_stmt_seq *); |
| 11 | static int validate_exprs(asdl_expr_seq*, expr_context_ty, int); |
| 12 | static int _validate_nonempty_seq(asdl_seq *, const char *, const char *); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 13 | static int validate_stmt(stmt_ty); |
| 14 | static int validate_expr(expr_ty, expr_context_ty); |
| 15 | |
| 16 | static int |
Batuhan Taskaya | 68874a8 | 2020-06-06 15:44:16 +0300 | [diff] [blame] | 17 | validate_name(PyObject *name) |
| 18 | { |
| 19 | assert(PyUnicode_Check(name)); |
| 20 | static const char * const forbidden[] = { |
| 21 | "None", |
| 22 | "True", |
| 23 | "False", |
| 24 | NULL |
| 25 | }; |
| 26 | for (int i = 0; forbidden[i] != NULL; i++) { |
| 27 | if (_PyUnicode_EqualToASCIIString(name, forbidden[i])) { |
| 28 | PyErr_Format(PyExc_ValueError, "Name node can't be used with '%s' constant", forbidden[i]); |
| 29 | return 0; |
| 30 | } |
| 31 | } |
| 32 | return 1; |
| 33 | } |
| 34 | |
| 35 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 36 | validate_comprehension(asdl_comprehension_seq *gens) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 37 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 38 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 39 | if (!asdl_seq_LEN(gens)) { |
| 40 | PyErr_SetString(PyExc_ValueError, "comprehension with no generators"); |
| 41 | return 0; |
| 42 | } |
| 43 | for (i = 0; i < asdl_seq_LEN(gens); i++) { |
| 44 | comprehension_ty comp = asdl_seq_GET(gens, i); |
| 45 | if (!validate_expr(comp->target, Store) || |
| 46 | !validate_expr(comp->iter, Load) || |
| 47 | !validate_exprs(comp->ifs, Load, 0)) |
| 48 | return 0; |
| 49 | } |
| 50 | return 1; |
| 51 | } |
| 52 | |
| 53 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 54 | validate_keywords(asdl_keyword_seq *keywords) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 55 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 56 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 57 | for (i = 0; i < asdl_seq_LEN(keywords); i++) |
Batuhan Taskaya | 02a1603 | 2020-10-10 20:14:59 +0300 | [diff] [blame] | 58 | if (!validate_expr((asdl_seq_GET(keywords, i))->value, Load)) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 59 | return 0; |
| 60 | return 1; |
| 61 | } |
| 62 | |
| 63 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 64 | validate_args(asdl_arg_seq *args) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 65 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 66 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 67 | for (i = 0; i < asdl_seq_LEN(args); i++) { |
| 68 | arg_ty arg = asdl_seq_GET(args, i); |
| 69 | if (arg->annotation && !validate_expr(arg->annotation, Load)) |
| 70 | return 0; |
| 71 | } |
| 72 | return 1; |
| 73 | } |
| 74 | |
| 75 | static const char * |
| 76 | expr_context_name(expr_context_ty ctx) |
| 77 | { |
| 78 | switch (ctx) { |
| 79 | case Load: |
| 80 | return "Load"; |
| 81 | case Store: |
| 82 | return "Store"; |
| 83 | case Del: |
| 84 | return "Del"; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 85 | default: |
Barry Warsaw | b2e5794 | 2017-09-14 18:13:16 -0700 | [diff] [blame] | 86 | Py_UNREACHABLE(); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 87 | } |
| 88 | } |
| 89 | |
| 90 | static int |
| 91 | validate_arguments(arguments_ty args) |
| 92 | { |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 93 | if (!validate_args(args->posonlyargs) || !validate_args(args->args)) { |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 94 | return 0; |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 95 | } |
Benjamin Peterson | cda75be | 2013-03-18 10:48:58 -0700 | [diff] [blame] | 96 | if (args->vararg && args->vararg->annotation |
| 97 | && !validate_expr(args->vararg->annotation, Load)) { |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 98 | return 0; |
| 99 | } |
| 100 | if (!validate_args(args->kwonlyargs)) |
| 101 | return 0; |
Victor Stinner | 0c39b1b | 2015-03-18 15:02:06 +0100 | [diff] [blame] | 102 | if (args->kwarg && args->kwarg->annotation |
Benjamin Peterson | cda75be | 2013-03-18 10:48:58 -0700 | [diff] [blame] | 103 | && !validate_expr(args->kwarg->annotation, Load)) { |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 104 | return 0; |
| 105 | } |
Pablo Galindo | 2f58a84 | 2019-05-31 14:09:49 +0100 | [diff] [blame] | 106 | if (asdl_seq_LEN(args->defaults) > asdl_seq_LEN(args->posonlyargs) + asdl_seq_LEN(args->args)) { |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 107 | PyErr_SetString(PyExc_ValueError, "more positional defaults than args on arguments"); |
| 108 | return 0; |
| 109 | } |
| 110 | if (asdl_seq_LEN(args->kw_defaults) != asdl_seq_LEN(args->kwonlyargs)) { |
| 111 | PyErr_SetString(PyExc_ValueError, "length of kwonlyargs is not the same as " |
| 112 | "kw_defaults on arguments"); |
| 113 | return 0; |
| 114 | } |
| 115 | return validate_exprs(args->defaults, Load, 0) && validate_exprs(args->kw_defaults, Load, 1); |
| 116 | } |
| 117 | |
| 118 | static int |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 119 | validate_constant(PyObject *value) |
| 120 | { |
| 121 | if (value == Py_None || value == Py_Ellipsis) |
| 122 | return 1; |
| 123 | |
| 124 | if (PyLong_CheckExact(value) |
| 125 | || PyFloat_CheckExact(value) |
| 126 | || PyComplex_CheckExact(value) |
| 127 | || PyBool_Check(value) |
| 128 | || PyUnicode_CheckExact(value) |
| 129 | || PyBytes_CheckExact(value)) |
| 130 | return 1; |
| 131 | |
| 132 | if (PyTuple_CheckExact(value) || PyFrozenSet_CheckExact(value)) { |
| 133 | PyObject *it; |
| 134 | |
| 135 | it = PyObject_GetIter(value); |
| 136 | if (it == NULL) |
| 137 | return 0; |
| 138 | |
| 139 | while (1) { |
| 140 | PyObject *item = PyIter_Next(it); |
| 141 | if (item == NULL) { |
| 142 | if (PyErr_Occurred()) { |
| 143 | Py_DECREF(it); |
| 144 | return 0; |
| 145 | } |
| 146 | break; |
| 147 | } |
| 148 | |
| 149 | if (!validate_constant(item)) { |
| 150 | Py_DECREF(it); |
Victor Stinner | 726f690 | 2016-01-27 00:11:47 +0100 | [diff] [blame] | 151 | Py_DECREF(item); |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 152 | return 0; |
| 153 | } |
Victor Stinner | 726f690 | 2016-01-27 00:11:47 +0100 | [diff] [blame] | 154 | Py_DECREF(item); |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 155 | } |
| 156 | |
| 157 | Py_DECREF(it); |
| 158 | return 1; |
| 159 | } |
| 160 | |
Batuhan TaÅŸkaya | 0ac59f9 | 2020-03-19 14:32:28 +0300 | [diff] [blame] | 161 | if (!PyErr_Occurred()) { |
| 162 | PyErr_Format(PyExc_TypeError, |
| 163 | "got an invalid type in Constant: %s", |
| 164 | _PyType_Name(Py_TYPE(value))); |
| 165 | } |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 166 | return 0; |
| 167 | } |
| 168 | |
| 169 | static int |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 170 | validate_expr(expr_ty exp, expr_context_ty ctx) |
| 171 | { |
| 172 | int check_ctx = 1; |
| 173 | expr_context_ty actual_ctx; |
| 174 | |
| 175 | /* First check expression context. */ |
| 176 | switch (exp->kind) { |
| 177 | case Attribute_kind: |
| 178 | actual_ctx = exp->v.Attribute.ctx; |
| 179 | break; |
| 180 | case Subscript_kind: |
| 181 | actual_ctx = exp->v.Subscript.ctx; |
| 182 | break; |
| 183 | case Starred_kind: |
| 184 | actual_ctx = exp->v.Starred.ctx; |
| 185 | break; |
| 186 | case Name_kind: |
Batuhan Taskaya | 68874a8 | 2020-06-06 15:44:16 +0300 | [diff] [blame] | 187 | if (!validate_name(exp->v.Name.id)) { |
| 188 | return 0; |
| 189 | } |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 190 | actual_ctx = exp->v.Name.ctx; |
| 191 | break; |
| 192 | case List_kind: |
| 193 | actual_ctx = exp->v.List.ctx; |
| 194 | break; |
| 195 | case Tuple_kind: |
| 196 | actual_ctx = exp->v.Tuple.ctx; |
| 197 | break; |
| 198 | default: |
| 199 | if (ctx != Load) { |
| 200 | PyErr_Format(PyExc_ValueError, "expression which can't be " |
| 201 | "assigned to in %s context", expr_context_name(ctx)); |
| 202 | return 0; |
| 203 | } |
| 204 | check_ctx = 0; |
Victor Stinner | 0c39b1b | 2015-03-18 15:02:06 +0100 | [diff] [blame] | 205 | /* set actual_ctx to prevent gcc warning */ |
| 206 | actual_ctx = 0; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 207 | } |
| 208 | if (check_ctx && actual_ctx != ctx) { |
| 209 | PyErr_Format(PyExc_ValueError, "expression must have %s context but has %s instead", |
| 210 | expr_context_name(ctx), expr_context_name(actual_ctx)); |
| 211 | return 0; |
| 212 | } |
| 213 | |
| 214 | /* Now validate expression. */ |
| 215 | switch (exp->kind) { |
| 216 | case BoolOp_kind: |
| 217 | if (asdl_seq_LEN(exp->v.BoolOp.values) < 2) { |
| 218 | PyErr_SetString(PyExc_ValueError, "BoolOp with less than 2 values"); |
| 219 | return 0; |
| 220 | } |
| 221 | return validate_exprs(exp->v.BoolOp.values, Load, 0); |
| 222 | case BinOp_kind: |
| 223 | return validate_expr(exp->v.BinOp.left, Load) && |
| 224 | validate_expr(exp->v.BinOp.right, Load); |
| 225 | case UnaryOp_kind: |
| 226 | return validate_expr(exp->v.UnaryOp.operand, Load); |
| 227 | case Lambda_kind: |
| 228 | return validate_arguments(exp->v.Lambda.args) && |
| 229 | validate_expr(exp->v.Lambda.body, Load); |
| 230 | case IfExp_kind: |
| 231 | return validate_expr(exp->v.IfExp.test, Load) && |
| 232 | validate_expr(exp->v.IfExp.body, Load) && |
| 233 | validate_expr(exp->v.IfExp.orelse, Load); |
| 234 | case Dict_kind: |
| 235 | if (asdl_seq_LEN(exp->v.Dict.keys) != asdl_seq_LEN(exp->v.Dict.values)) { |
| 236 | PyErr_SetString(PyExc_ValueError, |
| 237 | "Dict doesn't have the same number of keys as values"); |
| 238 | return 0; |
| 239 | } |
Yury Selivanov | b3d5313 | 2015-09-01 16:10:49 -0400 | [diff] [blame] | 240 | /* null_ok=1 for keys expressions to allow dict unpacking to work in |
| 241 | dict literals, i.e. ``{**{a:b}}`` */ |
| 242 | return validate_exprs(exp->v.Dict.keys, Load, /*null_ok=*/ 1) && |
| 243 | validate_exprs(exp->v.Dict.values, Load, /*null_ok=*/ 0); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 244 | case Set_kind: |
| 245 | return validate_exprs(exp->v.Set.elts, Load, 0); |
| 246 | #define COMP(NAME) \ |
| 247 | case NAME ## _kind: \ |
| 248 | return validate_comprehension(exp->v.NAME.generators) && \ |
| 249 | validate_expr(exp->v.NAME.elt, Load); |
| 250 | COMP(ListComp) |
| 251 | COMP(SetComp) |
| 252 | COMP(GeneratorExp) |
| 253 | #undef COMP |
| 254 | case DictComp_kind: |
| 255 | return validate_comprehension(exp->v.DictComp.generators) && |
| 256 | validate_expr(exp->v.DictComp.key, Load) && |
| 257 | validate_expr(exp->v.DictComp.value, Load); |
| 258 | case Yield_kind: |
| 259 | return !exp->v.Yield.value || validate_expr(exp->v.Yield.value, Load); |
Benjamin Peterson | 527c622 | 2012-01-14 08:58:23 -0500 | [diff] [blame] | 260 | case YieldFrom_kind: |
Mark Dickinson | ded35ae | 2012-11-25 14:36:26 +0000 | [diff] [blame] | 261 | return validate_expr(exp->v.YieldFrom.value, Load); |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 262 | case Await_kind: |
| 263 | return validate_expr(exp->v.Await.value, Load); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 264 | case Compare_kind: |
| 265 | if (!asdl_seq_LEN(exp->v.Compare.comparators)) { |
| 266 | PyErr_SetString(PyExc_ValueError, "Compare with no comparators"); |
| 267 | return 0; |
| 268 | } |
| 269 | if (asdl_seq_LEN(exp->v.Compare.comparators) != |
| 270 | asdl_seq_LEN(exp->v.Compare.ops)) { |
| 271 | PyErr_SetString(PyExc_ValueError, "Compare has a different number " |
| 272 | "of comparators and operands"); |
| 273 | return 0; |
| 274 | } |
| 275 | return validate_exprs(exp->v.Compare.comparators, Load, 0) && |
| 276 | validate_expr(exp->v.Compare.left, Load); |
| 277 | case Call_kind: |
| 278 | return validate_expr(exp->v.Call.func, Load) && |
| 279 | validate_exprs(exp->v.Call.args, Load, 0) && |
Benjamin Peterson | 025e9eb | 2015-05-05 20:16:41 -0400 | [diff] [blame] | 280 | validate_keywords(exp->v.Call.keywords); |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 281 | case Constant_kind: |
| 282 | if (!validate_constant(exp->v.Constant.value)) { |
Victor Stinner | f2c1aa1 | 2016-01-26 00:40:57 +0100 | [diff] [blame] | 283 | return 0; |
| 284 | } |
| 285 | return 1; |
Eric V. Smith | 235a6f0 | 2015-09-19 14:51:32 -0400 | [diff] [blame] | 286 | case JoinedStr_kind: |
| 287 | return validate_exprs(exp->v.JoinedStr.values, Load, 0); |
| 288 | case FormattedValue_kind: |
| 289 | if (validate_expr(exp->v.FormattedValue.value, Load) == 0) |
| 290 | return 0; |
| 291 | if (exp->v.FormattedValue.format_spec) |
| 292 | return validate_expr(exp->v.FormattedValue.format_spec, Load); |
| 293 | return 1; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 294 | case Attribute_kind: |
| 295 | return validate_expr(exp->v.Attribute.value, Load); |
| 296 | case Subscript_kind: |
Serhiy Storchaka | 13d52c2 | 2020-03-10 18:52:34 +0200 | [diff] [blame] | 297 | return validate_expr(exp->v.Subscript.slice, Load) && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 298 | validate_expr(exp->v.Subscript.value, Load); |
| 299 | case Starred_kind: |
| 300 | return validate_expr(exp->v.Starred.value, ctx); |
Serhiy Storchaka | 13d52c2 | 2020-03-10 18:52:34 +0200 | [diff] [blame] | 301 | case Slice_kind: |
| 302 | return (!exp->v.Slice.lower || validate_expr(exp->v.Slice.lower, Load)) && |
| 303 | (!exp->v.Slice.upper || validate_expr(exp->v.Slice.upper, Load)) && |
| 304 | (!exp->v.Slice.step || validate_expr(exp->v.Slice.step, Load)); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 305 | case List_kind: |
| 306 | return validate_exprs(exp->v.List.elts, ctx, 0); |
| 307 | case Tuple_kind: |
| 308 | return validate_exprs(exp->v.Tuple.elts, ctx, 0); |
Pablo Galindo | 0c9258a | 2019-03-18 13:51:53 +0000 | [diff] [blame] | 309 | case NamedExpr_kind: |
| 310 | return validate_expr(exp->v.NamedExpr.value, Load); |
Brandt Bucher | 145bf26 | 2021-02-26 14:51:55 -0800 | [diff] [blame] | 311 | case MatchAs_kind: |
| 312 | PyErr_SetString(PyExc_ValueError, |
| 313 | "MatchAs is only valid in match_case patterns"); |
| 314 | return 0; |
| 315 | case MatchOr_kind: |
| 316 | PyErr_SetString(PyExc_ValueError, |
| 317 | "MatchOr is only valid in match_case patterns"); |
| 318 | return 0; |
Serhiy Storchaka | 3f22811 | 2018-09-27 17:42:37 +0300 | [diff] [blame] | 319 | /* This last case doesn't have any checking. */ |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 320 | case Name_kind: |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 321 | return 1; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 322 | } |
Pablo Galindo | 0c9258a | 2019-03-18 13:51:53 +0000 | [diff] [blame] | 323 | PyErr_SetString(PyExc_SystemError, "unexpected expression"); |
| 324 | return 0; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 325 | } |
| 326 | |
| 327 | static int |
Brandt Bucher | 145bf26 | 2021-02-26 14:51:55 -0800 | [diff] [blame] | 328 | validate_pattern(expr_ty p) |
| 329 | { |
| 330 | // Coming soon (thanks Batuhan)! |
| 331 | return 1; |
| 332 | } |
| 333 | |
| 334 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 335 | _validate_nonempty_seq(asdl_seq *seq, const char *what, const char *owner) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 336 | { |
| 337 | if (asdl_seq_LEN(seq)) |
| 338 | return 1; |
| 339 | PyErr_Format(PyExc_ValueError, "empty %s on %s", what, owner); |
| 340 | return 0; |
| 341 | } |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 342 | #define validate_nonempty_seq(seq, what, owner) _validate_nonempty_seq((asdl_seq*)seq, what, owner) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 343 | |
| 344 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 345 | validate_assignlist(asdl_expr_seq *targets, expr_context_ty ctx) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 346 | { |
| 347 | return validate_nonempty_seq(targets, "targets", ctx == Del ? "Delete" : "Assign") && |
| 348 | validate_exprs(targets, ctx, 0); |
| 349 | } |
| 350 | |
| 351 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 352 | validate_body(asdl_stmt_seq *body, const char *owner) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 353 | { |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 354 | return validate_nonempty_seq(body, "body", owner) && validate_stmts(body); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 355 | } |
| 356 | |
| 357 | static int |
| 358 | validate_stmt(stmt_ty stmt) |
| 359 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 360 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 361 | switch (stmt->kind) { |
| 362 | case FunctionDef_kind: |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 363 | return validate_body(stmt->v.FunctionDef.body, "FunctionDef") && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 364 | validate_arguments(stmt->v.FunctionDef.args) && |
| 365 | validate_exprs(stmt->v.FunctionDef.decorator_list, Load, 0) && |
| 366 | (!stmt->v.FunctionDef.returns || |
| 367 | validate_expr(stmt->v.FunctionDef.returns, Load)); |
| 368 | case ClassDef_kind: |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 369 | return validate_body(stmt->v.ClassDef.body, "ClassDef") && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 370 | validate_exprs(stmt->v.ClassDef.bases, Load, 0) && |
| 371 | validate_keywords(stmt->v.ClassDef.keywords) && |
Benjamin Peterson | 025e9eb | 2015-05-05 20:16:41 -0400 | [diff] [blame] | 372 | validate_exprs(stmt->v.ClassDef.decorator_list, Load, 0); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 373 | case Return_kind: |
| 374 | return !stmt->v.Return.value || validate_expr(stmt->v.Return.value, Load); |
| 375 | case Delete_kind: |
| 376 | return validate_assignlist(stmt->v.Delete.targets, Del); |
| 377 | case Assign_kind: |
| 378 | return validate_assignlist(stmt->v.Assign.targets, Store) && |
| 379 | validate_expr(stmt->v.Assign.value, Load); |
| 380 | case AugAssign_kind: |
| 381 | return validate_expr(stmt->v.AugAssign.target, Store) && |
| 382 | validate_expr(stmt->v.AugAssign.value, Load); |
Yury Selivanov | f8cb8a1 | 2016-09-08 20:50:03 -0700 | [diff] [blame] | 383 | case AnnAssign_kind: |
| 384 | if (stmt->v.AnnAssign.target->kind != Name_kind && |
| 385 | stmt->v.AnnAssign.simple) { |
| 386 | PyErr_SetString(PyExc_TypeError, |
| 387 | "AnnAssign with simple non-Name target"); |
| 388 | return 0; |
| 389 | } |
| 390 | return validate_expr(stmt->v.AnnAssign.target, Store) && |
| 391 | (!stmt->v.AnnAssign.value || |
| 392 | validate_expr(stmt->v.AnnAssign.value, Load)) && |
| 393 | validate_expr(stmt->v.AnnAssign.annotation, Load); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 394 | case For_kind: |
| 395 | return validate_expr(stmt->v.For.target, Store) && |
| 396 | validate_expr(stmt->v.For.iter, Load) && |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 397 | validate_body(stmt->v.For.body, "For") && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 398 | validate_stmts(stmt->v.For.orelse); |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 399 | case AsyncFor_kind: |
| 400 | return validate_expr(stmt->v.AsyncFor.target, Store) && |
| 401 | validate_expr(stmt->v.AsyncFor.iter, Load) && |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 402 | validate_body(stmt->v.AsyncFor.body, "AsyncFor") && |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 403 | validate_stmts(stmt->v.AsyncFor.orelse); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 404 | case While_kind: |
| 405 | return validate_expr(stmt->v.While.test, Load) && |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 406 | validate_body(stmt->v.While.body, "While") && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 407 | validate_stmts(stmt->v.While.orelse); |
| 408 | case If_kind: |
| 409 | return validate_expr(stmt->v.If.test, Load) && |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 410 | validate_body(stmt->v.If.body, "If") && |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 411 | validate_stmts(stmt->v.If.orelse); |
| 412 | case With_kind: |
| 413 | if (!validate_nonempty_seq(stmt->v.With.items, "items", "With")) |
| 414 | return 0; |
| 415 | for (i = 0; i < asdl_seq_LEN(stmt->v.With.items); i++) { |
| 416 | withitem_ty item = asdl_seq_GET(stmt->v.With.items, i); |
| 417 | if (!validate_expr(item->context_expr, Load) || |
| 418 | (item->optional_vars && !validate_expr(item->optional_vars, Store))) |
| 419 | return 0; |
| 420 | } |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 421 | return validate_body(stmt->v.With.body, "With"); |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 422 | case AsyncWith_kind: |
| 423 | if (!validate_nonempty_seq(stmt->v.AsyncWith.items, "items", "AsyncWith")) |
| 424 | return 0; |
| 425 | for (i = 0; i < asdl_seq_LEN(stmt->v.AsyncWith.items); i++) { |
| 426 | withitem_ty item = asdl_seq_GET(stmt->v.AsyncWith.items, i); |
| 427 | if (!validate_expr(item->context_expr, Load) || |
| 428 | (item->optional_vars && !validate_expr(item->optional_vars, Store))) |
| 429 | return 0; |
| 430 | } |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 431 | return validate_body(stmt->v.AsyncWith.body, "AsyncWith"); |
Brandt Bucher | 145bf26 | 2021-02-26 14:51:55 -0800 | [diff] [blame] | 432 | case Match_kind: |
| 433 | if (!validate_expr(stmt->v.Match.subject, Load) |
| 434 | || !validate_nonempty_seq(stmt->v.Match.cases, "cases", "Match")) { |
| 435 | return 0; |
| 436 | } |
| 437 | for (i = 0; i < asdl_seq_LEN(stmt->v.Match.cases); i++) { |
| 438 | match_case_ty m = asdl_seq_GET(stmt->v.Match.cases, i); |
| 439 | if (!validate_pattern(m->pattern) |
| 440 | || (m->guard && !validate_expr(m->guard, Load)) |
| 441 | || !validate_body(m->body, "match_case")) { |
| 442 | return 0; |
| 443 | } |
| 444 | } |
| 445 | return 1; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 446 | case Raise_kind: |
| 447 | if (stmt->v.Raise.exc) { |
| 448 | return validate_expr(stmt->v.Raise.exc, Load) && |
| 449 | (!stmt->v.Raise.cause || validate_expr(stmt->v.Raise.cause, Load)); |
| 450 | } |
| 451 | if (stmt->v.Raise.cause) { |
| 452 | PyErr_SetString(PyExc_ValueError, "Raise with cause but no exception"); |
| 453 | return 0; |
| 454 | } |
| 455 | return 1; |
| 456 | case Try_kind: |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 457 | if (!validate_body(stmt->v.Try.body, "Try")) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 458 | return 0; |
| 459 | if (!asdl_seq_LEN(stmt->v.Try.handlers) && |
| 460 | !asdl_seq_LEN(stmt->v.Try.finalbody)) { |
| 461 | PyErr_SetString(PyExc_ValueError, "Try has neither except handlers nor finalbody"); |
| 462 | return 0; |
| 463 | } |
| 464 | if (!asdl_seq_LEN(stmt->v.Try.handlers) && |
| 465 | asdl_seq_LEN(stmt->v.Try.orelse)) { |
| 466 | PyErr_SetString(PyExc_ValueError, "Try has orelse but no except handlers"); |
| 467 | return 0; |
| 468 | } |
| 469 | for (i = 0; i < asdl_seq_LEN(stmt->v.Try.handlers); i++) { |
| 470 | excepthandler_ty handler = asdl_seq_GET(stmt->v.Try.handlers, i); |
| 471 | if ((handler->v.ExceptHandler.type && |
| 472 | !validate_expr(handler->v.ExceptHandler.type, Load)) || |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 473 | !validate_body(handler->v.ExceptHandler.body, "ExceptHandler")) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 474 | return 0; |
| 475 | } |
| 476 | return (!asdl_seq_LEN(stmt->v.Try.finalbody) || |
| 477 | validate_stmts(stmt->v.Try.finalbody)) && |
| 478 | (!asdl_seq_LEN(stmt->v.Try.orelse) || |
| 479 | validate_stmts(stmt->v.Try.orelse)); |
| 480 | case Assert_kind: |
| 481 | return validate_expr(stmt->v.Assert.test, Load) && |
| 482 | (!stmt->v.Assert.msg || validate_expr(stmt->v.Assert.msg, Load)); |
| 483 | case Import_kind: |
| 484 | return validate_nonempty_seq(stmt->v.Import.names, "names", "Import"); |
| 485 | case ImportFrom_kind: |
Serhiy Storchaka | fbd1523 | 2016-06-27 21:39:12 +0300 | [diff] [blame] | 486 | if (stmt->v.ImportFrom.level < 0) { |
| 487 | PyErr_SetString(PyExc_ValueError, "Negative ImportFrom level"); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 488 | return 0; |
| 489 | } |
| 490 | return validate_nonempty_seq(stmt->v.ImportFrom.names, "names", "ImportFrom"); |
| 491 | case Global_kind: |
| 492 | return validate_nonempty_seq(stmt->v.Global.names, "names", "Global"); |
| 493 | case Nonlocal_kind: |
| 494 | return validate_nonempty_seq(stmt->v.Nonlocal.names, "names", "Nonlocal"); |
| 495 | case Expr_kind: |
| 496 | return validate_expr(stmt->v.Expr.value, Load); |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 497 | case AsyncFunctionDef_kind: |
Serhiy Storchaka | 73cbe7a | 2018-05-29 12:04:55 +0300 | [diff] [blame] | 498 | return validate_body(stmt->v.AsyncFunctionDef.body, "AsyncFunctionDef") && |
Yury Selivanov | 7544508 | 2015-05-11 22:57:16 -0400 | [diff] [blame] | 499 | validate_arguments(stmt->v.AsyncFunctionDef.args) && |
| 500 | validate_exprs(stmt->v.AsyncFunctionDef.decorator_list, Load, 0) && |
| 501 | (!stmt->v.AsyncFunctionDef.returns || |
| 502 | validate_expr(stmt->v.AsyncFunctionDef.returns, Load)); |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 503 | case Pass_kind: |
| 504 | case Break_kind: |
| 505 | case Continue_kind: |
| 506 | return 1; |
| 507 | default: |
| 508 | PyErr_SetString(PyExc_SystemError, "unexpected statement"); |
| 509 | return 0; |
| 510 | } |
| 511 | } |
| 512 | |
| 513 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 514 | validate_stmts(asdl_stmt_seq *seq) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 515 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 516 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 517 | for (i = 0; i < asdl_seq_LEN(seq); i++) { |
| 518 | stmt_ty stmt = asdl_seq_GET(seq, i); |
| 519 | if (stmt) { |
| 520 | if (!validate_stmt(stmt)) |
| 521 | return 0; |
| 522 | } |
| 523 | else { |
| 524 | PyErr_SetString(PyExc_ValueError, |
| 525 | "None disallowed in statement list"); |
| 526 | return 0; |
| 527 | } |
| 528 | } |
| 529 | return 1; |
| 530 | } |
| 531 | |
| 532 | static int |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 533 | validate_exprs(asdl_expr_seq *exprs, expr_context_ty ctx, int null_ok) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 534 | { |
Victor Stinner | 4d73ae7 | 2018-11-22 14:45:16 +0100 | [diff] [blame] | 535 | Py_ssize_t i; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 536 | for (i = 0; i < asdl_seq_LEN(exprs); i++) { |
| 537 | expr_ty expr = asdl_seq_GET(exprs, i); |
| 538 | if (expr) { |
| 539 | if (!validate_expr(expr, ctx)) |
| 540 | return 0; |
| 541 | } |
| 542 | else if (!null_ok) { |
| 543 | PyErr_SetString(PyExc_ValueError, |
| 544 | "None disallowed in expression list"); |
| 545 | return 0; |
| 546 | } |
Victor Stinner | 0c39b1b | 2015-03-18 15:02:06 +0100 | [diff] [blame] | 547 | |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 548 | } |
| 549 | return 1; |
| 550 | } |
| 551 | |
| 552 | int |
Victor Stinner | eec8e61 | 2021-03-18 14:57:49 +0100 | [diff] [blame] | 553 | _PyAST_Validate(mod_ty mod) |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 554 | { |
| 555 | int res = 0; |
| 556 | |
| 557 | switch (mod->kind) { |
| 558 | case Module_kind: |
| 559 | res = validate_stmts(mod->v.Module.body); |
| 560 | break; |
| 561 | case Interactive_kind: |
| 562 | res = validate_stmts(mod->v.Interactive.body); |
| 563 | break; |
| 564 | case Expression_kind: |
| 565 | res = validate_expr(mod->v.Expression.body, Load); |
| 566 | break; |
Benjamin Peterson | 832bfe2 | 2011-08-09 16:15:04 -0500 | [diff] [blame] | 567 | default: |
| 568 | PyErr_SetString(PyExc_SystemError, "impossible module node"); |
| 569 | res = 0; |
| 570 | break; |
| 571 | } |
| 572 | return res; |
| 573 | } |
| 574 | |
Serhiy Storchaka | 143ce5c | 2018-05-30 10:56:16 +0300 | [diff] [blame] | 575 | PyObject * |
Pablo Galindo | a5634c4 | 2020-09-16 19:42:00 +0100 | [diff] [blame] | 576 | _PyAST_GetDocString(asdl_stmt_seq *body) |
Serhiy Storchaka | 143ce5c | 2018-05-30 10:56:16 +0300 | [diff] [blame] | 577 | { |
| 578 | if (!asdl_seq_LEN(body)) { |
| 579 | return NULL; |
| 580 | } |
Batuhan Taskaya | 02a1603 | 2020-10-10 20:14:59 +0300 | [diff] [blame] | 581 | stmt_ty st = asdl_seq_GET(body, 0); |
Serhiy Storchaka | 143ce5c | 2018-05-30 10:56:16 +0300 | [diff] [blame] | 582 | if (st->kind != Expr_kind) { |
| 583 | return NULL; |
| 584 | } |
| 585 | expr_ty e = st->v.Expr.value; |
Serhiy Storchaka | 143ce5c | 2018-05-30 10:56:16 +0300 | [diff] [blame] | 586 | if (e->kind == Constant_kind && PyUnicode_CheckExact(e->v.Constant.value)) { |
| 587 | return e->v.Constant.value; |
| 588 | } |
| 589 | return NULL; |
| 590 | } |