Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1 | |
| 2 | /* Write Python objects to files and read them back. |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 3 | This is primarily intended for writing and reading compiled Python code, |
| 4 | even though dicts, lists, sets and frozensets, not commonly seen in |
| 5 | code objects, are supported. |
| 6 | Version 3 of this protocol properly supports circular links |
| 7 | and sharing. */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 8 | |
Thomas Wouters | 695934a | 2006-03-01 23:49:13 +0000 | [diff] [blame] | 9 | #define PY_SSIZE_T_CLEAN |
| 10 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 11 | #include "Python.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 12 | #include "longintrepr.h" |
Jeremy Hylton | 3e0055f | 2005-10-20 19:59:25 +0000 | [diff] [blame] | 13 | #include "code.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 14 | #include "marshal.h" |
Victor Stinner | b617993 | 2020-05-12 02:42:19 +0200 | [diff] [blame] | 15 | #include "pycore_hashtable.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 16 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 17 | /*[clinic input] |
| 18 | module marshal |
| 19 | [clinic start generated code]*/ |
| 20 | /*[clinic end generated code: output=da39a3ee5e6b4b0d input=c982b7930dee17db]*/ |
| 21 | |
| 22 | #include "clinic/marshal.c.h" |
| 23 | |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 24 | /* High water mark to determine when the marshalled object is dangerously deep |
| 25 | * and risks coring the interpreter. When the object stack gets this deep, |
| 26 | * raise an exception instead of continuing. |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 27 | * On Windows debug builds, reduce this value. |
Steve Dower | 2a4a62b | 2018-06-04 13:25:00 -0700 | [diff] [blame] | 28 | * |
| 29 | * BUG: https://bugs.python.org/issue33720 |
| 30 | * On Windows PGO builds, the r_object function overallocates its stack and |
| 31 | * can cause a stack overflow. We reduce the maximum depth for all Windows |
| 32 | * releases to protect against this. |
| 33 | * #if defined(MS_WINDOWS) && defined(_DEBUG) |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 34 | */ |
Steve Dower | 2a4a62b | 2018-06-04 13:25:00 -0700 | [diff] [blame] | 35 | #if defined(MS_WINDOWS) |
Steve Dower | f6c69e6 | 2014-11-01 15:15:16 -0700 | [diff] [blame] | 36 | #define MAX_MARSHAL_STACK_DEPTH 1000 |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 37 | #else |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 38 | #define MAX_MARSHAL_STACK_DEPTH 2000 |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 39 | #endif |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 40 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 41 | #define TYPE_NULL '0' |
| 42 | #define TYPE_NONE 'N' |
| 43 | #define TYPE_FALSE 'F' |
| 44 | #define TYPE_TRUE 'T' |
| 45 | #define TYPE_STOPITER 'S' |
| 46 | #define TYPE_ELLIPSIS '.' |
| 47 | #define TYPE_INT 'i' |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 48 | /* TYPE_INT64 is not generated anymore. |
| 49 | Supported for backward compatibility only. */ |
| 50 | #define TYPE_INT64 'I' |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 51 | #define TYPE_FLOAT 'f' |
| 52 | #define TYPE_BINARY_FLOAT 'g' |
| 53 | #define TYPE_COMPLEX 'x' |
| 54 | #define TYPE_BINARY_COMPLEX 'y' |
| 55 | #define TYPE_LONG 'l' |
| 56 | #define TYPE_STRING 's' |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 57 | #define TYPE_INTERNED 't' |
| 58 | #define TYPE_REF 'r' |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 59 | #define TYPE_TUPLE '(' |
| 60 | #define TYPE_LIST '[' |
| 61 | #define TYPE_DICT '{' |
| 62 | #define TYPE_CODE 'c' |
| 63 | #define TYPE_UNICODE 'u' |
| 64 | #define TYPE_UNKNOWN '?' |
| 65 | #define TYPE_SET '<' |
| 66 | #define TYPE_FROZENSET '>' |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 67 | #define FLAG_REF '\x80' /* with a type, add obj to index */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 68 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 69 | #define TYPE_ASCII 'a' |
| 70 | #define TYPE_ASCII_INTERNED 'A' |
| 71 | #define TYPE_SMALL_TUPLE ')' |
| 72 | #define TYPE_SHORT_ASCII 'z' |
| 73 | #define TYPE_SHORT_ASCII_INTERNED 'Z' |
| 74 | |
Eric Smith | b1a03cf | 2009-04-21 11:57:38 +0000 | [diff] [blame] | 75 | #define WFERR_OK 0 |
| 76 | #define WFERR_UNMARSHALLABLE 1 |
| 77 | #define WFERR_NESTEDTOODEEP 2 |
| 78 | #define WFERR_NOMEMORY 3 |
| 79 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 80 | typedef struct { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 81 | FILE *fp; |
| 82 | int error; /* see WFERR_* values */ |
| 83 | int depth; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 84 | PyObject *str; |
| 85 | char *ptr; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 86 | const char *end; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 87 | char *buf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 88 | _Py_hashtable_t *hashtable; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 89 | int version; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 90 | } WFILE; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 91 | |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 92 | #define w_byte(c, p) do { \ |
| 93 | if ((p)->ptr != (p)->end || w_reserve((p), 1)) \ |
| 94 | *(p)->ptr++ = (c); \ |
| 95 | } while(0) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 96 | |
| 97 | static void |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 98 | w_flush(WFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 99 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 100 | assert(p->fp != NULL); |
| 101 | fwrite(p->buf, 1, p->ptr - p->buf, p->fp); |
| 102 | p->ptr = p->buf; |
| 103 | } |
| 104 | |
| 105 | static int |
| 106 | w_reserve(WFILE *p, Py_ssize_t needed) |
| 107 | { |
| 108 | Py_ssize_t pos, size, delta; |
| 109 | if (p->ptr == NULL) |
| 110 | return 0; /* An error already occurred */ |
| 111 | if (p->fp != NULL) { |
| 112 | w_flush(p); |
| 113 | return needed <= p->end - p->ptr; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 114 | } |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 115 | assert(p->str != NULL); |
| 116 | pos = p->ptr - p->buf; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 117 | size = PyBytes_GET_SIZE(p->str); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 118 | if (size > 16*1024*1024) |
| 119 | delta = (size >> 3); /* 12.5% overallocation */ |
| 120 | else |
| 121 | delta = size + 1024; |
| 122 | delta = Py_MAX(delta, needed); |
| 123 | if (delta > PY_SSIZE_T_MAX - size) { |
| 124 | p->error = WFERR_NOMEMORY; |
| 125 | return 0; |
| 126 | } |
| 127 | size += delta; |
| 128 | if (_PyBytes_Resize(&p->str, size) != 0) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 129 | p->end = p->ptr = p->buf = NULL; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 130 | return 0; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 131 | } |
| 132 | else { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 133 | p->buf = PyBytes_AS_STRING(p->str); |
| 134 | p->ptr = p->buf + pos; |
| 135 | p->end = p->buf + size; |
| 136 | return 1; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 137 | } |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 138 | } |
| 139 | |
| 140 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 141 | w_string(const void *s, Py_ssize_t n, WFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 142 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 143 | Py_ssize_t m; |
| 144 | if (!n || p->ptr == NULL) |
| 145 | return; |
| 146 | m = p->end - p->ptr; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 147 | if (p->fp != NULL) { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 148 | if (n <= m) { |
Christian Heimes | f051e43 | 2016-09-13 20:22:02 +0200 | [diff] [blame] | 149 | memcpy(p->ptr, s, n); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 150 | p->ptr += n; |
| 151 | } |
| 152 | else { |
| 153 | w_flush(p); |
| 154 | fwrite(s, 1, n, p->fp); |
| 155 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 156 | } |
| 157 | else { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 158 | if (n <= m || w_reserve(p, n - m)) { |
Christian Heimes | f051e43 | 2016-09-13 20:22:02 +0200 | [diff] [blame] | 159 | memcpy(p->ptr, s, n); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 160 | p->ptr += n; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 161 | } |
| 162 | } |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 163 | } |
| 164 | |
| 165 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 166 | w_short(int x, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 167 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 168 | w_byte((char)( x & 0xff), p); |
| 169 | w_byte((char)((x>> 8) & 0xff), p); |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 170 | } |
| 171 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 172 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 173 | w_long(long x, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 174 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 175 | w_byte((char)( x & 0xff), p); |
| 176 | w_byte((char)((x>> 8) & 0xff), p); |
| 177 | w_byte((char)((x>>16) & 0xff), p); |
| 178 | w_byte((char)((x>>24) & 0xff), p); |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 179 | } |
| 180 | |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 181 | #define SIZE32_MAX 0x7FFFFFFF |
| 182 | |
| 183 | #if SIZEOF_SIZE_T > 4 |
| 184 | # define W_SIZE(n, p) do { \ |
| 185 | if ((n) > SIZE32_MAX) { \ |
| 186 | (p)->depth--; \ |
| 187 | (p)->error = WFERR_UNMARSHALLABLE; \ |
| 188 | return; \ |
| 189 | } \ |
| 190 | w_long((long)(n), p); \ |
| 191 | } while(0) |
| 192 | #else |
| 193 | # define W_SIZE w_long |
| 194 | #endif |
| 195 | |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 196 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 197 | w_pstring(const void *s, Py_ssize_t n, WFILE *p) |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 198 | { |
| 199 | W_SIZE(n, p); |
| 200 | w_string(s, n, p); |
| 201 | } |
| 202 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 203 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 204 | w_short_pstring(const void *s, Py_ssize_t n, WFILE *p) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 205 | { |
Antoine Pitrou | b30f271 | 2013-10-12 23:14:47 +0200 | [diff] [blame] | 206 | w_byte(Py_SAFE_DOWNCAST(n, Py_ssize_t, unsigned char), p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 207 | w_string(s, n, p); |
| 208 | } |
| 209 | |
Serhiy Storchaka | 9594942 | 2013-08-27 19:40:23 +0300 | [diff] [blame] | 210 | /* We assume that Python ints are stored internally in base some power of |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 211 | 2**15; for the sake of portability we'll always read and write them in base |
| 212 | exactly 2**15. */ |
| 213 | |
| 214 | #define PyLong_MARSHAL_SHIFT 15 |
| 215 | #define PyLong_MARSHAL_BASE ((short)1 << PyLong_MARSHAL_SHIFT) |
| 216 | #define PyLong_MARSHAL_MASK (PyLong_MARSHAL_BASE - 1) |
| 217 | #if PyLong_SHIFT % PyLong_MARSHAL_SHIFT != 0 |
| 218 | #error "PyLong_SHIFT must be a multiple of PyLong_MARSHAL_SHIFT" |
| 219 | #endif |
| 220 | #define PyLong_MARSHAL_RATIO (PyLong_SHIFT / PyLong_MARSHAL_SHIFT) |
| 221 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 222 | #define W_TYPE(t, p) do { \ |
| 223 | w_byte((t) | flag, (p)); \ |
| 224 | } while(0) |
| 225 | |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 226 | static void |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 227 | w_PyLong(const PyLongObject *ob, char flag, WFILE *p) |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 228 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 229 | Py_ssize_t i, j, n, l; |
| 230 | digit d; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 231 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 232 | W_TYPE(TYPE_LONG, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 233 | if (Py_SIZE(ob) == 0) { |
| 234 | w_long((long)0, p); |
| 235 | return; |
| 236 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 237 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 238 | /* set l to number of base PyLong_MARSHAL_BASE digits */ |
Victor Stinner | 45e8e2f | 2014-05-14 17:24:35 +0200 | [diff] [blame] | 239 | n = Py_ABS(Py_SIZE(ob)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 240 | l = (n-1) * PyLong_MARSHAL_RATIO; |
| 241 | d = ob->ob_digit[n-1]; |
| 242 | assert(d != 0); /* a PyLong is always normalized */ |
| 243 | do { |
| 244 | d >>= PyLong_MARSHAL_SHIFT; |
| 245 | l++; |
| 246 | } while (d != 0); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 247 | if (l > SIZE32_MAX) { |
| 248 | p->depth--; |
| 249 | p->error = WFERR_UNMARSHALLABLE; |
| 250 | return; |
| 251 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 252 | w_long((long)(Py_SIZE(ob) > 0 ? l : -l), p); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 253 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 254 | for (i=0; i < n-1; i++) { |
| 255 | d = ob->ob_digit[i]; |
| 256 | for (j=0; j < PyLong_MARSHAL_RATIO; j++) { |
| 257 | w_short(d & PyLong_MARSHAL_MASK, p); |
| 258 | d >>= PyLong_MARSHAL_SHIFT; |
| 259 | } |
| 260 | assert (d == 0); |
| 261 | } |
| 262 | d = ob->ob_digit[n-1]; |
| 263 | do { |
| 264 | w_short(d & PyLong_MARSHAL_MASK, p); |
| 265 | d >>= PyLong_MARSHAL_SHIFT; |
| 266 | } while (d != 0); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 267 | } |
| 268 | |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 269 | static void |
| 270 | w_float_bin(double v, WFILE *p) |
| 271 | { |
| 272 | unsigned char buf[8]; |
| 273 | if (_PyFloat_Pack8(v, buf, 1) < 0) { |
| 274 | p->error = WFERR_UNMARSHALLABLE; |
| 275 | return; |
| 276 | } |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 277 | w_string(buf, 8, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 278 | } |
| 279 | |
| 280 | static void |
| 281 | w_float_str(double v, WFILE *p) |
| 282 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 283 | char *buf = PyOS_double_to_string(v, 'g', 17, 0, NULL); |
| 284 | if (!buf) { |
| 285 | p->error = WFERR_NOMEMORY; |
| 286 | return; |
| 287 | } |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 288 | w_short_pstring(buf, strlen(buf), p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 289 | PyMem_Free(buf); |
| 290 | } |
| 291 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 292 | static int |
| 293 | w_ref(PyObject *v, char *flag, WFILE *p) |
| 294 | { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 295 | _Py_hashtable_entry_t *entry; |
| 296 | int w; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 297 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 298 | if (p->version < 3 || p->hashtable == NULL) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 299 | return 0; /* not writing object references */ |
| 300 | |
| 301 | /* if it has only one reference, it definitely isn't shared */ |
| 302 | if (Py_REFCNT(v) == 1) |
| 303 | return 0; |
| 304 | |
Victor Stinner | 285cf0a | 2016-03-21 22:00:58 +0100 | [diff] [blame] | 305 | entry = _Py_HASHTABLE_GET_ENTRY(p->hashtable, v); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 306 | if (entry != NULL) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 307 | /* write the reference index to the stream */ |
Victor Stinner | e8c6b2f | 2016-03-23 09:25:01 +0100 | [diff] [blame] | 308 | _Py_HASHTABLE_ENTRY_READ_DATA(p->hashtable, entry, w); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 309 | /* we don't store "long" indices in the dict */ |
| 310 | assert(0 <= w && w <= 0x7fffffff); |
| 311 | w_byte(TYPE_REF, p); |
| 312 | w_long(w, p); |
| 313 | return 1; |
| 314 | } else { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 315 | size_t s = p->hashtable->entries; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 316 | /* we don't support long indices */ |
| 317 | if (s >= 0x7fffffff) { |
| 318 | PyErr_SetString(PyExc_ValueError, "too many objects"); |
| 319 | goto err; |
| 320 | } |
Serhiy Storchaka | 26861b0 | 2015-02-16 20:52:17 +0200 | [diff] [blame] | 321 | w = (int)s; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 322 | Py_INCREF(v); |
| 323 | if (_Py_HASHTABLE_SET(p->hashtable, v, w) < 0) { |
| 324 | Py_DECREF(v); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 325 | goto err; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 326 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 327 | *flag |= FLAG_REF; |
| 328 | return 0; |
| 329 | } |
| 330 | err: |
| 331 | p->error = WFERR_UNMARSHALLABLE; |
| 332 | return 1; |
| 333 | } |
| 334 | |
| 335 | static void |
| 336 | w_complex_object(PyObject *v, char flag, WFILE *p); |
| 337 | |
Guido van Rossum | b0c168c | 1996-12-05 23:15:02 +0000 | [diff] [blame] | 338 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 339 | w_object(PyObject *v, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 340 | { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 341 | char flag = '\0'; |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 342 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 343 | p->depth++; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 344 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 345 | if (p->depth > MAX_MARSHAL_STACK_DEPTH) { |
| 346 | p->error = WFERR_NESTEDTOODEEP; |
| 347 | } |
| 348 | else if (v == NULL) { |
| 349 | w_byte(TYPE_NULL, p); |
| 350 | } |
| 351 | else if (v == Py_None) { |
| 352 | w_byte(TYPE_NONE, p); |
| 353 | } |
| 354 | else if (v == PyExc_StopIteration) { |
| 355 | w_byte(TYPE_STOPITER, p); |
| 356 | } |
| 357 | else if (v == Py_Ellipsis) { |
| 358 | w_byte(TYPE_ELLIPSIS, p); |
| 359 | } |
| 360 | else if (v == Py_False) { |
| 361 | w_byte(TYPE_FALSE, p); |
| 362 | } |
| 363 | else if (v == Py_True) { |
| 364 | w_byte(TYPE_TRUE, p); |
| 365 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 366 | else if (!w_ref(v, &flag, p)) |
| 367 | w_complex_object(v, flag, p); |
| 368 | |
| 369 | p->depth--; |
| 370 | } |
| 371 | |
| 372 | static void |
| 373 | w_complex_object(PyObject *v, char flag, WFILE *p) |
| 374 | { |
| 375 | Py_ssize_t i, n; |
| 376 | |
| 377 | if (PyLong_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 378 | int overflow; |
| 379 | long x = PyLong_AsLongAndOverflow(v, &overflow); |
| 380 | if (overflow) { |
| 381 | w_PyLong((PyLongObject *)v, flag, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 382 | } |
| 383 | else { |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 384 | #if SIZEOF_LONG > 4 |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 385 | long y = Py_ARITHMETIC_RIGHT_SHIFT(long, x, 31); |
| 386 | if (y && y != -1) { |
Martin v. Löwis | 7e39572 | 2012-07-28 19:44:05 +0200 | [diff] [blame] | 387 | /* Too large for TYPE_INT */ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 388 | w_PyLong((PyLongObject*)v, flag, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 389 | } |
| 390 | else |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 391 | #endif |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 392 | { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 393 | W_TYPE(TYPE_INT, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 394 | w_long(x, p); |
| 395 | } |
| 396 | } |
| 397 | } |
| 398 | else if (PyFloat_CheckExact(v)) { |
| 399 | if (p->version > 1) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 400 | W_TYPE(TYPE_BINARY_FLOAT, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 401 | w_float_bin(PyFloat_AS_DOUBLE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 402 | } |
| 403 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 404 | W_TYPE(TYPE_FLOAT, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 405 | w_float_str(PyFloat_AS_DOUBLE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 406 | } |
| 407 | } |
| 408 | else if (PyComplex_CheckExact(v)) { |
| 409 | if (p->version > 1) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 410 | W_TYPE(TYPE_BINARY_COMPLEX, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 411 | w_float_bin(PyComplex_RealAsDouble(v), p); |
| 412 | w_float_bin(PyComplex_ImagAsDouble(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 413 | } |
| 414 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 415 | W_TYPE(TYPE_COMPLEX, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 416 | w_float_str(PyComplex_RealAsDouble(v), p); |
| 417 | w_float_str(PyComplex_ImagAsDouble(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 418 | } |
| 419 | } |
| 420 | else if (PyBytes_CheckExact(v)) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 421 | W_TYPE(TYPE_STRING, p); |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 422 | w_pstring(PyBytes_AS_STRING(v), PyBytes_GET_SIZE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 423 | } |
| 424 | else if (PyUnicode_CheckExact(v)) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 425 | if (p->version >= 4 && PyUnicode_IS_ASCII(v)) { |
| 426 | int is_short = PyUnicode_GET_LENGTH(v) < 256; |
| 427 | if (is_short) { |
| 428 | if (PyUnicode_CHECK_INTERNED(v)) |
| 429 | W_TYPE(TYPE_SHORT_ASCII_INTERNED, p); |
| 430 | else |
| 431 | W_TYPE(TYPE_SHORT_ASCII, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 432 | w_short_pstring(PyUnicode_1BYTE_DATA(v), |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 433 | PyUnicode_GET_LENGTH(v), p); |
| 434 | } |
| 435 | else { |
| 436 | if (PyUnicode_CHECK_INTERNED(v)) |
| 437 | W_TYPE(TYPE_ASCII_INTERNED, p); |
| 438 | else |
| 439 | W_TYPE(TYPE_ASCII, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 440 | w_pstring(PyUnicode_1BYTE_DATA(v), |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 441 | PyUnicode_GET_LENGTH(v), p); |
| 442 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 443 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 444 | else { |
| 445 | PyObject *utf8; |
| 446 | utf8 = PyUnicode_AsEncodedString(v, "utf8", "surrogatepass"); |
| 447 | if (utf8 == NULL) { |
| 448 | p->depth--; |
| 449 | p->error = WFERR_UNMARSHALLABLE; |
| 450 | return; |
| 451 | } |
| 452 | if (p->version >= 3 && PyUnicode_CHECK_INTERNED(v)) |
| 453 | W_TYPE(TYPE_INTERNED, p); |
| 454 | else |
| 455 | W_TYPE(TYPE_UNICODE, p); |
| 456 | w_pstring(PyBytes_AS_STRING(utf8), PyBytes_GET_SIZE(utf8), p); |
| 457 | Py_DECREF(utf8); |
| 458 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 459 | } |
| 460 | else if (PyTuple_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 461 | n = PyTuple_GET_SIZE(v); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 462 | if (p->version >= 4 && n < 256) { |
| 463 | W_TYPE(TYPE_SMALL_TUPLE, p); |
Victor Stinner | da06255 | 2013-11-16 00:13:29 +0100 | [diff] [blame] | 464 | w_byte((unsigned char)n, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 465 | } |
| 466 | else { |
| 467 | W_TYPE(TYPE_TUPLE, p); |
| 468 | W_SIZE(n, p); |
| 469 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 470 | for (i = 0; i < n; i++) { |
| 471 | w_object(PyTuple_GET_ITEM(v, i), p); |
| 472 | } |
| 473 | } |
| 474 | else if (PyList_CheckExact(v)) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 475 | W_TYPE(TYPE_LIST, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 476 | n = PyList_GET_SIZE(v); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 477 | W_SIZE(n, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 478 | for (i = 0; i < n; i++) { |
| 479 | w_object(PyList_GET_ITEM(v, i), p); |
| 480 | } |
| 481 | } |
| 482 | else if (PyDict_CheckExact(v)) { |
| 483 | Py_ssize_t pos; |
| 484 | PyObject *key, *value; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 485 | W_TYPE(TYPE_DICT, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 486 | /* This one is NULL object terminated! */ |
| 487 | pos = 0; |
| 488 | while (PyDict_Next(v, &pos, &key, &value)) { |
| 489 | w_object(key, p); |
| 490 | w_object(value, p); |
| 491 | } |
| 492 | w_object((PyObject *)NULL, p); |
| 493 | } |
| 494 | else if (PyAnySet_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 495 | PyObject *value; |
| 496 | Py_ssize_t pos = 0; |
| 497 | Py_hash_t hash; |
Raymond Hettinger | a422c34 | 2005-01-11 03:03:27 +0000 | [diff] [blame] | 498 | |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 499 | if (PyFrozenSet_CheckExact(v)) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 500 | W_TYPE(TYPE_FROZENSET, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 501 | else |
| 502 | W_TYPE(TYPE_SET, p); |
| 503 | n = PySet_GET_SIZE(v); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 504 | W_SIZE(n, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 505 | while (_PySet_NextEntry(v, &pos, &value, &hash)) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 506 | w_object(value, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 507 | } |
| 508 | } |
| 509 | else if (PyCode_Check(v)) { |
| 510 | PyCodeObject *co = (PyCodeObject *)v; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 511 | W_TYPE(TYPE_CODE, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 512 | w_long(co->co_argcount, p); |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 513 | w_long(co->co_posonlyargcount, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 514 | w_long(co->co_kwonlyargcount, p); |
| 515 | w_long(co->co_nlocals, p); |
| 516 | w_long(co->co_stacksize, p); |
| 517 | w_long(co->co_flags, p); |
| 518 | w_object(co->co_code, p); |
| 519 | w_object(co->co_consts, p); |
| 520 | w_object(co->co_names, p); |
| 521 | w_object(co->co_varnames, p); |
| 522 | w_object(co->co_freevars, p); |
| 523 | w_object(co->co_cellvars, p); |
| 524 | w_object(co->co_filename, p); |
| 525 | w_object(co->co_name, p); |
| 526 | w_long(co->co_firstlineno, p); |
| 527 | w_object(co->co_lnotab, p); |
| 528 | } |
| 529 | else if (PyObject_CheckBuffer(v)) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 530 | /* Write unknown bytes-like objects as a bytes object */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 531 | Py_buffer view; |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 532 | if (PyObject_GetBuffer(v, &view, PyBUF_SIMPLE) != 0) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 533 | w_byte(TYPE_UNKNOWN, p); |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 534 | p->depth--; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 535 | p->error = WFERR_UNMARSHALLABLE; |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 536 | return; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 537 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 538 | W_TYPE(TYPE_STRING, p); |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 539 | w_pstring(view.buf, view.len, p); |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 540 | PyBuffer_Release(&view); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 541 | } |
| 542 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 543 | W_TYPE(TYPE_UNKNOWN, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 544 | p->error = WFERR_UNMARSHALLABLE; |
| 545 | } |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 546 | } |
| 547 | |
Victor Stinner | 2d0a3d6 | 2020-05-13 02:50:18 +0200 | [diff] [blame^] | 548 | static void |
| 549 | w_decref_entry(void *key) |
| 550 | { |
| 551 | PyObject *entry_key = (PyObject *)key; |
| 552 | Py_XDECREF(entry_key); |
| 553 | } |
| 554 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 555 | static int |
| 556 | w_init_refs(WFILE *wf, int version) |
| 557 | { |
| 558 | if (version >= 3) { |
Victor Stinner | 2d0a3d6 | 2020-05-13 02:50:18 +0200 | [diff] [blame^] | 559 | wf->hashtable = _Py_hashtable_new_full(sizeof(int), 0, |
| 560 | _Py_hashtable_hash_ptr, |
| 561 | _Py_hashtable_compare_direct, |
| 562 | w_decref_entry, NULL, NULL); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 563 | if (wf->hashtable == NULL) { |
| 564 | PyErr_NoMemory(); |
| 565 | return -1; |
| 566 | } |
| 567 | } |
| 568 | return 0; |
| 569 | } |
| 570 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 571 | static void |
| 572 | w_clear_refs(WFILE *wf) |
| 573 | { |
| 574 | if (wf->hashtable != NULL) { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 575 | _Py_hashtable_destroy(wf->hashtable); |
| 576 | } |
| 577 | } |
| 578 | |
Serhiy Storchaka | 9594942 | 2013-08-27 19:40:23 +0300 | [diff] [blame] | 579 | /* version currently has no effect for writing ints. */ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 580 | void |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 581 | PyMarshal_WriteLongToFile(long x, FILE *fp, int version) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 582 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 583 | char buf[4]; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 584 | WFILE wf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 585 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 586 | wf.fp = fp; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 587 | wf.ptr = wf.buf = buf; |
| 588 | wf.end = wf.ptr + sizeof(buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 589 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 590 | wf.version = version; |
| 591 | w_long(x, &wf); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 592 | w_flush(&wf); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 593 | } |
| 594 | |
| 595 | void |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 596 | PyMarshal_WriteObjectToFile(PyObject *x, FILE *fp, int version) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 597 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 598 | char buf[BUFSIZ]; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 599 | WFILE wf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 600 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 601 | wf.fp = fp; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 602 | wf.ptr = wf.buf = buf; |
| 603 | wf.end = wf.ptr + sizeof(buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 604 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 605 | wf.version = version; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 606 | if (w_init_refs(&wf, version)) |
| 607 | return; /* caller mush check PyErr_Occurred() */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 608 | w_object(x, &wf); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 609 | w_clear_refs(&wf); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 610 | w_flush(&wf); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 611 | } |
| 612 | |
Serhiy Storchaka | c07422c | 2015-02-11 16:18:09 +0200 | [diff] [blame] | 613 | typedef struct { |
| 614 | FILE *fp; |
| 615 | int depth; |
| 616 | PyObject *readable; /* Stream-like object being read from */ |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 617 | const char *ptr; |
| 618 | const char *end; |
Serhiy Storchaka | c07422c | 2015-02-11 16:18:09 +0200 | [diff] [blame] | 619 | char *buf; |
| 620 | Py_ssize_t buf_size; |
| 621 | PyObject *refs; /* a list */ |
| 622 | } RFILE; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 623 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 624 | static const char * |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 625 | r_string(Py_ssize_t n, RFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 626 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 627 | Py_ssize_t read = -1; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 628 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 629 | if (p->ptr != NULL) { |
| 630 | /* Fast path for loads() */ |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 631 | const char *res = p->ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 632 | Py_ssize_t left = p->end - p->ptr; |
| 633 | if (left < n) { |
| 634 | PyErr_SetString(PyExc_EOFError, |
| 635 | "marshal data too short"); |
| 636 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 637 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 638 | p->ptr += n; |
| 639 | return res; |
| 640 | } |
| 641 | if (p->buf == NULL) { |
| 642 | p->buf = PyMem_MALLOC(n); |
| 643 | if (p->buf == NULL) { |
| 644 | PyErr_NoMemory(); |
| 645 | return NULL; |
| 646 | } |
| 647 | p->buf_size = n; |
| 648 | } |
| 649 | else if (p->buf_size < n) { |
Zackery Spytz | 4c49da0 | 2018-12-07 03:11:30 -0700 | [diff] [blame] | 650 | char *tmp = PyMem_REALLOC(p->buf, n); |
| 651 | if (tmp == NULL) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 652 | PyErr_NoMemory(); |
| 653 | return NULL; |
| 654 | } |
Zackery Spytz | 4c49da0 | 2018-12-07 03:11:30 -0700 | [diff] [blame] | 655 | p->buf = tmp; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 656 | p->buf_size = n; |
| 657 | } |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 658 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 659 | if (!p->readable) { |
| 660 | assert(p->fp != NULL); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 661 | read = fread(p->buf, 1, n, p->fp); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 662 | } |
| 663 | else { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 664 | _Py_IDENTIFIER(readinto); |
| 665 | PyObject *res, *mview; |
| 666 | Py_buffer buf; |
Martin v. Löwis | afe55bb | 2011-10-09 10:38:36 +0200 | [diff] [blame] | 667 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 668 | if (PyBuffer_FillInfo(&buf, NULL, p->buf, n, 0, PyBUF_CONTIG) == -1) |
| 669 | return NULL; |
| 670 | mview = PyMemoryView_FromBuffer(&buf); |
| 671 | if (mview == NULL) |
| 672 | return NULL; |
| 673 | |
| 674 | res = _PyObject_CallMethodId(p->readable, &PyId_readinto, "N", mview); |
| 675 | if (res != NULL) { |
| 676 | read = PyNumber_AsSsize_t(res, PyExc_ValueError); |
| 677 | Py_DECREF(res); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 678 | } |
| 679 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 680 | if (read != n) { |
| 681 | if (!PyErr_Occurred()) { |
| 682 | if (read > n) |
| 683 | PyErr_Format(PyExc_ValueError, |
| 684 | "read() returned too much data: " |
| 685 | "%zd bytes requested, %zd returned", |
| 686 | n, read); |
| 687 | else |
| 688 | PyErr_SetString(PyExc_EOFError, |
| 689 | "EOF read where not expected"); |
| 690 | } |
| 691 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 692 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 693 | return p->buf; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 694 | } |
| 695 | |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 696 | static int |
| 697 | r_byte(RFILE *p) |
| 698 | { |
| 699 | int c = EOF; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 700 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 701 | if (p->ptr != NULL) { |
| 702 | if (p->ptr < p->end) |
| 703 | c = (unsigned char) *p->ptr++; |
| 704 | return c; |
| 705 | } |
| 706 | if (!p->readable) { |
| 707 | assert(p->fp); |
| 708 | c = getc(p->fp); |
| 709 | } |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 710 | else { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 711 | const char *ptr = r_string(1, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 712 | if (ptr != NULL) |
Andy Lester | e6be9b5 | 2020-02-11 20:28:35 -0600 | [diff] [blame] | 713 | c = *(const unsigned char *) ptr; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 714 | } |
| 715 | return c; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 716 | } |
| 717 | |
| 718 | static int |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 719 | r_short(RFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 720 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 721 | short x = -1; |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 722 | const unsigned char *buffer; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 723 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 724 | buffer = (const unsigned char *) r_string(2, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 725 | if (buffer != NULL) { |
| 726 | x = buffer[0]; |
| 727 | x |= buffer[1] << 8; |
| 728 | /* Sign-extension, in case short greater than 16 bits */ |
| 729 | x |= -(x & 0x8000); |
| 730 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 731 | return x; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 732 | } |
| 733 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 734 | static long |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 735 | r_long(RFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 736 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 737 | long x = -1; |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 738 | const unsigned char *buffer; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 739 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 740 | buffer = (const unsigned char *) r_string(4, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 741 | if (buffer != NULL) { |
| 742 | x = buffer[0]; |
| 743 | x |= (long)buffer[1] << 8; |
| 744 | x |= (long)buffer[2] << 16; |
| 745 | x |= (long)buffer[3] << 24; |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 746 | #if SIZEOF_LONG > 4 |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 747 | /* Sign extension for 64-bit machines */ |
| 748 | x |= -(x & 0x80000000L); |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 749 | #endif |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 750 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 751 | return x; |
Guido van Rossum | b0c168c | 1996-12-05 23:15:02 +0000 | [diff] [blame] | 752 | } |
| 753 | |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 754 | /* r_long64 deals with the TYPE_INT64 code. */ |
| 755 | static PyObject * |
| 756 | r_long64(RFILE *p) |
| 757 | { |
| 758 | const unsigned char *buffer = (const unsigned char *) r_string(8, p); |
| 759 | if (buffer == NULL) { |
| 760 | return NULL; |
| 761 | } |
| 762 | return _PyLong_FromByteArray(buffer, 8, |
| 763 | 1 /* little endian */, |
| 764 | 1 /* signed */); |
| 765 | } |
| 766 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 767 | static PyObject * |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 768 | r_PyLong(RFILE *p) |
| 769 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 770 | PyLongObject *ob; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 771 | long n, size, i; |
| 772 | int j, md, shorts_in_top_digit; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 773 | digit d; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 774 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 775 | n = r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 776 | if (PyErr_Occurred()) |
| 777 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 778 | if (n == 0) |
| 779 | return (PyObject *)_PyLong_New(0); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 780 | if (n < -SIZE32_MAX || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 781 | PyErr_SetString(PyExc_ValueError, |
| 782 | "bad marshal data (long size out of range)"); |
| 783 | return NULL; |
| 784 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 785 | |
Victor Stinner | 45e8e2f | 2014-05-14 17:24:35 +0200 | [diff] [blame] | 786 | size = 1 + (Py_ABS(n) - 1) / PyLong_MARSHAL_RATIO; |
| 787 | shorts_in_top_digit = 1 + (Py_ABS(n) - 1) % PyLong_MARSHAL_RATIO; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 788 | ob = _PyLong_New(size); |
| 789 | if (ob == NULL) |
| 790 | return NULL; |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 791 | |
Victor Stinner | 60ac6ed | 2020-02-07 23:18:08 +0100 | [diff] [blame] | 792 | Py_SET_SIZE(ob, n > 0 ? size : -size); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 793 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 794 | for (i = 0; i < size-1; i++) { |
| 795 | d = 0; |
| 796 | for (j=0; j < PyLong_MARSHAL_RATIO; j++) { |
| 797 | md = r_short(p); |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 798 | if (PyErr_Occurred()) { |
| 799 | Py_DECREF(ob); |
| 800 | return NULL; |
| 801 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 802 | if (md < 0 || md > PyLong_MARSHAL_BASE) |
| 803 | goto bad_digit; |
| 804 | d += (digit)md << j*PyLong_MARSHAL_SHIFT; |
| 805 | } |
| 806 | ob->ob_digit[i] = d; |
| 807 | } |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 808 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 809 | d = 0; |
| 810 | for (j=0; j < shorts_in_top_digit; j++) { |
| 811 | md = r_short(p); |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 812 | if (PyErr_Occurred()) { |
| 813 | Py_DECREF(ob); |
| 814 | return NULL; |
| 815 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 816 | if (md < 0 || md > PyLong_MARSHAL_BASE) |
| 817 | goto bad_digit; |
| 818 | /* topmost marshal digit should be nonzero */ |
| 819 | if (md == 0 && j == shorts_in_top_digit - 1) { |
| 820 | Py_DECREF(ob); |
| 821 | PyErr_SetString(PyExc_ValueError, |
| 822 | "bad marshal data (unnormalized long data)"); |
| 823 | return NULL; |
| 824 | } |
| 825 | d += (digit)md << j*PyLong_MARSHAL_SHIFT; |
| 826 | } |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 827 | if (PyErr_Occurred()) { |
| 828 | Py_DECREF(ob); |
| 829 | return NULL; |
| 830 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 831 | /* top digit should be nonzero, else the resulting PyLong won't be |
| 832 | normalized */ |
| 833 | ob->ob_digit[size-1] = d; |
| 834 | return (PyObject *)ob; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 835 | bad_digit: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 836 | Py_DECREF(ob); |
| 837 | PyErr_SetString(PyExc_ValueError, |
| 838 | "bad marshal data (digit out of range in long)"); |
| 839 | return NULL; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 840 | } |
| 841 | |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 842 | static double |
| 843 | r_float_bin(RFILE *p) |
| 844 | { |
| 845 | const unsigned char *buf = (const unsigned char *) r_string(8, p); |
| 846 | if (buf == NULL) |
| 847 | return -1; |
| 848 | return _PyFloat_Unpack8(buf, 1); |
| 849 | } |
| 850 | |
| 851 | /* Issue #33720: Disable inlining for reducing the C stack consumption |
| 852 | on PGO builds. */ |
| 853 | _Py_NO_INLINE static double |
| 854 | r_float_str(RFILE *p) |
| 855 | { |
| 856 | int n; |
| 857 | char buf[256]; |
| 858 | const char *ptr; |
| 859 | n = r_byte(p); |
| 860 | if (n == EOF) { |
| 861 | PyErr_SetString(PyExc_EOFError, |
| 862 | "EOF read where object expected"); |
| 863 | return -1; |
| 864 | } |
| 865 | ptr = r_string(n, p); |
| 866 | if (ptr == NULL) { |
| 867 | return -1; |
| 868 | } |
| 869 | memcpy(buf, ptr, n); |
| 870 | buf[n] = '\0'; |
| 871 | return PyOS_string_to_double(buf, NULL, NULL); |
| 872 | } |
| 873 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 874 | /* allocate the reflist index for a new object. Return -1 on failure */ |
| 875 | static Py_ssize_t |
| 876 | r_ref_reserve(int flag, RFILE *p) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 877 | { |
| 878 | if (flag) { /* currently only FLAG_REF is defined */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 879 | Py_ssize_t idx = PyList_GET_SIZE(p->refs); |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 880 | if (idx >= 0x7ffffffe) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 881 | PyErr_SetString(PyExc_ValueError, "bad marshal data (index list too large)"); |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 882 | return -1; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 883 | } |
| 884 | if (PyList_Append(p->refs, Py_None) < 0) |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 885 | return -1; |
| 886 | return idx; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 887 | } else |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 888 | return 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 889 | } |
| 890 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 891 | /* insert the new object 'o' to the reflist at previously |
| 892 | * allocated index 'idx'. |
| 893 | * 'o' can be NULL, in which case nothing is done. |
| 894 | * if 'o' was non-NULL, and the function succeeds, 'o' is returned. |
| 895 | * if 'o' was non-NULL, and the function fails, 'o' is released and |
| 896 | * NULL returned. This simplifies error checking at the call site since |
| 897 | * a single test for NULL for the function result is enough. |
| 898 | */ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 899 | static PyObject * |
| 900 | r_ref_insert(PyObject *o, Py_ssize_t idx, int flag, RFILE *p) |
| 901 | { |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 902 | if (o != NULL && flag) { /* currently only FLAG_REF is defined */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 903 | PyObject *tmp = PyList_GET_ITEM(p->refs, idx); |
| 904 | Py_INCREF(o); |
| 905 | PyList_SET_ITEM(p->refs, idx, o); |
| 906 | Py_DECREF(tmp); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 907 | } |
| 908 | return o; |
| 909 | } |
| 910 | |
| 911 | /* combination of both above, used when an object can be |
| 912 | * created whenever it is seen in the file, as opposed to |
| 913 | * after having loaded its sub-objects. |
| 914 | */ |
| 915 | static PyObject * |
| 916 | r_ref(PyObject *o, int flag, RFILE *p) |
| 917 | { |
Victor Stinner | 359fabc | 2013-10-31 17:09:01 +0100 | [diff] [blame] | 918 | assert(flag & FLAG_REF); |
| 919 | if (o == NULL) |
| 920 | return NULL; |
| 921 | if (PyList_Append(p->refs, o) < 0) { |
| 922 | Py_DECREF(o); /* release the new object */ |
| 923 | return NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 924 | } |
| 925 | return o; |
| 926 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 927 | |
| 928 | static PyObject * |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 929 | r_object(RFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 930 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 931 | /* NULL is a valid return value, it does not necessarily means that |
| 932 | an exception is set. */ |
| 933 | PyObject *v, *v2; |
Benjamin Peterson | eddb0a7 | 2013-03-20 00:40:07 -0500 | [diff] [blame] | 934 | Py_ssize_t idx = 0; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 935 | long i, n; |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 936 | int type, code = r_byte(p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 937 | int flag, is_interned = 0; |
Christian Heimes | 3572842 | 2013-10-13 02:29:06 +0200 | [diff] [blame] | 938 | PyObject *retval = NULL; |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 939 | |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 940 | if (code == EOF) { |
| 941 | PyErr_SetString(PyExc_EOFError, |
| 942 | "EOF read where object expected"); |
| 943 | return NULL; |
| 944 | } |
| 945 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 946 | p->depth++; |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 947 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 948 | if (p->depth > MAX_MARSHAL_STACK_DEPTH) { |
| 949 | p->depth--; |
| 950 | PyErr_SetString(PyExc_ValueError, "recursion limit exceeded"); |
| 951 | return NULL; |
| 952 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 953 | |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 954 | flag = code & FLAG_REF; |
| 955 | type = code & ~FLAG_REF; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 956 | |
| 957 | #define R_REF(O) do{\ |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 958 | if (flag) \ |
| 959 | O = r_ref(O, flag, p);\ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 960 | } while (0) |
| 961 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 962 | switch (type) { |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 963 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 964 | case TYPE_NULL: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 965 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 966 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 967 | case TYPE_NONE: |
| 968 | Py_INCREF(Py_None); |
| 969 | retval = Py_None; |
| 970 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 971 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 972 | case TYPE_STOPITER: |
| 973 | Py_INCREF(PyExc_StopIteration); |
| 974 | retval = PyExc_StopIteration; |
| 975 | break; |
Tim Peters | 5ca576e | 2001-06-18 22:08:13 +0000 | [diff] [blame] | 976 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 977 | case TYPE_ELLIPSIS: |
| 978 | Py_INCREF(Py_Ellipsis); |
| 979 | retval = Py_Ellipsis; |
| 980 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 981 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 982 | case TYPE_FALSE: |
| 983 | Py_INCREF(Py_False); |
| 984 | retval = Py_False; |
| 985 | break; |
Guido van Rossum | 77f6a65 | 2002-04-03 22:41:51 +0000 | [diff] [blame] | 986 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 987 | case TYPE_TRUE: |
| 988 | Py_INCREF(Py_True); |
| 989 | retval = Py_True; |
| 990 | break; |
Guido van Rossum | 77f6a65 | 2002-04-03 22:41:51 +0000 | [diff] [blame] | 991 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 992 | case TYPE_INT: |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 993 | n = r_long(p); |
| 994 | retval = PyErr_Occurred() ? NULL : PyLong_FromLong(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 995 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 996 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 997 | |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 998 | case TYPE_INT64: |
| 999 | retval = r_long64(p); |
| 1000 | R_REF(retval); |
| 1001 | break; |
| 1002 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1003 | case TYPE_LONG: |
| 1004 | retval = r_PyLong(p); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1005 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1006 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1007 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1008 | case TYPE_FLOAT: |
| 1009 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1010 | double x = r_float_str(p); |
| 1011 | if (x == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1012 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1013 | retval = PyFloat_FromDouble(x); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1014 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1015 | break; |
| 1016 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1017 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1018 | case TYPE_BINARY_FLOAT: |
| 1019 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1020 | double x = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1021 | if (x == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1022 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1023 | retval = PyFloat_FromDouble(x); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1024 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1025 | break; |
| 1026 | } |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1027 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1028 | case TYPE_COMPLEX: |
| 1029 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1030 | Py_complex c; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1031 | c.real = r_float_str(p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1032 | if (c.real == -1.0 && PyErr_Occurred()) |
| 1033 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1034 | c.imag = r_float_str(p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1035 | if (c.imag == -1.0 && PyErr_Occurred()) |
| 1036 | break; |
| 1037 | retval = PyComplex_FromCComplex(c); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1038 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1039 | break; |
| 1040 | } |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1041 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1042 | case TYPE_BINARY_COMPLEX: |
| 1043 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1044 | Py_complex c; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1045 | c.real = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1046 | if (c.real == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1047 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1048 | c.imag = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1049 | if (c.imag == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1050 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1051 | retval = PyComplex_FromCComplex(c); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1052 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1053 | break; |
| 1054 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1055 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1056 | case TYPE_STRING: |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1057 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1058 | const char *ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1059 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1060 | if (PyErr_Occurred()) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1061 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1062 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1063 | PyErr_SetString(PyExc_ValueError, "bad marshal data (bytes object size out of range)"); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1064 | break; |
| 1065 | } |
| 1066 | v = PyBytes_FromStringAndSize((char *)NULL, n); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1067 | if (v == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1068 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1069 | ptr = r_string(n, p); |
| 1070 | if (ptr == NULL) { |
| 1071 | Py_DECREF(v); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1072 | break; |
| 1073 | } |
| 1074 | memcpy(PyBytes_AS_STRING(v), ptr, n); |
| 1075 | retval = v; |
| 1076 | R_REF(retval); |
| 1077 | break; |
| 1078 | } |
| 1079 | |
| 1080 | case TYPE_ASCII_INTERNED: |
| 1081 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1082 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1083 | case TYPE_ASCII: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1084 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1085 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1086 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1087 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1088 | PyErr_SetString(PyExc_ValueError, "bad marshal data (string size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1089 | break; |
| 1090 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1091 | goto _read_ascii; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1092 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1093 | case TYPE_SHORT_ASCII_INTERNED: |
| 1094 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1095 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1096 | case TYPE_SHORT_ASCII: |
| 1097 | n = r_byte(p); |
| 1098 | if (n == EOF) { |
| 1099 | PyErr_SetString(PyExc_EOFError, |
| 1100 | "EOF read where object expected"); |
| 1101 | break; |
| 1102 | } |
| 1103 | _read_ascii: |
| 1104 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1105 | const char *ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1106 | ptr = r_string(n, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1107 | if (ptr == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1108 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1109 | v = PyUnicode_FromKindAndData(PyUnicode_1BYTE_KIND, ptr, n); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1110 | if (v == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1111 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1112 | if (is_interned) |
| 1113 | PyUnicode_InternInPlace(&v); |
| 1114 | retval = v; |
| 1115 | R_REF(retval); |
| 1116 | break; |
| 1117 | } |
| 1118 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1119 | case TYPE_INTERNED: |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1120 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1121 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1122 | case TYPE_UNICODE: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1123 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1124 | const char *buffer; |
Guido van Rossum | c279b53 | 2000-03-10 23:03:02 +0000 | [diff] [blame] | 1125 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1126 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1127 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1128 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1129 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1130 | PyErr_SetString(PyExc_ValueError, "bad marshal data (string size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1131 | break; |
| 1132 | } |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1133 | if (n != 0) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1134 | buffer = r_string(n, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1135 | if (buffer == NULL) |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1136 | break; |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1137 | v = PyUnicode_DecodeUTF8(buffer, n, "surrogatepass"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1138 | } |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1139 | else { |
| 1140 | v = PyUnicode_New(0, 0); |
| 1141 | } |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1142 | if (v == NULL) |
Victor Stinner | 3a8b79d | 2013-07-08 22:23:32 +0200 | [diff] [blame] | 1143 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1144 | if (is_interned) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1145 | PyUnicode_InternInPlace(&v); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1146 | retval = v; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1147 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1148 | break; |
| 1149 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1150 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1151 | case TYPE_SMALL_TUPLE: |
| 1152 | n = (unsigned char) r_byte(p); |
Victor Stinner | b1b7b18 | 2013-10-31 17:07:08 +0100 | [diff] [blame] | 1153 | if (PyErr_Occurred()) |
| 1154 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1155 | goto _read_tuple; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1156 | case TYPE_TUPLE: |
| 1157 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1158 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1159 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1160 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1161 | PyErr_SetString(PyExc_ValueError, "bad marshal data (tuple size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1162 | break; |
| 1163 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1164 | _read_tuple: |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1165 | v = PyTuple_New(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1166 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1167 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1168 | break; |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1169 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1170 | for (i = 0; i < n; i++) { |
| 1171 | v2 = r_object(p); |
| 1172 | if ( v2 == NULL ) { |
| 1173 | if (!PyErr_Occurred()) |
| 1174 | PyErr_SetString(PyExc_TypeError, |
| 1175 | "NULL object in marshal data for tuple"); |
| 1176 | Py_DECREF(v); |
| 1177 | v = NULL; |
| 1178 | break; |
| 1179 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1180 | PyTuple_SET_ITEM(v, i, v2); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1181 | } |
| 1182 | retval = v; |
| 1183 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1184 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1185 | case TYPE_LIST: |
| 1186 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1187 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1188 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1189 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1190 | PyErr_SetString(PyExc_ValueError, "bad marshal data (list size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1191 | break; |
| 1192 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1193 | v = PyList_New(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1194 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1195 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1196 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1197 | for (i = 0; i < n; i++) { |
| 1198 | v2 = r_object(p); |
| 1199 | if ( v2 == NULL ) { |
| 1200 | if (!PyErr_Occurred()) |
| 1201 | PyErr_SetString(PyExc_TypeError, |
| 1202 | "NULL object in marshal data for list"); |
| 1203 | Py_DECREF(v); |
| 1204 | v = NULL; |
| 1205 | break; |
| 1206 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1207 | PyList_SET_ITEM(v, i, v2); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1208 | } |
| 1209 | retval = v; |
| 1210 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1211 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1212 | case TYPE_DICT: |
| 1213 | v = PyDict_New(); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1214 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1215 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1216 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1217 | for (;;) { |
| 1218 | PyObject *key, *val; |
| 1219 | key = r_object(p); |
| 1220 | if (key == NULL) |
| 1221 | break; |
| 1222 | val = r_object(p); |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1223 | if (val == NULL) { |
| 1224 | Py_DECREF(key); |
| 1225 | break; |
| 1226 | } |
| 1227 | if (PyDict_SetItem(v, key, val) < 0) { |
| 1228 | Py_DECREF(key); |
| 1229 | Py_DECREF(val); |
| 1230 | break; |
| 1231 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1232 | Py_DECREF(key); |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1233 | Py_DECREF(val); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1234 | } |
| 1235 | if (PyErr_Occurred()) { |
| 1236 | Py_DECREF(v); |
| 1237 | v = NULL; |
| 1238 | } |
| 1239 | retval = v; |
| 1240 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1241 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1242 | case TYPE_SET: |
| 1243 | case TYPE_FROZENSET: |
| 1244 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1245 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1246 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1247 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1248 | PyErr_SetString(PyExc_ValueError, "bad marshal data (set size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1249 | break; |
| 1250 | } |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1251 | |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1252 | if (n == 0 && type == TYPE_FROZENSET) { |
| 1253 | /* call frozenset() to get the empty frozenset singleton */ |
Victor Stinner | 4778eab | 2016-12-01 14:51:04 +0100 | [diff] [blame] | 1254 | v = _PyObject_CallNoArg((PyObject*)&PyFrozenSet_Type); |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1255 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1256 | break; |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1257 | R_REF(v); |
| 1258 | retval = v; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1259 | } |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1260 | else { |
| 1261 | v = (type == TYPE_SET) ? PySet_New(NULL) : PyFrozenSet_New(NULL); |
| 1262 | if (type == TYPE_SET) { |
| 1263 | R_REF(v); |
| 1264 | } else { |
| 1265 | /* must use delayed registration of frozensets because they must |
| 1266 | * be init with a refcount of 1 |
| 1267 | */ |
| 1268 | idx = r_ref_reserve(flag, p); |
| 1269 | if (idx < 0) |
| 1270 | Py_CLEAR(v); /* signal error */ |
| 1271 | } |
| 1272 | if (v == NULL) |
| 1273 | break; |
| 1274 | |
| 1275 | for (i = 0; i < n; i++) { |
| 1276 | v2 = r_object(p); |
| 1277 | if ( v2 == NULL ) { |
| 1278 | if (!PyErr_Occurred()) |
| 1279 | PyErr_SetString(PyExc_TypeError, |
| 1280 | "NULL object in marshal data for set"); |
| 1281 | Py_DECREF(v); |
| 1282 | v = NULL; |
| 1283 | break; |
| 1284 | } |
| 1285 | if (PySet_Add(v, v2) == -1) { |
| 1286 | Py_DECREF(v); |
| 1287 | Py_DECREF(v2); |
| 1288 | v = NULL; |
| 1289 | break; |
| 1290 | } |
| 1291 | Py_DECREF(v2); |
| 1292 | } |
| 1293 | if (type != TYPE_SET) |
| 1294 | v = r_ref_insert(v, idx, flag, p); |
| 1295 | retval = v; |
| 1296 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1297 | break; |
Raymond Hettinger | a422c34 | 2005-01-11 03:03:27 +0000 | [diff] [blame] | 1298 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1299 | case TYPE_CODE: |
| 1300 | { |
| 1301 | int argcount; |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1302 | int posonlyargcount; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1303 | int kwonlyargcount; |
| 1304 | int nlocals; |
| 1305 | int stacksize; |
| 1306 | int flags; |
| 1307 | PyObject *code = NULL; |
| 1308 | PyObject *consts = NULL; |
| 1309 | PyObject *names = NULL; |
| 1310 | PyObject *varnames = NULL; |
| 1311 | PyObject *freevars = NULL; |
| 1312 | PyObject *cellvars = NULL; |
| 1313 | PyObject *filename = NULL; |
| 1314 | PyObject *name = NULL; |
| 1315 | int firstlineno; |
| 1316 | PyObject *lnotab = NULL; |
Antoine Pitrou | e9bbe8b | 2013-04-13 22:41:09 +0200 | [diff] [blame] | 1317 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 1318 | idx = r_ref_reserve(flag, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1319 | if (idx < 0) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1320 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1321 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1322 | v = NULL; |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1323 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1324 | /* XXX ignore long->int overflows for now */ |
| 1325 | argcount = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1326 | if (PyErr_Occurred()) |
| 1327 | goto code_error; |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1328 | posonlyargcount = (int)r_long(p); |
| 1329 | if (PyErr_Occurred()) { |
| 1330 | goto code_error; |
| 1331 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1332 | kwonlyargcount = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1333 | if (PyErr_Occurred()) |
| 1334 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1335 | nlocals = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1336 | if (PyErr_Occurred()) |
| 1337 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1338 | stacksize = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1339 | if (PyErr_Occurred()) |
| 1340 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1341 | flags = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1342 | if (PyErr_Occurred()) |
| 1343 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1344 | code = r_object(p); |
| 1345 | if (code == NULL) |
| 1346 | goto code_error; |
| 1347 | consts = r_object(p); |
| 1348 | if (consts == NULL) |
| 1349 | goto code_error; |
| 1350 | names = r_object(p); |
| 1351 | if (names == NULL) |
| 1352 | goto code_error; |
| 1353 | varnames = r_object(p); |
| 1354 | if (varnames == NULL) |
| 1355 | goto code_error; |
| 1356 | freevars = r_object(p); |
| 1357 | if (freevars == NULL) |
| 1358 | goto code_error; |
| 1359 | cellvars = r_object(p); |
| 1360 | if (cellvars == NULL) |
| 1361 | goto code_error; |
| 1362 | filename = r_object(p); |
| 1363 | if (filename == NULL) |
| 1364 | goto code_error; |
| 1365 | name = r_object(p); |
| 1366 | if (name == NULL) |
| 1367 | goto code_error; |
| 1368 | firstlineno = (int)r_long(p); |
Kristján Valur Jónsson | 0a7697b | 2013-10-13 15:19:56 +0000 | [diff] [blame] | 1369 | if (firstlineno == -1 && PyErr_Occurred()) |
| 1370 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1371 | lnotab = r_object(p); |
| 1372 | if (lnotab == NULL) |
| 1373 | goto code_error; |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1374 | |
Pablo Galindo | 4a2edc3 | 2019-07-01 11:35:05 +0100 | [diff] [blame] | 1375 | v = (PyObject *) PyCode_NewWithPosOnlyArgs( |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1376 | argcount, posonlyargcount, kwonlyargcount, |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1377 | nlocals, stacksize, flags, |
| 1378 | code, consts, names, varnames, |
| 1379 | freevars, cellvars, filename, name, |
| 1380 | firstlineno, lnotab); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1381 | v = r_ref_insert(v, idx, flag, p); |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1382 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1383 | code_error: |
| 1384 | Py_XDECREF(code); |
| 1385 | Py_XDECREF(consts); |
| 1386 | Py_XDECREF(names); |
| 1387 | Py_XDECREF(varnames); |
| 1388 | Py_XDECREF(freevars); |
| 1389 | Py_XDECREF(cellvars); |
| 1390 | Py_XDECREF(filename); |
| 1391 | Py_XDECREF(name); |
| 1392 | Py_XDECREF(lnotab); |
| 1393 | } |
| 1394 | retval = v; |
| 1395 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1396 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1397 | case TYPE_REF: |
| 1398 | n = r_long(p); |
| 1399 | if (n < 0 || n >= PyList_GET_SIZE(p->refs)) { |
Kristján Valur Jónsson | 0a7697b | 2013-10-13 15:19:56 +0000 | [diff] [blame] | 1400 | if (n == -1 && PyErr_Occurred()) |
| 1401 | break; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1402 | PyErr_SetString(PyExc_ValueError, "bad marshal data (invalid reference)"); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1403 | break; |
| 1404 | } |
| 1405 | v = PyList_GET_ITEM(p->refs, n); |
| 1406 | if (v == Py_None) { |
| 1407 | PyErr_SetString(PyExc_ValueError, "bad marshal data (invalid reference)"); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1408 | break; |
| 1409 | } |
| 1410 | Py_INCREF(v); |
| 1411 | retval = v; |
| 1412 | break; |
| 1413 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1414 | default: |
| 1415 | /* Bogus data got written, which isn't ideal. |
| 1416 | This will let you keep working and recover. */ |
| 1417 | PyErr_SetString(PyExc_ValueError, "bad marshal data (unknown type code)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1418 | break; |
| 1419 | |
| 1420 | } |
| 1421 | p->depth--; |
| 1422 | return retval; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1423 | } |
| 1424 | |
Neal Norwitz | d85c452 | 2004-06-13 20:31:49 +0000 | [diff] [blame] | 1425 | static PyObject * |
Armin Rigo | 01ab279 | 2004-03-26 15:09:27 +0000 | [diff] [blame] | 1426 | read_object(RFILE *p) |
| 1427 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1428 | PyObject *v; |
| 1429 | if (PyErr_Occurred()) { |
| 1430 | fprintf(stderr, "XXX readobject called with exception set\n"); |
| 1431 | return NULL; |
| 1432 | } |
| 1433 | v = r_object(p); |
| 1434 | if (v == NULL && !PyErr_Occurred()) |
| 1435 | PyErr_SetString(PyExc_TypeError, "NULL object in marshal data for object"); |
| 1436 | return v; |
Armin Rigo | 01ab279 | 2004-03-26 15:09:27 +0000 | [diff] [blame] | 1437 | } |
| 1438 | |
Guido van Rossum | b8cf3e6 | 2001-10-19 01:46:21 +0000 | [diff] [blame] | 1439 | int |
| 1440 | PyMarshal_ReadShortFromFile(FILE *fp) |
| 1441 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1442 | RFILE rf; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1443 | int res; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1444 | assert(fp); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1445 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1446 | rf.fp = fp; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1447 | rf.end = rf.ptr = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1448 | rf.buf = NULL; |
| 1449 | res = r_short(&rf); |
| 1450 | if (rf.buf != NULL) |
| 1451 | PyMem_FREE(rf.buf); |
| 1452 | return res; |
Guido van Rossum | b8cf3e6 | 2001-10-19 01:46:21 +0000 | [diff] [blame] | 1453 | } |
| 1454 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1455 | long |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 1456 | PyMarshal_ReadLongFromFile(FILE *fp) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1457 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1458 | RFILE rf; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1459 | long res; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1460 | rf.fp = fp; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1461 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1462 | rf.ptr = rf.end = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1463 | rf.buf = NULL; |
| 1464 | res = r_long(&rf); |
| 1465 | if (rf.buf != NULL) |
| 1466 | PyMem_FREE(rf.buf); |
| 1467 | return res; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1468 | } |
| 1469 | |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1470 | /* Return size of file in bytes; < 0 if unknown or INT_MAX if too big */ |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1471 | static off_t |
| 1472 | getfilesize(FILE *fp) |
| 1473 | { |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1474 | struct _Py_stat_struct st; |
Victor Stinner | e134a7f | 2015-03-30 10:09:31 +0200 | [diff] [blame] | 1475 | if (_Py_fstat_noraise(fileno(fp), &st) != 0) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1476 | return -1; |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1477 | #if SIZEOF_OFF_T == 4 |
| 1478 | else if (st.st_size >= INT_MAX) |
| 1479 | return (off_t)INT_MAX; |
| 1480 | #endif |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1481 | else |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1482 | return (off_t)st.st_size; |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1483 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1484 | |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1485 | /* If we can get the size of the file up-front, and it's reasonably small, |
| 1486 | * read it in one gulp and delegate to ...FromString() instead. Much quicker |
| 1487 | * than reading a byte at a time from file; speeds .pyc imports. |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1488 | * CAUTION: since this may read the entire remainder of the file, don't |
| 1489 | * call it unless you know you're done with the file. |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1490 | */ |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1491 | PyObject * |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1492 | PyMarshal_ReadLastObjectFromFile(FILE *fp) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1493 | { |
Antoine Pitrou | 5bc7ec9 | 2010-04-21 22:56:22 +0000 | [diff] [blame] | 1494 | /* REASONABLE_FILE_LIMIT is by defn something big enough for Tkinter.pyc. */ |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1495 | #define REASONABLE_FILE_LIMIT (1L << 18) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1496 | off_t filesize; |
| 1497 | filesize = getfilesize(fp); |
| 1498 | if (filesize > 0 && filesize <= REASONABLE_FILE_LIMIT) { |
| 1499 | char* pBuf = (char *)PyMem_MALLOC(filesize); |
| 1500 | if (pBuf != NULL) { |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1501 | size_t n = fread(pBuf, 1, (size_t)filesize, fp); |
| 1502 | PyObject* v = PyMarshal_ReadObjectFromString(pBuf, n); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1503 | PyMem_FREE(pBuf); |
| 1504 | return v; |
| 1505 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1506 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1507 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1508 | /* We don't have fstat, or we do but the file is larger than |
| 1509 | * REASONABLE_FILE_LIMIT or malloc failed -- read a byte at a time. |
| 1510 | */ |
| 1511 | return PyMarshal_ReadObjectFromFile(fp); |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1512 | |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1513 | #undef REASONABLE_FILE_LIMIT |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1514 | } |
| 1515 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1516 | PyObject * |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1517 | PyMarshal_ReadObjectFromFile(FILE *fp) |
| 1518 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1519 | RFILE rf; |
| 1520 | PyObject *result; |
| 1521 | rf.fp = fp; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1522 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1523 | rf.depth = 0; |
| 1524 | rf.ptr = rf.end = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1525 | rf.buf = NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1526 | rf.refs = PyList_New(0); |
| 1527 | if (rf.refs == NULL) |
| 1528 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1529 | result = r_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1530 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1531 | if (rf.buf != NULL) |
| 1532 | PyMem_FREE(rf.buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1533 | return result; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1534 | } |
| 1535 | |
| 1536 | PyObject * |
Serhiy Storchaka | c679227 | 2013-10-19 21:03:34 +0300 | [diff] [blame] | 1537 | PyMarshal_ReadObjectFromString(const char *str, Py_ssize_t len) |
Guido van Rossum | f56e3db | 1993-04-01 20:59:32 +0000 | [diff] [blame] | 1538 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1539 | RFILE rf; |
| 1540 | PyObject *result; |
| 1541 | rf.fp = NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1542 | rf.readable = NULL; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1543 | rf.ptr = str; |
| 1544 | rf.end = str + len; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1545 | rf.buf = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1546 | rf.depth = 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1547 | rf.refs = PyList_New(0); |
| 1548 | if (rf.refs == NULL) |
| 1549 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1550 | result = r_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1551 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1552 | if (rf.buf != NULL) |
| 1553 | PyMem_FREE(rf.buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1554 | return result; |
Guido van Rossum | f56e3db | 1993-04-01 20:59:32 +0000 | [diff] [blame] | 1555 | } |
| 1556 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1557 | PyObject * |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 1558 | PyMarshal_WriteObjectToString(PyObject *x, int version) |
Guido van Rossum | 3f3bb3d | 1996-08-19 22:07:17 +0000 | [diff] [blame] | 1559 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1560 | WFILE wf; |
Guido van Rossum | e6d3904 | 2007-05-09 00:01:30 +0000 | [diff] [blame] | 1561 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1562 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1563 | wf.str = PyBytes_FromStringAndSize((char *)NULL, 50); |
| 1564 | if (wf.str == NULL) |
| 1565 | return NULL; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1566 | wf.ptr = wf.buf = PyBytes_AS_STRING(wf.str); |
| 1567 | wf.end = wf.ptr + PyBytes_GET_SIZE(wf.str); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1568 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1569 | wf.version = version; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1570 | if (w_init_refs(&wf, version)) { |
| 1571 | Py_DECREF(wf.str); |
| 1572 | return NULL; |
| 1573 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1574 | w_object(x, &wf); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1575 | w_clear_refs(&wf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1576 | if (wf.str != NULL) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1577 | const char *base = PyBytes_AS_STRING(wf.str); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1578 | if (_PyBytes_Resize(&wf.str, (Py_ssize_t)(wf.ptr - base)) < 0) |
| 1579 | return NULL; |
| 1580 | } |
| 1581 | if (wf.error != WFERR_OK) { |
| 1582 | Py_XDECREF(wf.str); |
| 1583 | if (wf.error == WFERR_NOMEMORY) |
| 1584 | PyErr_NoMemory(); |
| 1585 | else |
| 1586 | PyErr_SetString(PyExc_ValueError, |
| 1587 | (wf.error==WFERR_UNMARSHALLABLE)?"unmarshallable object" |
| 1588 | :"object too deeply nested to marshal"); |
| 1589 | return NULL; |
| 1590 | } |
Antoine Pitrou | 1c13f84 | 2012-03-02 18:22:23 +0100 | [diff] [blame] | 1591 | return wf.str; |
Guido van Rossum | 3f3bb3d | 1996-08-19 22:07:17 +0000 | [diff] [blame] | 1592 | } |
| 1593 | |
Guido van Rossum | 64b4552 | 1991-06-07 13:58:22 +0000 | [diff] [blame] | 1594 | /* And an interface for Python programs... */ |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1595 | /*[clinic input] |
| 1596 | marshal.dump |
| 1597 | |
| 1598 | value: object |
| 1599 | Must be a supported type. |
| 1600 | file: object |
| 1601 | Must be a writeable binary file. |
| 1602 | version: int(c_default="Py_MARSHAL_VERSION") = version |
| 1603 | Indicates the data format that dump should use. |
| 1604 | / |
| 1605 | |
| 1606 | Write the value on the open file. |
| 1607 | |
| 1608 | If the value has (or contains an object that has) an unsupported type, a |
| 1609 | ValueError exception is raised - but garbage data will also be written |
| 1610 | to the file. The object will not be properly read back by load(). |
| 1611 | [clinic start generated code]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1612 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1613 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1614 | marshal_dump_impl(PyObject *module, PyObject *value, PyObject *file, |
| 1615 | int version) |
| 1616 | /*[clinic end generated code: output=aaee62c7028a7cb2 input=6c7a3c23c6fef556]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1617 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1618 | /* XXX Quick hack -- need to do this differently */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1619 | PyObject *s; |
| 1620 | PyObject *res; |
Martin v. Löwis | bd928fe | 2011-10-14 10:20:37 +0200 | [diff] [blame] | 1621 | _Py_IDENTIFIER(write); |
Martin v. Löwis | afe55bb | 2011-10-09 10:38:36 +0200 | [diff] [blame] | 1622 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1623 | s = PyMarshal_WriteObjectToString(value, version); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1624 | if (s == NULL) |
| 1625 | return NULL; |
Jeroen Demeyer | 59ad110 | 2019-07-11 10:59:05 +0200 | [diff] [blame] | 1626 | res = _PyObject_CallMethodIdOneArg(file, &PyId_write, s); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1627 | Py_DECREF(s); |
| 1628 | return res; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1629 | } |
| 1630 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1631 | /*[clinic input] |
| 1632 | marshal.load |
| 1633 | |
| 1634 | file: object |
| 1635 | Must be readable binary file. |
| 1636 | / |
| 1637 | |
| 1638 | Read one value from the open file and return it. |
| 1639 | |
| 1640 | If no valid value is read (e.g. because the data has a different Python |
| 1641 | version's incompatible marshal format), raise EOFError, ValueError or |
| 1642 | TypeError. |
| 1643 | |
| 1644 | Note: If an object containing an unsupported type was marshalled with |
| 1645 | dump(), load() will substitute None for the unmarshallable type. |
| 1646 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1647 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1648 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1649 | marshal_load(PyObject *module, PyObject *file) |
| 1650 | /*[clinic end generated code: output=f8e5c33233566344 input=c85c2b594cd8124a]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1651 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1652 | PyObject *data, *result; |
Martin v. Löwis | bd928fe | 2011-10-14 10:20:37 +0200 | [diff] [blame] | 1653 | _Py_IDENTIFIER(read); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1654 | RFILE rf; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1655 | |
| 1656 | /* |
| 1657 | * Make a call to the read method, but read zero bytes. |
| 1658 | * This is to ensure that the object passed in at least |
| 1659 | * has a read method which returns bytes. |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1660 | * This can be removed if we guarantee good error handling |
| 1661 | * for r_string() |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1662 | */ |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1663 | data = _PyObject_CallMethodId(file, &PyId_read, "i", 0); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1664 | if (data == NULL) |
| 1665 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1666 | if (!PyBytes_Check(data)) { |
| 1667 | PyErr_Format(PyExc_TypeError, |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1668 | "file.read() returned not bytes but %.100s", |
Victor Stinner | a102ed7 | 2020-02-07 02:24:48 +0100 | [diff] [blame] | 1669 | Py_TYPE(data)->tp_name); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1670 | result = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1671 | } |
| 1672 | else { |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1673 | rf.depth = 0; |
| 1674 | rf.fp = NULL; |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1675 | rf.readable = file; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1676 | rf.ptr = rf.end = NULL; |
| 1677 | rf.buf = NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1678 | if ((rf.refs = PyList_New(0)) != NULL) { |
| 1679 | result = read_object(&rf); |
| 1680 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1681 | if (rf.buf != NULL) |
| 1682 | PyMem_FREE(rf.buf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1683 | } else |
| 1684 | result = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1685 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1686 | Py_DECREF(data); |
| 1687 | return result; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1688 | } |
| 1689 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1690 | /*[clinic input] |
| 1691 | marshal.dumps |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1692 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1693 | value: object |
| 1694 | Must be a supported type. |
| 1695 | version: int(c_default="Py_MARSHAL_VERSION") = version |
| 1696 | Indicates the data format that dumps should use. |
| 1697 | / |
| 1698 | |
| 1699 | Return the bytes object that would be written to a file by dump(value, file). |
| 1700 | |
| 1701 | Raise a ValueError exception if value has (or contains an object that has) an |
| 1702 | unsupported type. |
| 1703 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1704 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1705 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1706 | marshal_dumps_impl(PyObject *module, PyObject *value, int version) |
| 1707 | /*[clinic end generated code: output=9c200f98d7256cad input=a2139ea8608e9b27]*/ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1708 | { |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1709 | return PyMarshal_WriteObjectToString(value, version); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1710 | } |
| 1711 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1712 | /*[clinic input] |
| 1713 | marshal.loads |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1714 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1715 | bytes: Py_buffer |
| 1716 | / |
| 1717 | |
| 1718 | Convert the bytes-like object to a value. |
| 1719 | |
| 1720 | If no valid value is found, raise EOFError, ValueError or TypeError. Extra |
| 1721 | bytes in the input are ignored. |
| 1722 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1723 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1724 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1725 | marshal_loads_impl(PyObject *module, Py_buffer *bytes) |
| 1726 | /*[clinic end generated code: output=9fc65985c93d1bb1 input=6f426518459c8495]*/ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1727 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1728 | RFILE rf; |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1729 | char *s = bytes->buf; |
| 1730 | Py_ssize_t n = bytes->len; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1731 | PyObject* result; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1732 | rf.fp = NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1733 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1734 | rf.ptr = s; |
| 1735 | rf.end = s + n; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1736 | rf.depth = 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1737 | if ((rf.refs = PyList_New(0)) == NULL) |
| 1738 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1739 | result = read_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1740 | Py_DECREF(rf.refs); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1741 | return result; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1742 | } |
| 1743 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1744 | static PyMethodDef marshal_methods[] = { |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1745 | MARSHAL_DUMP_METHODDEF |
| 1746 | MARSHAL_LOAD_METHODDEF |
| 1747 | MARSHAL_DUMPS_METHODDEF |
| 1748 | MARSHAL_LOADS_METHODDEF |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1749 | {NULL, NULL} /* sentinel */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1750 | }; |
| 1751 | |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1752 | |
| 1753 | PyDoc_STRVAR(module_doc, |
| 1754 | "This module contains functions that can read and write Python values in\n\ |
| 1755 | a binary format. The format is specific to Python, but independent of\n\ |
| 1756 | machine architecture issues.\n\ |
| 1757 | \n\ |
| 1758 | Not all Python object types are supported; in general, only objects\n\ |
| 1759 | whose value is independent from a particular invocation of Python can be\n\ |
| 1760 | written and read by this module. The following types are supported:\n\ |
| 1761 | None, integers, floating point numbers, strings, bytes, bytearrays,\n\ |
| 1762 | tuples, lists, sets, dictionaries, and code objects, where it\n\ |
| 1763 | should be understood that tuples, lists and dictionaries are only\n\ |
| 1764 | supported as long as the values contained therein are themselves\n\ |
| 1765 | supported; and recursive lists and dictionaries should not be written\n\ |
| 1766 | (they will cause infinite loops).\n\ |
| 1767 | \n\ |
| 1768 | Variables:\n\ |
| 1769 | \n\ |
| 1770 | version -- indicates the format that the module uses. Version 0 is the\n\ |
| 1771 | historical format, version 1 shares interned strings and version 2\n\ |
| 1772 | uses a binary format for floating point numbers.\n\ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1773 | Version 3 shares common object references (New in version 3.4).\n\ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1774 | \n\ |
| 1775 | Functions:\n\ |
| 1776 | \n\ |
| 1777 | dump() -- write value to a file\n\ |
| 1778 | load() -- read value from a file\n\ |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1779 | dumps() -- marshal value as a bytes object\n\ |
| 1780 | loads() -- read value from a bytes-like object"); |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1781 | |
| 1782 | |
| 1783 | |
Brett Cannon | 429ef65 | 2008-06-27 00:35:35 +0000 | [diff] [blame] | 1784 | static struct PyModuleDef marshalmodule = { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1785 | PyModuleDef_HEAD_INIT, |
| 1786 | "marshal", |
| 1787 | module_doc, |
| 1788 | 0, |
| 1789 | marshal_methods, |
| 1790 | NULL, |
| 1791 | NULL, |
| 1792 | NULL, |
| 1793 | NULL |
Martin v. Löwis | 1a21451 | 2008-06-11 05:26:20 +0000 | [diff] [blame] | 1794 | }; |
| 1795 | |
Jason Tishler | 6bc06ec | 2003-09-04 11:59:50 +0000 | [diff] [blame] | 1796 | PyMODINIT_FUNC |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 1797 | PyMarshal_Init(void) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1798 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1799 | PyObject *mod = PyModule_Create(&marshalmodule); |
| 1800 | if (mod == NULL) |
| 1801 | return NULL; |
Brandt Bucher | 33b671e | 2019-11-19 16:59:32 -0800 | [diff] [blame] | 1802 | if (PyModule_AddIntConstant(mod, "version", Py_MARSHAL_VERSION) < 0) { |
| 1803 | Py_DECREF(mod); |
| 1804 | return NULL; |
| 1805 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1806 | return mod; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1807 | } |