Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1 | |
| 2 | /* Write Python objects to files and read them back. |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 3 | This is primarily intended for writing and reading compiled Python code, |
| 4 | even though dicts, lists, sets and frozensets, not commonly seen in |
| 5 | code objects, are supported. |
| 6 | Version 3 of this protocol properly supports circular links |
| 7 | and sharing. */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 8 | |
Thomas Wouters | 695934a | 2006-03-01 23:49:13 +0000 | [diff] [blame] | 9 | #define PY_SSIZE_T_CLEAN |
| 10 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 11 | #include "Python.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 12 | #include "longintrepr.h" |
Jeremy Hylton | 3e0055f | 2005-10-20 19:59:25 +0000 | [diff] [blame] | 13 | #include "code.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 14 | #include "marshal.h" |
Victor Stinner | b617993 | 2020-05-12 02:42:19 +0200 | [diff] [blame] | 15 | #include "pycore_hashtable.h" |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 16 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 17 | /*[clinic input] |
| 18 | module marshal |
| 19 | [clinic start generated code]*/ |
| 20 | /*[clinic end generated code: output=da39a3ee5e6b4b0d input=c982b7930dee17db]*/ |
| 21 | |
| 22 | #include "clinic/marshal.c.h" |
| 23 | |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 24 | /* High water mark to determine when the marshalled object is dangerously deep |
| 25 | * and risks coring the interpreter. When the object stack gets this deep, |
| 26 | * raise an exception instead of continuing. |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 27 | * On Windows debug builds, reduce this value. |
Steve Dower | 2a4a62b | 2018-06-04 13:25:00 -0700 | [diff] [blame] | 28 | * |
| 29 | * BUG: https://bugs.python.org/issue33720 |
| 30 | * On Windows PGO builds, the r_object function overallocates its stack and |
| 31 | * can cause a stack overflow. We reduce the maximum depth for all Windows |
| 32 | * releases to protect against this. |
| 33 | * #if defined(MS_WINDOWS) && defined(_DEBUG) |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 34 | */ |
Steve Dower | 2a4a62b | 2018-06-04 13:25:00 -0700 | [diff] [blame] | 35 | #if defined(MS_WINDOWS) |
Steve Dower | f6c69e6 | 2014-11-01 15:15:16 -0700 | [diff] [blame] | 36 | #define MAX_MARSHAL_STACK_DEPTH 1000 |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 37 | #else |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 38 | #define MAX_MARSHAL_STACK_DEPTH 2000 |
Guido van Rossum | 63175a1 | 2007-08-29 20:39:13 +0000 | [diff] [blame] | 39 | #endif |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 40 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 41 | #define TYPE_NULL '0' |
| 42 | #define TYPE_NONE 'N' |
| 43 | #define TYPE_FALSE 'F' |
| 44 | #define TYPE_TRUE 'T' |
| 45 | #define TYPE_STOPITER 'S' |
| 46 | #define TYPE_ELLIPSIS '.' |
| 47 | #define TYPE_INT 'i' |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 48 | /* TYPE_INT64 is not generated anymore. |
| 49 | Supported for backward compatibility only. */ |
| 50 | #define TYPE_INT64 'I' |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 51 | #define TYPE_FLOAT 'f' |
| 52 | #define TYPE_BINARY_FLOAT 'g' |
| 53 | #define TYPE_COMPLEX 'x' |
| 54 | #define TYPE_BINARY_COMPLEX 'y' |
| 55 | #define TYPE_LONG 'l' |
| 56 | #define TYPE_STRING 's' |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 57 | #define TYPE_INTERNED 't' |
| 58 | #define TYPE_REF 'r' |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 59 | #define TYPE_TUPLE '(' |
| 60 | #define TYPE_LIST '[' |
| 61 | #define TYPE_DICT '{' |
| 62 | #define TYPE_CODE 'c' |
| 63 | #define TYPE_UNICODE 'u' |
| 64 | #define TYPE_UNKNOWN '?' |
| 65 | #define TYPE_SET '<' |
| 66 | #define TYPE_FROZENSET '>' |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 67 | #define FLAG_REF '\x80' /* with a type, add obj to index */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 68 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 69 | #define TYPE_ASCII 'a' |
| 70 | #define TYPE_ASCII_INTERNED 'A' |
| 71 | #define TYPE_SMALL_TUPLE ')' |
| 72 | #define TYPE_SHORT_ASCII 'z' |
| 73 | #define TYPE_SHORT_ASCII_INTERNED 'Z' |
| 74 | |
Eric Smith | b1a03cf | 2009-04-21 11:57:38 +0000 | [diff] [blame] | 75 | #define WFERR_OK 0 |
| 76 | #define WFERR_UNMARSHALLABLE 1 |
| 77 | #define WFERR_NESTEDTOODEEP 2 |
| 78 | #define WFERR_NOMEMORY 3 |
| 79 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 80 | typedef struct { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 81 | FILE *fp; |
| 82 | int error; /* see WFERR_* values */ |
| 83 | int depth; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 84 | PyObject *str; |
| 85 | char *ptr; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 86 | const char *end; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 87 | char *buf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 88 | _Py_hashtable_t *hashtable; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 89 | int version; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 90 | } WFILE; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 91 | |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 92 | #define w_byte(c, p) do { \ |
| 93 | if ((p)->ptr != (p)->end || w_reserve((p), 1)) \ |
| 94 | *(p)->ptr++ = (c); \ |
| 95 | } while(0) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 96 | |
| 97 | static void |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 98 | w_flush(WFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 99 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 100 | assert(p->fp != NULL); |
| 101 | fwrite(p->buf, 1, p->ptr - p->buf, p->fp); |
| 102 | p->ptr = p->buf; |
| 103 | } |
| 104 | |
| 105 | static int |
| 106 | w_reserve(WFILE *p, Py_ssize_t needed) |
| 107 | { |
| 108 | Py_ssize_t pos, size, delta; |
| 109 | if (p->ptr == NULL) |
| 110 | return 0; /* An error already occurred */ |
| 111 | if (p->fp != NULL) { |
| 112 | w_flush(p); |
| 113 | return needed <= p->end - p->ptr; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 114 | } |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 115 | assert(p->str != NULL); |
| 116 | pos = p->ptr - p->buf; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 117 | size = PyBytes_GET_SIZE(p->str); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 118 | if (size > 16*1024*1024) |
| 119 | delta = (size >> 3); /* 12.5% overallocation */ |
| 120 | else |
| 121 | delta = size + 1024; |
| 122 | delta = Py_MAX(delta, needed); |
| 123 | if (delta > PY_SSIZE_T_MAX - size) { |
| 124 | p->error = WFERR_NOMEMORY; |
| 125 | return 0; |
| 126 | } |
| 127 | size += delta; |
| 128 | if (_PyBytes_Resize(&p->str, size) != 0) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 129 | p->end = p->ptr = p->buf = NULL; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 130 | return 0; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 131 | } |
| 132 | else { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 133 | p->buf = PyBytes_AS_STRING(p->str); |
| 134 | p->ptr = p->buf + pos; |
| 135 | p->end = p->buf + size; |
| 136 | return 1; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 137 | } |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 138 | } |
| 139 | |
| 140 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 141 | w_string(const void *s, Py_ssize_t n, WFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 142 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 143 | Py_ssize_t m; |
| 144 | if (!n || p->ptr == NULL) |
| 145 | return; |
| 146 | m = p->end - p->ptr; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 147 | if (p->fp != NULL) { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 148 | if (n <= m) { |
Christian Heimes | f051e43 | 2016-09-13 20:22:02 +0200 | [diff] [blame] | 149 | memcpy(p->ptr, s, n); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 150 | p->ptr += n; |
| 151 | } |
| 152 | else { |
| 153 | w_flush(p); |
| 154 | fwrite(s, 1, n, p->fp); |
| 155 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 156 | } |
| 157 | else { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 158 | if (n <= m || w_reserve(p, n - m)) { |
Christian Heimes | f051e43 | 2016-09-13 20:22:02 +0200 | [diff] [blame] | 159 | memcpy(p->ptr, s, n); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 160 | p->ptr += n; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 161 | } |
| 162 | } |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 163 | } |
| 164 | |
| 165 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 166 | w_short(int x, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 167 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 168 | w_byte((char)( x & 0xff), p); |
| 169 | w_byte((char)((x>> 8) & 0xff), p); |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 170 | } |
| 171 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 172 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 173 | w_long(long x, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 174 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 175 | w_byte((char)( x & 0xff), p); |
| 176 | w_byte((char)((x>> 8) & 0xff), p); |
| 177 | w_byte((char)((x>>16) & 0xff), p); |
| 178 | w_byte((char)((x>>24) & 0xff), p); |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 179 | } |
| 180 | |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 181 | #define SIZE32_MAX 0x7FFFFFFF |
| 182 | |
| 183 | #if SIZEOF_SIZE_T > 4 |
| 184 | # define W_SIZE(n, p) do { \ |
| 185 | if ((n) > SIZE32_MAX) { \ |
| 186 | (p)->depth--; \ |
| 187 | (p)->error = WFERR_UNMARSHALLABLE; \ |
| 188 | return; \ |
| 189 | } \ |
| 190 | w_long((long)(n), p); \ |
| 191 | } while(0) |
| 192 | #else |
| 193 | # define W_SIZE w_long |
| 194 | #endif |
| 195 | |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 196 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 197 | w_pstring(const void *s, Py_ssize_t n, WFILE *p) |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 198 | { |
| 199 | W_SIZE(n, p); |
| 200 | w_string(s, n, p); |
| 201 | } |
| 202 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 203 | static void |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 204 | w_short_pstring(const void *s, Py_ssize_t n, WFILE *p) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 205 | { |
Antoine Pitrou | b30f271 | 2013-10-12 23:14:47 +0200 | [diff] [blame] | 206 | w_byte(Py_SAFE_DOWNCAST(n, Py_ssize_t, unsigned char), p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 207 | w_string(s, n, p); |
| 208 | } |
| 209 | |
Serhiy Storchaka | 9594942 | 2013-08-27 19:40:23 +0300 | [diff] [blame] | 210 | /* We assume that Python ints are stored internally in base some power of |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 211 | 2**15; for the sake of portability we'll always read and write them in base |
| 212 | exactly 2**15. */ |
| 213 | |
| 214 | #define PyLong_MARSHAL_SHIFT 15 |
| 215 | #define PyLong_MARSHAL_BASE ((short)1 << PyLong_MARSHAL_SHIFT) |
| 216 | #define PyLong_MARSHAL_MASK (PyLong_MARSHAL_BASE - 1) |
| 217 | #if PyLong_SHIFT % PyLong_MARSHAL_SHIFT != 0 |
| 218 | #error "PyLong_SHIFT must be a multiple of PyLong_MARSHAL_SHIFT" |
| 219 | #endif |
| 220 | #define PyLong_MARSHAL_RATIO (PyLong_SHIFT / PyLong_MARSHAL_SHIFT) |
| 221 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 222 | #define W_TYPE(t, p) do { \ |
| 223 | w_byte((t) | flag, (p)); \ |
| 224 | } while(0) |
| 225 | |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 226 | static void |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 227 | w_PyLong(const PyLongObject *ob, char flag, WFILE *p) |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 228 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 229 | Py_ssize_t i, j, n, l; |
| 230 | digit d; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 231 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 232 | W_TYPE(TYPE_LONG, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 233 | if (Py_SIZE(ob) == 0) { |
| 234 | w_long((long)0, p); |
| 235 | return; |
| 236 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 237 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 238 | /* set l to number of base PyLong_MARSHAL_BASE digits */ |
Victor Stinner | 45e8e2f | 2014-05-14 17:24:35 +0200 | [diff] [blame] | 239 | n = Py_ABS(Py_SIZE(ob)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 240 | l = (n-1) * PyLong_MARSHAL_RATIO; |
| 241 | d = ob->ob_digit[n-1]; |
| 242 | assert(d != 0); /* a PyLong is always normalized */ |
| 243 | do { |
| 244 | d >>= PyLong_MARSHAL_SHIFT; |
| 245 | l++; |
| 246 | } while (d != 0); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 247 | if (l > SIZE32_MAX) { |
| 248 | p->depth--; |
| 249 | p->error = WFERR_UNMARSHALLABLE; |
| 250 | return; |
| 251 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 252 | w_long((long)(Py_SIZE(ob) > 0 ? l : -l), p); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 253 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 254 | for (i=0; i < n-1; i++) { |
| 255 | d = ob->ob_digit[i]; |
| 256 | for (j=0; j < PyLong_MARSHAL_RATIO; j++) { |
| 257 | w_short(d & PyLong_MARSHAL_MASK, p); |
| 258 | d >>= PyLong_MARSHAL_SHIFT; |
| 259 | } |
| 260 | assert (d == 0); |
| 261 | } |
| 262 | d = ob->ob_digit[n-1]; |
| 263 | do { |
| 264 | w_short(d & PyLong_MARSHAL_MASK, p); |
| 265 | d >>= PyLong_MARSHAL_SHIFT; |
| 266 | } while (d != 0); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 267 | } |
| 268 | |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 269 | static void |
| 270 | w_float_bin(double v, WFILE *p) |
| 271 | { |
| 272 | unsigned char buf[8]; |
| 273 | if (_PyFloat_Pack8(v, buf, 1) < 0) { |
| 274 | p->error = WFERR_UNMARSHALLABLE; |
| 275 | return; |
| 276 | } |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 277 | w_string(buf, 8, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 278 | } |
| 279 | |
| 280 | static void |
| 281 | w_float_str(double v, WFILE *p) |
| 282 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 283 | char *buf = PyOS_double_to_string(v, 'g', 17, 0, NULL); |
| 284 | if (!buf) { |
| 285 | p->error = WFERR_NOMEMORY; |
| 286 | return; |
| 287 | } |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 288 | w_short_pstring(buf, strlen(buf), p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 289 | PyMem_Free(buf); |
| 290 | } |
| 291 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 292 | static int |
| 293 | w_ref(PyObject *v, char *flag, WFILE *p) |
| 294 | { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 295 | _Py_hashtable_entry_t *entry; |
| 296 | int w; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 297 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 298 | if (p->version < 3 || p->hashtable == NULL) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 299 | return 0; /* not writing object references */ |
| 300 | |
| 301 | /* if it has only one reference, it definitely isn't shared */ |
| 302 | if (Py_REFCNT(v) == 1) |
| 303 | return 0; |
| 304 | |
Victor Stinner | 5b0a303 | 2020-05-13 04:40:30 +0200 | [diff] [blame^] | 305 | entry = _Py_hashtable_get_entry(p->hashtable, v); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 306 | if (entry != NULL) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 307 | /* write the reference index to the stream */ |
Victor Stinner | 5b0a303 | 2020-05-13 04:40:30 +0200 | [diff] [blame^] | 308 | w = (int)(uintptr_t)entry->value; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 309 | /* we don't store "long" indices in the dict */ |
| 310 | assert(0 <= w && w <= 0x7fffffff); |
| 311 | w_byte(TYPE_REF, p); |
| 312 | w_long(w, p); |
| 313 | return 1; |
| 314 | } else { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 315 | size_t s = p->hashtable->entries; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 316 | /* we don't support long indices */ |
| 317 | if (s >= 0x7fffffff) { |
| 318 | PyErr_SetString(PyExc_ValueError, "too many objects"); |
| 319 | goto err; |
| 320 | } |
Serhiy Storchaka | 26861b0 | 2015-02-16 20:52:17 +0200 | [diff] [blame] | 321 | w = (int)s; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 322 | Py_INCREF(v); |
Victor Stinner | 5b0a303 | 2020-05-13 04:40:30 +0200 | [diff] [blame^] | 323 | if (_Py_hashtable_set(p->hashtable, v, (void *)(uintptr_t)w) < 0) { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 324 | Py_DECREF(v); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 325 | goto err; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 326 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 327 | *flag |= FLAG_REF; |
| 328 | return 0; |
| 329 | } |
| 330 | err: |
| 331 | p->error = WFERR_UNMARSHALLABLE; |
| 332 | return 1; |
| 333 | } |
| 334 | |
| 335 | static void |
| 336 | w_complex_object(PyObject *v, char flag, WFILE *p); |
| 337 | |
Guido van Rossum | b0c168c | 1996-12-05 23:15:02 +0000 | [diff] [blame] | 338 | static void |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 339 | w_object(PyObject *v, WFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 340 | { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 341 | char flag = '\0'; |
Fred Drake | 6da0b91 | 2000-06-28 18:47:56 +0000 | [diff] [blame] | 342 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 343 | p->depth++; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 344 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 345 | if (p->depth > MAX_MARSHAL_STACK_DEPTH) { |
| 346 | p->error = WFERR_NESTEDTOODEEP; |
| 347 | } |
| 348 | else if (v == NULL) { |
| 349 | w_byte(TYPE_NULL, p); |
| 350 | } |
| 351 | else if (v == Py_None) { |
| 352 | w_byte(TYPE_NONE, p); |
| 353 | } |
| 354 | else if (v == PyExc_StopIteration) { |
| 355 | w_byte(TYPE_STOPITER, p); |
| 356 | } |
| 357 | else if (v == Py_Ellipsis) { |
| 358 | w_byte(TYPE_ELLIPSIS, p); |
| 359 | } |
| 360 | else if (v == Py_False) { |
| 361 | w_byte(TYPE_FALSE, p); |
| 362 | } |
| 363 | else if (v == Py_True) { |
| 364 | w_byte(TYPE_TRUE, p); |
| 365 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 366 | else if (!w_ref(v, &flag, p)) |
| 367 | w_complex_object(v, flag, p); |
| 368 | |
| 369 | p->depth--; |
| 370 | } |
| 371 | |
| 372 | static void |
| 373 | w_complex_object(PyObject *v, char flag, WFILE *p) |
| 374 | { |
| 375 | Py_ssize_t i, n; |
| 376 | |
| 377 | if (PyLong_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 378 | int overflow; |
| 379 | long x = PyLong_AsLongAndOverflow(v, &overflow); |
| 380 | if (overflow) { |
| 381 | w_PyLong((PyLongObject *)v, flag, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 382 | } |
| 383 | else { |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 384 | #if SIZEOF_LONG > 4 |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 385 | long y = Py_ARITHMETIC_RIGHT_SHIFT(long, x, 31); |
| 386 | if (y && y != -1) { |
Martin v. Löwis | 7e39572 | 2012-07-28 19:44:05 +0200 | [diff] [blame] | 387 | /* Too large for TYPE_INT */ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 388 | w_PyLong((PyLongObject*)v, flag, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 389 | } |
| 390 | else |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 391 | #endif |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 392 | { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 393 | W_TYPE(TYPE_INT, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 394 | w_long(x, p); |
| 395 | } |
| 396 | } |
| 397 | } |
| 398 | else if (PyFloat_CheckExact(v)) { |
| 399 | if (p->version > 1) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 400 | W_TYPE(TYPE_BINARY_FLOAT, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 401 | w_float_bin(PyFloat_AS_DOUBLE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 402 | } |
| 403 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 404 | W_TYPE(TYPE_FLOAT, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 405 | w_float_str(PyFloat_AS_DOUBLE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 406 | } |
| 407 | } |
| 408 | else if (PyComplex_CheckExact(v)) { |
| 409 | if (p->version > 1) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 410 | W_TYPE(TYPE_BINARY_COMPLEX, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 411 | w_float_bin(PyComplex_RealAsDouble(v), p); |
| 412 | w_float_bin(PyComplex_ImagAsDouble(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 413 | } |
| 414 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 415 | W_TYPE(TYPE_COMPLEX, p); |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 416 | w_float_str(PyComplex_RealAsDouble(v), p); |
| 417 | w_float_str(PyComplex_ImagAsDouble(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 418 | } |
| 419 | } |
| 420 | else if (PyBytes_CheckExact(v)) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 421 | W_TYPE(TYPE_STRING, p); |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 422 | w_pstring(PyBytes_AS_STRING(v), PyBytes_GET_SIZE(v), p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 423 | } |
| 424 | else if (PyUnicode_CheckExact(v)) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 425 | if (p->version >= 4 && PyUnicode_IS_ASCII(v)) { |
| 426 | int is_short = PyUnicode_GET_LENGTH(v) < 256; |
| 427 | if (is_short) { |
| 428 | if (PyUnicode_CHECK_INTERNED(v)) |
| 429 | W_TYPE(TYPE_SHORT_ASCII_INTERNED, p); |
| 430 | else |
| 431 | W_TYPE(TYPE_SHORT_ASCII, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 432 | w_short_pstring(PyUnicode_1BYTE_DATA(v), |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 433 | PyUnicode_GET_LENGTH(v), p); |
| 434 | } |
| 435 | else { |
| 436 | if (PyUnicode_CHECK_INTERNED(v)) |
| 437 | W_TYPE(TYPE_ASCII_INTERNED, p); |
| 438 | else |
| 439 | W_TYPE(TYPE_ASCII, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 440 | w_pstring(PyUnicode_1BYTE_DATA(v), |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 441 | PyUnicode_GET_LENGTH(v), p); |
| 442 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 443 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 444 | else { |
| 445 | PyObject *utf8; |
| 446 | utf8 = PyUnicode_AsEncodedString(v, "utf8", "surrogatepass"); |
| 447 | if (utf8 == NULL) { |
| 448 | p->depth--; |
| 449 | p->error = WFERR_UNMARSHALLABLE; |
| 450 | return; |
| 451 | } |
| 452 | if (p->version >= 3 && PyUnicode_CHECK_INTERNED(v)) |
| 453 | W_TYPE(TYPE_INTERNED, p); |
| 454 | else |
| 455 | W_TYPE(TYPE_UNICODE, p); |
| 456 | w_pstring(PyBytes_AS_STRING(utf8), PyBytes_GET_SIZE(utf8), p); |
| 457 | Py_DECREF(utf8); |
| 458 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 459 | } |
| 460 | else if (PyTuple_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 461 | n = PyTuple_GET_SIZE(v); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 462 | if (p->version >= 4 && n < 256) { |
| 463 | W_TYPE(TYPE_SMALL_TUPLE, p); |
Victor Stinner | da06255 | 2013-11-16 00:13:29 +0100 | [diff] [blame] | 464 | w_byte((unsigned char)n, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 465 | } |
| 466 | else { |
| 467 | W_TYPE(TYPE_TUPLE, p); |
| 468 | W_SIZE(n, p); |
| 469 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 470 | for (i = 0; i < n; i++) { |
| 471 | w_object(PyTuple_GET_ITEM(v, i), p); |
| 472 | } |
| 473 | } |
| 474 | else if (PyList_CheckExact(v)) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 475 | W_TYPE(TYPE_LIST, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 476 | n = PyList_GET_SIZE(v); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 477 | W_SIZE(n, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 478 | for (i = 0; i < n; i++) { |
| 479 | w_object(PyList_GET_ITEM(v, i), p); |
| 480 | } |
| 481 | } |
| 482 | else if (PyDict_CheckExact(v)) { |
| 483 | Py_ssize_t pos; |
| 484 | PyObject *key, *value; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 485 | W_TYPE(TYPE_DICT, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 486 | /* This one is NULL object terminated! */ |
| 487 | pos = 0; |
| 488 | while (PyDict_Next(v, &pos, &key, &value)) { |
| 489 | w_object(key, p); |
| 490 | w_object(value, p); |
| 491 | } |
| 492 | w_object((PyObject *)NULL, p); |
| 493 | } |
| 494 | else if (PyAnySet_CheckExact(v)) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 495 | PyObject *value; |
| 496 | Py_ssize_t pos = 0; |
| 497 | Py_hash_t hash; |
Raymond Hettinger | a422c34 | 2005-01-11 03:03:27 +0000 | [diff] [blame] | 498 | |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 499 | if (PyFrozenSet_CheckExact(v)) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 500 | W_TYPE(TYPE_FROZENSET, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 501 | else |
| 502 | W_TYPE(TYPE_SET, p); |
| 503 | n = PySet_GET_SIZE(v); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 504 | W_SIZE(n, p); |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 505 | while (_PySet_NextEntry(v, &pos, &value, &hash)) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 506 | w_object(value, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 507 | } |
| 508 | } |
| 509 | else if (PyCode_Check(v)) { |
| 510 | PyCodeObject *co = (PyCodeObject *)v; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 511 | W_TYPE(TYPE_CODE, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 512 | w_long(co->co_argcount, p); |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 513 | w_long(co->co_posonlyargcount, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 514 | w_long(co->co_kwonlyargcount, p); |
| 515 | w_long(co->co_nlocals, p); |
| 516 | w_long(co->co_stacksize, p); |
| 517 | w_long(co->co_flags, p); |
| 518 | w_object(co->co_code, p); |
| 519 | w_object(co->co_consts, p); |
| 520 | w_object(co->co_names, p); |
| 521 | w_object(co->co_varnames, p); |
| 522 | w_object(co->co_freevars, p); |
| 523 | w_object(co->co_cellvars, p); |
| 524 | w_object(co->co_filename, p); |
| 525 | w_object(co->co_name, p); |
| 526 | w_long(co->co_firstlineno, p); |
| 527 | w_object(co->co_lnotab, p); |
| 528 | } |
| 529 | else if (PyObject_CheckBuffer(v)) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 530 | /* Write unknown bytes-like objects as a bytes object */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 531 | Py_buffer view; |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 532 | if (PyObject_GetBuffer(v, &view, PyBUF_SIMPLE) != 0) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 533 | w_byte(TYPE_UNKNOWN, p); |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 534 | p->depth--; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 535 | p->error = WFERR_UNMARSHALLABLE; |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 536 | return; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 537 | } |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 538 | W_TYPE(TYPE_STRING, p); |
Serhiy Storchaka | dfde215 | 2013-07-11 19:14:26 +0300 | [diff] [blame] | 539 | w_pstring(view.buf, view.len, p); |
Antoine Pitrou | 679e9d3 | 2012-03-02 18:12:43 +0100 | [diff] [blame] | 540 | PyBuffer_Release(&view); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 541 | } |
| 542 | else { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 543 | W_TYPE(TYPE_UNKNOWN, p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 544 | p->error = WFERR_UNMARSHALLABLE; |
| 545 | } |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 546 | } |
| 547 | |
Victor Stinner | 2d0a3d6 | 2020-05-13 02:50:18 +0200 | [diff] [blame] | 548 | static void |
| 549 | w_decref_entry(void *key) |
| 550 | { |
| 551 | PyObject *entry_key = (PyObject *)key; |
| 552 | Py_XDECREF(entry_key); |
| 553 | } |
| 554 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 555 | static int |
| 556 | w_init_refs(WFILE *wf, int version) |
| 557 | { |
| 558 | if (version >= 3) { |
Victor Stinner | 5b0a303 | 2020-05-13 04:40:30 +0200 | [diff] [blame^] | 559 | wf->hashtable = _Py_hashtable_new_full(_Py_hashtable_hash_ptr, |
Victor Stinner | 2d0a3d6 | 2020-05-13 02:50:18 +0200 | [diff] [blame] | 560 | _Py_hashtable_compare_direct, |
| 561 | w_decref_entry, NULL, NULL); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 562 | if (wf->hashtable == NULL) { |
| 563 | PyErr_NoMemory(); |
| 564 | return -1; |
| 565 | } |
| 566 | } |
| 567 | return 0; |
| 568 | } |
| 569 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 570 | static void |
| 571 | w_clear_refs(WFILE *wf) |
| 572 | { |
| 573 | if (wf->hashtable != NULL) { |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 574 | _Py_hashtable_destroy(wf->hashtable); |
| 575 | } |
| 576 | } |
| 577 | |
Serhiy Storchaka | 9594942 | 2013-08-27 19:40:23 +0300 | [diff] [blame] | 578 | /* version currently has no effect for writing ints. */ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 579 | void |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 580 | PyMarshal_WriteLongToFile(long x, FILE *fp, int version) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 581 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 582 | char buf[4]; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 583 | WFILE wf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 584 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 585 | wf.fp = fp; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 586 | wf.ptr = wf.buf = buf; |
| 587 | wf.end = wf.ptr + sizeof(buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 588 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 589 | wf.version = version; |
| 590 | w_long(x, &wf); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 591 | w_flush(&wf); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 592 | } |
| 593 | |
| 594 | void |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 595 | PyMarshal_WriteObjectToFile(PyObject *x, FILE *fp, int version) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 596 | { |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 597 | char buf[BUFSIZ]; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 598 | WFILE wf; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 599 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 600 | wf.fp = fp; |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 601 | wf.ptr = wf.buf = buf; |
| 602 | wf.end = wf.ptr + sizeof(buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 603 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 604 | wf.version = version; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 605 | if (w_init_refs(&wf, version)) |
| 606 | return; /* caller mush check PyErr_Occurred() */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 607 | w_object(x, &wf); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 608 | w_clear_refs(&wf); |
Serhiy Storchaka | c1efe5f | 2015-02-11 15:54:54 +0200 | [diff] [blame] | 609 | w_flush(&wf); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 610 | } |
| 611 | |
Serhiy Storchaka | c07422c | 2015-02-11 16:18:09 +0200 | [diff] [blame] | 612 | typedef struct { |
| 613 | FILE *fp; |
| 614 | int depth; |
| 615 | PyObject *readable; /* Stream-like object being read from */ |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 616 | const char *ptr; |
| 617 | const char *end; |
Serhiy Storchaka | c07422c | 2015-02-11 16:18:09 +0200 | [diff] [blame] | 618 | char *buf; |
| 619 | Py_ssize_t buf_size; |
| 620 | PyObject *refs; /* a list */ |
| 621 | } RFILE; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 622 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 623 | static const char * |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 624 | r_string(Py_ssize_t n, RFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 625 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 626 | Py_ssize_t read = -1; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 627 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 628 | if (p->ptr != NULL) { |
| 629 | /* Fast path for loads() */ |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 630 | const char *res = p->ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 631 | Py_ssize_t left = p->end - p->ptr; |
| 632 | if (left < n) { |
| 633 | PyErr_SetString(PyExc_EOFError, |
| 634 | "marshal data too short"); |
| 635 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 636 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 637 | p->ptr += n; |
| 638 | return res; |
| 639 | } |
| 640 | if (p->buf == NULL) { |
| 641 | p->buf = PyMem_MALLOC(n); |
| 642 | if (p->buf == NULL) { |
| 643 | PyErr_NoMemory(); |
| 644 | return NULL; |
| 645 | } |
| 646 | p->buf_size = n; |
| 647 | } |
| 648 | else if (p->buf_size < n) { |
Zackery Spytz | 4c49da0 | 2018-12-07 03:11:30 -0700 | [diff] [blame] | 649 | char *tmp = PyMem_REALLOC(p->buf, n); |
| 650 | if (tmp == NULL) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 651 | PyErr_NoMemory(); |
| 652 | return NULL; |
| 653 | } |
Zackery Spytz | 4c49da0 | 2018-12-07 03:11:30 -0700 | [diff] [blame] | 654 | p->buf = tmp; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 655 | p->buf_size = n; |
| 656 | } |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 657 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 658 | if (!p->readable) { |
| 659 | assert(p->fp != NULL); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 660 | read = fread(p->buf, 1, n, p->fp); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 661 | } |
| 662 | else { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 663 | _Py_IDENTIFIER(readinto); |
| 664 | PyObject *res, *mview; |
| 665 | Py_buffer buf; |
Martin v. Löwis | afe55bb | 2011-10-09 10:38:36 +0200 | [diff] [blame] | 666 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 667 | if (PyBuffer_FillInfo(&buf, NULL, p->buf, n, 0, PyBUF_CONTIG) == -1) |
| 668 | return NULL; |
| 669 | mview = PyMemoryView_FromBuffer(&buf); |
| 670 | if (mview == NULL) |
| 671 | return NULL; |
| 672 | |
| 673 | res = _PyObject_CallMethodId(p->readable, &PyId_readinto, "N", mview); |
| 674 | if (res != NULL) { |
| 675 | read = PyNumber_AsSsize_t(res, PyExc_ValueError); |
| 676 | Py_DECREF(res); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 677 | } |
| 678 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 679 | if (read != n) { |
| 680 | if (!PyErr_Occurred()) { |
| 681 | if (read > n) |
| 682 | PyErr_Format(PyExc_ValueError, |
| 683 | "read() returned too much data: " |
| 684 | "%zd bytes requested, %zd returned", |
| 685 | n, read); |
| 686 | else |
| 687 | PyErr_SetString(PyExc_EOFError, |
| 688 | "EOF read where not expected"); |
| 689 | } |
| 690 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 691 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 692 | return p->buf; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 693 | } |
| 694 | |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 695 | static int |
| 696 | r_byte(RFILE *p) |
| 697 | { |
| 698 | int c = EOF; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 699 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 700 | if (p->ptr != NULL) { |
| 701 | if (p->ptr < p->end) |
| 702 | c = (unsigned char) *p->ptr++; |
| 703 | return c; |
| 704 | } |
| 705 | if (!p->readable) { |
| 706 | assert(p->fp); |
| 707 | c = getc(p->fp); |
| 708 | } |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 709 | else { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 710 | const char *ptr = r_string(1, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 711 | if (ptr != NULL) |
Andy Lester | e6be9b5 | 2020-02-11 20:28:35 -0600 | [diff] [blame] | 712 | c = *(const unsigned char *) ptr; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 713 | } |
| 714 | return c; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 715 | } |
| 716 | |
| 717 | static int |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 718 | r_short(RFILE *p) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 719 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 720 | short x = -1; |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 721 | const unsigned char *buffer; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 722 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 723 | buffer = (const unsigned char *) r_string(2, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 724 | if (buffer != NULL) { |
| 725 | x = buffer[0]; |
| 726 | x |= buffer[1] << 8; |
| 727 | /* Sign-extension, in case short greater than 16 bits */ |
| 728 | x |= -(x & 0x8000); |
| 729 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 730 | return x; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 731 | } |
| 732 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 733 | static long |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 734 | r_long(RFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 735 | { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 736 | long x = -1; |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 737 | const unsigned char *buffer; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 738 | |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 739 | buffer = (const unsigned char *) r_string(4, p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 740 | if (buffer != NULL) { |
| 741 | x = buffer[0]; |
| 742 | x |= (long)buffer[1] << 8; |
| 743 | x |= (long)buffer[2] << 16; |
| 744 | x |= (long)buffer[3] << 24; |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 745 | #if SIZEOF_LONG > 4 |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 746 | /* Sign extension for 64-bit machines */ |
| 747 | x |= -(x & 0x80000000L); |
Guido van Rossum | c1547d9 | 1996-12-10 15:39:04 +0000 | [diff] [blame] | 748 | #endif |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 749 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 750 | return x; |
Guido van Rossum | b0c168c | 1996-12-05 23:15:02 +0000 | [diff] [blame] | 751 | } |
| 752 | |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 753 | /* r_long64 deals with the TYPE_INT64 code. */ |
| 754 | static PyObject * |
| 755 | r_long64(RFILE *p) |
| 756 | { |
| 757 | const unsigned char *buffer = (const unsigned char *) r_string(8, p); |
| 758 | if (buffer == NULL) { |
| 759 | return NULL; |
| 760 | } |
| 761 | return _PyLong_FromByteArray(buffer, 8, |
| 762 | 1 /* little endian */, |
| 763 | 1 /* signed */); |
| 764 | } |
| 765 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 766 | static PyObject * |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 767 | r_PyLong(RFILE *p) |
| 768 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 769 | PyLongObject *ob; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 770 | long n, size, i; |
| 771 | int j, md, shorts_in_top_digit; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 772 | digit d; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 773 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 774 | n = r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 775 | if (PyErr_Occurred()) |
| 776 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 777 | if (n == 0) |
| 778 | return (PyObject *)_PyLong_New(0); |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 779 | if (n < -SIZE32_MAX || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 780 | PyErr_SetString(PyExc_ValueError, |
| 781 | "bad marshal data (long size out of range)"); |
| 782 | return NULL; |
| 783 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 784 | |
Victor Stinner | 45e8e2f | 2014-05-14 17:24:35 +0200 | [diff] [blame] | 785 | size = 1 + (Py_ABS(n) - 1) / PyLong_MARSHAL_RATIO; |
| 786 | shorts_in_top_digit = 1 + (Py_ABS(n) - 1) % PyLong_MARSHAL_RATIO; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 787 | ob = _PyLong_New(size); |
| 788 | if (ob == NULL) |
| 789 | return NULL; |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 790 | |
Victor Stinner | 60ac6ed | 2020-02-07 23:18:08 +0100 | [diff] [blame] | 791 | Py_SET_SIZE(ob, n > 0 ? size : -size); |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 792 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 793 | for (i = 0; i < size-1; i++) { |
| 794 | d = 0; |
| 795 | for (j=0; j < PyLong_MARSHAL_RATIO; j++) { |
| 796 | md = r_short(p); |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 797 | if (PyErr_Occurred()) { |
| 798 | Py_DECREF(ob); |
| 799 | return NULL; |
| 800 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 801 | if (md < 0 || md > PyLong_MARSHAL_BASE) |
| 802 | goto bad_digit; |
| 803 | d += (digit)md << j*PyLong_MARSHAL_SHIFT; |
| 804 | } |
| 805 | ob->ob_digit[i] = d; |
| 806 | } |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 807 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 808 | d = 0; |
| 809 | for (j=0; j < shorts_in_top_digit; j++) { |
| 810 | md = r_short(p); |
Victor Stinner | 763b0d1 | 2013-10-31 16:56:38 +0100 | [diff] [blame] | 811 | if (PyErr_Occurred()) { |
| 812 | Py_DECREF(ob); |
| 813 | return NULL; |
| 814 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 815 | if (md < 0 || md > PyLong_MARSHAL_BASE) |
| 816 | goto bad_digit; |
| 817 | /* topmost marshal digit should be nonzero */ |
| 818 | if (md == 0 && j == shorts_in_top_digit - 1) { |
| 819 | Py_DECREF(ob); |
| 820 | PyErr_SetString(PyExc_ValueError, |
| 821 | "bad marshal data (unnormalized long data)"); |
| 822 | return NULL; |
| 823 | } |
| 824 | d += (digit)md << j*PyLong_MARSHAL_SHIFT; |
| 825 | } |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 826 | if (PyErr_Occurred()) { |
| 827 | Py_DECREF(ob); |
| 828 | return NULL; |
| 829 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 830 | /* top digit should be nonzero, else the resulting PyLong won't be |
| 831 | normalized */ |
| 832 | ob->ob_digit[size-1] = d; |
| 833 | return (PyObject *)ob; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 834 | bad_digit: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 835 | Py_DECREF(ob); |
| 836 | PyErr_SetString(PyExc_ValueError, |
| 837 | "bad marshal data (digit out of range in long)"); |
| 838 | return NULL; |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 839 | } |
| 840 | |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 841 | static double |
| 842 | r_float_bin(RFILE *p) |
| 843 | { |
| 844 | const unsigned char *buf = (const unsigned char *) r_string(8, p); |
| 845 | if (buf == NULL) |
| 846 | return -1; |
| 847 | return _PyFloat_Unpack8(buf, 1); |
| 848 | } |
| 849 | |
| 850 | /* Issue #33720: Disable inlining for reducing the C stack consumption |
| 851 | on PGO builds. */ |
| 852 | _Py_NO_INLINE static double |
| 853 | r_float_str(RFILE *p) |
| 854 | { |
| 855 | int n; |
| 856 | char buf[256]; |
| 857 | const char *ptr; |
| 858 | n = r_byte(p); |
| 859 | if (n == EOF) { |
| 860 | PyErr_SetString(PyExc_EOFError, |
| 861 | "EOF read where object expected"); |
| 862 | return -1; |
| 863 | } |
| 864 | ptr = r_string(n, p); |
| 865 | if (ptr == NULL) { |
| 866 | return -1; |
| 867 | } |
| 868 | memcpy(buf, ptr, n); |
| 869 | buf[n] = '\0'; |
| 870 | return PyOS_string_to_double(buf, NULL, NULL); |
| 871 | } |
| 872 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 873 | /* allocate the reflist index for a new object. Return -1 on failure */ |
| 874 | static Py_ssize_t |
| 875 | r_ref_reserve(int flag, RFILE *p) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 876 | { |
| 877 | if (flag) { /* currently only FLAG_REF is defined */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 878 | Py_ssize_t idx = PyList_GET_SIZE(p->refs); |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 879 | if (idx >= 0x7ffffffe) { |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 880 | PyErr_SetString(PyExc_ValueError, "bad marshal data (index list too large)"); |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 881 | return -1; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 882 | } |
| 883 | if (PyList_Append(p->refs, Py_None) < 0) |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 884 | return -1; |
| 885 | return idx; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 886 | } else |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 887 | return 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 888 | } |
| 889 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 890 | /* insert the new object 'o' to the reflist at previously |
| 891 | * allocated index 'idx'. |
| 892 | * 'o' can be NULL, in which case nothing is done. |
| 893 | * if 'o' was non-NULL, and the function succeeds, 'o' is returned. |
| 894 | * if 'o' was non-NULL, and the function fails, 'o' is released and |
| 895 | * NULL returned. This simplifies error checking at the call site since |
| 896 | * a single test for NULL for the function result is enough. |
| 897 | */ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 898 | static PyObject * |
| 899 | r_ref_insert(PyObject *o, Py_ssize_t idx, int flag, RFILE *p) |
| 900 | { |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 901 | if (o != NULL && flag) { /* currently only FLAG_REF is defined */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 902 | PyObject *tmp = PyList_GET_ITEM(p->refs, idx); |
| 903 | Py_INCREF(o); |
| 904 | PyList_SET_ITEM(p->refs, idx, o); |
| 905 | Py_DECREF(tmp); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 906 | } |
| 907 | return o; |
| 908 | } |
| 909 | |
| 910 | /* combination of both above, used when an object can be |
| 911 | * created whenever it is seen in the file, as opposed to |
| 912 | * after having loaded its sub-objects. |
| 913 | */ |
| 914 | static PyObject * |
| 915 | r_ref(PyObject *o, int flag, RFILE *p) |
| 916 | { |
Victor Stinner | 359fabc | 2013-10-31 17:09:01 +0100 | [diff] [blame] | 917 | assert(flag & FLAG_REF); |
| 918 | if (o == NULL) |
| 919 | return NULL; |
| 920 | if (PyList_Append(p->refs, o) < 0) { |
| 921 | Py_DECREF(o); /* release the new object */ |
| 922 | return NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 923 | } |
| 924 | return o; |
| 925 | } |
Mark Dickinson | bd79264 | 2009-03-18 20:06:12 +0000 | [diff] [blame] | 926 | |
| 927 | static PyObject * |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 928 | r_object(RFILE *p) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 929 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 930 | /* NULL is a valid return value, it does not necessarily means that |
| 931 | an exception is set. */ |
| 932 | PyObject *v, *v2; |
Benjamin Peterson | eddb0a7 | 2013-03-20 00:40:07 -0500 | [diff] [blame] | 933 | Py_ssize_t idx = 0; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 934 | long i, n; |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 935 | int type, code = r_byte(p); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 936 | int flag, is_interned = 0; |
Christian Heimes | 3572842 | 2013-10-13 02:29:06 +0200 | [diff] [blame] | 937 | PyObject *retval = NULL; |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 938 | |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 939 | if (code == EOF) { |
| 940 | PyErr_SetString(PyExc_EOFError, |
| 941 | "EOF read where object expected"); |
| 942 | return NULL; |
| 943 | } |
| 944 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 945 | p->depth++; |
Guido van Rossum | d59da4b | 2007-05-22 18:11:13 +0000 | [diff] [blame] | 946 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 947 | if (p->depth > MAX_MARSHAL_STACK_DEPTH) { |
| 948 | p->depth--; |
| 949 | PyErr_SetString(PyExc_ValueError, "recursion limit exceeded"); |
| 950 | return NULL; |
| 951 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 952 | |
Kristján Valur Jónsson | 6168362 | 2013-03-20 14:26:33 -0700 | [diff] [blame] | 953 | flag = code & FLAG_REF; |
| 954 | type = code & ~FLAG_REF; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 955 | |
| 956 | #define R_REF(O) do{\ |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 957 | if (flag) \ |
| 958 | O = r_ref(O, flag, p);\ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 959 | } while (0) |
| 960 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 961 | switch (type) { |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 962 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 963 | case TYPE_NULL: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 964 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 965 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 966 | case TYPE_NONE: |
| 967 | Py_INCREF(Py_None); |
| 968 | retval = Py_None; |
| 969 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 970 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 971 | case TYPE_STOPITER: |
| 972 | Py_INCREF(PyExc_StopIteration); |
| 973 | retval = PyExc_StopIteration; |
| 974 | break; |
Tim Peters | 5ca576e | 2001-06-18 22:08:13 +0000 | [diff] [blame] | 975 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 976 | case TYPE_ELLIPSIS: |
| 977 | Py_INCREF(Py_Ellipsis); |
| 978 | retval = Py_Ellipsis; |
| 979 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 980 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 981 | case TYPE_FALSE: |
| 982 | Py_INCREF(Py_False); |
| 983 | retval = Py_False; |
| 984 | break; |
Guido van Rossum | 77f6a65 | 2002-04-03 22:41:51 +0000 | [diff] [blame] | 985 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 986 | case TYPE_TRUE: |
| 987 | Py_INCREF(Py_True); |
| 988 | retval = Py_True; |
| 989 | break; |
Guido van Rossum | 77f6a65 | 2002-04-03 22:41:51 +0000 | [diff] [blame] | 990 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 991 | case TYPE_INT: |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 992 | n = r_long(p); |
| 993 | retval = PyErr_Occurred() ? NULL : PyLong_FromLong(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 994 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 995 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 996 | |
Serhiy Storchaka | 00987f6 | 2017-11-15 17:41:05 +0200 | [diff] [blame] | 997 | case TYPE_INT64: |
| 998 | retval = r_long64(p); |
| 999 | R_REF(retval); |
| 1000 | break; |
| 1001 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1002 | case TYPE_LONG: |
| 1003 | retval = r_PyLong(p); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1004 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1005 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1006 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1007 | case TYPE_FLOAT: |
| 1008 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1009 | double x = r_float_str(p); |
| 1010 | if (x == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1011 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1012 | retval = PyFloat_FromDouble(x); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1013 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1014 | break; |
| 1015 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1016 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1017 | case TYPE_BINARY_FLOAT: |
| 1018 | { |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1019 | double x = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1020 | if (x == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1021 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1022 | retval = PyFloat_FromDouble(x); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1023 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1024 | break; |
| 1025 | } |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1026 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1027 | case TYPE_COMPLEX: |
| 1028 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1029 | Py_complex c; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1030 | c.real = r_float_str(p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1031 | if (c.real == -1.0 && PyErr_Occurred()) |
| 1032 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1033 | c.imag = r_float_str(p); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1034 | if (c.imag == -1.0 && PyErr_Occurred()) |
| 1035 | break; |
| 1036 | retval = PyComplex_FromCComplex(c); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1037 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1038 | break; |
| 1039 | } |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1040 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1041 | case TYPE_BINARY_COMPLEX: |
| 1042 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1043 | Py_complex c; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1044 | c.real = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1045 | if (c.real == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1046 | break; |
Serhiy Storchaka | c573499 | 2018-07-24 10:55:47 +0300 | [diff] [blame] | 1047 | c.imag = r_float_bin(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1048 | if (c.imag == -1.0 && PyErr_Occurred()) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1049 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1050 | retval = PyComplex_FromCComplex(c); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1051 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1052 | break; |
| 1053 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1054 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1055 | case TYPE_STRING: |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1056 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1057 | const char *ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1058 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1059 | if (PyErr_Occurred()) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1060 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1061 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1062 | PyErr_SetString(PyExc_ValueError, "bad marshal data (bytes object size out of range)"); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1063 | break; |
| 1064 | } |
| 1065 | v = PyBytes_FromStringAndSize((char *)NULL, n); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1066 | if (v == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1067 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1068 | ptr = r_string(n, p); |
| 1069 | if (ptr == NULL) { |
| 1070 | Py_DECREF(v); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1071 | break; |
| 1072 | } |
| 1073 | memcpy(PyBytes_AS_STRING(v), ptr, n); |
| 1074 | retval = v; |
| 1075 | R_REF(retval); |
| 1076 | break; |
| 1077 | } |
| 1078 | |
| 1079 | case TYPE_ASCII_INTERNED: |
| 1080 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1081 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1082 | case TYPE_ASCII: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1083 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1084 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1085 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1086 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1087 | PyErr_SetString(PyExc_ValueError, "bad marshal data (string size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1088 | break; |
| 1089 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1090 | goto _read_ascii; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1091 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1092 | case TYPE_SHORT_ASCII_INTERNED: |
| 1093 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1094 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1095 | case TYPE_SHORT_ASCII: |
| 1096 | n = r_byte(p); |
| 1097 | if (n == EOF) { |
| 1098 | PyErr_SetString(PyExc_EOFError, |
| 1099 | "EOF read where object expected"); |
| 1100 | break; |
| 1101 | } |
| 1102 | _read_ascii: |
| 1103 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1104 | const char *ptr; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1105 | ptr = r_string(n, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1106 | if (ptr == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1107 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1108 | v = PyUnicode_FromKindAndData(PyUnicode_1BYTE_KIND, ptr, n); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1109 | if (v == NULL) |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1110 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1111 | if (is_interned) |
| 1112 | PyUnicode_InternInPlace(&v); |
| 1113 | retval = v; |
| 1114 | R_REF(retval); |
| 1115 | break; |
| 1116 | } |
| 1117 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1118 | case TYPE_INTERNED: |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1119 | is_interned = 1; |
Stefan Krah | f432a32 | 2017-08-21 13:09:59 +0200 | [diff] [blame] | 1120 | /* fall through */ |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1121 | case TYPE_UNICODE: |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1122 | { |
Serhiy Storchaka | ef1585e | 2015-12-25 20:01:53 +0200 | [diff] [blame] | 1123 | const char *buffer; |
Guido van Rossum | c279b53 | 2000-03-10 23:03:02 +0000 | [diff] [blame] | 1124 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1125 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1126 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1127 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1128 | if (n < 0 || n > SIZE32_MAX) { |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1129 | PyErr_SetString(PyExc_ValueError, "bad marshal data (string size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1130 | break; |
| 1131 | } |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1132 | if (n != 0) { |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1133 | buffer = r_string(n, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1134 | if (buffer == NULL) |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1135 | break; |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1136 | v = PyUnicode_DecodeUTF8(buffer, n, "surrogatepass"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1137 | } |
Victor Stinner | f1913ca | 2013-06-21 19:08:06 +0200 | [diff] [blame] | 1138 | else { |
| 1139 | v = PyUnicode_New(0, 0); |
| 1140 | } |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1141 | if (v == NULL) |
Victor Stinner | 3a8b79d | 2013-07-08 22:23:32 +0200 | [diff] [blame] | 1142 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1143 | if (is_interned) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1144 | PyUnicode_InternInPlace(&v); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1145 | retval = v; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1146 | R_REF(retval); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1147 | break; |
| 1148 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1149 | |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1150 | case TYPE_SMALL_TUPLE: |
| 1151 | n = (unsigned char) r_byte(p); |
Victor Stinner | b1b7b18 | 2013-10-31 17:07:08 +0100 | [diff] [blame] | 1152 | if (PyErr_Occurred()) |
| 1153 | break; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1154 | goto _read_tuple; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1155 | case TYPE_TUPLE: |
| 1156 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1157 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1158 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1159 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1160 | PyErr_SetString(PyExc_ValueError, "bad marshal data (tuple size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1161 | break; |
| 1162 | } |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1163 | _read_tuple: |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1164 | v = PyTuple_New(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1165 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1166 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1167 | break; |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1168 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1169 | for (i = 0; i < n; i++) { |
| 1170 | v2 = r_object(p); |
| 1171 | if ( v2 == NULL ) { |
| 1172 | if (!PyErr_Occurred()) |
| 1173 | PyErr_SetString(PyExc_TypeError, |
| 1174 | "NULL object in marshal data for tuple"); |
| 1175 | Py_DECREF(v); |
| 1176 | v = NULL; |
| 1177 | break; |
| 1178 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1179 | PyTuple_SET_ITEM(v, i, v2); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1180 | } |
| 1181 | retval = v; |
| 1182 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1183 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1184 | case TYPE_LIST: |
| 1185 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1186 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1187 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1188 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1189 | PyErr_SetString(PyExc_ValueError, "bad marshal data (list size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1190 | break; |
| 1191 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1192 | v = PyList_New(n); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1193 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1194 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1195 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1196 | for (i = 0; i < n; i++) { |
| 1197 | v2 = r_object(p); |
| 1198 | if ( v2 == NULL ) { |
| 1199 | if (!PyErr_Occurred()) |
| 1200 | PyErr_SetString(PyExc_TypeError, |
| 1201 | "NULL object in marshal data for list"); |
| 1202 | Py_DECREF(v); |
| 1203 | v = NULL; |
| 1204 | break; |
| 1205 | } |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1206 | PyList_SET_ITEM(v, i, v2); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1207 | } |
| 1208 | retval = v; |
| 1209 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1210 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1211 | case TYPE_DICT: |
| 1212 | v = PyDict_New(); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1213 | R_REF(v); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1214 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1215 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1216 | for (;;) { |
| 1217 | PyObject *key, *val; |
| 1218 | key = r_object(p); |
| 1219 | if (key == NULL) |
| 1220 | break; |
| 1221 | val = r_object(p); |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1222 | if (val == NULL) { |
| 1223 | Py_DECREF(key); |
| 1224 | break; |
| 1225 | } |
| 1226 | if (PyDict_SetItem(v, key, val) < 0) { |
| 1227 | Py_DECREF(key); |
| 1228 | Py_DECREF(val); |
| 1229 | break; |
| 1230 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1231 | Py_DECREF(key); |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1232 | Py_DECREF(val); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1233 | } |
| 1234 | if (PyErr_Occurred()) { |
| 1235 | Py_DECREF(v); |
| 1236 | v = NULL; |
| 1237 | } |
| 1238 | retval = v; |
| 1239 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1240 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1241 | case TYPE_SET: |
| 1242 | case TYPE_FROZENSET: |
| 1243 | n = r_long(p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1244 | if (PyErr_Occurred()) |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1245 | break; |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1246 | if (n < 0 || n > SIZE32_MAX) { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1247 | PyErr_SetString(PyExc_ValueError, "bad marshal data (set size out of range)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1248 | break; |
| 1249 | } |
Victor Stinner | d5cae6f | 2013-10-31 17:14:52 +0100 | [diff] [blame] | 1250 | |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1251 | if (n == 0 && type == TYPE_FROZENSET) { |
| 1252 | /* call frozenset() to get the empty frozenset singleton */ |
Victor Stinner | 4778eab | 2016-12-01 14:51:04 +0100 | [diff] [blame] | 1253 | v = _PyObject_CallNoArg((PyObject*)&PyFrozenSet_Type); |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1254 | if (v == NULL) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1255 | break; |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1256 | R_REF(v); |
| 1257 | retval = v; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1258 | } |
Victor Stinner | 1aa7893 | 2016-01-23 14:15:48 +0100 | [diff] [blame] | 1259 | else { |
| 1260 | v = (type == TYPE_SET) ? PySet_New(NULL) : PyFrozenSet_New(NULL); |
| 1261 | if (type == TYPE_SET) { |
| 1262 | R_REF(v); |
| 1263 | } else { |
| 1264 | /* must use delayed registration of frozensets because they must |
| 1265 | * be init with a refcount of 1 |
| 1266 | */ |
| 1267 | idx = r_ref_reserve(flag, p); |
| 1268 | if (idx < 0) |
| 1269 | Py_CLEAR(v); /* signal error */ |
| 1270 | } |
| 1271 | if (v == NULL) |
| 1272 | break; |
| 1273 | |
| 1274 | for (i = 0; i < n; i++) { |
| 1275 | v2 = r_object(p); |
| 1276 | if ( v2 == NULL ) { |
| 1277 | if (!PyErr_Occurred()) |
| 1278 | PyErr_SetString(PyExc_TypeError, |
| 1279 | "NULL object in marshal data for set"); |
| 1280 | Py_DECREF(v); |
| 1281 | v = NULL; |
| 1282 | break; |
| 1283 | } |
| 1284 | if (PySet_Add(v, v2) == -1) { |
| 1285 | Py_DECREF(v); |
| 1286 | Py_DECREF(v2); |
| 1287 | v = NULL; |
| 1288 | break; |
| 1289 | } |
| 1290 | Py_DECREF(v2); |
| 1291 | } |
| 1292 | if (type != TYPE_SET) |
| 1293 | v = r_ref_insert(v, idx, flag, p); |
| 1294 | retval = v; |
| 1295 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1296 | break; |
Raymond Hettinger | a422c34 | 2005-01-11 03:03:27 +0000 | [diff] [blame] | 1297 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1298 | case TYPE_CODE: |
| 1299 | { |
| 1300 | int argcount; |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1301 | int posonlyargcount; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1302 | int kwonlyargcount; |
| 1303 | int nlocals; |
| 1304 | int stacksize; |
| 1305 | int flags; |
| 1306 | PyObject *code = NULL; |
| 1307 | PyObject *consts = NULL; |
| 1308 | PyObject *names = NULL; |
| 1309 | PyObject *varnames = NULL; |
| 1310 | PyObject *freevars = NULL; |
| 1311 | PyObject *cellvars = NULL; |
| 1312 | PyObject *filename = NULL; |
| 1313 | PyObject *name = NULL; |
| 1314 | int firstlineno; |
| 1315 | PyObject *lnotab = NULL; |
Antoine Pitrou | e9bbe8b | 2013-04-13 22:41:09 +0200 | [diff] [blame] | 1316 | |
Kristján Valur Jónsson | e178187 | 2013-03-20 11:43:57 -0700 | [diff] [blame] | 1317 | idx = r_ref_reserve(flag, p); |
Kristján Valur Jónsson | 5983258 | 2013-10-13 13:41:59 +0000 | [diff] [blame] | 1318 | if (idx < 0) |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1319 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1320 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1321 | v = NULL; |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1322 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1323 | /* XXX ignore long->int overflows for now */ |
| 1324 | argcount = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1325 | if (PyErr_Occurred()) |
| 1326 | goto code_error; |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1327 | posonlyargcount = (int)r_long(p); |
| 1328 | if (PyErr_Occurred()) { |
| 1329 | goto code_error; |
| 1330 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1331 | kwonlyargcount = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1332 | if (PyErr_Occurred()) |
| 1333 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1334 | nlocals = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1335 | if (PyErr_Occurred()) |
| 1336 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1337 | stacksize = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1338 | if (PyErr_Occurred()) |
| 1339 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1340 | flags = (int)r_long(p); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1341 | if (PyErr_Occurred()) |
| 1342 | goto code_error; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1343 | code = r_object(p); |
| 1344 | if (code == NULL) |
| 1345 | goto code_error; |
| 1346 | consts = r_object(p); |
| 1347 | if (consts == NULL) |
| 1348 | goto code_error; |
| 1349 | names = r_object(p); |
| 1350 | if (names == NULL) |
| 1351 | goto code_error; |
| 1352 | varnames = r_object(p); |
| 1353 | if (varnames == NULL) |
| 1354 | goto code_error; |
| 1355 | freevars = r_object(p); |
| 1356 | if (freevars == NULL) |
| 1357 | goto code_error; |
| 1358 | cellvars = r_object(p); |
| 1359 | if (cellvars == NULL) |
| 1360 | goto code_error; |
| 1361 | filename = r_object(p); |
| 1362 | if (filename == NULL) |
| 1363 | goto code_error; |
| 1364 | name = r_object(p); |
| 1365 | if (name == NULL) |
| 1366 | goto code_error; |
| 1367 | firstlineno = (int)r_long(p); |
Kristján Valur Jónsson | 0a7697b | 2013-10-13 15:19:56 +0000 | [diff] [blame] | 1368 | if (firstlineno == -1 && PyErr_Occurred()) |
| 1369 | break; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1370 | lnotab = r_object(p); |
| 1371 | if (lnotab == NULL) |
| 1372 | goto code_error; |
Michael W. Hudson | df88846 | 2005-06-03 14:41:55 +0000 | [diff] [blame] | 1373 | |
Pablo Galindo | 4a2edc3 | 2019-07-01 11:35:05 +0100 | [diff] [blame] | 1374 | v = (PyObject *) PyCode_NewWithPosOnlyArgs( |
Pablo Galindo | 8c77b8c | 2019-04-29 13:36:57 +0100 | [diff] [blame] | 1375 | argcount, posonlyargcount, kwonlyargcount, |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1376 | nlocals, stacksize, flags, |
| 1377 | code, consts, names, varnames, |
| 1378 | freevars, cellvars, filename, name, |
| 1379 | firstlineno, lnotab); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1380 | v = r_ref_insert(v, idx, flag, p); |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1381 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1382 | code_error: |
| 1383 | Py_XDECREF(code); |
| 1384 | Py_XDECREF(consts); |
| 1385 | Py_XDECREF(names); |
| 1386 | Py_XDECREF(varnames); |
| 1387 | Py_XDECREF(freevars); |
| 1388 | Py_XDECREF(cellvars); |
| 1389 | Py_XDECREF(filename); |
| 1390 | Py_XDECREF(name); |
| 1391 | Py_XDECREF(lnotab); |
| 1392 | } |
| 1393 | retval = v; |
| 1394 | break; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1395 | |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1396 | case TYPE_REF: |
| 1397 | n = r_long(p); |
| 1398 | if (n < 0 || n >= PyList_GET_SIZE(p->refs)) { |
Kristján Valur Jónsson | 0a7697b | 2013-10-13 15:19:56 +0000 | [diff] [blame] | 1399 | if (n == -1 && PyErr_Occurred()) |
| 1400 | break; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1401 | PyErr_SetString(PyExc_ValueError, "bad marshal data (invalid reference)"); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1402 | break; |
| 1403 | } |
| 1404 | v = PyList_GET_ITEM(p->refs, n); |
| 1405 | if (v == Py_None) { |
| 1406 | PyErr_SetString(PyExc_ValueError, "bad marshal data (invalid reference)"); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1407 | break; |
| 1408 | } |
| 1409 | Py_INCREF(v); |
| 1410 | retval = v; |
| 1411 | break; |
| 1412 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1413 | default: |
| 1414 | /* Bogus data got written, which isn't ideal. |
| 1415 | This will let you keep working and recover. */ |
| 1416 | PyErr_SetString(PyExc_ValueError, "bad marshal data (unknown type code)"); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1417 | break; |
| 1418 | |
| 1419 | } |
| 1420 | p->depth--; |
| 1421 | return retval; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1422 | } |
| 1423 | |
Neal Norwitz | d85c452 | 2004-06-13 20:31:49 +0000 | [diff] [blame] | 1424 | static PyObject * |
Armin Rigo | 01ab279 | 2004-03-26 15:09:27 +0000 | [diff] [blame] | 1425 | read_object(RFILE *p) |
| 1426 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1427 | PyObject *v; |
| 1428 | if (PyErr_Occurred()) { |
| 1429 | fprintf(stderr, "XXX readobject called with exception set\n"); |
| 1430 | return NULL; |
| 1431 | } |
| 1432 | v = r_object(p); |
| 1433 | if (v == NULL && !PyErr_Occurred()) |
| 1434 | PyErr_SetString(PyExc_TypeError, "NULL object in marshal data for object"); |
| 1435 | return v; |
Armin Rigo | 01ab279 | 2004-03-26 15:09:27 +0000 | [diff] [blame] | 1436 | } |
| 1437 | |
Guido van Rossum | b8cf3e6 | 2001-10-19 01:46:21 +0000 | [diff] [blame] | 1438 | int |
| 1439 | PyMarshal_ReadShortFromFile(FILE *fp) |
| 1440 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1441 | RFILE rf; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1442 | int res; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1443 | assert(fp); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1444 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1445 | rf.fp = fp; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1446 | rf.end = rf.ptr = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1447 | rf.buf = NULL; |
| 1448 | res = r_short(&rf); |
| 1449 | if (rf.buf != NULL) |
| 1450 | PyMem_FREE(rf.buf); |
| 1451 | return res; |
Guido van Rossum | b8cf3e6 | 2001-10-19 01:46:21 +0000 | [diff] [blame] | 1452 | } |
| 1453 | |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1454 | long |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 1455 | PyMarshal_ReadLongFromFile(FILE *fp) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1456 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1457 | RFILE rf; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1458 | long res; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1459 | rf.fp = fp; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1460 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1461 | rf.ptr = rf.end = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1462 | rf.buf = NULL; |
| 1463 | res = r_long(&rf); |
| 1464 | if (rf.buf != NULL) |
| 1465 | PyMem_FREE(rf.buf); |
| 1466 | return res; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1467 | } |
| 1468 | |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1469 | /* Return size of file in bytes; < 0 if unknown or INT_MAX if too big */ |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1470 | static off_t |
| 1471 | getfilesize(FILE *fp) |
| 1472 | { |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1473 | struct _Py_stat_struct st; |
Victor Stinner | e134a7f | 2015-03-30 10:09:31 +0200 | [diff] [blame] | 1474 | if (_Py_fstat_noraise(fileno(fp), &st) != 0) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1475 | return -1; |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1476 | #if SIZEOF_OFF_T == 4 |
| 1477 | else if (st.st_size >= INT_MAX) |
| 1478 | return (off_t)INT_MAX; |
| 1479 | #endif |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1480 | else |
Steve Dower | f2f373f | 2015-02-21 08:44:05 -0800 | [diff] [blame] | 1481 | return (off_t)st.st_size; |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1482 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1483 | |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1484 | /* If we can get the size of the file up-front, and it's reasonably small, |
| 1485 | * read it in one gulp and delegate to ...FromString() instead. Much quicker |
| 1486 | * than reading a byte at a time from file; speeds .pyc imports. |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1487 | * CAUTION: since this may read the entire remainder of the file, don't |
| 1488 | * call it unless you know you're done with the file. |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1489 | */ |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1490 | PyObject * |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1491 | PyMarshal_ReadLastObjectFromFile(FILE *fp) |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1492 | { |
Antoine Pitrou | 5bc7ec9 | 2010-04-21 22:56:22 +0000 | [diff] [blame] | 1493 | /* REASONABLE_FILE_LIMIT is by defn something big enough for Tkinter.pyc. */ |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1494 | #define REASONABLE_FILE_LIMIT (1L << 18) |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1495 | off_t filesize; |
| 1496 | filesize = getfilesize(fp); |
| 1497 | if (filesize > 0 && filesize <= REASONABLE_FILE_LIMIT) { |
| 1498 | char* pBuf = (char *)PyMem_MALLOC(filesize); |
| 1499 | if (pBuf != NULL) { |
Serhiy Storchaka | 7e01911 | 2013-02-13 12:08:15 +0200 | [diff] [blame] | 1500 | size_t n = fread(pBuf, 1, (size_t)filesize, fp); |
| 1501 | PyObject* v = PyMarshal_ReadObjectFromString(pBuf, n); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1502 | PyMem_FREE(pBuf); |
| 1503 | return v; |
| 1504 | } |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1505 | |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1506 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1507 | /* We don't have fstat, or we do but the file is larger than |
| 1508 | * REASONABLE_FILE_LIMIT or malloc failed -- read a byte at a time. |
| 1509 | */ |
| 1510 | return PyMarshal_ReadObjectFromFile(fp); |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1511 | |
Tim Peters | 691e0e9 | 2001-01-18 04:39:16 +0000 | [diff] [blame] | 1512 | #undef REASONABLE_FILE_LIMIT |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1513 | } |
| 1514 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1515 | PyObject * |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1516 | PyMarshal_ReadObjectFromFile(FILE *fp) |
| 1517 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1518 | RFILE rf; |
| 1519 | PyObject *result; |
| 1520 | rf.fp = fp; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1521 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1522 | rf.depth = 0; |
| 1523 | rf.ptr = rf.end = NULL; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1524 | rf.buf = NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1525 | rf.refs = PyList_New(0); |
| 1526 | if (rf.refs == NULL) |
| 1527 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1528 | result = r_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1529 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1530 | if (rf.buf != NULL) |
| 1531 | PyMem_FREE(rf.buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1532 | return result; |
Tim Peters | d9b9ac8 | 2001-01-28 00:27:39 +0000 | [diff] [blame] | 1533 | } |
| 1534 | |
| 1535 | PyObject * |
Serhiy Storchaka | c679227 | 2013-10-19 21:03:34 +0300 | [diff] [blame] | 1536 | PyMarshal_ReadObjectFromString(const char *str, Py_ssize_t len) |
Guido van Rossum | f56e3db | 1993-04-01 20:59:32 +0000 | [diff] [blame] | 1537 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1538 | RFILE rf; |
| 1539 | PyObject *result; |
| 1540 | rf.fp = NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1541 | rf.readable = NULL; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1542 | rf.ptr = str; |
| 1543 | rf.end = str + len; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1544 | rf.buf = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1545 | rf.depth = 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1546 | rf.refs = PyList_New(0); |
| 1547 | if (rf.refs == NULL) |
| 1548 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1549 | result = r_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1550 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1551 | if (rf.buf != NULL) |
| 1552 | PyMem_FREE(rf.buf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1553 | return result; |
Guido van Rossum | f56e3db | 1993-04-01 20:59:32 +0000 | [diff] [blame] | 1554 | } |
| 1555 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1556 | PyObject * |
Martin v. Löwis | ef82d2f | 2004-06-27 16:51:46 +0000 | [diff] [blame] | 1557 | PyMarshal_WriteObjectToString(PyObject *x, int version) |
Guido van Rossum | 3f3bb3d | 1996-08-19 22:07:17 +0000 | [diff] [blame] | 1558 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1559 | WFILE wf; |
Guido van Rossum | e6d3904 | 2007-05-09 00:01:30 +0000 | [diff] [blame] | 1560 | |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1561 | memset(&wf, 0, sizeof(wf)); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1562 | wf.str = PyBytes_FromStringAndSize((char *)NULL, 50); |
| 1563 | if (wf.str == NULL) |
| 1564 | return NULL; |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1565 | wf.ptr = wf.buf = PyBytes_AS_STRING(wf.str); |
| 1566 | wf.end = wf.ptr + PyBytes_GET_SIZE(wf.str); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1567 | wf.error = WFERR_OK; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1568 | wf.version = version; |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1569 | if (w_init_refs(&wf, version)) { |
| 1570 | Py_DECREF(wf.str); |
| 1571 | return NULL; |
| 1572 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1573 | w_object(x, &wf); |
Serhiy Storchaka | ce921c62 | 2015-02-11 15:53:31 +0200 | [diff] [blame] | 1574 | w_clear_refs(&wf); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1575 | if (wf.str != NULL) { |
Serhiy Storchaka | 2c003ef | 2020-03-31 23:23:21 +0300 | [diff] [blame] | 1576 | const char *base = PyBytes_AS_STRING(wf.str); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1577 | if (_PyBytes_Resize(&wf.str, (Py_ssize_t)(wf.ptr - base)) < 0) |
| 1578 | return NULL; |
| 1579 | } |
| 1580 | if (wf.error != WFERR_OK) { |
| 1581 | Py_XDECREF(wf.str); |
| 1582 | if (wf.error == WFERR_NOMEMORY) |
| 1583 | PyErr_NoMemory(); |
| 1584 | else |
| 1585 | PyErr_SetString(PyExc_ValueError, |
| 1586 | (wf.error==WFERR_UNMARSHALLABLE)?"unmarshallable object" |
| 1587 | :"object too deeply nested to marshal"); |
| 1588 | return NULL; |
| 1589 | } |
Antoine Pitrou | 1c13f84 | 2012-03-02 18:22:23 +0100 | [diff] [blame] | 1590 | return wf.str; |
Guido van Rossum | 3f3bb3d | 1996-08-19 22:07:17 +0000 | [diff] [blame] | 1591 | } |
| 1592 | |
Guido van Rossum | 64b4552 | 1991-06-07 13:58:22 +0000 | [diff] [blame] | 1593 | /* And an interface for Python programs... */ |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1594 | /*[clinic input] |
| 1595 | marshal.dump |
| 1596 | |
| 1597 | value: object |
| 1598 | Must be a supported type. |
| 1599 | file: object |
| 1600 | Must be a writeable binary file. |
| 1601 | version: int(c_default="Py_MARSHAL_VERSION") = version |
| 1602 | Indicates the data format that dump should use. |
| 1603 | / |
| 1604 | |
| 1605 | Write the value on the open file. |
| 1606 | |
| 1607 | If the value has (or contains an object that has) an unsupported type, a |
| 1608 | ValueError exception is raised - but garbage data will also be written |
| 1609 | to the file. The object will not be properly read back by load(). |
| 1610 | [clinic start generated code]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1611 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1612 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1613 | marshal_dump_impl(PyObject *module, PyObject *value, PyObject *file, |
| 1614 | int version) |
| 1615 | /*[clinic end generated code: output=aaee62c7028a7cb2 input=6c7a3c23c6fef556]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1616 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1617 | /* XXX Quick hack -- need to do this differently */ |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1618 | PyObject *s; |
| 1619 | PyObject *res; |
Martin v. Löwis | bd928fe | 2011-10-14 10:20:37 +0200 | [diff] [blame] | 1620 | _Py_IDENTIFIER(write); |
Martin v. Löwis | afe55bb | 2011-10-09 10:38:36 +0200 | [diff] [blame] | 1621 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1622 | s = PyMarshal_WriteObjectToString(value, version); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1623 | if (s == NULL) |
| 1624 | return NULL; |
Jeroen Demeyer | 59ad110 | 2019-07-11 10:59:05 +0200 | [diff] [blame] | 1625 | res = _PyObject_CallMethodIdOneArg(file, &PyId_write, s); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1626 | Py_DECREF(s); |
| 1627 | return res; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1628 | } |
| 1629 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1630 | /*[clinic input] |
| 1631 | marshal.load |
| 1632 | |
| 1633 | file: object |
| 1634 | Must be readable binary file. |
| 1635 | / |
| 1636 | |
| 1637 | Read one value from the open file and return it. |
| 1638 | |
| 1639 | If no valid value is read (e.g. because the data has a different Python |
| 1640 | version's incompatible marshal format), raise EOFError, ValueError or |
| 1641 | TypeError. |
| 1642 | |
| 1643 | Note: If an object containing an unsupported type was marshalled with |
| 1644 | dump(), load() will substitute None for the unmarshallable type. |
| 1645 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1646 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1647 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1648 | marshal_load(PyObject *module, PyObject *file) |
| 1649 | /*[clinic end generated code: output=f8e5c33233566344 input=c85c2b594cd8124a]*/ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1650 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1651 | PyObject *data, *result; |
Martin v. Löwis | bd928fe | 2011-10-14 10:20:37 +0200 | [diff] [blame] | 1652 | _Py_IDENTIFIER(read); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1653 | RFILE rf; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1654 | |
| 1655 | /* |
| 1656 | * Make a call to the read method, but read zero bytes. |
| 1657 | * This is to ensure that the object passed in at least |
| 1658 | * has a read method which returns bytes. |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1659 | * This can be removed if we guarantee good error handling |
| 1660 | * for r_string() |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1661 | */ |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1662 | data = _PyObject_CallMethodId(file, &PyId_read, "i", 0); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1663 | if (data == NULL) |
| 1664 | return NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1665 | if (!PyBytes_Check(data)) { |
| 1666 | PyErr_Format(PyExc_TypeError, |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1667 | "file.read() returned not bytes but %.100s", |
Victor Stinner | a102ed7 | 2020-02-07 02:24:48 +0100 | [diff] [blame] | 1668 | Py_TYPE(data)->tp_name); |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1669 | result = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1670 | } |
| 1671 | else { |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1672 | rf.depth = 0; |
| 1673 | rf.fp = NULL; |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1674 | rf.readable = file; |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1675 | rf.ptr = rf.end = NULL; |
| 1676 | rf.buf = NULL; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1677 | if ((rf.refs = PyList_New(0)) != NULL) { |
| 1678 | result = read_object(&rf); |
| 1679 | Py_DECREF(rf.refs); |
Antoine Pitrou | 1164dfc | 2013-10-12 22:25:39 +0200 | [diff] [blame] | 1680 | if (rf.buf != NULL) |
| 1681 | PyMem_FREE(rf.buf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1682 | } else |
| 1683 | result = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1684 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1685 | Py_DECREF(data); |
| 1686 | return result; |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1687 | } |
| 1688 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1689 | /*[clinic input] |
| 1690 | marshal.dumps |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1691 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1692 | value: object |
| 1693 | Must be a supported type. |
| 1694 | version: int(c_default="Py_MARSHAL_VERSION") = version |
| 1695 | Indicates the data format that dumps should use. |
| 1696 | / |
| 1697 | |
| 1698 | Return the bytes object that would be written to a file by dump(value, file). |
| 1699 | |
| 1700 | Raise a ValueError exception if value has (or contains an object that has) an |
| 1701 | unsupported type. |
| 1702 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1703 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1704 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1705 | marshal_dumps_impl(PyObject *module, PyObject *value, int version) |
| 1706 | /*[clinic end generated code: output=9c200f98d7256cad input=a2139ea8608e9b27]*/ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1707 | { |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1708 | return PyMarshal_WriteObjectToString(value, version); |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1709 | } |
| 1710 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1711 | /*[clinic input] |
| 1712 | marshal.loads |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1713 | |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1714 | bytes: Py_buffer |
| 1715 | / |
| 1716 | |
| 1717 | Convert the bytes-like object to a value. |
| 1718 | |
| 1719 | If no valid value is found, raise EOFError, ValueError or TypeError. Extra |
| 1720 | bytes in the input are ignored. |
| 1721 | [clinic start generated code]*/ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1722 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1723 | static PyObject * |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1724 | marshal_loads_impl(PyObject *module, Py_buffer *bytes) |
| 1725 | /*[clinic end generated code: output=9fc65985c93d1bb1 input=6f426518459c8495]*/ |
Guido van Rossum | 0b0db8e | 1993-01-21 16:07:51 +0000 | [diff] [blame] | 1726 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1727 | RFILE rf; |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1728 | char *s = bytes->buf; |
| 1729 | Py_ssize_t n = bytes->len; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1730 | PyObject* result; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1731 | rf.fp = NULL; |
Vinay Sajip | 5bdae3b | 2011-07-02 16:42:47 +0100 | [diff] [blame] | 1732 | rf.readable = NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1733 | rf.ptr = s; |
| 1734 | rf.end = s + n; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1735 | rf.depth = 0; |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1736 | if ((rf.refs = PyList_New(0)) == NULL) |
| 1737 | return NULL; |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1738 | result = read_object(&rf); |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1739 | Py_DECREF(rf.refs); |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1740 | return result; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1741 | } |
| 1742 | |
Guido van Rossum | 79f25d9 | 1997-04-29 20:08:16 +0000 | [diff] [blame] | 1743 | static PyMethodDef marshal_methods[] = { |
Serhiy Storchaka | 0767ad4 | 2017-03-12 09:20:15 +0200 | [diff] [blame] | 1744 | MARSHAL_DUMP_METHODDEF |
| 1745 | MARSHAL_LOAD_METHODDEF |
| 1746 | MARSHAL_DUMPS_METHODDEF |
| 1747 | MARSHAL_LOADS_METHODDEF |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1748 | {NULL, NULL} /* sentinel */ |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1749 | }; |
| 1750 | |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1751 | |
| 1752 | PyDoc_STRVAR(module_doc, |
| 1753 | "This module contains functions that can read and write Python values in\n\ |
| 1754 | a binary format. The format is specific to Python, but independent of\n\ |
| 1755 | machine architecture issues.\n\ |
| 1756 | \n\ |
| 1757 | Not all Python object types are supported; in general, only objects\n\ |
| 1758 | whose value is independent from a particular invocation of Python can be\n\ |
| 1759 | written and read by this module. The following types are supported:\n\ |
| 1760 | None, integers, floating point numbers, strings, bytes, bytearrays,\n\ |
| 1761 | tuples, lists, sets, dictionaries, and code objects, where it\n\ |
| 1762 | should be understood that tuples, lists and dictionaries are only\n\ |
| 1763 | supported as long as the values contained therein are themselves\n\ |
| 1764 | supported; and recursive lists and dictionaries should not be written\n\ |
| 1765 | (they will cause infinite loops).\n\ |
| 1766 | \n\ |
| 1767 | Variables:\n\ |
| 1768 | \n\ |
| 1769 | version -- indicates the format that the module uses. Version 0 is the\n\ |
| 1770 | historical format, version 1 shares interned strings and version 2\n\ |
| 1771 | uses a binary format for floating point numbers.\n\ |
Kristján Valur Jónsson | d7009c6 | 2013-03-19 18:02:10 -0700 | [diff] [blame] | 1772 | Version 3 shares common object references (New in version 3.4).\n\ |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1773 | \n\ |
| 1774 | Functions:\n\ |
| 1775 | \n\ |
| 1776 | dump() -- write value to a file\n\ |
| 1777 | load() -- read value from a file\n\ |
Serhiy Storchaka | c611a5b | 2017-03-12 08:53:22 +0200 | [diff] [blame] | 1778 | dumps() -- marshal value as a bytes object\n\ |
| 1779 | loads() -- read value from a bytes-like object"); |
R. David Murray | dd226ea | 2009-05-13 12:27:21 +0000 | [diff] [blame] | 1780 | |
| 1781 | |
| 1782 | |
Brett Cannon | 429ef65 | 2008-06-27 00:35:35 +0000 | [diff] [blame] | 1783 | static struct PyModuleDef marshalmodule = { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1784 | PyModuleDef_HEAD_INIT, |
| 1785 | "marshal", |
| 1786 | module_doc, |
| 1787 | 0, |
| 1788 | marshal_methods, |
| 1789 | NULL, |
| 1790 | NULL, |
| 1791 | NULL, |
| 1792 | NULL |
Martin v. Löwis | 1a21451 | 2008-06-11 05:26:20 +0000 | [diff] [blame] | 1793 | }; |
| 1794 | |
Jason Tishler | 6bc06ec | 2003-09-04 11:59:50 +0000 | [diff] [blame] | 1795 | PyMODINIT_FUNC |
Thomas Wouters | f70ef4f | 2000-07-22 18:47:25 +0000 | [diff] [blame] | 1796 | PyMarshal_Init(void) |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1797 | { |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1798 | PyObject *mod = PyModule_Create(&marshalmodule); |
| 1799 | if (mod == NULL) |
| 1800 | return NULL; |
Brandt Bucher | 33b671e | 2019-11-19 16:59:32 -0800 | [diff] [blame] | 1801 | if (PyModule_AddIntConstant(mod, "version", Py_MARSHAL_VERSION) < 0) { |
| 1802 | Py_DECREF(mod); |
| 1803 | return NULL; |
| 1804 | } |
Antoine Pitrou | f95a1b3 | 2010-05-09 15:52:27 +0000 | [diff] [blame] | 1805 | return mod; |
Guido van Rossum | dce2e3d | 1991-06-04 19:42:30 +0000 | [diff] [blame] | 1806 | } |