blob: 2667b65c6dab286012d217a145cb80417041820d [file] [log] [blame]
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001
2/* Write Python objects to files and read them back.
3 This is intended for writing and reading compiled Python code only;
4 a true persistent storage facility would be much harder, since
5 it would have to take circular links and sharing into account. */
6
Thomas Wouters695934a2006-03-01 23:49:13 +00007#define PY_SSIZE_T_CLEAN
8
Guido van Rossum79f25d91997-04-29 20:08:16 +00009#include "Python.h"
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000010#include "longintrepr.h"
Jeremy Hylton3e0055f2005-10-20 19:59:25 +000011#include "code.h"
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000012#include "marshal.h"
13
Fred Drake6da0b912000-06-28 18:47:56 +000014/* High water mark to determine when the marshalled object is dangerously deep
15 * and risks coring the interpreter. When the object stack gets this deep,
16 * raise an exception instead of continuing.
17 */
18#define MAX_MARSHAL_STACK_DEPTH 5000
19
Michael W. Hudsondf888462005-06-03 14:41:55 +000020#define TYPE_NULL '0'
21#define TYPE_NONE 'N'
22#define TYPE_FALSE 'F'
23#define TYPE_TRUE 'T'
24#define TYPE_STOPITER 'S'
25#define TYPE_ELLIPSIS '.'
26#define TYPE_INT 'i'
27#define TYPE_INT64 'I'
28#define TYPE_FLOAT 'f'
29#define TYPE_BINARY_FLOAT 'g'
30#define TYPE_COMPLEX 'x'
31#define TYPE_BINARY_COMPLEX 'y'
32#define TYPE_LONG 'l'
33#define TYPE_STRING 's'
34#define TYPE_INTERNED 't'
35#define TYPE_STRINGREF 'R'
36#define TYPE_TUPLE '('
37#define TYPE_LIST '['
38#define TYPE_DICT '{'
39#define TYPE_CODE 'c'
40#define TYPE_UNICODE 'u'
41#define TYPE_UNKNOWN '?'
42#define TYPE_SET '<'
43#define TYPE_FROZENSET '>'
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000044
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000045typedef struct {
46 FILE *fp;
Guido van Rossumf2150601996-06-26 20:41:23 +000047 int error;
Fred Drake6da0b912000-06-28 18:47:56 +000048 int depth;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000049 /* If fp == NULL, the following are valid: */
Guido van Rossum79f25d91997-04-29 20:08:16 +000050 PyObject *str;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000051 char *ptr;
52 char *end;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +000053 PyObject *strings; /* dict on marshal, list on unmarshal */
Michael W. Hudsondf888462005-06-03 14:41:55 +000054 int version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000055} WFILE;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000056
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000057#define w_byte(c, p) if (((p)->fp)) putc((c), (p)->fp); \
58 else if ((p)->ptr != (p)->end) *(p)->ptr++ = (c); \
59 else w_more(c, p)
60
61static void
Fredrik Lundh11534382000-07-23 18:24:06 +000062w_more(int c, WFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000063{
Martin v. Löwis18e16552006-02-15 17:27:45 +000064 Py_ssize_t size, newsize;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000065 if (p->str == NULL)
66 return; /* An error already occurred */
Guido van Rossum79f25d91997-04-29 20:08:16 +000067 size = PyString_Size(p->str);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000068 newsize = size + 1024;
Guido van Rossum79f25d91997-04-29 20:08:16 +000069 if (_PyString_Resize(&p->str, newsize) != 0) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000070 p->ptr = p->end = NULL;
71 }
72 else {
Guido van Rossum79f25d91997-04-29 20:08:16 +000073 p->ptr = PyString_AS_STRING((PyStringObject *)p->str) + size;
74 p->end =
75 PyString_AS_STRING((PyStringObject *)p->str) + newsize;
Tim Peters8315ea52000-07-23 19:28:35 +000076 *p->ptr++ = Py_SAFE_DOWNCAST(c, int, char);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000077 }
78}
79
80static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +000081w_string(char *s, int n, WFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000082{
83 if (p->fp != NULL) {
84 fwrite(s, 1, n, p->fp);
85 }
86 else {
87 while (--n >= 0) {
88 w_byte(*s, p);
89 s++;
90 }
91 }
92}
93
94static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +000095w_short(int x, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000096{
Thomas Heller3e1c18a2002-07-30 11:40:57 +000097 w_byte((char)( x & 0xff), p);
98 w_byte((char)((x>> 8) & 0xff), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000099}
100
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000101static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000102w_long(long x, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000103{
Thomas Heller37d5a152002-07-30 11:44:44 +0000104 w_byte((char)( x & 0xff), p);
105 w_byte((char)((x>> 8) & 0xff), p);
106 w_byte((char)((x>>16) & 0xff), p);
107 w_byte((char)((x>>24) & 0xff), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000108}
109
Guido van Rossumc1547d91996-12-10 15:39:04 +0000110#if SIZEOF_LONG > 4
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000111static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000112w_long64(long x, WFILE *p)
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000113{
114 w_long(x, p);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000115 w_long(x>>32, p);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000116}
Guido van Rossumc1547d91996-12-10 15:39:04 +0000117#endif
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000118
119static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000120w_object(PyObject *v, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000121{
Martin v. Löwis18e16552006-02-15 17:27:45 +0000122 Py_ssize_t i, n;
Fred Drake6da0b912000-06-28 18:47:56 +0000123
124 p->depth++;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000125
Fred Drake6da0b912000-06-28 18:47:56 +0000126 if (p->depth > MAX_MARSHAL_STACK_DEPTH) {
127 p->error = 2;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000128 }
Fred Drake6da0b912000-06-28 18:47:56 +0000129 else if (v == NULL) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000130 w_byte(TYPE_NULL, p);
Guido van Rossum730806d1998-04-10 22:27:42 +0000131 }
132 else if (v == Py_None) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000133 w_byte(TYPE_NONE, p);
Guido van Rossum730806d1998-04-10 22:27:42 +0000134 }
Tim Peters5ca576e2001-06-18 22:08:13 +0000135 else if (v == PyExc_StopIteration) {
136 w_byte(TYPE_STOPITER, p);
137 }
Guido van Rossum730806d1998-04-10 22:27:42 +0000138 else if (v == Py_Ellipsis) {
139 w_byte(TYPE_ELLIPSIS, p);
140 }
Guido van Rossum77f6a652002-04-03 22:41:51 +0000141 else if (v == Py_False) {
142 w_byte(TYPE_FALSE, p);
143 }
144 else if (v == Py_True) {
145 w_byte(TYPE_TRUE, p);
146 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000147 else if (PyInt_Check(v)) {
148 long x = PyInt_AS_LONG((PyIntObject *)v);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000149#if SIZEOF_LONG > 4
Tim Peters44714002001-04-10 05:02:52 +0000150 long y = Py_ARITHMETIC_RIGHT_SHIFT(long, x, 31);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000151 if (y && y != -1) {
152 w_byte(TYPE_INT64, p);
153 w_long64(x, p);
154 }
Guido van Rossumc1547d91996-12-10 15:39:04 +0000155 else
156#endif
157 {
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000158 w_byte(TYPE_INT, p);
159 w_long(x, p);
160 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000161 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000162 else if (PyLong_Check(v)) {
163 PyLongObject *ob = (PyLongObject *)v;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000164 w_byte(TYPE_LONG, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000165 n = ob->ob_size;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000166 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000167 if (n < 0)
168 n = -n;
169 for (i = 0; i < n; i++)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000170 w_short(ob->ob_digit[i], p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000171 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000172 else if (PyFloat_Check(v)) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000173 if (p->version > 1) {
Brett Cannonc9371d42005-06-25 08:23:41 +0000174 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000175 if (_PyFloat_Pack8(PyFloat_AsDouble(v),
176 buf, 1) < 0) {
177 p->error = 1;
178 return;
179 }
180 w_byte(TYPE_BINARY_FLOAT, p);
Brett Cannonc9371d42005-06-25 08:23:41 +0000181 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000182 }
183 else {
184 char buf[256]; /* Plenty to format any double */
185 PyFloat_AsReprString(buf, (PyFloatObject *)v);
Martin v. Löwis67baee62006-02-16 14:37:48 +0000186 n = strlen(buf);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000187 w_byte(TYPE_FLOAT, p);
Martin v. Löwis67baee62006-02-16 14:37:48 +0000188 w_byte((int)n, p);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000189 w_string(buf, (int)n, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000190 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000191 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000192#ifndef WITHOUT_COMPLEX
Guido van Rossum79f25d91997-04-29 20:08:16 +0000193 else if (PyComplex_Check(v)) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000194 if (p->version > 1) {
Brett Cannonc9371d42005-06-25 08:23:41 +0000195 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000196 if (_PyFloat_Pack8(PyComplex_RealAsDouble(v),
197 buf, 1) < 0) {
198 p->error = 1;
199 return;
200 }
201 w_byte(TYPE_BINARY_COMPLEX, p);
Brett Cannonc9371d42005-06-25 08:23:41 +0000202 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000203 if (_PyFloat_Pack8(PyComplex_ImagAsDouble(v),
204 buf, 1) < 0) {
205 p->error = 1;
206 return;
207 }
Brett Cannonc9371d42005-06-25 08:23:41 +0000208 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000209 }
210 else {
211 char buf[256]; /* Plenty to format any double */
212 PyFloatObject *temp;
213 w_byte(TYPE_COMPLEX, p);
214 temp = (PyFloatObject*)PyFloat_FromDouble(
215 PyComplex_RealAsDouble(v));
Thomas Wouters00ee7ba2006-08-21 19:07:27 +0000216 if (!temp) {
217 p->error = 1;
218 return;
219 }
Michael W. Hudsondf888462005-06-03 14:41:55 +0000220 PyFloat_AsReprString(buf, temp);
221 Py_DECREF(temp);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000222 n = strlen(buf);
223 w_byte((int)n, p);
224 w_string(buf, (int)n, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000225 temp = (PyFloatObject*)PyFloat_FromDouble(
226 PyComplex_ImagAsDouble(v));
Thomas Wouters00ee7ba2006-08-21 19:07:27 +0000227 if (!temp) {
228 p->error = 1;
229 return;
230 }
Michael W. Hudsondf888462005-06-03 14:41:55 +0000231 PyFloat_AsReprString(buf, temp);
232 Py_DECREF(temp);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000233 n = strlen(buf);
234 w_byte((int)n, p);
235 w_string(buf, (int)n, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000236 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000237 }
238#endif
Guido van Rossum79f25d91997-04-29 20:08:16 +0000239 else if (PyString_Check(v)) {
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000240 if (p->strings && PyString_CHECK_INTERNED(v)) {
241 PyObject *o = PyDict_GetItem(p->strings, v);
242 if (o) {
243 long w = PyInt_AsLong(o);
244 w_byte(TYPE_STRINGREF, p);
245 w_long(w, p);
246 goto exit;
247 }
248 else {
Martin v. Löwis18e16552006-02-15 17:27:45 +0000249 o = PyInt_FromSsize_t(PyDict_Size(p->strings));
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000250 PyDict_SetItem(p->strings, v, o);
251 Py_DECREF(o);
252 w_byte(TYPE_INTERNED, p);
253 }
254 }
255 else {
256 w_byte(TYPE_STRING, p);
257 }
Guido van Rossumc279b532000-03-10 23:03:02 +0000258 n = PyString_GET_SIZE(v);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000259 if (n > INT_MAX) {
260 /* huge strings are not supported */
261 p->depth--;
262 p->error = 1;
263 return;
264 }
Guido van Rossum3a205f71995-02-17 15:10:07 +0000265 w_long((long)n, p);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000266 w_string(PyString_AS_STRING(v), (int)n, p);
Guido van Rossumc279b532000-03-10 23:03:02 +0000267 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000268#ifdef Py_USING_UNICODE
Guido van Rossumc279b532000-03-10 23:03:02 +0000269 else if (PyUnicode_Check(v)) {
270 PyObject *utf8;
271 utf8 = PyUnicode_AsUTF8String(v);
272 if (utf8 == NULL) {
Guido van Rossum98626cd2000-06-28 23:24:19 +0000273 p->depth--;
274 p->error = 1;
275 return;
Guido van Rossumc279b532000-03-10 23:03:02 +0000276 }
277 w_byte(TYPE_UNICODE, p);
278 n = PyString_GET_SIZE(utf8);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000279 if (n > INT_MAX) {
280 p->depth--;
281 p->error = 1;
282 return;
283 }
Guido van Rossumc279b532000-03-10 23:03:02 +0000284 w_long((long)n, p);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000285 w_string(PyString_AS_STRING(utf8), (int)n, p);
Guido van Rossumc279b532000-03-10 23:03:02 +0000286 Py_DECREF(utf8);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000287 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000288#endif
Guido van Rossum79f25d91997-04-29 20:08:16 +0000289 else if (PyTuple_Check(v)) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000290 w_byte(TYPE_TUPLE, p);
Guido van Rossum79f25d91997-04-29 20:08:16 +0000291 n = PyTuple_Size(v);
Guido van Rossum3a205f71995-02-17 15:10:07 +0000292 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000293 for (i = 0; i < n; i++) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000294 w_object(PyTuple_GET_ITEM(v, i), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000295 }
296 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000297 else if (PyList_Check(v)) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000298 w_byte(TYPE_LIST, p);
Guido van Rossumc279b532000-03-10 23:03:02 +0000299 n = PyList_GET_SIZE(v);
Guido van Rossum3a205f71995-02-17 15:10:07 +0000300 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000301 for (i = 0; i < n; i++) {
Guido van Rossumc279b532000-03-10 23:03:02 +0000302 w_object(PyList_GET_ITEM(v, i), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000303 }
304 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000305 else if (PyDict_Check(v)) {
Martin v. Löwis18e16552006-02-15 17:27:45 +0000306 Py_ssize_t pos;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000307 PyObject *key, *value;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000308 w_byte(TYPE_DICT, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000309 /* This one is NULL object terminated! */
Guido van Rossum25831651993-05-19 14:50:45 +0000310 pos = 0;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000311 while (PyDict_Next(v, &pos, &key, &value)) {
Guido van Rossum25831651993-05-19 14:50:45 +0000312 w_object(key, p);
313 w_object(value, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000314 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000315 w_object((PyObject *)NULL, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000316 }
Raymond Hettingera422c342005-01-11 03:03:27 +0000317 else if (PyAnySet_Check(v)) {
Raymond Hettingera422c342005-01-11 03:03:27 +0000318 PyObject *value, *it;
319
320 if (PyObject_TypeCheck(v, &PySet_Type))
321 w_byte(TYPE_SET, p);
322 else
323 w_byte(TYPE_FROZENSET, p);
324 n = PyObject_Size(v);
325 if (n == -1) {
326 p->depth--;
327 p->error = 1;
328 return;
329 }
330 w_long((long)n, p);
331 it = PyObject_GetIter(v);
332 if (it == NULL) {
333 p->depth--;
334 p->error = 1;
335 return;
336 }
337 while ((value = PyIter_Next(it)) != NULL) {
338 w_object(value, p);
339 Py_DECREF(value);
340 }
341 Py_DECREF(it);
342 if (PyErr_Occurred()) {
343 p->depth--;
344 p->error = 1;
345 return;
346 }
347 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000348 else if (PyCode_Check(v)) {
349 PyCodeObject *co = (PyCodeObject *)v;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000350 w_byte(TYPE_CODE, p);
Neal Norwitz7fdcb412002-06-14 01:07:39 +0000351 w_long(co->co_argcount, p);
Guido van Rossum4f72a782006-10-27 23:31:49 +0000352 w_long(co->co_kwonlyargcount, p);
Neal Norwitz7fdcb412002-06-14 01:07:39 +0000353 w_long(co->co_nlocals, p);
354 w_long(co->co_stacksize, p);
355 w_long(co->co_flags, p);
Guido van Rossumd076c731998-10-07 19:42:25 +0000356 w_object(co->co_code, p);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000357 w_object(co->co_consts, p);
358 w_object(co->co_names, p);
Guido van Rossum681d79a1995-07-18 14:51:37 +0000359 w_object(co->co_varnames, p);
Jeremy Hylton64949cb2001-01-25 20:06:59 +0000360 w_object(co->co_freevars, p);
361 w_object(co->co_cellvars, p);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000362 w_object(co->co_filename, p);
Guido van Rossum9bfef441993-03-29 10:43:31 +0000363 w_object(co->co_name, p);
Neal Norwitz7fdcb412002-06-14 01:07:39 +0000364 w_long(co->co_firstlineno, p);
Guido van Rossumd031c891997-01-24 03:44:17 +0000365 w_object(co->co_lnotab, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000366 }
Jeremy Hylton9f64caa2001-11-09 22:02:48 +0000367 else if (PyObject_CheckReadBuffer(v)) {
Guido van Rossumd076c731998-10-07 19:42:25 +0000368 /* Write unknown buffer-style objects as a string */
369 char *s;
Jeremy Hylton9f64caa2001-11-09 22:02:48 +0000370 PyBufferProcs *pb = v->ob_type->tp_as_buffer;
Guido van Rossumd076c731998-10-07 19:42:25 +0000371 w_byte(TYPE_STRING, p);
372 n = (*pb->bf_getreadbuffer)(v, 0, (void **)&s);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000373 if (n > INT_MAX) {
374 p->depth--;
375 p->error = 1;
376 return;
377 }
Guido van Rossumd076c731998-10-07 19:42:25 +0000378 w_long((long)n, p);
Martin v. Löwis725507b2006-03-07 12:08:51 +0000379 w_string(s, (int)n, p);
Guido van Rossumd076c731998-10-07 19:42:25 +0000380 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000381 else {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000382 w_byte(TYPE_UNKNOWN, p);
Guido van Rossumf2150601996-06-26 20:41:23 +0000383 p->error = 1;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000384 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000385 exit:
Guido van Rossum98626cd2000-06-28 23:24:19 +0000386 p->depth--;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000387}
388
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000389/* version currently has no effect for writing longs. */
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000390void
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000391PyMarshal_WriteLongToFile(long x, FILE *fp, int version)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000392{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000393 WFILE wf;
394 wf.fp = fp;
Guido van Rossumf2150601996-06-26 20:41:23 +0000395 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +0000396 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000397 wf.strings = NULL;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000398 wf.version = version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000399 w_long(x, &wf);
400}
401
402void
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000403PyMarshal_WriteObjectToFile(PyObject *x, FILE *fp, int version)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000404{
405 WFILE wf;
406 wf.fp = fp;
Guido van Rossumf2150601996-06-26 20:41:23 +0000407 wf.error = 0;
Guido van Rossum98626cd2000-06-28 23:24:19 +0000408 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000409 wf.strings = (version > 0) ? PyDict_New() : NULL;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000410 wf.version = version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000411 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000412 Py_XDECREF(wf.strings);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000413}
414
415typedef WFILE RFILE; /* Same struct with different invariants */
416
Guido van Rossum8d617a61995-03-09 12:12:11 +0000417#define rs_byte(p) (((p)->ptr != (p)->end) ? (unsigned char)*(p)->ptr++ : EOF)
418
419#define r_byte(p) ((p)->fp ? getc((p)->fp) : rs_byte(p))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000420
421static int
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000422r_string(char *s, int n, RFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000423{
424 if (p->fp != NULL)
Martin v. Löwis18e16552006-02-15 17:27:45 +0000425 /* The result fits into int because it must be <=n. */
426 return (int)fread(s, 1, n, p->fp);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000427 if (p->end - p->ptr < n)
Martin v. Löwis18e16552006-02-15 17:27:45 +0000428 n = (int)(p->end - p->ptr);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000429 memcpy(s, p->ptr, n);
430 p->ptr += n;
431 return n;
432}
433
434static int
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000435r_short(RFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000436{
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000437 register short x;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000438 x = r_byte(p);
439 x |= r_byte(p) << 8;
Tim Peterse84b7402000-09-19 08:54:13 +0000440 /* Sign-extension, in case short greater than 16 bits */
441 x |= -(x & 0x8000);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000442 return x;
443}
444
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000445static long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000446r_long(RFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000447{
448 register long x;
Guido van Rossum8d617a61995-03-09 12:12:11 +0000449 register FILE *fp = p->fp;
450 if (fp) {
451 x = getc(fp);
452 x |= (long)getc(fp) << 8;
453 x |= (long)getc(fp) << 16;
454 x |= (long)getc(fp) << 24;
455 }
456 else {
457 x = rs_byte(p);
458 x |= (long)rs_byte(p) << 8;
459 x |= (long)rs_byte(p) << 16;
460 x |= (long)rs_byte(p) << 24;
461 }
Guido van Rossumc1547d91996-12-10 15:39:04 +0000462#if SIZEOF_LONG > 4
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000463 /* Sign extension for 64-bit machines */
Tim Peterse84b7402000-09-19 08:54:13 +0000464 x |= -(x & 0x80000000L);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000465#endif
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000466 return x;
467}
468
Tim Peters82112372001-08-29 02:28:42 +0000469/* r_long64 deals with the TYPE_INT64 code. On a machine with
470 sizeof(long) > 4, it returns a Python int object, else a Python long
471 object. Note that w_long64 writes out TYPE_INT if 32 bits is enough,
472 so there's no inefficiency here in returning a PyLong on 32-bit boxes
473 for everything written via TYPE_INT64 (i.e., if an int is written via
474 TYPE_INT64, it *needs* more than 32 bits).
475*/
476static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000477r_long64(RFILE *p)
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000478{
Tim Peters82112372001-08-29 02:28:42 +0000479 long lo4 = r_long(p);
480 long hi4 = r_long(p);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000481#if SIZEOF_LONG > 4
Tim Peters82112372001-08-29 02:28:42 +0000482 long x = (hi4 << 32) | (lo4 & 0xFFFFFFFFL);
483 return PyInt_FromLong(x);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000484#else
Tim Peters82112372001-08-29 02:28:42 +0000485 unsigned char buf[8];
486 int one = 1;
487 int is_little_endian = (int)*(char*)&one;
488 if (is_little_endian) {
489 memcpy(buf, &lo4, 4);
490 memcpy(buf+4, &hi4, 4);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000491 }
Tim Peters82112372001-08-29 02:28:42 +0000492 else {
493 memcpy(buf, &hi4, 4);
494 memcpy(buf+4, &lo4, 4);
495 }
496 return _PyLong_FromByteArray(buf, 8, is_little_endian, 1);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000497#endif
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000498}
499
Guido van Rossum79f25d91997-04-29 20:08:16 +0000500static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000501r_object(RFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000502{
Armin Rigo01ab2792004-03-26 15:09:27 +0000503 /* NULL is a valid return value, it does not necessarily means that
504 an exception is set. */
Raymond Hettingera422c342005-01-11 03:03:27 +0000505 PyObject *v, *v2, *v3;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000506 long i, n;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000507 int type = r_byte(p);
Tim Petersd9b9ac82001-01-28 00:27:39 +0000508
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000509 switch (type) {
Tim Petersd9b9ac82001-01-28 00:27:39 +0000510
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000511 case EOF:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000512 PyErr_SetString(PyExc_EOFError,
513 "EOF read where object expected");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000514 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000515
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000516 case TYPE_NULL:
517 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000518
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000519 case TYPE_NONE:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000520 Py_INCREF(Py_None);
521 return Py_None;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000522
Tim Peters5ca576e2001-06-18 22:08:13 +0000523 case TYPE_STOPITER:
524 Py_INCREF(PyExc_StopIteration);
525 return PyExc_StopIteration;
526
Guido van Rossume449af71996-10-11 16:25:41 +0000527 case TYPE_ELLIPSIS:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000528 Py_INCREF(Py_Ellipsis);
Guido van Rossume449af71996-10-11 16:25:41 +0000529 return Py_Ellipsis;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000530
Guido van Rossum77f6a652002-04-03 22:41:51 +0000531 case TYPE_FALSE:
532 Py_INCREF(Py_False);
533 return Py_False;
534
535 case TYPE_TRUE:
536 Py_INCREF(Py_True);
537 return Py_True;
538
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000539 case TYPE_INT:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000540 return PyInt_FromLong(r_long(p));
Tim Petersd9b9ac82001-01-28 00:27:39 +0000541
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000542 case TYPE_INT64:
Tim Peters82112372001-08-29 02:28:42 +0000543 return r_long64(p);
Tim Petersd9b9ac82001-01-28 00:27:39 +0000544
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000545 case TYPE_LONG:
546 {
547 int size;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000548 PyLongObject *ob;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000549 n = r_long(p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000550 size = n<0 ? -n : n;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000551 ob = _PyLong_New(size);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000552 if (ob == NULL)
553 return NULL;
554 ob->ob_size = n;
Armin Rigo01ab2792004-03-26 15:09:27 +0000555 for (i = 0; i < size; i++) {
556 int digit = r_short(p);
557 if (digit < 0) {
558 Py_DECREF(ob);
559 PyErr_SetString(PyExc_ValueError,
560 "bad marshal data");
561 return NULL;
562 }
563 ob->ob_digit[i] = digit;
564 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000565 return (PyObject *)ob;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000566 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000567
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000568 case TYPE_FLOAT:
569 {
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000570 char buf[256];
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000571 double dx;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000572 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000573 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000574 PyErr_SetString(PyExc_EOFError,
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000575 "EOF read where object expected");
576 return NULL;
577 }
578 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000579 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000580 dx = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000581 PyFPE_END_PROTECT(dx)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000582 return PyFloat_FromDouble(dx);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000583 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000584
Michael W. Hudsondf888462005-06-03 14:41:55 +0000585 case TYPE_BINARY_FLOAT:
586 {
Brett Cannonc9371d42005-06-25 08:23:41 +0000587 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000588 double x;
Brett Cannonc9371d42005-06-25 08:23:41 +0000589 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000590 PyErr_SetString(PyExc_EOFError,
591 "EOF read where object expected");
592 return NULL;
593 }
594 x = _PyFloat_Unpack8(buf, 1);
595 if (x == -1.0 && PyErr_Occurred()) {
596 return NULL;
597 }
598 return PyFloat_FromDouble(x);
599 }
600
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000601#ifndef WITHOUT_COMPLEX
602 case TYPE_COMPLEX:
603 {
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000604 char buf[256];
Guido van Rossum530956d1996-07-21 02:27:43 +0000605 Py_complex c;
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000606 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000607 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000608 PyErr_SetString(PyExc_EOFError,
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000609 "EOF read where object expected");
610 return NULL;
611 }
612 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000613 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000614 c.real = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000615 PyFPE_END_PROTECT(c)
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000616 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000617 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000618 PyErr_SetString(PyExc_EOFError,
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000619 "EOF read where object expected");
620 return NULL;
621 }
622 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000623 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000624 c.imag = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000625 PyFPE_END_PROTECT(c)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000626 return PyComplex_FromCComplex(c);
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000627 }
Michael W. Hudsondf888462005-06-03 14:41:55 +0000628
629 case TYPE_BINARY_COMPLEX:
630 {
Brett Cannonc9371d42005-06-25 08:23:41 +0000631 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000632 Py_complex c;
Brett Cannonc9371d42005-06-25 08:23:41 +0000633 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000634 PyErr_SetString(PyExc_EOFError,
635 "EOF read where object expected");
636 return NULL;
637 }
638 c.real = _PyFloat_Unpack8(buf, 1);
639 if (c.real == -1.0 && PyErr_Occurred()) {
640 return NULL;
641 }
Brett Cannonc9371d42005-06-25 08:23:41 +0000642 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000643 PyErr_SetString(PyExc_EOFError,
644 "EOF read where object expected");
645 return NULL;
646 }
647 c.imag = _PyFloat_Unpack8(buf, 1);
648 if (c.imag == -1.0 && PyErr_Occurred()) {
649 return NULL;
650 }
651 return PyComplex_FromCComplex(c);
652 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000653#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000654
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000655 case TYPE_INTERNED:
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000656 case TYPE_STRING:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000657 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000658 if (n < 0) {
659 PyErr_SetString(PyExc_ValueError, "bad marshal data");
660 return NULL;
661 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000662 v = PyString_FromStringAndSize((char *)NULL, n);
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000663 if (v == NULL)
664 return v;
665 if (r_string(PyString_AS_STRING(v), (int)n, p) != n) {
666 Py_DECREF(v);
667 PyErr_SetString(PyExc_EOFError,
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000668 "EOF read where object expected");
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000669 return NULL;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000670 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000671 if (type == TYPE_INTERNED) {
672 PyString_InternInPlace(&v);
673 PyList_Append(p->strings, v);
674 }
675 return v;
676
677 case TYPE_STRINGREF:
678 n = r_long(p);
Michael W. Hudsonf2ca5af2005-06-13 18:28:46 +0000679 if (n < 0 || n >= PyList_GET_SIZE(p->strings)) {
680 PyErr_SetString(PyExc_ValueError, "bad marshal data");
681 return NULL;
682 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000683 v = PyList_GET_ITEM(p->strings, n);
684 Py_INCREF(v);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000685 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000686
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000687#ifdef Py_USING_UNICODE
Guido van Rossumc279b532000-03-10 23:03:02 +0000688 case TYPE_UNICODE:
689 {
690 char *buffer;
691
692 n = r_long(p);
693 if (n < 0) {
694 PyErr_SetString(PyExc_ValueError, "bad marshal data");
695 return NULL;
696 }
Guido van Rossumb18618d2000-05-03 23:44:39 +0000697 buffer = PyMem_NEW(char, n);
Guido van Rossumc279b532000-03-10 23:03:02 +0000698 if (buffer == NULL)
Guido van Rossumb18618d2000-05-03 23:44:39 +0000699 return PyErr_NoMemory();
Guido van Rossumc279b532000-03-10 23:03:02 +0000700 if (r_string(buffer, (int)n, p) != n) {
Guido van Rossumb18618d2000-05-03 23:44:39 +0000701 PyMem_DEL(buffer);
Guido van Rossumc279b532000-03-10 23:03:02 +0000702 PyErr_SetString(PyExc_EOFError,
703 "EOF read where object expected");
704 return NULL;
705 }
706 v = PyUnicode_DecodeUTF8(buffer, n, NULL);
Guido van Rossumb18618d2000-05-03 23:44:39 +0000707 PyMem_DEL(buffer);
Guido van Rossumc279b532000-03-10 23:03:02 +0000708 return v;
709 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000710#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000711
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000712 case TYPE_TUPLE:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000713 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000714 if (n < 0) {
715 PyErr_SetString(PyExc_ValueError, "bad marshal data");
716 return NULL;
717 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000718 v = PyTuple_New((int)n);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000719 if (v == NULL)
720 return v;
Jack Jansen9513f2c1995-10-27 13:21:28 +0000721 for (i = 0; i < n; i++) {
722 v2 = r_object(p);
723 if ( v2 == NULL ) {
Armin Rigo01ab2792004-03-26 15:09:27 +0000724 if (!PyErr_Occurred())
725 PyErr_SetString(PyExc_TypeError,
726 "NULL object in marshal data");
Guido van Rossum79f25d91997-04-29 20:08:16 +0000727 Py_DECREF(v);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000728 v = NULL;
729 break;
730 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000731 PyTuple_SET_ITEM(v, (int)i, v2);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000732 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000733 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000734
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000735 case TYPE_LIST:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000736 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000737 if (n < 0) {
738 PyErr_SetString(PyExc_ValueError, "bad marshal data");
739 return NULL;
740 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000741 v = PyList_New((int)n);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000742 if (v == NULL)
743 return v;
Jack Jansen9513f2c1995-10-27 13:21:28 +0000744 for (i = 0; i < n; i++) {
745 v2 = r_object(p);
746 if ( v2 == NULL ) {
Armin Rigo01ab2792004-03-26 15:09:27 +0000747 if (!PyErr_Occurred())
748 PyErr_SetString(PyExc_TypeError,
749 "NULL object in marshal data");
Guido van Rossum79f25d91997-04-29 20:08:16 +0000750 Py_DECREF(v);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000751 v = NULL;
752 break;
753 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000754 PyList_SetItem(v, (int)i, v2);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000755 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000756 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000757
Guido van Rossum64b45521991-06-07 13:58:22 +0000758 case TYPE_DICT:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000759 v = PyDict_New();
Guido van Rossum64b45521991-06-07 13:58:22 +0000760 if (v == NULL)
761 return NULL;
762 for (;;) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000763 PyObject *key, *val;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000764 key = r_object(p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000765 if (key == NULL)
Armin Rigo01ab2792004-03-26 15:09:27 +0000766 break;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000767 val = r_object(p);
Guido van Rossumf2150601996-06-26 20:41:23 +0000768 if (val != NULL)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000769 PyDict_SetItem(v, key, val);
770 Py_DECREF(key);
771 Py_XDECREF(val);
Guido van Rossum64b45521991-06-07 13:58:22 +0000772 }
Armin Rigo01ab2792004-03-26 15:09:27 +0000773 if (PyErr_Occurred()) {
774 Py_DECREF(v);
775 v = NULL;
776 }
Guido van Rossum64b45521991-06-07 13:58:22 +0000777 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000778
Raymond Hettingera422c342005-01-11 03:03:27 +0000779 case TYPE_SET:
780 case TYPE_FROZENSET:
781 n = r_long(p);
782 if (n < 0) {
783 PyErr_SetString(PyExc_ValueError, "bad marshal data");
784 return NULL;
785 }
786 v = PyTuple_New((int)n);
787 if (v == NULL)
788 return v;
789 for (i = 0; i < n; i++) {
790 v2 = r_object(p);
791 if ( v2 == NULL ) {
792 if (!PyErr_Occurred())
793 PyErr_SetString(PyExc_TypeError,
794 "NULL object in marshal data");
795 Py_DECREF(v);
796 v = NULL;
797 break;
798 }
799 PyTuple_SET_ITEM(v, (int)i, v2);
800 }
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000801 if (v == NULL)
802 return v;
Raymond Hettingera422c342005-01-11 03:03:27 +0000803 if (type == TYPE_SET)
Raymond Hettingerbeb31012005-08-16 03:47:52 +0000804 v3 = PySet_New(v);
Raymond Hettingera422c342005-01-11 03:03:27 +0000805 else
Raymond Hettingerbeb31012005-08-16 03:47:52 +0000806 v3 = PyFrozenSet_New(v);
Raymond Hettingera422c342005-01-11 03:03:27 +0000807 Py_DECREF(v);
808 return v3;
809
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000810 case TYPE_CODE:
Michael W. Hudson80199132001-08-30 14:50:20 +0000811 if (PyEval_GetRestricted()) {
812 PyErr_SetString(PyExc_RuntimeError,
813 "cannot unmarshal code objects in "
814 "restricted execution mode");
815 return NULL;
816 }
817 else {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000818 int argcount;
Guido van Rossum4f72a782006-10-27 23:31:49 +0000819 int kwonlyargcount;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000820 int nlocals;
821 int stacksize;
822 int flags;
823 PyObject *code = NULL;
824 PyObject *consts = NULL;
825 PyObject *names = NULL;
826 PyObject *varnames = NULL;
827 PyObject *freevars = NULL;
828 PyObject *cellvars = NULL;
829 PyObject *filename = NULL;
830 PyObject *name = NULL;
831 int firstlineno;
832 PyObject *lnotab = NULL;
833
834 v = NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000835
Michael W. Hudsondf888462005-06-03 14:41:55 +0000836 argcount = r_long(p);
Guido van Rossum4f72a782006-10-27 23:31:49 +0000837 kwonlyargcount = r_long(p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000838 nlocals = r_long(p);
839 stacksize = r_long(p);
840 flags = r_long(p);
841 code = r_object(p);
842 if (code == NULL)
843 goto code_error;
844 consts = r_object(p);
845 if (consts == NULL)
846 goto code_error;
847 names = r_object(p);
848 if (names == NULL)
849 goto code_error;
850 varnames = r_object(p);
851 if (varnames == NULL)
852 goto code_error;
853 freevars = r_object(p);
854 if (freevars == NULL)
855 goto code_error;
856 cellvars = r_object(p);
857 if (cellvars == NULL)
858 goto code_error;
859 filename = r_object(p);
860 if (filename == NULL)
861 goto code_error;
862 name = r_object(p);
863 if (name == NULL)
864 goto code_error;
865 firstlineno = r_long(p);
866 lnotab = r_object(p);
867 if (lnotab == NULL)
868 goto code_error;
869
870 v = (PyObject *) PyCode_New(
Guido van Rossum4f72a782006-10-27 23:31:49 +0000871 argcount, kwonlyargcount,
872 nlocals, stacksize, flags,
Guido van Rossum681d79a1995-07-18 14:51:37 +0000873 code, consts, names, varnames,
Tim Petersd9b9ac82001-01-28 00:27:39 +0000874 freevars, cellvars, filename, name,
875 firstlineno, lnotab);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000876
877 code_error:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000878 Py_XDECREF(code);
879 Py_XDECREF(consts);
880 Py_XDECREF(names);
881 Py_XDECREF(varnames);
Jeremy Hylton64949cb2001-01-25 20:06:59 +0000882 Py_XDECREF(freevars);
883 Py_XDECREF(cellvars);
Guido van Rossum79f25d91997-04-29 20:08:16 +0000884 Py_XDECREF(filename);
885 Py_XDECREF(name);
Guido van Rossum6fc06e71997-07-26 23:30:18 +0000886 Py_XDECREF(lnotab);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000887
888 }
889 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000890
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000891 default:
Guido van Rossumf2150601996-06-26 20:41:23 +0000892 /* Bogus data got written, which isn't ideal.
893 This will let you keep working and recover. */
Guido van Rossuma45cb451998-06-08 20:27:29 +0000894 PyErr_SetString(PyExc_ValueError, "bad marshal data");
895 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000896
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000897 }
898}
899
Neal Norwitzd85c4522004-06-13 20:31:49 +0000900static PyObject *
Armin Rigo01ab2792004-03-26 15:09:27 +0000901read_object(RFILE *p)
902{
903 PyObject *v;
904 if (PyErr_Occurred()) {
905 fprintf(stderr, "XXX readobject called with exception set\n");
906 return NULL;
907 }
908 v = r_object(p);
909 if (v == NULL && !PyErr_Occurred())
910 PyErr_SetString(PyExc_TypeError, "NULL object in marshal data");
911 return v;
912}
913
Guido van Rossumb8cf3e62001-10-19 01:46:21 +0000914int
915PyMarshal_ReadShortFromFile(FILE *fp)
916{
917 RFILE rf;
Thomas Wouters7f401ef2006-03-01 22:30:47 +0000918 assert(fp);
Guido van Rossumb8cf3e62001-10-19 01:46:21 +0000919 rf.fp = fp;
Thomas Wouters7464b432006-03-01 22:34:09 +0000920 rf.strings = NULL;
921 rf.end = rf.ptr = NULL;
Guido van Rossumb8cf3e62001-10-19 01:46:21 +0000922 return r_short(&rf);
923}
924
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000925long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000926PyMarshal_ReadLongFromFile(FILE *fp)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000927{
928 RFILE rf;
929 rf.fp = fp;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000930 rf.strings = NULL;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000931 return r_long(&rf);
932}
933
Tim Peters691e0e92001-01-18 04:39:16 +0000934#ifdef HAVE_FSTAT
935/* Return size of file in bytes; < 0 if unknown. */
936static off_t
937getfilesize(FILE *fp)
938{
939 struct stat st;
940 if (fstat(fileno(fp), &st) != 0)
941 return -1;
942 else
943 return st.st_size;
944}
945#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000946
Tim Peters691e0e92001-01-18 04:39:16 +0000947/* If we can get the size of the file up-front, and it's reasonably small,
948 * read it in one gulp and delegate to ...FromString() instead. Much quicker
949 * than reading a byte at a time from file; speeds .pyc imports.
Tim Petersd9b9ac82001-01-28 00:27:39 +0000950 * CAUTION: since this may read the entire remainder of the file, don't
951 * call it unless you know you're done with the file.
Tim Peters691e0e92001-01-18 04:39:16 +0000952 */
Guido van Rossum79f25d91997-04-29 20:08:16 +0000953PyObject *
Tim Petersd9b9ac82001-01-28 00:27:39 +0000954PyMarshal_ReadLastObjectFromFile(FILE *fp)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000955{
Tim Peters691e0e92001-01-18 04:39:16 +0000956/* 75% of 2.1's .pyc files can exploit SMALL_FILE_LIMIT.
957 * REASONABLE_FILE_LIMIT is by defn something big enough for Tkinter.pyc.
958 */
959#define SMALL_FILE_LIMIT (1L << 14)
960#define REASONABLE_FILE_LIMIT (1L << 18)
Tim Peters691e0e92001-01-18 04:39:16 +0000961#ifdef HAVE_FSTAT
962 off_t filesize;
963#endif
Tim Peters691e0e92001-01-18 04:39:16 +0000964#ifdef HAVE_FSTAT
965 filesize = getfilesize(fp);
966 if (filesize > 0) {
967 char buf[SMALL_FILE_LIMIT];
968 char* pBuf = NULL;
969 if (filesize <= SMALL_FILE_LIMIT)
970 pBuf = buf;
971 else if (filesize <= REASONABLE_FILE_LIMIT)
972 pBuf = (char *)PyMem_MALLOC(filesize);
973 if (pBuf != NULL) {
974 PyObject* v;
Martin v. Löwis18e16552006-02-15 17:27:45 +0000975 size_t n;
976 /* filesize must fit into an int, because it
977 is smaller than REASONABLE_FILE_LIMIT */
978 n = fread(pBuf, 1, (int)filesize, fp);
Tim Peters691e0e92001-01-18 04:39:16 +0000979 v = PyMarshal_ReadObjectFromString(pBuf, n);
980 if (pBuf != buf)
981 PyMem_FREE(pBuf);
982 return v;
983 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000984
Tim Peters691e0e92001-01-18 04:39:16 +0000985 }
986#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000987 /* We don't have fstat, or we do but the file is larger than
988 * REASONABLE_FILE_LIMIT or malloc failed -- read a byte at a time.
989 */
990 return PyMarshal_ReadObjectFromFile(fp);
991
Tim Peters691e0e92001-01-18 04:39:16 +0000992#undef SMALL_FILE_LIMIT
993#undef REASONABLE_FILE_LIMIT
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000994}
995
Guido van Rossum79f25d91997-04-29 20:08:16 +0000996PyObject *
Tim Petersd9b9ac82001-01-28 00:27:39 +0000997PyMarshal_ReadObjectFromFile(FILE *fp)
998{
999 RFILE rf;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001000 PyObject *result;
Tim Petersd9b9ac82001-01-28 00:27:39 +00001001 rf.fp = fp;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001002 rf.strings = PyList_New(0);
1003 result = r_object(&rf);
1004 Py_DECREF(rf.strings);
1005 return result;
Tim Petersd9b9ac82001-01-28 00:27:39 +00001006}
1007
1008PyObject *
Martin v. Löwis18e16552006-02-15 17:27:45 +00001009PyMarshal_ReadObjectFromString(char *str, Py_ssize_t len)
Guido van Rossumf56e3db1993-04-01 20:59:32 +00001010{
1011 RFILE rf;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001012 PyObject *result;
Guido van Rossumf56e3db1993-04-01 20:59:32 +00001013 rf.fp = NULL;
Guido van Rossumf56e3db1993-04-01 20:59:32 +00001014 rf.ptr = str;
1015 rf.end = str + len;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001016 rf.strings = PyList_New(0);
1017 result = r_object(&rf);
1018 Py_DECREF(rf.strings);
1019 return result;
Guido van Rossumf56e3db1993-04-01 20:59:32 +00001020}
1021
Guido van Rossum79f25d91997-04-29 20:08:16 +00001022PyObject *
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001023PyMarshal_WriteObjectToString(PyObject *x, int version)
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001024{
1025 WFILE wf;
1026 wf.fp = NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001027 wf.str = PyString_FromStringAndSize((char *)NULL, 50);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001028 if (wf.str == NULL)
1029 return NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001030 wf.ptr = PyString_AS_STRING((PyStringObject *)wf.str);
1031 wf.end = wf.ptr + PyString_Size(wf.str);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001032 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +00001033 wf.depth = 0;
Michael W. Hudsondf888462005-06-03 14:41:55 +00001034 wf.version = version;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001035 wf.strings = (version > 0) ? PyDict_New() : NULL;
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001036 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001037 Py_XDECREF(wf.strings);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001038 if (wf.str != NULL)
Guido van Rossum79f25d91997-04-29 20:08:16 +00001039 _PyString_Resize(&wf.str,
1040 (int) (wf.ptr -
1041 PyString_AS_STRING((PyStringObject *)wf.str)));
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001042 if (wf.error) {
Guido van Rossum79f25d91997-04-29 20:08:16 +00001043 Py_XDECREF(wf.str);
Tim Petersd9b9ac82001-01-28 00:27:39 +00001044 PyErr_SetString(PyExc_ValueError,
Fred Drake6da0b912000-06-28 18:47:56 +00001045 (wf.error==1)?"unmarshallable object"
1046 :"object too deeply nested to marshal");
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001047 return NULL;
1048 }
1049 return wf.str;
1050}
1051
Guido van Rossum64b45521991-06-07 13:58:22 +00001052/* And an interface for Python programs... */
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001053
Guido van Rossum79f25d91997-04-29 20:08:16 +00001054static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001055marshal_dump(PyObject *self, PyObject *args)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001056{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001057 WFILE wf;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001058 PyObject *x;
1059 PyObject *f;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001060 int version = Py_MARSHAL_VERSION;
1061 if (!PyArg_ParseTuple(args, "OO|i:dump", &x, &f, &version))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001062 return NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001063 if (!PyFile_Check(f)) {
1064 PyErr_SetString(PyExc_TypeError,
1065 "marshal.dump() 2nd arg must be file");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001066 return NULL;
1067 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001068 wf.fp = PyFile_AsFile(f);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001069 wf.str = NULL;
1070 wf.ptr = wf.end = NULL;
Guido van Rossumf2150601996-06-26 20:41:23 +00001071 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +00001072 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001073 wf.strings = (version > 0) ? PyDict_New() : 0;
Neal Norwitzef785292005-11-16 05:04:51 +00001074 wf.version = version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001075 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001076 Py_XDECREF(wf.strings);
Guido van Rossumf2150601996-06-26 20:41:23 +00001077 if (wf.error) {
Tim Petersd9b9ac82001-01-28 00:27:39 +00001078 PyErr_SetString(PyExc_ValueError,
Fred Drake6da0b912000-06-28 18:47:56 +00001079 (wf.error==1)?"unmarshallable object"
1080 :"object too deeply nested to marshal");
Guido van Rossumf2150601996-06-26 20:41:23 +00001081 return NULL;
1082 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001083 Py_INCREF(Py_None);
1084 return Py_None;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001085}
1086
Guido van Rossum79f25d91997-04-29 20:08:16 +00001087static PyObject *
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001088marshal_load(PyObject *self, PyObject *f)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001089{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001090 RFILE rf;
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001091 PyObject *result;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001092 if (!PyFile_Check(f)) {
1093 PyErr_SetString(PyExc_TypeError,
1094 "marshal.load() arg must be file");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001095 return NULL;
1096 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001097 rf.fp = PyFile_AsFile(f);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001098 rf.strings = PyList_New(0);
1099 result = read_object(&rf);
1100 Py_DECREF(rf.strings);
1101 return result;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001102}
1103
Guido van Rossum79f25d91997-04-29 20:08:16 +00001104static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001105marshal_dumps(PyObject *self, PyObject *args)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001106{
Guido van Rossum79f25d91997-04-29 20:08:16 +00001107 PyObject *x;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001108 int version = Py_MARSHAL_VERSION;
Armin Rigo2ccea172004-12-20 12:25:57 +00001109 if (!PyArg_ParseTuple(args, "O|i:dumps", &x, &version))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001110 return NULL;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001111 return PyMarshal_WriteObjectToString(x, version);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001112}
1113
Guido van Rossum79f25d91997-04-29 20:08:16 +00001114static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001115marshal_loads(PyObject *self, PyObject *args)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001116{
1117 RFILE rf;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001118 char *s;
Thomas Wouters695934a2006-03-01 23:49:13 +00001119 Py_ssize_t n;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001120 PyObject* result;
Michael W. Hudson01fca112005-06-13 17:50:18 +00001121 if (!PyArg_ParseTuple(args, "s#:loads", &s, &n))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001122 return NULL;
1123 rf.fp = NULL;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001124 rf.ptr = s;
1125 rf.end = s + n;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001126 rf.strings = PyList_New(0);
1127 result = read_object(&rf);
1128 Py_DECREF(rf.strings);
1129 return result;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001130}
1131
Guido van Rossum79f25d91997-04-29 20:08:16 +00001132static PyMethodDef marshal_methods[] = {
Neal Norwitz031829d2002-03-31 14:37:44 +00001133 {"dump", marshal_dump, METH_VARARGS},
Thomas Wouters4d70c3d2006-06-08 14:42:34 +00001134 {"load", marshal_load, METH_O},
Neal Norwitz031829d2002-03-31 14:37:44 +00001135 {"dumps", marshal_dumps, METH_VARARGS},
1136 {"loads", marshal_loads, METH_VARARGS},
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001137 {NULL, NULL} /* sentinel */
1138};
1139
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001140PyMODINIT_FUNC
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001141PyMarshal_Init(void)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001142{
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001143 PyObject *mod = Py_InitModule("marshal", marshal_methods);
Neal Norwitz1ac754f2006-01-19 06:09:39 +00001144 if (mod == NULL)
1145 return;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001146 PyModule_AddIntConstant(mod, "version", Py_MARSHAL_VERSION);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001147}