blob: 4114c8edc3fb289cebeb04645c2f34d78f063451 [file] [log] [blame]
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001
2/* Write Python objects to files and read them back.
3 This is intended for writing and reading compiled Python code only;
4 a true persistent storage facility would be much harder, since
5 it would have to take circular links and sharing into account. */
6
Guido van Rossum79f25d91997-04-29 20:08:16 +00007#include "Python.h"
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00008#include "longintrepr.h"
Jeremy Hylton3e0055f2005-10-20 19:59:25 +00009#include "code.h"
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000010#include "compile.h"
11#include "marshal.h"
12
Fred Drake6da0b912000-06-28 18:47:56 +000013/* High water mark to determine when the marshalled object is dangerously deep
14 * and risks coring the interpreter. When the object stack gets this deep,
15 * raise an exception instead of continuing.
16 */
17#define MAX_MARSHAL_STACK_DEPTH 5000
18
Michael W. Hudsondf888462005-06-03 14:41:55 +000019#define TYPE_NULL '0'
20#define TYPE_NONE 'N'
21#define TYPE_FALSE 'F'
22#define TYPE_TRUE 'T'
23#define TYPE_STOPITER 'S'
24#define TYPE_ELLIPSIS '.'
25#define TYPE_INT 'i'
26#define TYPE_INT64 'I'
27#define TYPE_FLOAT 'f'
28#define TYPE_BINARY_FLOAT 'g'
29#define TYPE_COMPLEX 'x'
30#define TYPE_BINARY_COMPLEX 'y'
31#define TYPE_LONG 'l'
32#define TYPE_STRING 's'
33#define TYPE_INTERNED 't'
34#define TYPE_STRINGREF 'R'
35#define TYPE_TUPLE '('
36#define TYPE_LIST '['
37#define TYPE_DICT '{'
38#define TYPE_CODE 'c'
39#define TYPE_UNICODE 'u'
40#define TYPE_UNKNOWN '?'
41#define TYPE_SET '<'
42#define TYPE_FROZENSET '>'
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000043
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000044typedef struct {
45 FILE *fp;
Guido van Rossumf2150601996-06-26 20:41:23 +000046 int error;
Fred Drake6da0b912000-06-28 18:47:56 +000047 int depth;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000048 /* If fp == NULL, the following are valid: */
Guido van Rossum79f25d91997-04-29 20:08:16 +000049 PyObject *str;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000050 char *ptr;
51 char *end;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +000052 PyObject *strings; /* dict on marshal, list on unmarshal */
Michael W. Hudsondf888462005-06-03 14:41:55 +000053 int version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000054} WFILE;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000055
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000056#define w_byte(c, p) if (((p)->fp)) putc((c), (p)->fp); \
57 else if ((p)->ptr != (p)->end) *(p)->ptr++ = (c); \
58 else w_more(c, p)
59
60static void
Fredrik Lundh11534382000-07-23 18:24:06 +000061w_more(int c, WFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000062{
63 int size, newsize;
64 if (p->str == NULL)
65 return; /* An error already occurred */
Guido van Rossum79f25d91997-04-29 20:08:16 +000066 size = PyString_Size(p->str);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000067 newsize = size + 1024;
Guido van Rossum79f25d91997-04-29 20:08:16 +000068 if (_PyString_Resize(&p->str, newsize) != 0) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000069 p->ptr = p->end = NULL;
70 }
71 else {
Guido van Rossum79f25d91997-04-29 20:08:16 +000072 p->ptr = PyString_AS_STRING((PyStringObject *)p->str) + size;
73 p->end =
74 PyString_AS_STRING((PyStringObject *)p->str) + newsize;
Tim Peters8315ea52000-07-23 19:28:35 +000075 *p->ptr++ = Py_SAFE_DOWNCAST(c, int, char);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000076 }
77}
78
79static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +000080w_string(char *s, int n, WFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +000081{
82 if (p->fp != NULL) {
83 fwrite(s, 1, n, p->fp);
84 }
85 else {
86 while (--n >= 0) {
87 w_byte(*s, p);
88 s++;
89 }
90 }
91}
92
93static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +000094w_short(int x, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000095{
Thomas Heller3e1c18a2002-07-30 11:40:57 +000096 w_byte((char)( x & 0xff), p);
97 w_byte((char)((x>> 8) & 0xff), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +000098}
99
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000100static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000101w_long(long x, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000102{
Thomas Heller37d5a152002-07-30 11:44:44 +0000103 w_byte((char)( x & 0xff), p);
104 w_byte((char)((x>> 8) & 0xff), p);
105 w_byte((char)((x>>16) & 0xff), p);
106 w_byte((char)((x>>24) & 0xff), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000107}
108
Guido van Rossumc1547d91996-12-10 15:39:04 +0000109#if SIZEOF_LONG > 4
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000110static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000111w_long64(long x, WFILE *p)
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000112{
113 w_long(x, p);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000114 w_long(x>>32, p);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000115}
Guido van Rossumc1547d91996-12-10 15:39:04 +0000116#endif
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000117
118static void
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000119w_object(PyObject *v, WFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000120{
Guido van Rossum3a205f71995-02-17 15:10:07 +0000121 int i, n;
Fred Drake6da0b912000-06-28 18:47:56 +0000122
123 p->depth++;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000124
Fred Drake6da0b912000-06-28 18:47:56 +0000125 if (p->depth > MAX_MARSHAL_STACK_DEPTH) {
126 p->error = 2;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000127 }
Fred Drake6da0b912000-06-28 18:47:56 +0000128 else if (v == NULL) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000129 w_byte(TYPE_NULL, p);
Guido van Rossum730806d1998-04-10 22:27:42 +0000130 }
131 else if (v == Py_None) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000132 w_byte(TYPE_NONE, p);
Guido van Rossum730806d1998-04-10 22:27:42 +0000133 }
Tim Peters5ca576e2001-06-18 22:08:13 +0000134 else if (v == PyExc_StopIteration) {
135 w_byte(TYPE_STOPITER, p);
136 }
Guido van Rossum730806d1998-04-10 22:27:42 +0000137 else if (v == Py_Ellipsis) {
138 w_byte(TYPE_ELLIPSIS, p);
139 }
Guido van Rossum77f6a652002-04-03 22:41:51 +0000140 else if (v == Py_False) {
141 w_byte(TYPE_FALSE, p);
142 }
143 else if (v == Py_True) {
144 w_byte(TYPE_TRUE, p);
145 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000146 else if (PyInt_Check(v)) {
147 long x = PyInt_AS_LONG((PyIntObject *)v);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000148#if SIZEOF_LONG > 4
Tim Peters44714002001-04-10 05:02:52 +0000149 long y = Py_ARITHMETIC_RIGHT_SHIFT(long, x, 31);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000150 if (y && y != -1) {
151 w_byte(TYPE_INT64, p);
152 w_long64(x, p);
153 }
Guido van Rossumc1547d91996-12-10 15:39:04 +0000154 else
155#endif
156 {
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000157 w_byte(TYPE_INT, p);
158 w_long(x, p);
159 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000160 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000161 else if (PyLong_Check(v)) {
162 PyLongObject *ob = (PyLongObject *)v;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000163 w_byte(TYPE_LONG, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000164 n = ob->ob_size;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000165 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000166 if (n < 0)
167 n = -n;
168 for (i = 0; i < n; i++)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000169 w_short(ob->ob_digit[i], p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000170 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000171 else if (PyFloat_Check(v)) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000172 if (p->version > 1) {
Brett Cannonc9371d42005-06-25 08:23:41 +0000173 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000174 if (_PyFloat_Pack8(PyFloat_AsDouble(v),
175 buf, 1) < 0) {
176 p->error = 1;
177 return;
178 }
179 w_byte(TYPE_BINARY_FLOAT, p);
Brett Cannonc9371d42005-06-25 08:23:41 +0000180 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000181 }
182 else {
183 char buf[256]; /* Plenty to format any double */
184 PyFloat_AsReprString(buf, (PyFloatObject *)v);
185 n = strlen(buf);
186 w_byte(TYPE_FLOAT, p);
187 w_byte(n, p);
188 w_string(buf, n, p);
189 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000190 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000191#ifndef WITHOUT_COMPLEX
Guido van Rossum79f25d91997-04-29 20:08:16 +0000192 else if (PyComplex_Check(v)) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000193 if (p->version > 1) {
Brett Cannonc9371d42005-06-25 08:23:41 +0000194 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000195 if (_PyFloat_Pack8(PyComplex_RealAsDouble(v),
196 buf, 1) < 0) {
197 p->error = 1;
198 return;
199 }
200 w_byte(TYPE_BINARY_COMPLEX, p);
Brett Cannonc9371d42005-06-25 08:23:41 +0000201 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000202 if (_PyFloat_Pack8(PyComplex_ImagAsDouble(v),
203 buf, 1) < 0) {
204 p->error = 1;
205 return;
206 }
Brett Cannonc9371d42005-06-25 08:23:41 +0000207 w_string((char*)buf, 8, p);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000208 }
209 else {
210 char buf[256]; /* Plenty to format any double */
211 PyFloatObject *temp;
212 w_byte(TYPE_COMPLEX, p);
213 temp = (PyFloatObject*)PyFloat_FromDouble(
214 PyComplex_RealAsDouble(v));
215 PyFloat_AsReprString(buf, temp);
216 Py_DECREF(temp);
217 n = strlen(buf);
218 w_byte(n, p);
219 w_string(buf, n, p);
220 temp = (PyFloatObject*)PyFloat_FromDouble(
221 PyComplex_ImagAsDouble(v));
222 PyFloat_AsReprString(buf, temp);
223 Py_DECREF(temp);
224 n = strlen(buf);
225 w_byte(n, p);
226 w_string(buf, n, p);
227 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000228 }
229#endif
Guido van Rossum79f25d91997-04-29 20:08:16 +0000230 else if (PyString_Check(v)) {
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000231 if (p->strings && PyString_CHECK_INTERNED(v)) {
232 PyObject *o = PyDict_GetItem(p->strings, v);
233 if (o) {
234 long w = PyInt_AsLong(o);
235 w_byte(TYPE_STRINGREF, p);
236 w_long(w, p);
237 goto exit;
238 }
239 else {
240 o = PyInt_FromLong(PyDict_Size(p->strings));
241 PyDict_SetItem(p->strings, v, o);
242 Py_DECREF(o);
243 w_byte(TYPE_INTERNED, p);
244 }
245 }
246 else {
247 w_byte(TYPE_STRING, p);
248 }
Guido van Rossumc279b532000-03-10 23:03:02 +0000249 n = PyString_GET_SIZE(v);
Guido van Rossum3a205f71995-02-17 15:10:07 +0000250 w_long((long)n, p);
Guido van Rossumc279b532000-03-10 23:03:02 +0000251 w_string(PyString_AS_STRING(v), n, p);
252 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000253#ifdef Py_USING_UNICODE
Guido van Rossumc279b532000-03-10 23:03:02 +0000254 else if (PyUnicode_Check(v)) {
255 PyObject *utf8;
256 utf8 = PyUnicode_AsUTF8String(v);
257 if (utf8 == NULL) {
Guido van Rossum98626cd2000-06-28 23:24:19 +0000258 p->depth--;
259 p->error = 1;
260 return;
Guido van Rossumc279b532000-03-10 23:03:02 +0000261 }
262 w_byte(TYPE_UNICODE, p);
263 n = PyString_GET_SIZE(utf8);
264 w_long((long)n, p);
265 w_string(PyString_AS_STRING(utf8), n, p);
266 Py_DECREF(utf8);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000267 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000268#endif
Guido van Rossum79f25d91997-04-29 20:08:16 +0000269 else if (PyTuple_Check(v)) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000270 w_byte(TYPE_TUPLE, p);
Guido van Rossum79f25d91997-04-29 20:08:16 +0000271 n = PyTuple_Size(v);
Guido van Rossum3a205f71995-02-17 15:10:07 +0000272 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000273 for (i = 0; i < n; i++) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000274 w_object(PyTuple_GET_ITEM(v, i), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000275 }
276 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000277 else if (PyList_Check(v)) {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000278 w_byte(TYPE_LIST, p);
Guido van Rossumc279b532000-03-10 23:03:02 +0000279 n = PyList_GET_SIZE(v);
Guido van Rossum3a205f71995-02-17 15:10:07 +0000280 w_long((long)n, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000281 for (i = 0; i < n; i++) {
Guido van Rossumc279b532000-03-10 23:03:02 +0000282 w_object(PyList_GET_ITEM(v, i), p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000283 }
284 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000285 else if (PyDict_Check(v)) {
Guido van Rossum25831651993-05-19 14:50:45 +0000286 int pos;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000287 PyObject *key, *value;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000288 w_byte(TYPE_DICT, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000289 /* This one is NULL object terminated! */
Guido van Rossum25831651993-05-19 14:50:45 +0000290 pos = 0;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000291 while (PyDict_Next(v, &pos, &key, &value)) {
Guido van Rossum25831651993-05-19 14:50:45 +0000292 w_object(key, p);
293 w_object(value, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000294 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000295 w_object((PyObject *)NULL, p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000296 }
Raymond Hettingera422c342005-01-11 03:03:27 +0000297 else if (PyAnySet_Check(v)) {
Raymond Hettingera422c342005-01-11 03:03:27 +0000298 PyObject *value, *it;
299
300 if (PyObject_TypeCheck(v, &PySet_Type))
301 w_byte(TYPE_SET, p);
302 else
303 w_byte(TYPE_FROZENSET, p);
304 n = PyObject_Size(v);
305 if (n == -1) {
306 p->depth--;
307 p->error = 1;
308 return;
309 }
310 w_long((long)n, p);
311 it = PyObject_GetIter(v);
312 if (it == NULL) {
313 p->depth--;
314 p->error = 1;
315 return;
316 }
317 while ((value = PyIter_Next(it)) != NULL) {
318 w_object(value, p);
319 Py_DECREF(value);
320 }
321 Py_DECREF(it);
322 if (PyErr_Occurred()) {
323 p->depth--;
324 p->error = 1;
325 return;
326 }
327 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000328 else if (PyCode_Check(v)) {
329 PyCodeObject *co = (PyCodeObject *)v;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000330 w_byte(TYPE_CODE, p);
Neal Norwitz7fdcb412002-06-14 01:07:39 +0000331 w_long(co->co_argcount, p);
332 w_long(co->co_nlocals, p);
333 w_long(co->co_stacksize, p);
334 w_long(co->co_flags, p);
Guido van Rossumd076c731998-10-07 19:42:25 +0000335 w_object(co->co_code, p);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000336 w_object(co->co_consts, p);
337 w_object(co->co_names, p);
Guido van Rossum681d79a1995-07-18 14:51:37 +0000338 w_object(co->co_varnames, p);
Jeremy Hylton64949cb2001-01-25 20:06:59 +0000339 w_object(co->co_freevars, p);
340 w_object(co->co_cellvars, p);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000341 w_object(co->co_filename, p);
Guido van Rossum9bfef441993-03-29 10:43:31 +0000342 w_object(co->co_name, p);
Neal Norwitz7fdcb412002-06-14 01:07:39 +0000343 w_long(co->co_firstlineno, p);
Guido van Rossumd031c891997-01-24 03:44:17 +0000344 w_object(co->co_lnotab, p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000345 }
Jeremy Hylton9f64caa2001-11-09 22:02:48 +0000346 else if (PyObject_CheckReadBuffer(v)) {
Guido van Rossumd076c731998-10-07 19:42:25 +0000347 /* Write unknown buffer-style objects as a string */
348 char *s;
Jeremy Hylton9f64caa2001-11-09 22:02:48 +0000349 PyBufferProcs *pb = v->ob_type->tp_as_buffer;
Guido van Rossumd076c731998-10-07 19:42:25 +0000350 w_byte(TYPE_STRING, p);
351 n = (*pb->bf_getreadbuffer)(v, 0, (void **)&s);
352 w_long((long)n, p);
353 w_string(s, n, p);
354 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000355 else {
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000356 w_byte(TYPE_UNKNOWN, p);
Guido van Rossumf2150601996-06-26 20:41:23 +0000357 p->error = 1;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000358 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000359 exit:
Guido van Rossum98626cd2000-06-28 23:24:19 +0000360 p->depth--;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000361}
362
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000363/* version currently has no effect for writing longs. */
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000364void
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000365PyMarshal_WriteLongToFile(long x, FILE *fp, int version)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000366{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000367 WFILE wf;
368 wf.fp = fp;
Guido van Rossumf2150601996-06-26 20:41:23 +0000369 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +0000370 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000371 wf.strings = NULL;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000372 wf.version = version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000373 w_long(x, &wf);
374}
375
376void
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000377PyMarshal_WriteObjectToFile(PyObject *x, FILE *fp, int version)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000378{
379 WFILE wf;
380 wf.fp = fp;
Guido van Rossumf2150601996-06-26 20:41:23 +0000381 wf.error = 0;
Guido van Rossum98626cd2000-06-28 23:24:19 +0000382 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000383 wf.strings = (version > 0) ? PyDict_New() : NULL;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000384 wf.version = version;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000385 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000386 Py_XDECREF(wf.strings);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000387}
388
389typedef WFILE RFILE; /* Same struct with different invariants */
390
Guido van Rossum8d617a61995-03-09 12:12:11 +0000391#define rs_byte(p) (((p)->ptr != (p)->end) ? (unsigned char)*(p)->ptr++ : EOF)
392
393#define r_byte(p) ((p)->fp ? getc((p)->fp) : rs_byte(p))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000394
395static int
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000396r_string(char *s, int n, RFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000397{
398 if (p->fp != NULL)
399 return fread(s, 1, n, p->fp);
400 if (p->end - p->ptr < n)
401 n = p->end - p->ptr;
402 memcpy(s, p->ptr, n);
403 p->ptr += n;
404 return n;
405}
406
407static int
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000408r_short(RFILE *p)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000409{
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000410 register short x;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000411 x = r_byte(p);
412 x |= r_byte(p) << 8;
Tim Peterse84b7402000-09-19 08:54:13 +0000413 /* Sign-extension, in case short greater than 16 bits */
414 x |= -(x & 0x8000);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000415 return x;
416}
417
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000418static long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000419r_long(RFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000420{
421 register long x;
Guido van Rossum8d617a61995-03-09 12:12:11 +0000422 register FILE *fp = p->fp;
423 if (fp) {
424 x = getc(fp);
425 x |= (long)getc(fp) << 8;
426 x |= (long)getc(fp) << 16;
427 x |= (long)getc(fp) << 24;
428 }
429 else {
430 x = rs_byte(p);
431 x |= (long)rs_byte(p) << 8;
432 x |= (long)rs_byte(p) << 16;
433 x |= (long)rs_byte(p) << 24;
434 }
Guido van Rossumc1547d91996-12-10 15:39:04 +0000435#if SIZEOF_LONG > 4
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000436 /* Sign extension for 64-bit machines */
Tim Peterse84b7402000-09-19 08:54:13 +0000437 x |= -(x & 0x80000000L);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000438#endif
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000439 return x;
440}
441
Tim Peters82112372001-08-29 02:28:42 +0000442/* r_long64 deals with the TYPE_INT64 code. On a machine with
443 sizeof(long) > 4, it returns a Python int object, else a Python long
444 object. Note that w_long64 writes out TYPE_INT if 32 bits is enough,
445 so there's no inefficiency here in returning a PyLong on 32-bit boxes
446 for everything written via TYPE_INT64 (i.e., if an int is written via
447 TYPE_INT64, it *needs* more than 32 bits).
448*/
449static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000450r_long64(RFILE *p)
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000451{
Tim Peters82112372001-08-29 02:28:42 +0000452 long lo4 = r_long(p);
453 long hi4 = r_long(p);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000454#if SIZEOF_LONG > 4
Tim Peters82112372001-08-29 02:28:42 +0000455 long x = (hi4 << 32) | (lo4 & 0xFFFFFFFFL);
456 return PyInt_FromLong(x);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000457#else
Tim Peters82112372001-08-29 02:28:42 +0000458 unsigned char buf[8];
459 int one = 1;
460 int is_little_endian = (int)*(char*)&one;
461 if (is_little_endian) {
462 memcpy(buf, &lo4, 4);
463 memcpy(buf+4, &hi4, 4);
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000464 }
Tim Peters82112372001-08-29 02:28:42 +0000465 else {
466 memcpy(buf, &hi4, 4);
467 memcpy(buf+4, &lo4, 4);
468 }
469 return _PyLong_FromByteArray(buf, 8, is_little_endian, 1);
Guido van Rossumc1547d91996-12-10 15:39:04 +0000470#endif
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000471}
472
Guido van Rossum79f25d91997-04-29 20:08:16 +0000473static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000474r_object(RFILE *p)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000475{
Armin Rigo01ab2792004-03-26 15:09:27 +0000476 /* NULL is a valid return value, it does not necessarily means that
477 an exception is set. */
Raymond Hettingera422c342005-01-11 03:03:27 +0000478 PyObject *v, *v2, *v3;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000479 long i, n;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000480 int type = r_byte(p);
Tim Petersd9b9ac82001-01-28 00:27:39 +0000481
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000482 switch (type) {
Tim Petersd9b9ac82001-01-28 00:27:39 +0000483
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000484 case EOF:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000485 PyErr_SetString(PyExc_EOFError,
486 "EOF read where object expected");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000487 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000488
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000489 case TYPE_NULL:
490 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000491
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000492 case TYPE_NONE:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000493 Py_INCREF(Py_None);
494 return Py_None;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000495
Tim Peters5ca576e2001-06-18 22:08:13 +0000496 case TYPE_STOPITER:
497 Py_INCREF(PyExc_StopIteration);
498 return PyExc_StopIteration;
499
Guido van Rossume449af71996-10-11 16:25:41 +0000500 case TYPE_ELLIPSIS:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000501 Py_INCREF(Py_Ellipsis);
Guido van Rossume449af71996-10-11 16:25:41 +0000502 return Py_Ellipsis;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000503
Guido van Rossum77f6a652002-04-03 22:41:51 +0000504 case TYPE_FALSE:
505 Py_INCREF(Py_False);
506 return Py_False;
507
508 case TYPE_TRUE:
509 Py_INCREF(Py_True);
510 return Py_True;
511
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000512 case TYPE_INT:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000513 return PyInt_FromLong(r_long(p));
Tim Petersd9b9ac82001-01-28 00:27:39 +0000514
Guido van Rossumb0c168c1996-12-05 23:15:02 +0000515 case TYPE_INT64:
Tim Peters82112372001-08-29 02:28:42 +0000516 return r_long64(p);
Tim Petersd9b9ac82001-01-28 00:27:39 +0000517
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000518 case TYPE_LONG:
519 {
520 int size;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000521 PyLongObject *ob;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000522 n = r_long(p);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000523 size = n<0 ? -n : n;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000524 ob = _PyLong_New(size);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000525 if (ob == NULL)
526 return NULL;
527 ob->ob_size = n;
Armin Rigo01ab2792004-03-26 15:09:27 +0000528 for (i = 0; i < size; i++) {
529 int digit = r_short(p);
530 if (digit < 0) {
531 Py_DECREF(ob);
532 PyErr_SetString(PyExc_ValueError,
533 "bad marshal data");
534 return NULL;
535 }
536 ob->ob_digit[i] = digit;
537 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000538 return (PyObject *)ob;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000539 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000540
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000541 case TYPE_FLOAT:
542 {
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000543 char buf[256];
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000544 double dx;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000545 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000546 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000547 PyErr_SetString(PyExc_EOFError,
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000548 "EOF read where object expected");
549 return NULL;
550 }
551 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000552 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000553 dx = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000554 PyFPE_END_PROTECT(dx)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000555 return PyFloat_FromDouble(dx);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000556 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000557
Michael W. Hudsondf888462005-06-03 14:41:55 +0000558 case TYPE_BINARY_FLOAT:
559 {
Brett Cannonc9371d42005-06-25 08:23:41 +0000560 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000561 double x;
Brett Cannonc9371d42005-06-25 08:23:41 +0000562 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000563 PyErr_SetString(PyExc_EOFError,
564 "EOF read where object expected");
565 return NULL;
566 }
567 x = _PyFloat_Unpack8(buf, 1);
568 if (x == -1.0 && PyErr_Occurred()) {
569 return NULL;
570 }
571 return PyFloat_FromDouble(x);
572 }
573
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000574#ifndef WITHOUT_COMPLEX
575 case TYPE_COMPLEX:
576 {
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000577 char buf[256];
Guido van Rossum530956d1996-07-21 02:27:43 +0000578 Py_complex c;
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000579 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000580 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000581 PyErr_SetString(PyExc_EOFError,
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000582 "EOF read where object expected");
583 return NULL;
584 }
585 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000586 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000587 c.real = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000588 PyFPE_END_PROTECT(c)
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000589 n = r_byte(p);
Armin Rigo01ab2792004-03-26 15:09:27 +0000590 if (n == EOF || r_string(buf, (int)n, p) != n) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000591 PyErr_SetString(PyExc_EOFError,
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000592 "EOF read where object expected");
593 return NULL;
594 }
595 buf[n] = '\0';
Guido van Rossum0ae748d1997-02-14 22:58:07 +0000596 PyFPE_START_PROTECT("atof", return 0)
Martin v. Löwis737ea822004-06-08 18:52:54 +0000597 c.imag = PyOS_ascii_atof(buf);
Guido van Rossum45b83911997-03-14 04:32:50 +0000598 PyFPE_END_PROTECT(c)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000599 return PyComplex_FromCComplex(c);
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000600 }
Michael W. Hudsondf888462005-06-03 14:41:55 +0000601
602 case TYPE_BINARY_COMPLEX:
603 {
Brett Cannonc9371d42005-06-25 08:23:41 +0000604 unsigned char buf[8];
Michael W. Hudsondf888462005-06-03 14:41:55 +0000605 Py_complex c;
Brett Cannonc9371d42005-06-25 08:23:41 +0000606 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000607 PyErr_SetString(PyExc_EOFError,
608 "EOF read where object expected");
609 return NULL;
610 }
611 c.real = _PyFloat_Unpack8(buf, 1);
612 if (c.real == -1.0 && PyErr_Occurred()) {
613 return NULL;
614 }
Brett Cannonc9371d42005-06-25 08:23:41 +0000615 if (r_string((char*)buf, 8, p) != 8) {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000616 PyErr_SetString(PyExc_EOFError,
617 "EOF read where object expected");
618 return NULL;
619 }
620 c.imag = _PyFloat_Unpack8(buf, 1);
621 if (c.imag == -1.0 && PyErr_Occurred()) {
622 return NULL;
623 }
624 return PyComplex_FromCComplex(c);
625 }
Guido van Rossum8a5c5d21996-01-12 01:09:56 +0000626#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000627
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000628 case TYPE_INTERNED:
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000629 case TYPE_STRING:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000630 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000631 if (n < 0) {
632 PyErr_SetString(PyExc_ValueError, "bad marshal data");
633 return NULL;
634 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000635 v = PyString_FromStringAndSize((char *)NULL, n);
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000636 if (v == NULL)
637 return v;
638 if (r_string(PyString_AS_STRING(v), (int)n, p) != n) {
639 Py_DECREF(v);
640 PyErr_SetString(PyExc_EOFError,
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000641 "EOF read where object expected");
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000642 return NULL;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000643 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000644 if (type == TYPE_INTERNED) {
645 PyString_InternInPlace(&v);
646 PyList_Append(p->strings, v);
647 }
648 return v;
649
650 case TYPE_STRINGREF:
651 n = r_long(p);
Michael W. Hudsonf2ca5af2005-06-13 18:28:46 +0000652 if (n < 0 || n >= PyList_GET_SIZE(p->strings)) {
653 PyErr_SetString(PyExc_ValueError, "bad marshal data");
654 return NULL;
655 }
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000656 v = PyList_GET_ITEM(p->strings, n);
657 Py_INCREF(v);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000658 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000659
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000660#ifdef Py_USING_UNICODE
Guido van Rossumc279b532000-03-10 23:03:02 +0000661 case TYPE_UNICODE:
662 {
663 char *buffer;
664
665 n = r_long(p);
666 if (n < 0) {
667 PyErr_SetString(PyExc_ValueError, "bad marshal data");
668 return NULL;
669 }
Guido van Rossumb18618d2000-05-03 23:44:39 +0000670 buffer = PyMem_NEW(char, n);
Guido van Rossumc279b532000-03-10 23:03:02 +0000671 if (buffer == NULL)
Guido van Rossumb18618d2000-05-03 23:44:39 +0000672 return PyErr_NoMemory();
Guido van Rossumc279b532000-03-10 23:03:02 +0000673 if (r_string(buffer, (int)n, p) != n) {
Guido van Rossumb18618d2000-05-03 23:44:39 +0000674 PyMem_DEL(buffer);
Guido van Rossumc279b532000-03-10 23:03:02 +0000675 PyErr_SetString(PyExc_EOFError,
676 "EOF read where object expected");
677 return NULL;
678 }
679 v = PyUnicode_DecodeUTF8(buffer, n, NULL);
Guido van Rossumb18618d2000-05-03 23:44:39 +0000680 PyMem_DEL(buffer);
Guido van Rossumc279b532000-03-10 23:03:02 +0000681 return v;
682 }
Martin v. Löwis339d0f72001-08-17 18:39:25 +0000683#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000684
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000685 case TYPE_TUPLE:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000686 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000687 if (n < 0) {
688 PyErr_SetString(PyExc_ValueError, "bad marshal data");
689 return NULL;
690 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000691 v = PyTuple_New((int)n);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000692 if (v == NULL)
693 return v;
Jack Jansen9513f2c1995-10-27 13:21:28 +0000694 for (i = 0; i < n; i++) {
695 v2 = r_object(p);
696 if ( v2 == NULL ) {
Armin Rigo01ab2792004-03-26 15:09:27 +0000697 if (!PyErr_Occurred())
698 PyErr_SetString(PyExc_TypeError,
699 "NULL object in marshal data");
Guido van Rossum79f25d91997-04-29 20:08:16 +0000700 Py_DECREF(v);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000701 v = NULL;
702 break;
703 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000704 PyTuple_SET_ITEM(v, (int)i, v2);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000705 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000706 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000707
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000708 case TYPE_LIST:
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000709 n = r_long(p);
Guido van Rossuma45cb451998-06-08 20:27:29 +0000710 if (n < 0) {
711 PyErr_SetString(PyExc_ValueError, "bad marshal data");
712 return NULL;
713 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000714 v = PyList_New((int)n);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000715 if (v == NULL)
716 return v;
Jack Jansen9513f2c1995-10-27 13:21:28 +0000717 for (i = 0; i < n; i++) {
718 v2 = r_object(p);
719 if ( v2 == NULL ) {
Armin Rigo01ab2792004-03-26 15:09:27 +0000720 if (!PyErr_Occurred())
721 PyErr_SetString(PyExc_TypeError,
722 "NULL object in marshal data");
Guido van Rossum79f25d91997-04-29 20:08:16 +0000723 Py_DECREF(v);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000724 v = NULL;
725 break;
726 }
Guido van Rossum79f25d91997-04-29 20:08:16 +0000727 PyList_SetItem(v, (int)i, v2);
Jack Jansen9513f2c1995-10-27 13:21:28 +0000728 }
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000729 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000730
Guido van Rossum64b45521991-06-07 13:58:22 +0000731 case TYPE_DICT:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000732 v = PyDict_New();
Guido van Rossum64b45521991-06-07 13:58:22 +0000733 if (v == NULL)
734 return NULL;
735 for (;;) {
Guido van Rossum79f25d91997-04-29 20:08:16 +0000736 PyObject *key, *val;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000737 key = r_object(p);
Guido van Rossum64b45521991-06-07 13:58:22 +0000738 if (key == NULL)
Armin Rigo01ab2792004-03-26 15:09:27 +0000739 break;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000740 val = r_object(p);
Guido van Rossumf2150601996-06-26 20:41:23 +0000741 if (val != NULL)
Guido van Rossum79f25d91997-04-29 20:08:16 +0000742 PyDict_SetItem(v, key, val);
743 Py_DECREF(key);
744 Py_XDECREF(val);
Guido van Rossum64b45521991-06-07 13:58:22 +0000745 }
Armin Rigo01ab2792004-03-26 15:09:27 +0000746 if (PyErr_Occurred()) {
747 Py_DECREF(v);
748 v = NULL;
749 }
Guido van Rossum64b45521991-06-07 13:58:22 +0000750 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000751
Raymond Hettingera422c342005-01-11 03:03:27 +0000752 case TYPE_SET:
753 case TYPE_FROZENSET:
754 n = r_long(p);
755 if (n < 0) {
756 PyErr_SetString(PyExc_ValueError, "bad marshal data");
757 return NULL;
758 }
759 v = PyTuple_New((int)n);
760 if (v == NULL)
761 return v;
762 for (i = 0; i < n; i++) {
763 v2 = r_object(p);
764 if ( v2 == NULL ) {
765 if (!PyErr_Occurred())
766 PyErr_SetString(PyExc_TypeError,
767 "NULL object in marshal data");
768 Py_DECREF(v);
769 v = NULL;
770 break;
771 }
772 PyTuple_SET_ITEM(v, (int)i, v2);
773 }
Michael W. Hudson6d6917b2005-06-03 15:17:16 +0000774 if (v == NULL)
775 return v;
Raymond Hettingera422c342005-01-11 03:03:27 +0000776 if (type == TYPE_SET)
Raymond Hettingerbeb31012005-08-16 03:47:52 +0000777 v3 = PySet_New(v);
Raymond Hettingera422c342005-01-11 03:03:27 +0000778 else
Raymond Hettingerbeb31012005-08-16 03:47:52 +0000779 v3 = PyFrozenSet_New(v);
Raymond Hettingera422c342005-01-11 03:03:27 +0000780 Py_DECREF(v);
781 return v3;
782
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000783 case TYPE_CODE:
Michael W. Hudson80199132001-08-30 14:50:20 +0000784 if (PyEval_GetRestricted()) {
785 PyErr_SetString(PyExc_RuntimeError,
786 "cannot unmarshal code objects in "
787 "restricted execution mode");
788 return NULL;
789 }
790 else {
Michael W. Hudsondf888462005-06-03 14:41:55 +0000791 int argcount;
792 int nlocals;
793 int stacksize;
794 int flags;
795 PyObject *code = NULL;
796 PyObject *consts = NULL;
797 PyObject *names = NULL;
798 PyObject *varnames = NULL;
799 PyObject *freevars = NULL;
800 PyObject *cellvars = NULL;
801 PyObject *filename = NULL;
802 PyObject *name = NULL;
803 int firstlineno;
804 PyObject *lnotab = NULL;
805
806 v = NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000807
Michael W. Hudsondf888462005-06-03 14:41:55 +0000808 argcount = r_long(p);
809 nlocals = r_long(p);
810 stacksize = r_long(p);
811 flags = r_long(p);
812 code = r_object(p);
813 if (code == NULL)
814 goto code_error;
815 consts = r_object(p);
816 if (consts == NULL)
817 goto code_error;
818 names = r_object(p);
819 if (names == NULL)
820 goto code_error;
821 varnames = r_object(p);
822 if (varnames == NULL)
823 goto code_error;
824 freevars = r_object(p);
825 if (freevars == NULL)
826 goto code_error;
827 cellvars = r_object(p);
828 if (cellvars == NULL)
829 goto code_error;
830 filename = r_object(p);
831 if (filename == NULL)
832 goto code_error;
833 name = r_object(p);
834 if (name == NULL)
835 goto code_error;
836 firstlineno = r_long(p);
837 lnotab = r_object(p);
838 if (lnotab == NULL)
839 goto code_error;
840
841 v = (PyObject *) PyCode_New(
Tim Petersd9b9ac82001-01-28 00:27:39 +0000842 argcount, nlocals, stacksize, flags,
Guido van Rossum681d79a1995-07-18 14:51:37 +0000843 code, consts, names, varnames,
Tim Petersd9b9ac82001-01-28 00:27:39 +0000844 freevars, cellvars, filename, name,
845 firstlineno, lnotab);
Michael W. Hudsondf888462005-06-03 14:41:55 +0000846
847 code_error:
Guido van Rossum79f25d91997-04-29 20:08:16 +0000848 Py_XDECREF(code);
849 Py_XDECREF(consts);
850 Py_XDECREF(names);
851 Py_XDECREF(varnames);
Jeremy Hylton64949cb2001-01-25 20:06:59 +0000852 Py_XDECREF(freevars);
853 Py_XDECREF(cellvars);
Guido van Rossum79f25d91997-04-29 20:08:16 +0000854 Py_XDECREF(filename);
855 Py_XDECREF(name);
Guido van Rossum6fc06e71997-07-26 23:30:18 +0000856 Py_XDECREF(lnotab);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000857
858 }
859 return v;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000860
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000861 default:
Guido van Rossumf2150601996-06-26 20:41:23 +0000862 /* Bogus data got written, which isn't ideal.
863 This will let you keep working and recover. */
Guido van Rossuma45cb451998-06-08 20:27:29 +0000864 PyErr_SetString(PyExc_ValueError, "bad marshal data");
865 return NULL;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000866
Guido van Rossumdce2e3d1991-06-04 19:42:30 +0000867 }
868}
869
Neal Norwitzd85c4522004-06-13 20:31:49 +0000870static PyObject *
Armin Rigo01ab2792004-03-26 15:09:27 +0000871read_object(RFILE *p)
872{
873 PyObject *v;
874 if (PyErr_Occurred()) {
875 fprintf(stderr, "XXX readobject called with exception set\n");
876 return NULL;
877 }
878 v = r_object(p);
879 if (v == NULL && !PyErr_Occurred())
880 PyErr_SetString(PyExc_TypeError, "NULL object in marshal data");
881 return v;
882}
883
Guido van Rossumb8cf3e62001-10-19 01:46:21 +0000884int
885PyMarshal_ReadShortFromFile(FILE *fp)
886{
887 RFILE rf;
888 rf.fp = fp;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000889 rf.strings = NULL;
Guido van Rossumb8cf3e62001-10-19 01:46:21 +0000890 return r_short(&rf);
891}
892
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000893long
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000894PyMarshal_ReadLongFromFile(FILE *fp)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000895{
896 RFILE rf;
897 rf.fp = fp;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000898 rf.strings = NULL;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000899 return r_long(&rf);
900}
901
Tim Peters691e0e92001-01-18 04:39:16 +0000902#ifdef HAVE_FSTAT
903/* Return size of file in bytes; < 0 if unknown. */
904static off_t
905getfilesize(FILE *fp)
906{
907 struct stat st;
908 if (fstat(fileno(fp), &st) != 0)
909 return -1;
910 else
911 return st.st_size;
912}
913#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000914
Tim Peters691e0e92001-01-18 04:39:16 +0000915/* If we can get the size of the file up-front, and it's reasonably small,
916 * read it in one gulp and delegate to ...FromString() instead. Much quicker
917 * than reading a byte at a time from file; speeds .pyc imports.
Tim Petersd9b9ac82001-01-28 00:27:39 +0000918 * CAUTION: since this may read the entire remainder of the file, don't
919 * call it unless you know you're done with the file.
Tim Peters691e0e92001-01-18 04:39:16 +0000920 */
Guido van Rossum79f25d91997-04-29 20:08:16 +0000921PyObject *
Tim Petersd9b9ac82001-01-28 00:27:39 +0000922PyMarshal_ReadLastObjectFromFile(FILE *fp)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000923{
Tim Peters691e0e92001-01-18 04:39:16 +0000924/* 75% of 2.1's .pyc files can exploit SMALL_FILE_LIMIT.
925 * REASONABLE_FILE_LIMIT is by defn something big enough for Tkinter.pyc.
926 */
927#define SMALL_FILE_LIMIT (1L << 14)
928#define REASONABLE_FILE_LIMIT (1L << 18)
Tim Peters691e0e92001-01-18 04:39:16 +0000929#ifdef HAVE_FSTAT
930 off_t filesize;
931#endif
Tim Peters691e0e92001-01-18 04:39:16 +0000932#ifdef HAVE_FSTAT
933 filesize = getfilesize(fp);
934 if (filesize > 0) {
935 char buf[SMALL_FILE_LIMIT];
936 char* pBuf = NULL;
937 if (filesize <= SMALL_FILE_LIMIT)
938 pBuf = buf;
939 else if (filesize <= REASONABLE_FILE_LIMIT)
940 pBuf = (char *)PyMem_MALLOC(filesize);
941 if (pBuf != NULL) {
942 PyObject* v;
943 size_t n = fread(pBuf, 1, filesize, fp);
944 v = PyMarshal_ReadObjectFromString(pBuf, n);
945 if (pBuf != buf)
946 PyMem_FREE(pBuf);
947 return v;
948 }
Tim Petersd9b9ac82001-01-28 00:27:39 +0000949
Tim Peters691e0e92001-01-18 04:39:16 +0000950 }
951#endif
Tim Petersd9b9ac82001-01-28 00:27:39 +0000952 /* We don't have fstat, or we do but the file is larger than
953 * REASONABLE_FILE_LIMIT or malloc failed -- read a byte at a time.
954 */
955 return PyMarshal_ReadObjectFromFile(fp);
956
Tim Peters691e0e92001-01-18 04:39:16 +0000957#undef SMALL_FILE_LIMIT
958#undef REASONABLE_FILE_LIMIT
Guido van Rossum0b0db8e1993-01-21 16:07:51 +0000959}
960
Guido van Rossum79f25d91997-04-29 20:08:16 +0000961PyObject *
Tim Petersd9b9ac82001-01-28 00:27:39 +0000962PyMarshal_ReadObjectFromFile(FILE *fp)
963{
964 RFILE rf;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000965 PyObject *result;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000966 rf.fp = fp;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000967 rf.strings = PyList_New(0);
968 result = r_object(&rf);
969 Py_DECREF(rf.strings);
970 return result;
Tim Petersd9b9ac82001-01-28 00:27:39 +0000971}
972
973PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +0000974PyMarshal_ReadObjectFromString(char *str, int len)
Guido van Rossumf56e3db1993-04-01 20:59:32 +0000975{
976 RFILE rf;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000977 PyObject *result;
Guido van Rossumf56e3db1993-04-01 20:59:32 +0000978 rf.fp = NULL;
Guido van Rossumf56e3db1993-04-01 20:59:32 +0000979 rf.ptr = str;
980 rf.end = str + len;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000981 rf.strings = PyList_New(0);
982 result = r_object(&rf);
983 Py_DECREF(rf.strings);
984 return result;
Guido van Rossumf56e3db1993-04-01 20:59:32 +0000985}
986
Guido van Rossum79f25d91997-04-29 20:08:16 +0000987PyObject *
Martin v. Löwisef82d2f2004-06-27 16:51:46 +0000988PyMarshal_WriteObjectToString(PyObject *x, int version)
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +0000989{
990 WFILE wf;
991 wf.fp = NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000992 wf.str = PyString_FromStringAndSize((char *)NULL, 50);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +0000993 if (wf.str == NULL)
994 return NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +0000995 wf.ptr = PyString_AS_STRING((PyStringObject *)wf.str);
996 wf.end = wf.ptr + PyString_Size(wf.str);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +0000997 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +0000998 wf.depth = 0;
Michael W. Hudsondf888462005-06-03 14:41:55 +0000999 wf.version = version;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001000 wf.strings = (version > 0) ? PyDict_New() : NULL;
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001001 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001002 Py_XDECREF(wf.strings);
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001003 if (wf.str != NULL)
Guido van Rossum79f25d91997-04-29 20:08:16 +00001004 _PyString_Resize(&wf.str,
1005 (int) (wf.ptr -
1006 PyString_AS_STRING((PyStringObject *)wf.str)));
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001007 if (wf.error) {
Guido van Rossum79f25d91997-04-29 20:08:16 +00001008 Py_XDECREF(wf.str);
Tim Petersd9b9ac82001-01-28 00:27:39 +00001009 PyErr_SetString(PyExc_ValueError,
Fred Drake6da0b912000-06-28 18:47:56 +00001010 (wf.error==1)?"unmarshallable object"
1011 :"object too deeply nested to marshal");
Guido van Rossum3f3bb3d1996-08-19 22:07:17 +00001012 return NULL;
1013 }
1014 return wf.str;
1015}
1016
Guido van Rossum64b45521991-06-07 13:58:22 +00001017/* And an interface for Python programs... */
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001018
Guido van Rossum79f25d91997-04-29 20:08:16 +00001019static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001020marshal_dump(PyObject *self, PyObject *args)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001021{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001022 WFILE wf;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001023 PyObject *x;
1024 PyObject *f;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001025 int version = Py_MARSHAL_VERSION;
1026 if (!PyArg_ParseTuple(args, "OO|i:dump", &x, &f, &version))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001027 return NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001028 if (!PyFile_Check(f)) {
1029 PyErr_SetString(PyExc_TypeError,
1030 "marshal.dump() 2nd arg must be file");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001031 return NULL;
1032 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001033 wf.fp = PyFile_AsFile(f);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001034 wf.str = NULL;
1035 wf.ptr = wf.end = NULL;
Guido van Rossumf2150601996-06-26 20:41:23 +00001036 wf.error = 0;
Fred Drake6da0b912000-06-28 18:47:56 +00001037 wf.depth = 0;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001038 wf.strings = (version > 0) ? PyDict_New() : 0;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001039 w_object(x, &wf);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001040 Py_XDECREF(wf.strings);
Guido van Rossumf2150601996-06-26 20:41:23 +00001041 if (wf.error) {
Tim Petersd9b9ac82001-01-28 00:27:39 +00001042 PyErr_SetString(PyExc_ValueError,
Fred Drake6da0b912000-06-28 18:47:56 +00001043 (wf.error==1)?"unmarshallable object"
1044 :"object too deeply nested to marshal");
Guido van Rossumf2150601996-06-26 20:41:23 +00001045 return NULL;
1046 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001047 Py_INCREF(Py_None);
1048 return Py_None;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001049}
1050
Guido van Rossum79f25d91997-04-29 20:08:16 +00001051static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001052marshal_load(PyObject *self, PyObject *args)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001053{
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001054 RFILE rf;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001055 PyObject *f, *result;
Guido van Rossum2efa3692000-03-31 00:37:41 +00001056 if (!PyArg_ParseTuple(args, "O:load", &f))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001057 return NULL;
Guido van Rossum79f25d91997-04-29 20:08:16 +00001058 if (!PyFile_Check(f)) {
1059 PyErr_SetString(PyExc_TypeError,
1060 "marshal.load() arg must be file");
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001061 return NULL;
1062 }
Guido van Rossum79f25d91997-04-29 20:08:16 +00001063 rf.fp = PyFile_AsFile(f);
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001064 rf.strings = PyList_New(0);
1065 result = read_object(&rf);
1066 Py_DECREF(rf.strings);
1067 return result;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001068}
1069
Guido van Rossum79f25d91997-04-29 20:08:16 +00001070static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001071marshal_dumps(PyObject *self, PyObject *args)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001072{
Guido van Rossum79f25d91997-04-29 20:08:16 +00001073 PyObject *x;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001074 int version = Py_MARSHAL_VERSION;
Armin Rigo2ccea172004-12-20 12:25:57 +00001075 if (!PyArg_ParseTuple(args, "O|i:dumps", &x, &version))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001076 return NULL;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001077 return PyMarshal_WriteObjectToString(x, version);
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001078}
1079
Guido van Rossum79f25d91997-04-29 20:08:16 +00001080static PyObject *
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001081marshal_loads(PyObject *self, PyObject *args)
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001082{
1083 RFILE rf;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001084 char *s;
1085 int n;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001086 PyObject* result;
Michael W. Hudson01fca112005-06-13 17:50:18 +00001087 if (!PyArg_ParseTuple(args, "s#:loads", &s, &n))
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001088 return NULL;
1089 rf.fp = NULL;
Guido van Rossum0b0db8e1993-01-21 16:07:51 +00001090 rf.ptr = s;
1091 rf.end = s + n;
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001092 rf.strings = PyList_New(0);
1093 result = read_object(&rf);
1094 Py_DECREF(rf.strings);
1095 return result;
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001096}
1097
Guido van Rossum79f25d91997-04-29 20:08:16 +00001098static PyMethodDef marshal_methods[] = {
Neal Norwitz031829d2002-03-31 14:37:44 +00001099 {"dump", marshal_dump, METH_VARARGS},
1100 {"load", marshal_load, METH_VARARGS},
1101 {"dumps", marshal_dumps, METH_VARARGS},
1102 {"loads", marshal_loads, METH_VARARGS},
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001103 {NULL, NULL} /* sentinel */
1104};
1105
Jason Tishler6bc06ec2003-09-04 11:59:50 +00001106PyMODINIT_FUNC
Thomas Woutersf70ef4f2000-07-22 18:47:25 +00001107PyMarshal_Init(void)
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001108{
Martin v. Löwisef82d2f2004-06-27 16:51:46 +00001109 PyObject *mod = Py_InitModule("marshal", marshal_methods);
1110 PyModule_AddIntConstant(mod, "version", Py_MARSHAL_VERSION);
Guido van Rossumdce2e3d1991-06-04 19:42:30 +00001111}