blob: 4cc6629d532e97304b382d9bf3937b7c3e477a06 [file] [log] [blame]
Guido van Rossum54f22ed2000-02-04 15:10:34 +00001"""Create portable serialized representations of Python objects.
Guido van Rossuma48061a1995-01-10 00:31:14 +00002
Guido van Rossume467be61997-12-05 19:42:42 +00003See module cPickle for a (much) faster implementation.
4See module copy_reg for a mechanism for registering custom picklers.
Guido van Rossuma48061a1995-01-10 00:31:14 +00005
Guido van Rossume467be61997-12-05 19:42:42 +00006Classes:
Guido van Rossuma48061a1995-01-10 00:31:14 +00007
Guido van Rossume467be61997-12-05 19:42:42 +00008 Pickler
9 Unpickler
Guido van Rossuma48061a1995-01-10 00:31:14 +000010
Guido van Rossume467be61997-12-05 19:42:42 +000011Functions:
Guido van Rossuma48061a1995-01-10 00:31:14 +000012
Guido van Rossume467be61997-12-05 19:42:42 +000013 dump(object, file)
14 dumps(object) -> string
15 load(file) -> object
16 loads(string) -> object
Guido van Rossuma48061a1995-01-10 00:31:14 +000017
Guido van Rossume467be61997-12-05 19:42:42 +000018Misc variables:
Guido van Rossuma48061a1995-01-10 00:31:14 +000019
Fred Drakefe82acc1998-02-13 03:24:48 +000020 __version__
Guido van Rossume467be61997-12-05 19:42:42 +000021 format_version
22 compatible_formats
Guido van Rossuma48061a1995-01-10 00:31:14 +000023
Guido van Rossuma48061a1995-01-10 00:31:14 +000024"""
25
Guido van Rossum743d17e1998-09-15 20:25:57 +000026__version__ = "$Revision$" # Code version
Guido van Rossuma48061a1995-01-10 00:31:14 +000027
28from types import *
Guido van Rossum4fb5b281997-09-12 20:07:24 +000029from copy_reg import dispatch_table, safe_constructors
Guido van Rossumd3703791998-10-22 20:15:36 +000030import marshal
31import sys
32import struct
Skip Montanaro23bafc62001-02-18 03:10:09 +000033import re
Guido van Rossuma48061a1995-01-10 00:31:14 +000034
Skip Montanaro352674d2001-02-07 23:14:30 +000035__all__ = ["PickleError", "PicklingError", "UnpicklingError", "Pickler",
36 "Unpickler", "dump", "dumps", "load", "loads"]
37
Guido van Rossumd3703791998-10-22 20:15:36 +000038format_version = "1.3" # File format version we write
39compatible_formats = ["1.0", "1.1", "1.2"] # Old format versions we can read
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000040
41mdumps = marshal.dumps
42mloads = marshal.loads
Guido van Rossum0c891ce1995-03-14 15:09:05 +000043
Guido van Rossum26e89d02000-06-29 16:15:52 +000044class PickleError(Exception): pass
45class PicklingError(PickleError): pass
46class UnpicklingError(PickleError): pass
Guido van Rossum7849da81995-03-09 14:08:35 +000047
Guido van Rossumff871742000-12-13 18:11:56 +000048class _Stop(Exception):
49 def __init__(self, value):
50 self.value = value
51
Jeremy Hylton2b9d0291998-05-27 22:38:22 +000052try:
53 from org.python.core import PyStringMap
54except ImportError:
55 PyStringMap = None
56
Guido van Rossumdbb718f2001-09-21 19:22:34 +000057try:
58 UnicodeType
59except NameError:
60 UnicodeType = None
61
62
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000063MARK = '('
64STOP = '.'
65POP = '0'
66POP_MARK = '1'
67DUP = '2'
68FLOAT = 'F'
69INT = 'I'
70BININT = 'J'
71BININT1 = 'K'
72LONG = 'L'
73BININT2 = 'M'
74NONE = 'N'
75PERSID = 'P'
76BINPERSID = 'Q'
77REDUCE = 'R'
78STRING = 'S'
79BINSTRING = 'T'
80SHORT_BINSTRING = 'U'
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +000081UNICODE = 'V'
82BINUNICODE = 'X'
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000083APPEND = 'a'
84BUILD = 'b'
85GLOBAL = 'c'
86DICT = 'd'
87EMPTY_DICT = '}'
88APPENDS = 'e'
89GET = 'g'
90BINGET = 'h'
91INST = 'i'
92LONG_BINGET = 'j'
93LIST = 'l'
94EMPTY_LIST = ']'
95OBJ = 'o'
96PUT = 'p'
97BINPUT = 'q'
98LONG_BINPUT = 'r'
99SETITEM = 's'
100TUPLE = 't'
101EMPTY_TUPLE = ')'
102SETITEMS = 'u'
Guido van Rossumd3703791998-10-22 20:15:36 +0000103BINFLOAT = 'G'
Guido van Rossuma48061a1995-01-10 00:31:14 +0000104
Skip Montanaro23bafc62001-02-18 03:10:09 +0000105__all__.extend([x for x in dir() if re.match("[A-Z][A-Z0-9_]+$",x)])
106
Guido van Rossuma48061a1995-01-10 00:31:14 +0000107class Pickler:
108
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000109 def __init__(self, file, bin = 0):
110 self.write = file.write
111 self.memo = {}
112 self.bin = bin
Guido van Rossuma48061a1995-01-10 00:31:14 +0000113
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000114 def dump(self, object):
115 self.save(object)
116 self.write(STOP)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000117
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000118 def put(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000119 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000120 s = mdumps(i)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000121 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000122 return BINPUT + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000123
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000124 return LONG_BINPUT + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000125
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000126 return PUT + `i` + '\n'
Guido van Rossuma48061a1995-01-10 00:31:14 +0000127
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000128 def get(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000129 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000130 s = mdumps(i)[1:]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000131
Tim Petersc32d8242001-04-10 02:48:53 +0000132 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000133 return BINGET + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000134
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000135 return LONG_BINGET + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000136
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000137 return GET + `i` + '\n'
Tim Peters2344fae2001-01-15 00:50:52 +0000138
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000139 def save(self, object, pers_save = 0):
140 memo = self.memo
Guido van Rossuma48061a1995-01-10 00:31:14 +0000141
Tim Petersc32d8242001-04-10 02:48:53 +0000142 if not pers_save:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000143 pid = self.persistent_id(object)
Tim Petersc32d8242001-04-10 02:48:53 +0000144 if pid is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000145 self.save_pers(pid)
146 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000147
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000148 d = id(object)
Tim Peters2344fae2001-01-15 00:50:52 +0000149
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000150 t = type(object)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000151
Tim Petersc32d8242001-04-10 02:48:53 +0000152 if (t is TupleType) and (len(object) == 0):
153 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000154 self.save_empty_tuple(object)
155 else:
156 self.save_tuple(object)
157 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000158
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000159 if memo.has_key(d):
160 self.write(self.get(memo[d][0]))
161 return
162
163 try:
164 f = self.dispatch[t]
165 except KeyError:
Guido van Rossumf048a8f2001-12-19 16:55:02 +0000166 if issubclass(t, TypeType):
167 self.save_global(object)
168 return
169
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000170 pid = self.inst_persistent_id(object)
171 if pid is not None:
172 self.save_pers(pid)
173 return
174
175 try:
176 reduce = dispatch_table[t]
177 except KeyError:
178 try:
179 reduce = object.__reduce__
180 except AttributeError:
181 raise PicklingError, \
Guido van Rossum08a92cb1999-10-10 21:14:25 +0000182 "can't pickle %s object: %s" % (`t.__name__`,
183 `object`)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000184 else:
185 tup = reduce()
186 else:
187 tup = reduce(object)
188
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000189 if type(tup) is StringType:
190 self.save_global(object, tup)
191 return
Guido van Rossumd1f49841997-12-10 23:40:18 +0000192
Tim Petersc32d8242001-04-10 02:48:53 +0000193 if type(tup) is not TupleType:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000194 raise PicklingError, "Value returned by %s must be a " \
195 "tuple" % reduce
196
197 l = len(tup)
Tim Peters2344fae2001-01-15 00:50:52 +0000198
Tim Petersc32d8242001-04-10 02:48:53 +0000199 if (l != 2) and (l != 3):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000200 raise PicklingError, "tuple returned by %s must contain " \
201 "only two or three elements" % reduce
202
203 callable = tup[0]
204 arg_tup = tup[1]
Tim Peters2344fae2001-01-15 00:50:52 +0000205
Tim Petersc32d8242001-04-10 02:48:53 +0000206 if l > 2:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000207 state = tup[2]
208 else:
209 state = None
210
Guido van Rossumd1f49841997-12-10 23:40:18 +0000211 if type(arg_tup) is not TupleType and arg_tup is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000212 raise PicklingError, "Second element of tuple returned " \
213 "by %s must be a tuple" % reduce
214
Tim Peters2344fae2001-01-15 00:50:52 +0000215 self.save_reduce(callable, arg_tup, state)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000216 memo_len = len(memo)
217 self.write(self.put(memo_len))
218 memo[d] = (memo_len, object)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000219 return
220
221 f(self, object)
222
223 def persistent_id(self, object):
224 return None
225
226 def inst_persistent_id(self, object):
227 return None
228
229 def save_pers(self, pid):
Tim Petersc32d8242001-04-10 02:48:53 +0000230 if not self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000231 self.write(PERSID + str(pid) + '\n')
232 else:
233 self.save(pid, 1)
234 self.write(BINPERSID)
235
236 def save_reduce(self, callable, arg_tup, state = None):
237 write = self.write
238 save = self.save
239
240 save(callable)
241 save(arg_tup)
242 write(REDUCE)
Tim Peters2344fae2001-01-15 00:50:52 +0000243
Tim Petersc32d8242001-04-10 02:48:53 +0000244 if state is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000245 save(state)
246 write(BUILD)
247
248 dispatch = {}
249
250 def save_none(self, object):
251 self.write(NONE)
252 dispatch[NoneType] = save_none
253
254 def save_int(self, object):
Tim Petersc32d8242001-04-10 02:48:53 +0000255 if self.bin:
Tim Peters44714002001-04-10 05:02:52 +0000256 # If the int is small enough to fit in a signed 4-byte 2's-comp
257 # format, we can store it more efficiently than the general
258 # case.
259 high_bits = object >> 31 # note that Python shift sign-extends
260 if high_bits == 0 or high_bits == -1:
261 # All high bits are copies of bit 2**31, so the value
262 # fits in a 4-byte signed int.
263 i = mdumps(object)[1:]
264 assert len(i) == 4
265 if i[-2:] == '\000\000': # fits in 2-byte unsigned int
266 if i[-3] == '\000': # fits in 1-byte unsigned int
267 self.write(BININT1 + i[0])
268 else:
269 self.write(BININT2 + i[:2])
270 else:
271 self.write(BININT + i)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000272 return
Tim Peters44714002001-04-10 05:02:52 +0000273 # Text pickle, or int too big to fit in signed 4-byte format.
274 self.write(INT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000275 dispatch[IntType] = save_int
276
277 def save_long(self, object):
278 self.write(LONG + `object` + '\n')
279 dispatch[LongType] = save_long
280
Guido van Rossumd3703791998-10-22 20:15:36 +0000281 def save_float(self, object, pack=struct.pack):
282 if self.bin:
283 self.write(BINFLOAT + pack('>d', object))
284 else:
285 self.write(FLOAT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000286 dispatch[FloatType] = save_float
287
288 def save_string(self, object):
289 d = id(object)
290 memo = self.memo
291
Tim Petersc32d8242001-04-10 02:48:53 +0000292 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000293 l = len(object)
294 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000295 if l < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000296 self.write(SHORT_BINSTRING + s[0] + object)
297 else:
298 self.write(BINSTRING + s + object)
299 else:
300 self.write(STRING + `object` + '\n')
301
302 memo_len = len(memo)
303 self.write(self.put(memo_len))
304 memo[d] = (memo_len, object)
305 dispatch[StringType] = save_string
306
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000307 def save_unicode(self, object):
308 d = id(object)
309 memo = self.memo
310
Tim Petersc32d8242001-04-10 02:48:53 +0000311 if self.bin:
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000312 encoding = object.encode('utf-8')
313 l = len(encoding)
314 s = mdumps(l)[1:]
315 self.write(BINUNICODE + s + encoding)
316 else:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000317 object = object.replace("\\", "\\u005c")
318 object = object.replace("\n", "\\u000a")
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000319 self.write(UNICODE + object.encode('raw-unicode-escape') + '\n')
320
321 memo_len = len(memo)
322 self.write(self.put(memo_len))
323 memo[d] = (memo_len, object)
324 dispatch[UnicodeType] = save_unicode
325
Guido van Rossum31584cb2001-01-22 14:53:29 +0000326 if StringType == UnicodeType:
327 # This is true for Jython
328 def save_string(self, object):
329 d = id(object)
330 memo = self.memo
331 unicode = object.isunicode()
332
Tim Petersc32d8242001-04-10 02:48:53 +0000333 if self.bin:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000334 if unicode:
335 object = object.encode("utf-8")
336 l = len(object)
337 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000338 if l < 256 and not unicode:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000339 self.write(SHORT_BINSTRING + s[0] + object)
340 else:
341 if unicode:
342 self.write(BINUNICODE + s + object)
343 else:
344 self.write(BINSTRING + s + object)
345 else:
Tim Peters658cba62001-02-09 20:06:00 +0000346 if unicode:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000347 object = object.replace("\\", "\\u005c")
348 object = object.replace("\n", "\\u000a")
Guido van Rossum31584cb2001-01-22 14:53:29 +0000349 object = object.encode('raw-unicode-escape')
350 self.write(UNICODE + object + '\n')
351 else:
352 self.write(STRING + `object` + '\n')
353
354 memo_len = len(memo)
355 self.write(self.put(memo_len))
356 memo[d] = (memo_len, object)
357 dispatch[StringType] = save_string
Tim Peters658cba62001-02-09 20:06:00 +0000358
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000359 def save_tuple(self, object):
360
361 write = self.write
362 save = self.save
363 memo = self.memo
364
365 d = id(object)
366
367 write(MARK)
368
369 for element in object:
370 save(element)
371
Tim Petersc32d8242001-04-10 02:48:53 +0000372 if len(object) and memo.has_key(d):
373 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000374 write(POP_MARK + self.get(memo[d][0]))
375 return
Tim Peters2344fae2001-01-15 00:50:52 +0000376
Guido van Rossum599174f1998-03-31 16:30:28 +0000377 write(POP * (len(object) + 1) + self.get(memo[d][0]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000378 return
379
380 memo_len = len(memo)
381 self.write(TUPLE + self.put(memo_len))
382 memo[d] = (memo_len, object)
383 dispatch[TupleType] = save_tuple
384
385 def save_empty_tuple(self, object):
386 self.write(EMPTY_TUPLE)
387
388 def save_list(self, object):
389 d = id(object)
390
391 write = self.write
392 save = self.save
393 memo = self.memo
394
Tim Petersc32d8242001-04-10 02:48:53 +0000395 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000396 write(EMPTY_LIST)
397 else:
398 write(MARK + LIST)
399
400 memo_len = len(memo)
401 write(self.put(memo_len))
402 memo[d] = (memo_len, object)
403
404 using_appends = (self.bin and (len(object) > 1))
405
Tim Petersc32d8242001-04-10 02:48:53 +0000406 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000407 write(MARK)
408
409 for element in object:
410 save(element)
Tim Peters2344fae2001-01-15 00:50:52 +0000411
Tim Petersc32d8242001-04-10 02:48:53 +0000412 if not using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000413 write(APPEND)
414
Tim Petersc32d8242001-04-10 02:48:53 +0000415 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000416 write(APPENDS)
417 dispatch[ListType] = save_list
418
419 def save_dict(self, object):
420 d = id(object)
421
422 write = self.write
423 save = self.save
424 memo = self.memo
425
Tim Petersc32d8242001-04-10 02:48:53 +0000426 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000427 write(EMPTY_DICT)
428 else:
429 write(MARK + DICT)
430
431 memo_len = len(memo)
432 self.write(self.put(memo_len))
433 memo[d] = (memo_len, object)
434
435 using_setitems = (self.bin and (len(object) > 1))
436
Tim Petersc32d8242001-04-10 02:48:53 +0000437 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000438 write(MARK)
439
440 items = object.items()
441 for key, value in items:
442 save(key)
443 save(value)
444
Tim Petersc32d8242001-04-10 02:48:53 +0000445 if not using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000446 write(SETITEM)
447
Tim Petersc32d8242001-04-10 02:48:53 +0000448 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000449 write(SETITEMS)
450
451 dispatch[DictionaryType] = save_dict
Jeremy Hylton2b9d0291998-05-27 22:38:22 +0000452 if not PyStringMap is None:
453 dispatch[PyStringMap] = save_dict
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000454
455 def save_inst(self, object):
456 d = id(object)
457 cls = object.__class__
458
459 memo = self.memo
460 write = self.write
461 save = self.save
462
463 if hasattr(object, '__getinitargs__'):
464 args = object.__getinitargs__()
465 len(args) # XXX Assert it's a sequence
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000466 _keep_alive(args, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000467 else:
468 args = ()
469
470 write(MARK)
471
Tim Petersc32d8242001-04-10 02:48:53 +0000472 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000473 save(cls)
474
475 for arg in args:
476 save(arg)
477
478 memo_len = len(memo)
Tim Petersc32d8242001-04-10 02:48:53 +0000479 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000480 write(OBJ + self.put(memo_len))
481 else:
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000482 write(INST + cls.__module__ + '\n' + cls.__name__ + '\n' +
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000483 self.put(memo_len))
484
485 memo[d] = (memo_len, object)
486
487 try:
488 getstate = object.__getstate__
489 except AttributeError:
490 stuff = object.__dict__
491 else:
492 stuff = getstate()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000493 _keep_alive(stuff, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000494 save(stuff)
495 write(BUILD)
496 dispatch[InstanceType] = save_inst
497
498 def save_global(self, object, name = None):
499 write = self.write
500 memo = self.memo
501
Tim Petersc32d8242001-04-10 02:48:53 +0000502 if name is None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000503 name = object.__name__
504
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000505 try:
506 module = object.__module__
507 except AttributeError:
508 module = whichmodule(object, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000509
Guido van Rossumb0a98e92001-08-17 18:49:52 +0000510 try:
511 __import__(module)
512 mod = sys.modules[module]
513 klass = getattr(mod, name)
514 except (ImportError, KeyError, AttributeError):
515 raise PicklingError(
516 "Can't pickle %r: it's not found as %s.%s" %
517 (object, module, name))
518 else:
519 if klass is not object:
520 raise PicklingError(
521 "Can't pickle %r: it's not the same object as %s.%s" %
522 (object, module, name))
523
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000524 memo_len = len(memo)
525 write(GLOBAL + module + '\n' + name + '\n' +
526 self.put(memo_len))
527 memo[id(object)] = (memo_len, object)
528 dispatch[ClassType] = save_global
529 dispatch[FunctionType] = save_global
530 dispatch[BuiltinFunctionType] = save_global
Tim Peters6d6c1a32001-08-02 04:15:00 +0000531 dispatch[TypeType] = save_global
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000532
Guido van Rossuma48061a1995-01-10 00:31:14 +0000533
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000534def _keep_alive(x, memo):
535 """Keeps a reference to the object x in the memo.
536
537 Because we remember objects by their id, we have
538 to assure that possibly temporary objects are kept
539 alive by referencing them.
540 We store a reference at the id of the memo, which should
541 normally not be used unless someone tries to deepcopy
542 the memo itself...
543 """
544 try:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000545 memo[id(memo)].append(x)
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000546 except KeyError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000547 # aha, this is the first one :-)
548 memo[id(memo)]=[x]
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000549
550
Guido van Rossuma48061a1995-01-10 00:31:14 +0000551classmap = {}
552
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000553# This is no longer used to find classes, but still for functions
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000554def whichmodule(cls, clsname):
555 """Figure out the module in which a class occurs.
Guido van Rossuma48061a1995-01-10 00:31:14 +0000556
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000557 Search sys.modules for the module.
558 Cache in classmap.
559 Return a module name.
560 If the class cannot be found, return __main__.
561 """
562 if classmap.has_key(cls):
563 return classmap[cls]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000564
565 for name, module in sys.modules.items():
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000566 if name != '__main__' and \
567 hasattr(module, clsname) and \
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000568 getattr(module, clsname) is cls:
569 break
570 else:
571 name = '__main__'
572 classmap[cls] = name
573 return name
Guido van Rossuma48061a1995-01-10 00:31:14 +0000574
575
576class Unpickler:
577
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000578 def __init__(self, file):
579 self.readline = file.readline
580 self.read = file.read
581 self.memo = {}
Guido van Rossuma48061a1995-01-10 00:31:14 +0000582
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000583 def load(self):
Jeremy Hylton20747fa2001-11-09 16:15:04 +0000584 self.mark = object() # any new unique object
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000585 self.stack = []
586 self.append = self.stack.append
587 read = self.read
588 dispatch = self.dispatch
589 try:
590 while 1:
591 key = read(1)
592 dispatch[key](self)
Guido van Rossumff871742000-12-13 18:11:56 +0000593 except _Stop, stopinst:
594 return stopinst.value
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000595
596 def marker(self):
597 stack = self.stack
598 mark = self.mark
599 k = len(stack)-1
600 while stack[k] is not mark: k = k-1
601 return k
602
603 dispatch = {}
604
605 def load_eof(self):
606 raise EOFError
607 dispatch[''] = load_eof
608
609 def load_persid(self):
610 pid = self.readline()[:-1]
611 self.append(self.persistent_load(pid))
612 dispatch[PERSID] = load_persid
613
614 def load_binpersid(self):
615 stack = self.stack
Tim Peters2344fae2001-01-15 00:50:52 +0000616
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000617 pid = stack[-1]
618 del stack[-1]
619
620 self.append(self.persistent_load(pid))
621 dispatch[BINPERSID] = load_binpersid
622
623 def load_none(self):
624 self.append(None)
625 dispatch[NONE] = load_none
626
627 def load_int(self):
Tim Peters19ef62d2001-08-28 22:21:18 +0000628 data = self.readline()
629 try:
630 self.append(int(data))
631 except ValueError:
632 self.append(long(data))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000633 dispatch[INT] = load_int
634
635 def load_binint(self):
636 self.append(mloads('i' + self.read(4)))
637 dispatch[BININT] = load_binint
638
639 def load_binint1(self):
640 self.append(mloads('i' + self.read(1) + '\000\000\000'))
641 dispatch[BININT1] = load_binint1
642
643 def load_binint2(self):
644 self.append(mloads('i' + self.read(2) + '\000\000'))
645 dispatch[BININT2] = load_binint2
Tim Peters2344fae2001-01-15 00:50:52 +0000646
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000647 def load_long(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000648 self.append(long(self.readline()[:-1], 0))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000649 dispatch[LONG] = load_long
650
651 def load_float(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000652 self.append(float(self.readline()[:-1]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000653 dispatch[FLOAT] = load_float
654
Guido van Rossumd3703791998-10-22 20:15:36 +0000655 def load_binfloat(self, unpack=struct.unpack):
656 self.append(unpack('>d', self.read(8))[0])
657 dispatch[BINFLOAT] = load_binfloat
658
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000659 def load_string(self):
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000660 rep = self.readline()[:-1]
661 if not self._is_string_secure(rep):
662 raise ValueError, "insecure string pickle"
663 self.append(eval(rep,
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000664 {'__builtins__': {}})) # Let's be careful
665 dispatch[STRING] = load_string
666
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000667 def _is_string_secure(self, s):
668 """Return true if s contains a string that is safe to eval
669
670 The definition of secure string is based on the implementation
671 in cPickle. s is secure as long as it only contains a quoted
672 string and optional trailing whitespace.
673 """
674 q = s[0]
675 if q not in ("'", '"'):
676 return 0
677 # find the closing quote
678 offset = 1
679 i = None
680 while 1:
681 try:
682 i = s.index(q, offset)
683 except ValueError:
684 # if there is an error the first time, there is no
685 # close quote
686 if offset == 1:
687 return 0
688 if s[i-1] != '\\':
689 break
690 # check to see if this one is escaped
691 nslash = 0
692 j = i - 1
693 while j >= offset and s[j] == '\\':
694 j = j - 1
695 nslash = nslash + 1
696 if nslash % 2 == 0:
697 break
698 offset = i + 1
699 for c in s[i+1:]:
700 if ord(c) > 32:
701 return 0
702 return 1
703
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000704 def load_binstring(self):
705 len = mloads('i' + self.read(4))
706 self.append(self.read(len))
707 dispatch[BINSTRING] = load_binstring
708
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000709 def load_unicode(self):
710 self.append(unicode(self.readline()[:-1],'raw-unicode-escape'))
711 dispatch[UNICODE] = load_unicode
712
713 def load_binunicode(self):
714 len = mloads('i' + self.read(4))
715 self.append(unicode(self.read(len),'utf-8'))
716 dispatch[BINUNICODE] = load_binunicode
717
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000718 def load_short_binstring(self):
719 len = mloads('i' + self.read(1) + '\000\000\000')
720 self.append(self.read(len))
721 dispatch[SHORT_BINSTRING] = load_short_binstring
722
723 def load_tuple(self):
724 k = self.marker()
725 self.stack[k:] = [tuple(self.stack[k+1:])]
726 dispatch[TUPLE] = load_tuple
727
728 def load_empty_tuple(self):
729 self.stack.append(())
730 dispatch[EMPTY_TUPLE] = load_empty_tuple
731
732 def load_empty_list(self):
733 self.stack.append([])
734 dispatch[EMPTY_LIST] = load_empty_list
735
736 def load_empty_dictionary(self):
737 self.stack.append({})
738 dispatch[EMPTY_DICT] = load_empty_dictionary
739
740 def load_list(self):
741 k = self.marker()
742 self.stack[k:] = [self.stack[k+1:]]
743 dispatch[LIST] = load_list
744
745 def load_dict(self):
746 k = self.marker()
747 d = {}
748 items = self.stack[k+1:]
749 for i in range(0, len(items), 2):
750 key = items[i]
751 value = items[i+1]
752 d[key] = value
753 self.stack[k:] = [d]
754 dispatch[DICT] = load_dict
755
756 def load_inst(self):
757 k = self.marker()
758 args = tuple(self.stack[k+1:])
759 del self.stack[k:]
760 module = self.readline()[:-1]
761 name = self.readline()[:-1]
762 klass = self.find_class(module, name)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000763 instantiated = 0
764 if (not args and type(klass) is ClassType and
765 not hasattr(klass, "__getinitargs__")):
766 try:
767 value = _EmptyClass()
768 value.__class__ = klass
Guido van Rossumb19e2a31998-04-13 18:08:45 +0000769 instantiated = 1
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000770 except RuntimeError:
771 # In restricted execution, assignment to inst.__class__ is
772 # prohibited
773 pass
774 if not instantiated:
Guido van Rossum743d17e1998-09-15 20:25:57 +0000775 try:
Barry Warsawbf4d9592001-11-15 23:42:58 +0000776 if not hasattr(klass, '__safe_for_unpickling__'):
777 raise UnpicklingError('%s is not safe for unpickling' %
778 klass)
Guido van Rossum743d17e1998-09-15 20:25:57 +0000779 value = apply(klass, args)
780 except TypeError, err:
781 raise TypeError, "in constructor for %s: %s" % (
782 klass.__name__, str(err)), sys.exc_info()[2]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000783 self.append(value)
784 dispatch[INST] = load_inst
785
786 def load_obj(self):
787 stack = self.stack
788 k = self.marker()
789 klass = stack[k + 1]
790 del stack[k + 1]
Tim Peters2344fae2001-01-15 00:50:52 +0000791 args = tuple(stack[k + 1:])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000792 del stack[k:]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000793 instantiated = 0
794 if (not args and type(klass) is ClassType and
795 not hasattr(klass, "__getinitargs__")):
796 try:
797 value = _EmptyClass()
798 value.__class__ = klass
799 instantiated = 1
800 except RuntimeError:
801 # In restricted execution, assignment to inst.__class__ is
802 # prohibited
803 pass
804 if not instantiated:
805 value = apply(klass, args)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000806 self.append(value)
Tim Peters2344fae2001-01-15 00:50:52 +0000807 dispatch[OBJ] = load_obj
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000808
809 def load_global(self):
810 module = self.readline()[:-1]
811 name = self.readline()[:-1]
812 klass = self.find_class(module, name)
813 self.append(klass)
814 dispatch[GLOBAL] = load_global
815
816 def find_class(self, module, name):
Barry Warsawbf4d9592001-11-15 23:42:58 +0000817 __import__(module)
818 mod = sys.modules[module]
819 klass = getattr(mod, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000820 return klass
821
822 def load_reduce(self):
823 stack = self.stack
824
825 callable = stack[-2]
826 arg_tup = stack[-1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000827 del stack[-2:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000828
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000829 if type(callable) is not ClassType:
830 if not safe_constructors.has_key(callable):
831 try:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000832 safe = callable.__safe_for_unpickling__
833 except AttributeError:
834 safe = None
Guido van Rossuma48061a1995-01-10 00:31:14 +0000835
Tim Petersc32d8242001-04-10 02:48:53 +0000836 if not safe:
Tim Peters2344fae2001-01-15 00:50:52 +0000837 raise UnpicklingError, "%s is not safe for " \
838 "unpickling" % callable
Guido van Rossuma48061a1995-01-10 00:31:14 +0000839
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000840 if arg_tup is None:
841 value = callable.__basicnew__()
842 else:
843 value = apply(callable, arg_tup)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000844 self.append(value)
845 dispatch[REDUCE] = load_reduce
Guido van Rossuma48061a1995-01-10 00:31:14 +0000846
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000847 def load_pop(self):
848 del self.stack[-1]
849 dispatch[POP] = load_pop
Guido van Rossum7b5430f1995-03-04 22:25:21 +0000850
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000851 def load_pop_mark(self):
852 k = self.marker()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000853 del self.stack[k:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000854 dispatch[POP_MARK] = load_pop_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000855
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000856 def load_dup(self):
Guido van Rossumb1062fc1998-03-31 17:00:46 +0000857 self.append(self.stack[-1])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000858 dispatch[DUP] = load_dup
Guido van Rossuma48061a1995-01-10 00:31:14 +0000859
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000860 def load_get(self):
861 self.append(self.memo[self.readline()[:-1]])
862 dispatch[GET] = load_get
Guido van Rossum78536471996-04-12 13:36:27 +0000863
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000864 def load_binget(self):
865 i = mloads('i' + self.read(1) + '\000\000\000')
866 self.append(self.memo[`i`])
867 dispatch[BINGET] = load_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000868
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000869 def load_long_binget(self):
870 i = mloads('i' + self.read(4))
871 self.append(self.memo[`i`])
872 dispatch[LONG_BINGET] = load_long_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000873
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000874 def load_put(self):
875 self.memo[self.readline()[:-1]] = self.stack[-1]
876 dispatch[PUT] = load_put
Guido van Rossuma48061a1995-01-10 00:31:14 +0000877
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000878 def load_binput(self):
879 i = mloads('i' + self.read(1) + '\000\000\000')
880 self.memo[`i`] = self.stack[-1]
881 dispatch[BINPUT] = load_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000882
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000883 def load_long_binput(self):
884 i = mloads('i' + self.read(4))
885 self.memo[`i`] = self.stack[-1]
886 dispatch[LONG_BINPUT] = load_long_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000887
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000888 def load_append(self):
889 stack = self.stack
890 value = stack[-1]
891 del stack[-1]
892 list = stack[-1]
893 list.append(value)
894 dispatch[APPEND] = load_append
Guido van Rossuma48061a1995-01-10 00:31:14 +0000895
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000896 def load_appends(self):
897 stack = self.stack
898 mark = self.marker()
899 list = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000900 for i in range(mark + 1, len(stack)):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000901 list.append(stack[i])
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000902
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000903 del stack[mark:]
904 dispatch[APPENDS] = load_appends
Tim Peters2344fae2001-01-15 00:50:52 +0000905
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000906 def load_setitem(self):
907 stack = self.stack
908 value = stack[-1]
909 key = stack[-2]
910 del stack[-2:]
911 dict = stack[-1]
912 dict[key] = value
913 dispatch[SETITEM] = load_setitem
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000914
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000915 def load_setitems(self):
916 stack = self.stack
917 mark = self.marker()
918 dict = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000919 for i in range(mark + 1, len(stack), 2):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000920 dict[stack[i]] = stack[i + 1]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000921
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000922 del stack[mark:]
923 dispatch[SETITEMS] = load_setitems
Guido van Rossuma48061a1995-01-10 00:31:14 +0000924
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000925 def load_build(self):
926 stack = self.stack
927 value = stack[-1]
928 del stack[-1]
929 inst = stack[-1]
930 try:
931 setstate = inst.__setstate__
932 except AttributeError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000933 try:
934 inst.__dict__.update(value)
935 except RuntimeError:
936 # XXX In restricted execution, the instance's __dict__ is not
937 # accessible. Use the old way of unpickling the instance
938 # variables. This is a semantic different when unpickling in
939 # restricted vs. unrestricted modes.
940 for k, v in value.items():
941 setattr(inst, k, v)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000942 else:
943 setstate(value)
944 dispatch[BUILD] = load_build
Guido van Rossuma48061a1995-01-10 00:31:14 +0000945
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000946 def load_mark(self):
947 self.append(self.mark)
948 dispatch[MARK] = load_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000949
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000950 def load_stop(self):
951 value = self.stack[-1]
952 del self.stack[-1]
Guido van Rossumff871742000-12-13 18:11:56 +0000953 raise _Stop(value)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000954 dispatch[STOP] = load_stop
Guido van Rossuma48061a1995-01-10 00:31:14 +0000955
Guido van Rossume467be61997-12-05 19:42:42 +0000956# Helper class for load_inst/load_obj
957
958class _EmptyClass:
959 pass
Guido van Rossuma48061a1995-01-10 00:31:14 +0000960
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000961# Shorthands
962
Jeremy Hyltonabe2c622001-10-15 21:29:28 +0000963try:
964 from cStringIO import StringIO
965except ImportError:
966 from StringIO import StringIO
Guido van Rossumc7c5e691996-07-22 22:26:07 +0000967
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000968def dump(object, file, bin = 0):
969 Pickler(file, bin).dump(object)
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000970
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000971def dumps(object, bin = 0):
972 file = StringIO()
973 Pickler(file, bin).dump(object)
974 return file.getvalue()
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000975
976def load(file):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000977 return Unpickler(file).load()
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000978
979def loads(str):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000980 file = StringIO(str)
981 return Unpickler(file).load()