blob: 7e8e6656683ef10f73e1b14446ff3c5e33b0c662 [file] [log] [blame]
Guido van Rossum54f22ed2000-02-04 15:10:34 +00001"""Create portable serialized representations of Python objects.
Guido van Rossuma48061a1995-01-10 00:31:14 +00002
Guido van Rossume467be61997-12-05 19:42:42 +00003See module cPickle for a (much) faster implementation.
4See module copy_reg for a mechanism for registering custom picklers.
Guido van Rossuma48061a1995-01-10 00:31:14 +00005
Guido van Rossume467be61997-12-05 19:42:42 +00006Classes:
Guido van Rossuma48061a1995-01-10 00:31:14 +00007
Guido van Rossume467be61997-12-05 19:42:42 +00008 Pickler
9 Unpickler
Guido van Rossuma48061a1995-01-10 00:31:14 +000010
Guido van Rossume467be61997-12-05 19:42:42 +000011Functions:
Guido van Rossuma48061a1995-01-10 00:31:14 +000012
Guido van Rossume467be61997-12-05 19:42:42 +000013 dump(object, file)
14 dumps(object) -> string
15 load(file) -> object
16 loads(string) -> object
Guido van Rossuma48061a1995-01-10 00:31:14 +000017
Guido van Rossume467be61997-12-05 19:42:42 +000018Misc variables:
Guido van Rossuma48061a1995-01-10 00:31:14 +000019
Fred Drakefe82acc1998-02-13 03:24:48 +000020 __version__
Guido van Rossume467be61997-12-05 19:42:42 +000021 format_version
22 compatible_formats
Guido van Rossuma48061a1995-01-10 00:31:14 +000023
Guido van Rossuma48061a1995-01-10 00:31:14 +000024"""
25
Guido van Rossum743d17e1998-09-15 20:25:57 +000026__version__ = "$Revision$" # Code version
Guido van Rossuma48061a1995-01-10 00:31:14 +000027
28from types import *
Guido van Rossum4fb5b281997-09-12 20:07:24 +000029from copy_reg import dispatch_table, safe_constructors
Guido van Rossumd3703791998-10-22 20:15:36 +000030import marshal
31import sys
32import struct
Skip Montanaro23bafc62001-02-18 03:10:09 +000033import re
Guido van Rossuma48061a1995-01-10 00:31:14 +000034
Skip Montanaro352674d2001-02-07 23:14:30 +000035__all__ = ["PickleError", "PicklingError", "UnpicklingError", "Pickler",
36 "Unpickler", "dump", "dumps", "load", "loads"]
37
Guido van Rossumd3703791998-10-22 20:15:36 +000038format_version = "1.3" # File format version we write
39compatible_formats = ["1.0", "1.1", "1.2"] # Old format versions we can read
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000040
41mdumps = marshal.dumps
42mloads = marshal.loads
Guido van Rossum0c891ce1995-03-14 15:09:05 +000043
Guido van Rossum26e89d02000-06-29 16:15:52 +000044class PickleError(Exception): pass
45class PicklingError(PickleError): pass
46class UnpicklingError(PickleError): pass
Guido van Rossum7849da81995-03-09 14:08:35 +000047
Guido van Rossumff871742000-12-13 18:11:56 +000048class _Stop(Exception):
49 def __init__(self, value):
50 self.value = value
51
Jeremy Hylton2b9d0291998-05-27 22:38:22 +000052try:
53 from org.python.core import PyStringMap
54except ImportError:
55 PyStringMap = None
56
Guido van Rossumdbb718f2001-09-21 19:22:34 +000057try:
58 UnicodeType
59except NameError:
60 UnicodeType = None
61
62
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000063MARK = '('
64STOP = '.'
65POP = '0'
66POP_MARK = '1'
67DUP = '2'
68FLOAT = 'F'
69INT = 'I'
70BININT = 'J'
71BININT1 = 'K'
72LONG = 'L'
73BININT2 = 'M'
74NONE = 'N'
75PERSID = 'P'
76BINPERSID = 'Q'
77REDUCE = 'R'
78STRING = 'S'
79BINSTRING = 'T'
80SHORT_BINSTRING = 'U'
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +000081UNICODE = 'V'
82BINUNICODE = 'X'
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000083APPEND = 'a'
84BUILD = 'b'
85GLOBAL = 'c'
86DICT = 'd'
87EMPTY_DICT = '}'
88APPENDS = 'e'
89GET = 'g'
90BINGET = 'h'
91INST = 'i'
92LONG_BINGET = 'j'
93LIST = 'l'
94EMPTY_LIST = ']'
95OBJ = 'o'
96PUT = 'p'
97BINPUT = 'q'
98LONG_BINPUT = 'r'
99SETITEM = 's'
100TUPLE = 't'
101EMPTY_TUPLE = ')'
102SETITEMS = 'u'
Guido van Rossumd3703791998-10-22 20:15:36 +0000103BINFLOAT = 'G'
Guido van Rossuma48061a1995-01-10 00:31:14 +0000104
Skip Montanaro23bafc62001-02-18 03:10:09 +0000105__all__.extend([x for x in dir() if re.match("[A-Z][A-Z0-9_]+$",x)])
Neal Norwitzd5ba4ae2002-02-11 18:12:06 +0000106del x
Skip Montanaro23bafc62001-02-18 03:10:09 +0000107
Guido van Rossuma48061a1995-01-10 00:31:14 +0000108class Pickler:
109
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000110 def __init__(self, file, bin = 0):
111 self.write = file.write
112 self.memo = {}
113 self.bin = bin
Guido van Rossuma48061a1995-01-10 00:31:14 +0000114
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000115 def dump(self, object):
116 self.save(object)
117 self.write(STOP)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000118
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000119 def put(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000120 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000121 s = mdumps(i)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000122 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000123 return BINPUT + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000124
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000125 return LONG_BINPUT + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000126
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000127 return PUT + `i` + '\n'
Guido van Rossuma48061a1995-01-10 00:31:14 +0000128
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000129 def get(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000130 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000131 s = mdumps(i)[1:]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000132
Tim Petersc32d8242001-04-10 02:48:53 +0000133 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000134 return BINGET + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000135
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000136 return LONG_BINGET + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000137
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000138 return GET + `i` + '\n'
Tim Peters2344fae2001-01-15 00:50:52 +0000139
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000140 def save(self, object, pers_save = 0):
141 memo = self.memo
Guido van Rossuma48061a1995-01-10 00:31:14 +0000142
Tim Petersc32d8242001-04-10 02:48:53 +0000143 if not pers_save:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000144 pid = self.persistent_id(object)
Tim Petersc32d8242001-04-10 02:48:53 +0000145 if pid is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000146 self.save_pers(pid)
147 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000148
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000149 d = id(object)
Tim Peters2344fae2001-01-15 00:50:52 +0000150
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000151 t = type(object)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000152
Tim Petersc32d8242001-04-10 02:48:53 +0000153 if (t is TupleType) and (len(object) == 0):
154 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000155 self.save_empty_tuple(object)
156 else:
157 self.save_tuple(object)
158 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000159
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000160 if memo.has_key(d):
161 self.write(self.get(memo[d][0]))
162 return
163
164 try:
165 f = self.dispatch[t]
166 except KeyError:
Guido van Rossumf048a8f2001-12-19 16:55:02 +0000167 if issubclass(t, TypeType):
168 self.save_global(object)
169 return
170
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000171 pid = self.inst_persistent_id(object)
172 if pid is not None:
173 self.save_pers(pid)
174 return
175
176 try:
177 reduce = dispatch_table[t]
178 except KeyError:
179 try:
180 reduce = object.__reduce__
181 except AttributeError:
182 raise PicklingError, \
Guido van Rossum08a92cb1999-10-10 21:14:25 +0000183 "can't pickle %s object: %s" % (`t.__name__`,
184 `object`)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000185 else:
186 tup = reduce()
187 else:
188 tup = reduce(object)
189
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000190 if type(tup) is StringType:
191 self.save_global(object, tup)
192 return
Guido van Rossumd1f49841997-12-10 23:40:18 +0000193
Tim Petersc32d8242001-04-10 02:48:53 +0000194 if type(tup) is not TupleType:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000195 raise PicklingError, "Value returned by %s must be a " \
196 "tuple" % reduce
197
198 l = len(tup)
Tim Peters2344fae2001-01-15 00:50:52 +0000199
Tim Petersc32d8242001-04-10 02:48:53 +0000200 if (l != 2) and (l != 3):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000201 raise PicklingError, "tuple returned by %s must contain " \
202 "only two or three elements" % reduce
203
204 callable = tup[0]
205 arg_tup = tup[1]
Tim Peters2344fae2001-01-15 00:50:52 +0000206
Tim Petersc32d8242001-04-10 02:48:53 +0000207 if l > 2:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000208 state = tup[2]
209 else:
210 state = None
211
Guido van Rossumd1f49841997-12-10 23:40:18 +0000212 if type(arg_tup) is not TupleType and arg_tup is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000213 raise PicklingError, "Second element of tuple returned " \
214 "by %s must be a tuple" % reduce
215
Tim Peters2344fae2001-01-15 00:50:52 +0000216 self.save_reduce(callable, arg_tup, state)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000217 memo_len = len(memo)
218 self.write(self.put(memo_len))
219 memo[d] = (memo_len, object)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000220 return
221
222 f(self, object)
223
224 def persistent_id(self, object):
225 return None
226
227 def inst_persistent_id(self, object):
228 return None
229
230 def save_pers(self, pid):
Tim Petersc32d8242001-04-10 02:48:53 +0000231 if not self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000232 self.write(PERSID + str(pid) + '\n')
233 else:
234 self.save(pid, 1)
235 self.write(BINPERSID)
236
237 def save_reduce(self, callable, arg_tup, state = None):
238 write = self.write
239 save = self.save
240
241 save(callable)
242 save(arg_tup)
243 write(REDUCE)
Tim Peters2344fae2001-01-15 00:50:52 +0000244
Tim Petersc32d8242001-04-10 02:48:53 +0000245 if state is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000246 save(state)
247 write(BUILD)
248
249 dispatch = {}
250
251 def save_none(self, object):
252 self.write(NONE)
253 dispatch[NoneType] = save_none
254
255 def save_int(self, object):
Tim Petersc32d8242001-04-10 02:48:53 +0000256 if self.bin:
Tim Peters44714002001-04-10 05:02:52 +0000257 # If the int is small enough to fit in a signed 4-byte 2's-comp
258 # format, we can store it more efficiently than the general
259 # case.
260 high_bits = object >> 31 # note that Python shift sign-extends
261 if high_bits == 0 or high_bits == -1:
262 # All high bits are copies of bit 2**31, so the value
263 # fits in a 4-byte signed int.
264 i = mdumps(object)[1:]
265 assert len(i) == 4
266 if i[-2:] == '\000\000': # fits in 2-byte unsigned int
267 if i[-3] == '\000': # fits in 1-byte unsigned int
268 self.write(BININT1 + i[0])
269 else:
270 self.write(BININT2 + i[:2])
271 else:
272 self.write(BININT + i)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000273 return
Tim Peters44714002001-04-10 05:02:52 +0000274 # Text pickle, or int too big to fit in signed 4-byte format.
275 self.write(INT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000276 dispatch[IntType] = save_int
277
278 def save_long(self, object):
279 self.write(LONG + `object` + '\n')
280 dispatch[LongType] = save_long
281
Guido van Rossumd3703791998-10-22 20:15:36 +0000282 def save_float(self, object, pack=struct.pack):
283 if self.bin:
284 self.write(BINFLOAT + pack('>d', object))
285 else:
286 self.write(FLOAT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000287 dispatch[FloatType] = save_float
288
289 def save_string(self, object):
290 d = id(object)
291 memo = self.memo
292
Tim Petersc32d8242001-04-10 02:48:53 +0000293 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000294 l = len(object)
295 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000296 if l < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000297 self.write(SHORT_BINSTRING + s[0] + object)
298 else:
299 self.write(BINSTRING + s + object)
300 else:
301 self.write(STRING + `object` + '\n')
302
303 memo_len = len(memo)
304 self.write(self.put(memo_len))
305 memo[d] = (memo_len, object)
306 dispatch[StringType] = save_string
307
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000308 def save_unicode(self, object):
309 d = id(object)
310 memo = self.memo
311
Tim Petersc32d8242001-04-10 02:48:53 +0000312 if self.bin:
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000313 encoding = object.encode('utf-8')
314 l = len(encoding)
315 s = mdumps(l)[1:]
316 self.write(BINUNICODE + s + encoding)
317 else:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000318 object = object.replace("\\", "\\u005c")
319 object = object.replace("\n", "\\u000a")
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000320 self.write(UNICODE + object.encode('raw-unicode-escape') + '\n')
321
322 memo_len = len(memo)
323 self.write(self.put(memo_len))
324 memo[d] = (memo_len, object)
325 dispatch[UnicodeType] = save_unicode
326
Guido van Rossum31584cb2001-01-22 14:53:29 +0000327 if StringType == UnicodeType:
328 # This is true for Jython
329 def save_string(self, object):
330 d = id(object)
331 memo = self.memo
332 unicode = object.isunicode()
333
Tim Petersc32d8242001-04-10 02:48:53 +0000334 if self.bin:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000335 if unicode:
336 object = object.encode("utf-8")
337 l = len(object)
338 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000339 if l < 256 and not unicode:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000340 self.write(SHORT_BINSTRING + s[0] + object)
341 else:
342 if unicode:
343 self.write(BINUNICODE + s + object)
344 else:
345 self.write(BINSTRING + s + object)
346 else:
Tim Peters658cba62001-02-09 20:06:00 +0000347 if unicode:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000348 object = object.replace("\\", "\\u005c")
349 object = object.replace("\n", "\\u000a")
Guido van Rossum31584cb2001-01-22 14:53:29 +0000350 object = object.encode('raw-unicode-escape')
351 self.write(UNICODE + object + '\n')
352 else:
353 self.write(STRING + `object` + '\n')
354
355 memo_len = len(memo)
356 self.write(self.put(memo_len))
357 memo[d] = (memo_len, object)
358 dispatch[StringType] = save_string
Tim Peters658cba62001-02-09 20:06:00 +0000359
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000360 def save_tuple(self, object):
361
362 write = self.write
363 save = self.save
364 memo = self.memo
365
366 d = id(object)
367
368 write(MARK)
369
370 for element in object:
371 save(element)
372
Tim Petersc32d8242001-04-10 02:48:53 +0000373 if len(object) and memo.has_key(d):
374 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000375 write(POP_MARK + self.get(memo[d][0]))
376 return
Tim Peters2344fae2001-01-15 00:50:52 +0000377
Guido van Rossum599174f1998-03-31 16:30:28 +0000378 write(POP * (len(object) + 1) + self.get(memo[d][0]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000379 return
380
381 memo_len = len(memo)
382 self.write(TUPLE + self.put(memo_len))
383 memo[d] = (memo_len, object)
384 dispatch[TupleType] = save_tuple
385
386 def save_empty_tuple(self, object):
387 self.write(EMPTY_TUPLE)
388
389 def save_list(self, object):
390 d = id(object)
391
392 write = self.write
393 save = self.save
394 memo = self.memo
395
Tim Petersc32d8242001-04-10 02:48:53 +0000396 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000397 write(EMPTY_LIST)
398 else:
399 write(MARK + LIST)
400
401 memo_len = len(memo)
402 write(self.put(memo_len))
403 memo[d] = (memo_len, object)
404
405 using_appends = (self.bin and (len(object) > 1))
406
Tim Petersc32d8242001-04-10 02:48:53 +0000407 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000408 write(MARK)
409
410 for element in object:
411 save(element)
Tim Peters2344fae2001-01-15 00:50:52 +0000412
Tim Petersc32d8242001-04-10 02:48:53 +0000413 if not using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000414 write(APPEND)
415
Tim Petersc32d8242001-04-10 02:48:53 +0000416 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000417 write(APPENDS)
418 dispatch[ListType] = save_list
419
420 def save_dict(self, object):
421 d = id(object)
422
423 write = self.write
424 save = self.save
425 memo = self.memo
426
Tim Petersc32d8242001-04-10 02:48:53 +0000427 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000428 write(EMPTY_DICT)
429 else:
430 write(MARK + DICT)
431
432 memo_len = len(memo)
433 self.write(self.put(memo_len))
434 memo[d] = (memo_len, object)
435
436 using_setitems = (self.bin and (len(object) > 1))
437
Tim Petersc32d8242001-04-10 02:48:53 +0000438 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000439 write(MARK)
440
441 items = object.items()
442 for key, value in items:
443 save(key)
444 save(value)
445
Tim Petersc32d8242001-04-10 02:48:53 +0000446 if not using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000447 write(SETITEM)
448
Tim Petersc32d8242001-04-10 02:48:53 +0000449 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000450 write(SETITEMS)
451
452 dispatch[DictionaryType] = save_dict
Jeremy Hylton2b9d0291998-05-27 22:38:22 +0000453 if not PyStringMap is None:
454 dispatch[PyStringMap] = save_dict
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000455
456 def save_inst(self, object):
457 d = id(object)
458 cls = object.__class__
459
460 memo = self.memo
461 write = self.write
462 save = self.save
463
464 if hasattr(object, '__getinitargs__'):
465 args = object.__getinitargs__()
466 len(args) # XXX Assert it's a sequence
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000467 _keep_alive(args, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000468 else:
469 args = ()
470
471 write(MARK)
472
Tim Petersc32d8242001-04-10 02:48:53 +0000473 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000474 save(cls)
475
476 for arg in args:
477 save(arg)
478
479 memo_len = len(memo)
Tim Petersc32d8242001-04-10 02:48:53 +0000480 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000481 write(OBJ + self.put(memo_len))
482 else:
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000483 write(INST + cls.__module__ + '\n' + cls.__name__ + '\n' +
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000484 self.put(memo_len))
485
486 memo[d] = (memo_len, object)
487
488 try:
489 getstate = object.__getstate__
490 except AttributeError:
491 stuff = object.__dict__
492 else:
493 stuff = getstate()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000494 _keep_alive(stuff, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000495 save(stuff)
496 write(BUILD)
497 dispatch[InstanceType] = save_inst
498
499 def save_global(self, object, name = None):
500 write = self.write
501 memo = self.memo
502
Tim Petersc32d8242001-04-10 02:48:53 +0000503 if name is None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000504 name = object.__name__
505
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000506 try:
507 module = object.__module__
508 except AttributeError:
509 module = whichmodule(object, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000510
Guido van Rossumb0a98e92001-08-17 18:49:52 +0000511 try:
512 __import__(module)
513 mod = sys.modules[module]
514 klass = getattr(mod, name)
515 except (ImportError, KeyError, AttributeError):
516 raise PicklingError(
517 "Can't pickle %r: it's not found as %s.%s" %
518 (object, module, name))
519 else:
520 if klass is not object:
521 raise PicklingError(
522 "Can't pickle %r: it's not the same object as %s.%s" %
523 (object, module, name))
524
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000525 memo_len = len(memo)
526 write(GLOBAL + module + '\n' + name + '\n' +
527 self.put(memo_len))
528 memo[id(object)] = (memo_len, object)
529 dispatch[ClassType] = save_global
530 dispatch[FunctionType] = save_global
531 dispatch[BuiltinFunctionType] = save_global
Tim Peters6d6c1a32001-08-02 04:15:00 +0000532 dispatch[TypeType] = save_global
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000533
Guido van Rossuma48061a1995-01-10 00:31:14 +0000534
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000535def _keep_alive(x, memo):
536 """Keeps a reference to the object x in the memo.
537
538 Because we remember objects by their id, we have
539 to assure that possibly temporary objects are kept
540 alive by referencing them.
541 We store a reference at the id of the memo, which should
542 normally not be used unless someone tries to deepcopy
543 the memo itself...
544 """
545 try:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000546 memo[id(memo)].append(x)
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000547 except KeyError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000548 # aha, this is the first one :-)
549 memo[id(memo)]=[x]
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000550
551
Guido van Rossuma48061a1995-01-10 00:31:14 +0000552classmap = {}
553
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000554# This is no longer used to find classes, but still for functions
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000555def whichmodule(cls, clsname):
556 """Figure out the module in which a class occurs.
Guido van Rossuma48061a1995-01-10 00:31:14 +0000557
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000558 Search sys.modules for the module.
559 Cache in classmap.
560 Return a module name.
561 If the class cannot be found, return __main__.
562 """
563 if classmap.has_key(cls):
564 return classmap[cls]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000565
566 for name, module in sys.modules.items():
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000567 if name != '__main__' and \
568 hasattr(module, clsname) and \
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000569 getattr(module, clsname) is cls:
570 break
571 else:
572 name = '__main__'
573 classmap[cls] = name
574 return name
Guido van Rossuma48061a1995-01-10 00:31:14 +0000575
576
577class Unpickler:
578
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000579 def __init__(self, file):
580 self.readline = file.readline
581 self.read = file.read
582 self.memo = {}
Guido van Rossuma48061a1995-01-10 00:31:14 +0000583
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000584 def load(self):
Jeremy Hylton20747fa2001-11-09 16:15:04 +0000585 self.mark = object() # any new unique object
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000586 self.stack = []
587 self.append = self.stack.append
588 read = self.read
589 dispatch = self.dispatch
590 try:
591 while 1:
592 key = read(1)
593 dispatch[key](self)
Guido van Rossumff871742000-12-13 18:11:56 +0000594 except _Stop, stopinst:
595 return stopinst.value
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000596
597 def marker(self):
598 stack = self.stack
599 mark = self.mark
600 k = len(stack)-1
601 while stack[k] is not mark: k = k-1
602 return k
603
604 dispatch = {}
605
606 def load_eof(self):
607 raise EOFError
608 dispatch[''] = load_eof
609
610 def load_persid(self):
611 pid = self.readline()[:-1]
612 self.append(self.persistent_load(pid))
613 dispatch[PERSID] = load_persid
614
615 def load_binpersid(self):
616 stack = self.stack
Tim Peters2344fae2001-01-15 00:50:52 +0000617
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000618 pid = stack[-1]
619 del stack[-1]
620
621 self.append(self.persistent_load(pid))
622 dispatch[BINPERSID] = load_binpersid
623
624 def load_none(self):
625 self.append(None)
626 dispatch[NONE] = load_none
627
628 def load_int(self):
Tim Peters19ef62d2001-08-28 22:21:18 +0000629 data = self.readline()
630 try:
631 self.append(int(data))
632 except ValueError:
633 self.append(long(data))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000634 dispatch[INT] = load_int
635
636 def load_binint(self):
637 self.append(mloads('i' + self.read(4)))
638 dispatch[BININT] = load_binint
639
640 def load_binint1(self):
641 self.append(mloads('i' + self.read(1) + '\000\000\000'))
642 dispatch[BININT1] = load_binint1
643
644 def load_binint2(self):
645 self.append(mloads('i' + self.read(2) + '\000\000'))
646 dispatch[BININT2] = load_binint2
Tim Peters2344fae2001-01-15 00:50:52 +0000647
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000648 def load_long(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000649 self.append(long(self.readline()[:-1], 0))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000650 dispatch[LONG] = load_long
651
652 def load_float(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000653 self.append(float(self.readline()[:-1]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000654 dispatch[FLOAT] = load_float
655
Guido van Rossumd3703791998-10-22 20:15:36 +0000656 def load_binfloat(self, unpack=struct.unpack):
657 self.append(unpack('>d', self.read(8))[0])
658 dispatch[BINFLOAT] = load_binfloat
659
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000660 def load_string(self):
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000661 rep = self.readline()[:-1]
662 if not self._is_string_secure(rep):
663 raise ValueError, "insecure string pickle"
664 self.append(eval(rep,
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000665 {'__builtins__': {}})) # Let's be careful
666 dispatch[STRING] = load_string
667
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000668 def _is_string_secure(self, s):
669 """Return true if s contains a string that is safe to eval
670
671 The definition of secure string is based on the implementation
672 in cPickle. s is secure as long as it only contains a quoted
673 string and optional trailing whitespace.
674 """
675 q = s[0]
676 if q not in ("'", '"'):
677 return 0
678 # find the closing quote
679 offset = 1
680 i = None
681 while 1:
682 try:
683 i = s.index(q, offset)
684 except ValueError:
685 # if there is an error the first time, there is no
686 # close quote
687 if offset == 1:
688 return 0
689 if s[i-1] != '\\':
690 break
691 # check to see if this one is escaped
692 nslash = 0
693 j = i - 1
694 while j >= offset and s[j] == '\\':
695 j = j - 1
696 nslash = nslash + 1
697 if nslash % 2 == 0:
698 break
699 offset = i + 1
700 for c in s[i+1:]:
701 if ord(c) > 32:
702 return 0
703 return 1
704
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000705 def load_binstring(self):
706 len = mloads('i' + self.read(4))
707 self.append(self.read(len))
708 dispatch[BINSTRING] = load_binstring
709
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000710 def load_unicode(self):
711 self.append(unicode(self.readline()[:-1],'raw-unicode-escape'))
712 dispatch[UNICODE] = load_unicode
713
714 def load_binunicode(self):
715 len = mloads('i' + self.read(4))
716 self.append(unicode(self.read(len),'utf-8'))
717 dispatch[BINUNICODE] = load_binunicode
718
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000719 def load_short_binstring(self):
720 len = mloads('i' + self.read(1) + '\000\000\000')
721 self.append(self.read(len))
722 dispatch[SHORT_BINSTRING] = load_short_binstring
723
724 def load_tuple(self):
725 k = self.marker()
726 self.stack[k:] = [tuple(self.stack[k+1:])]
727 dispatch[TUPLE] = load_tuple
728
729 def load_empty_tuple(self):
730 self.stack.append(())
731 dispatch[EMPTY_TUPLE] = load_empty_tuple
732
733 def load_empty_list(self):
734 self.stack.append([])
735 dispatch[EMPTY_LIST] = load_empty_list
736
737 def load_empty_dictionary(self):
738 self.stack.append({})
739 dispatch[EMPTY_DICT] = load_empty_dictionary
740
741 def load_list(self):
742 k = self.marker()
743 self.stack[k:] = [self.stack[k+1:]]
744 dispatch[LIST] = load_list
745
746 def load_dict(self):
747 k = self.marker()
748 d = {}
749 items = self.stack[k+1:]
750 for i in range(0, len(items), 2):
751 key = items[i]
752 value = items[i+1]
753 d[key] = value
754 self.stack[k:] = [d]
755 dispatch[DICT] = load_dict
756
757 def load_inst(self):
758 k = self.marker()
759 args = tuple(self.stack[k+1:])
760 del self.stack[k:]
761 module = self.readline()[:-1]
762 name = self.readline()[:-1]
763 klass = self.find_class(module, name)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000764 instantiated = 0
765 if (not args and type(klass) is ClassType and
766 not hasattr(klass, "__getinitargs__")):
767 try:
768 value = _EmptyClass()
769 value.__class__ = klass
Guido van Rossumb19e2a31998-04-13 18:08:45 +0000770 instantiated = 1
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000771 except RuntimeError:
772 # In restricted execution, assignment to inst.__class__ is
773 # prohibited
774 pass
775 if not instantiated:
Guido van Rossum743d17e1998-09-15 20:25:57 +0000776 try:
Barry Warsawbf4d9592001-11-15 23:42:58 +0000777 if not hasattr(klass, '__safe_for_unpickling__'):
778 raise UnpicklingError('%s is not safe for unpickling' %
779 klass)
Guido van Rossum743d17e1998-09-15 20:25:57 +0000780 value = apply(klass, args)
781 except TypeError, err:
782 raise TypeError, "in constructor for %s: %s" % (
783 klass.__name__, str(err)), sys.exc_info()[2]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000784 self.append(value)
785 dispatch[INST] = load_inst
786
787 def load_obj(self):
788 stack = self.stack
789 k = self.marker()
790 klass = stack[k + 1]
791 del stack[k + 1]
Tim Peters2344fae2001-01-15 00:50:52 +0000792 args = tuple(stack[k + 1:])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000793 del stack[k:]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000794 instantiated = 0
795 if (not args and type(klass) is ClassType and
796 not hasattr(klass, "__getinitargs__")):
797 try:
798 value = _EmptyClass()
799 value.__class__ = klass
800 instantiated = 1
801 except RuntimeError:
802 # In restricted execution, assignment to inst.__class__ is
803 # prohibited
804 pass
805 if not instantiated:
806 value = apply(klass, args)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000807 self.append(value)
Tim Peters2344fae2001-01-15 00:50:52 +0000808 dispatch[OBJ] = load_obj
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000809
810 def load_global(self):
811 module = self.readline()[:-1]
812 name = self.readline()[:-1]
813 klass = self.find_class(module, name)
814 self.append(klass)
815 dispatch[GLOBAL] = load_global
816
817 def find_class(self, module, name):
Barry Warsawbf4d9592001-11-15 23:42:58 +0000818 __import__(module)
819 mod = sys.modules[module]
820 klass = getattr(mod, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000821 return klass
822
823 def load_reduce(self):
824 stack = self.stack
825
826 callable = stack[-2]
827 arg_tup = stack[-1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000828 del stack[-2:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000829
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000830 if type(callable) is not ClassType:
831 if not safe_constructors.has_key(callable):
832 try:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000833 safe = callable.__safe_for_unpickling__
834 except AttributeError:
835 safe = None
Guido van Rossuma48061a1995-01-10 00:31:14 +0000836
Tim Petersc32d8242001-04-10 02:48:53 +0000837 if not safe:
Tim Peters2344fae2001-01-15 00:50:52 +0000838 raise UnpicklingError, "%s is not safe for " \
839 "unpickling" % callable
Guido van Rossuma48061a1995-01-10 00:31:14 +0000840
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000841 if arg_tup is None:
842 value = callable.__basicnew__()
843 else:
844 value = apply(callable, arg_tup)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000845 self.append(value)
846 dispatch[REDUCE] = load_reduce
Guido van Rossuma48061a1995-01-10 00:31:14 +0000847
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000848 def load_pop(self):
849 del self.stack[-1]
850 dispatch[POP] = load_pop
Guido van Rossum7b5430f1995-03-04 22:25:21 +0000851
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000852 def load_pop_mark(self):
853 k = self.marker()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000854 del self.stack[k:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000855 dispatch[POP_MARK] = load_pop_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000856
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000857 def load_dup(self):
Guido van Rossumb1062fc1998-03-31 17:00:46 +0000858 self.append(self.stack[-1])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000859 dispatch[DUP] = load_dup
Guido van Rossuma48061a1995-01-10 00:31:14 +0000860
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000861 def load_get(self):
862 self.append(self.memo[self.readline()[:-1]])
863 dispatch[GET] = load_get
Guido van Rossum78536471996-04-12 13:36:27 +0000864
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000865 def load_binget(self):
866 i = mloads('i' + self.read(1) + '\000\000\000')
867 self.append(self.memo[`i`])
868 dispatch[BINGET] = load_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000869
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000870 def load_long_binget(self):
871 i = mloads('i' + self.read(4))
872 self.append(self.memo[`i`])
873 dispatch[LONG_BINGET] = load_long_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000874
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000875 def load_put(self):
876 self.memo[self.readline()[:-1]] = self.stack[-1]
877 dispatch[PUT] = load_put
Guido van Rossuma48061a1995-01-10 00:31:14 +0000878
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000879 def load_binput(self):
880 i = mloads('i' + self.read(1) + '\000\000\000')
881 self.memo[`i`] = self.stack[-1]
882 dispatch[BINPUT] = load_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000883
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000884 def load_long_binput(self):
885 i = mloads('i' + self.read(4))
886 self.memo[`i`] = self.stack[-1]
887 dispatch[LONG_BINPUT] = load_long_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000888
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000889 def load_append(self):
890 stack = self.stack
891 value = stack[-1]
892 del stack[-1]
893 list = stack[-1]
894 list.append(value)
895 dispatch[APPEND] = load_append
Guido van Rossuma48061a1995-01-10 00:31:14 +0000896
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000897 def load_appends(self):
898 stack = self.stack
899 mark = self.marker()
900 list = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000901 for i in range(mark + 1, len(stack)):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000902 list.append(stack[i])
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000903
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000904 del stack[mark:]
905 dispatch[APPENDS] = load_appends
Tim Peters2344fae2001-01-15 00:50:52 +0000906
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000907 def load_setitem(self):
908 stack = self.stack
909 value = stack[-1]
910 key = stack[-2]
911 del stack[-2:]
912 dict = stack[-1]
913 dict[key] = value
914 dispatch[SETITEM] = load_setitem
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000915
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000916 def load_setitems(self):
917 stack = self.stack
918 mark = self.marker()
919 dict = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000920 for i in range(mark + 1, len(stack), 2):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000921 dict[stack[i]] = stack[i + 1]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000922
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000923 del stack[mark:]
924 dispatch[SETITEMS] = load_setitems
Guido van Rossuma48061a1995-01-10 00:31:14 +0000925
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000926 def load_build(self):
927 stack = self.stack
928 value = stack[-1]
929 del stack[-1]
930 inst = stack[-1]
931 try:
932 setstate = inst.__setstate__
933 except AttributeError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000934 try:
935 inst.__dict__.update(value)
936 except RuntimeError:
937 # XXX In restricted execution, the instance's __dict__ is not
938 # accessible. Use the old way of unpickling the instance
939 # variables. This is a semantic different when unpickling in
940 # restricted vs. unrestricted modes.
941 for k, v in value.items():
942 setattr(inst, k, v)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000943 else:
944 setstate(value)
945 dispatch[BUILD] = load_build
Guido van Rossuma48061a1995-01-10 00:31:14 +0000946
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000947 def load_mark(self):
948 self.append(self.mark)
949 dispatch[MARK] = load_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000950
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000951 def load_stop(self):
952 value = self.stack[-1]
953 del self.stack[-1]
Guido van Rossumff871742000-12-13 18:11:56 +0000954 raise _Stop(value)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000955 dispatch[STOP] = load_stop
Guido van Rossuma48061a1995-01-10 00:31:14 +0000956
Guido van Rossume467be61997-12-05 19:42:42 +0000957# Helper class for load_inst/load_obj
958
959class _EmptyClass:
960 pass
Guido van Rossuma48061a1995-01-10 00:31:14 +0000961
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000962# Shorthands
963
Jeremy Hyltonabe2c622001-10-15 21:29:28 +0000964try:
965 from cStringIO import StringIO
966except ImportError:
967 from StringIO import StringIO
Guido van Rossumc7c5e691996-07-22 22:26:07 +0000968
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000969def dump(object, file, bin = 0):
970 Pickler(file, bin).dump(object)
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000971
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000972def dumps(object, bin = 0):
973 file = StringIO()
974 Pickler(file, bin).dump(object)
975 return file.getvalue()
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000976
977def load(file):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000978 return Unpickler(file).load()
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000979
980def loads(str):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000981 file = StringIO(str)
982 return Unpickler(file).load()