blob: 96ee5c17e22d15a17d075424d04bad4d9d4b1f9e [file] [log] [blame]
Guido van Rossum54f22ed2000-02-04 15:10:34 +00001"""Create portable serialized representations of Python objects.
Guido van Rossuma48061a1995-01-10 00:31:14 +00002
Guido van Rossume467be61997-12-05 19:42:42 +00003See module cPickle for a (much) faster implementation.
4See module copy_reg for a mechanism for registering custom picklers.
Guido van Rossuma48061a1995-01-10 00:31:14 +00005
Guido van Rossume467be61997-12-05 19:42:42 +00006Classes:
Guido van Rossuma48061a1995-01-10 00:31:14 +00007
Guido van Rossume467be61997-12-05 19:42:42 +00008 Pickler
9 Unpickler
Guido van Rossuma48061a1995-01-10 00:31:14 +000010
Guido van Rossume467be61997-12-05 19:42:42 +000011Functions:
Guido van Rossuma48061a1995-01-10 00:31:14 +000012
Guido van Rossume467be61997-12-05 19:42:42 +000013 dump(object, file)
14 dumps(object) -> string
15 load(file) -> object
16 loads(string) -> object
Guido van Rossuma48061a1995-01-10 00:31:14 +000017
Guido van Rossume467be61997-12-05 19:42:42 +000018Misc variables:
Guido van Rossuma48061a1995-01-10 00:31:14 +000019
Fred Drakefe82acc1998-02-13 03:24:48 +000020 __version__
Guido van Rossume467be61997-12-05 19:42:42 +000021 format_version
22 compatible_formats
Guido van Rossuma48061a1995-01-10 00:31:14 +000023
Guido van Rossuma48061a1995-01-10 00:31:14 +000024"""
25
Guido van Rossum743d17e1998-09-15 20:25:57 +000026__version__ = "$Revision$" # Code version
Guido van Rossuma48061a1995-01-10 00:31:14 +000027
28from types import *
Guido van Rossum4fb5b281997-09-12 20:07:24 +000029from copy_reg import dispatch_table, safe_constructors
Guido van Rossumd3703791998-10-22 20:15:36 +000030import marshal
31import sys
32import struct
Skip Montanaro23bafc62001-02-18 03:10:09 +000033import re
Guido van Rossuma48061a1995-01-10 00:31:14 +000034
Skip Montanaro352674d2001-02-07 23:14:30 +000035__all__ = ["PickleError", "PicklingError", "UnpicklingError", "Pickler",
36 "Unpickler", "dump", "dumps", "load", "loads"]
37
Guido van Rossumd3703791998-10-22 20:15:36 +000038format_version = "1.3" # File format version we write
39compatible_formats = ["1.0", "1.1", "1.2"] # Old format versions we can read
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000040
41mdumps = marshal.dumps
42mloads = marshal.loads
Guido van Rossum0c891ce1995-03-14 15:09:05 +000043
Guido van Rossum26e89d02000-06-29 16:15:52 +000044class PickleError(Exception): pass
45class PicklingError(PickleError): pass
46class UnpicklingError(PickleError): pass
Guido van Rossum7849da81995-03-09 14:08:35 +000047
Guido van Rossumff871742000-12-13 18:11:56 +000048class _Stop(Exception):
49 def __init__(self, value):
50 self.value = value
51
Jeremy Hylton2b9d0291998-05-27 22:38:22 +000052try:
53 from org.python.core import PyStringMap
54except ImportError:
55 PyStringMap = None
56
Guido van Rossumdbb718f2001-09-21 19:22:34 +000057try:
58 UnicodeType
59except NameError:
60 UnicodeType = None
61
62
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000063MARK = '('
64STOP = '.'
65POP = '0'
66POP_MARK = '1'
67DUP = '2'
68FLOAT = 'F'
69INT = 'I'
70BININT = 'J'
71BININT1 = 'K'
72LONG = 'L'
73BININT2 = 'M'
74NONE = 'N'
75PERSID = 'P'
76BINPERSID = 'Q'
77REDUCE = 'R'
78STRING = 'S'
79BINSTRING = 'T'
80SHORT_BINSTRING = 'U'
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +000081UNICODE = 'V'
82BINUNICODE = 'X'
Guido van Rossumb72cf2d1997-04-09 17:32:51 +000083APPEND = 'a'
84BUILD = 'b'
85GLOBAL = 'c'
86DICT = 'd'
87EMPTY_DICT = '}'
88APPENDS = 'e'
89GET = 'g'
90BINGET = 'h'
91INST = 'i'
92LONG_BINGET = 'j'
93LIST = 'l'
94EMPTY_LIST = ']'
95OBJ = 'o'
96PUT = 'p'
97BINPUT = 'q'
98LONG_BINPUT = 'r'
99SETITEM = 's'
100TUPLE = 't'
101EMPTY_TUPLE = ')'
102SETITEMS = 'u'
Guido van Rossumd3703791998-10-22 20:15:36 +0000103BINFLOAT = 'G'
Guido van Rossum77f6a652002-04-03 22:41:51 +0000104TRUE = 'Z'
105FALSE = 'z'
106
Guido van Rossuma48061a1995-01-10 00:31:14 +0000107
Skip Montanaro23bafc62001-02-18 03:10:09 +0000108__all__.extend([x for x in dir() if re.match("[A-Z][A-Z0-9_]+$",x)])
Neal Norwitzd5ba4ae2002-02-11 18:12:06 +0000109del x
Skip Montanaro23bafc62001-02-18 03:10:09 +0000110
Guido van Rossuma48061a1995-01-10 00:31:14 +0000111class Pickler:
112
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000113 def __init__(self, file, bin = 0):
114 self.write = file.write
115 self.memo = {}
116 self.bin = bin
Guido van Rossuma48061a1995-01-10 00:31:14 +0000117
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000118 def dump(self, object):
119 self.save(object)
120 self.write(STOP)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000121
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000122 def put(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000123 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000124 s = mdumps(i)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000125 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000126 return BINPUT + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000127
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000128 return LONG_BINPUT + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000129
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000130 return PUT + `i` + '\n'
Guido van Rossuma48061a1995-01-10 00:31:14 +0000131
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000132 def get(self, i):
Tim Petersc32d8242001-04-10 02:48:53 +0000133 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000134 s = mdumps(i)[1:]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000135
Tim Petersc32d8242001-04-10 02:48:53 +0000136 if i < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000137 return BINGET + s[0]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000138
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000139 return LONG_BINGET + s
Guido van Rossuma48061a1995-01-10 00:31:14 +0000140
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000141 return GET + `i` + '\n'
Tim Peters2344fae2001-01-15 00:50:52 +0000142
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000143 def save(self, object, pers_save = 0):
144 memo = self.memo
Guido van Rossuma48061a1995-01-10 00:31:14 +0000145
Tim Petersc32d8242001-04-10 02:48:53 +0000146 if not pers_save:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000147 pid = self.persistent_id(object)
Tim Petersc32d8242001-04-10 02:48:53 +0000148 if pid is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000149 self.save_pers(pid)
150 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000151
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000152 d = id(object)
Tim Peters2344fae2001-01-15 00:50:52 +0000153
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000154 t = type(object)
Guido van Rossuma48061a1995-01-10 00:31:14 +0000155
Tim Petersc32d8242001-04-10 02:48:53 +0000156 if (t is TupleType) and (len(object) == 0):
157 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000158 self.save_empty_tuple(object)
159 else:
160 self.save_tuple(object)
161 return
Guido van Rossuma48061a1995-01-10 00:31:14 +0000162
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000163 if memo.has_key(d):
164 self.write(self.get(memo[d][0]))
165 return
166
167 try:
168 f = self.dispatch[t]
169 except KeyError:
Guido van Rossum85ee4912002-03-26 00:51:56 +0000170 try:
171 issc = issubclass(t, TypeType)
172 except TypeError: # t is not a class
173 issc = 0
174 if issc:
Guido van Rossumf048a8f2001-12-19 16:55:02 +0000175 self.save_global(object)
176 return
177
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000178 pid = self.inst_persistent_id(object)
179 if pid is not None:
180 self.save_pers(pid)
181 return
182
183 try:
184 reduce = dispatch_table[t]
185 except KeyError:
186 try:
187 reduce = object.__reduce__
188 except AttributeError:
189 raise PicklingError, \
Guido van Rossum08a92cb1999-10-10 21:14:25 +0000190 "can't pickle %s object: %s" % (`t.__name__`,
191 `object`)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000192 else:
193 tup = reduce()
194 else:
195 tup = reduce(object)
196
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000197 if type(tup) is StringType:
198 self.save_global(object, tup)
199 return
Guido van Rossumd1f49841997-12-10 23:40:18 +0000200
Tim Petersc32d8242001-04-10 02:48:53 +0000201 if type(tup) is not TupleType:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000202 raise PicklingError, "Value returned by %s must be a " \
203 "tuple" % reduce
204
205 l = len(tup)
Tim Peters2344fae2001-01-15 00:50:52 +0000206
Tim Petersc32d8242001-04-10 02:48:53 +0000207 if (l != 2) and (l != 3):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000208 raise PicklingError, "tuple returned by %s must contain " \
209 "only two or three elements" % reduce
210
211 callable = tup[0]
212 arg_tup = tup[1]
Tim Peters2344fae2001-01-15 00:50:52 +0000213
Tim Petersc32d8242001-04-10 02:48:53 +0000214 if l > 2:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000215 state = tup[2]
216 else:
217 state = None
218
Guido van Rossumd1f49841997-12-10 23:40:18 +0000219 if type(arg_tup) is not TupleType and arg_tup is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000220 raise PicklingError, "Second element of tuple returned " \
221 "by %s must be a tuple" % reduce
222
Tim Peters2344fae2001-01-15 00:50:52 +0000223 self.save_reduce(callable, arg_tup, state)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000224 memo_len = len(memo)
225 self.write(self.put(memo_len))
226 memo[d] = (memo_len, object)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000227 return
228
229 f(self, object)
230
231 def persistent_id(self, object):
232 return None
233
234 def inst_persistent_id(self, object):
235 return None
236
237 def save_pers(self, pid):
Tim Petersc32d8242001-04-10 02:48:53 +0000238 if not self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000239 self.write(PERSID + str(pid) + '\n')
240 else:
241 self.save(pid, 1)
242 self.write(BINPERSID)
243
244 def save_reduce(self, callable, arg_tup, state = None):
245 write = self.write
246 save = self.save
247
248 save(callable)
249 save(arg_tup)
250 write(REDUCE)
Tim Peters2344fae2001-01-15 00:50:52 +0000251
Tim Petersc32d8242001-04-10 02:48:53 +0000252 if state is not None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000253 save(state)
254 write(BUILD)
255
256 dispatch = {}
257
258 def save_none(self, object):
259 self.write(NONE)
260 dispatch[NoneType] = save_none
261
Guido van Rossum77f6a652002-04-03 22:41:51 +0000262 def save_bool(self, object):
263 if object:
264 self.write(TRUE)
265 else:
266 self.write(FALSE)
267 dispatch[bool] = save_bool
268
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000269 def save_int(self, object):
Tim Petersc32d8242001-04-10 02:48:53 +0000270 if self.bin:
Tim Peters44714002001-04-10 05:02:52 +0000271 # If the int is small enough to fit in a signed 4-byte 2's-comp
272 # format, we can store it more efficiently than the general
273 # case.
274 high_bits = object >> 31 # note that Python shift sign-extends
275 if high_bits == 0 or high_bits == -1:
276 # All high bits are copies of bit 2**31, so the value
277 # fits in a 4-byte signed int.
278 i = mdumps(object)[1:]
279 assert len(i) == 4
280 if i[-2:] == '\000\000': # fits in 2-byte unsigned int
281 if i[-3] == '\000': # fits in 1-byte unsigned int
282 self.write(BININT1 + i[0])
283 else:
284 self.write(BININT2 + i[:2])
285 else:
286 self.write(BININT + i)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000287 return
Tim Peters44714002001-04-10 05:02:52 +0000288 # Text pickle, or int too big to fit in signed 4-byte format.
289 self.write(INT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000290 dispatch[IntType] = save_int
291
292 def save_long(self, object):
293 self.write(LONG + `object` + '\n')
294 dispatch[LongType] = save_long
295
Guido van Rossumd3703791998-10-22 20:15:36 +0000296 def save_float(self, object, pack=struct.pack):
297 if self.bin:
298 self.write(BINFLOAT + pack('>d', object))
299 else:
300 self.write(FLOAT + `object` + '\n')
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000301 dispatch[FloatType] = save_float
302
303 def save_string(self, object):
304 d = id(object)
305 memo = self.memo
306
Tim Petersc32d8242001-04-10 02:48:53 +0000307 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000308 l = len(object)
309 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000310 if l < 256:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000311 self.write(SHORT_BINSTRING + s[0] + object)
312 else:
313 self.write(BINSTRING + s + object)
314 else:
315 self.write(STRING + `object` + '\n')
316
317 memo_len = len(memo)
318 self.write(self.put(memo_len))
319 memo[d] = (memo_len, object)
320 dispatch[StringType] = save_string
321
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000322 def save_unicode(self, object):
323 d = id(object)
324 memo = self.memo
325
Tim Petersc32d8242001-04-10 02:48:53 +0000326 if self.bin:
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000327 encoding = object.encode('utf-8')
328 l = len(encoding)
329 s = mdumps(l)[1:]
330 self.write(BINUNICODE + s + encoding)
331 else:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000332 object = object.replace("\\", "\\u005c")
333 object = object.replace("\n", "\\u000a")
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000334 self.write(UNICODE + object.encode('raw-unicode-escape') + '\n')
335
336 memo_len = len(memo)
337 self.write(self.put(memo_len))
338 memo[d] = (memo_len, object)
339 dispatch[UnicodeType] = save_unicode
340
Guido van Rossum31584cb2001-01-22 14:53:29 +0000341 if StringType == UnicodeType:
342 # This is true for Jython
343 def save_string(self, object):
344 d = id(object)
345 memo = self.memo
346 unicode = object.isunicode()
347
Tim Petersc32d8242001-04-10 02:48:53 +0000348 if self.bin:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000349 if unicode:
350 object = object.encode("utf-8")
351 l = len(object)
352 s = mdumps(l)[1:]
Tim Petersc32d8242001-04-10 02:48:53 +0000353 if l < 256 and not unicode:
Guido van Rossum31584cb2001-01-22 14:53:29 +0000354 self.write(SHORT_BINSTRING + s[0] + object)
355 else:
356 if unicode:
357 self.write(BINUNICODE + s + object)
358 else:
359 self.write(BINSTRING + s + object)
360 else:
Tim Peters658cba62001-02-09 20:06:00 +0000361 if unicode:
Guido van Rossumdbb718f2001-09-21 19:22:34 +0000362 object = object.replace("\\", "\\u005c")
363 object = object.replace("\n", "\\u000a")
Guido van Rossum31584cb2001-01-22 14:53:29 +0000364 object = object.encode('raw-unicode-escape')
365 self.write(UNICODE + object + '\n')
366 else:
367 self.write(STRING + `object` + '\n')
368
369 memo_len = len(memo)
370 self.write(self.put(memo_len))
371 memo[d] = (memo_len, object)
372 dispatch[StringType] = save_string
Tim Peters658cba62001-02-09 20:06:00 +0000373
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000374 def save_tuple(self, object):
375
376 write = self.write
377 save = self.save
378 memo = self.memo
379
380 d = id(object)
381
382 write(MARK)
383
384 for element in object:
385 save(element)
386
Tim Petersc32d8242001-04-10 02:48:53 +0000387 if len(object) and memo.has_key(d):
388 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000389 write(POP_MARK + self.get(memo[d][0]))
390 return
Tim Peters2344fae2001-01-15 00:50:52 +0000391
Guido van Rossum599174f1998-03-31 16:30:28 +0000392 write(POP * (len(object) + 1) + self.get(memo[d][0]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000393 return
394
395 memo_len = len(memo)
396 self.write(TUPLE + self.put(memo_len))
397 memo[d] = (memo_len, object)
398 dispatch[TupleType] = save_tuple
399
400 def save_empty_tuple(self, object):
401 self.write(EMPTY_TUPLE)
402
403 def save_list(self, object):
404 d = id(object)
405
406 write = self.write
407 save = self.save
408 memo = self.memo
409
Tim Petersc32d8242001-04-10 02:48:53 +0000410 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000411 write(EMPTY_LIST)
412 else:
413 write(MARK + LIST)
414
415 memo_len = len(memo)
416 write(self.put(memo_len))
417 memo[d] = (memo_len, object)
418
419 using_appends = (self.bin and (len(object) > 1))
420
Tim Petersc32d8242001-04-10 02:48:53 +0000421 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000422 write(MARK)
423
424 for element in object:
425 save(element)
Tim Peters2344fae2001-01-15 00:50:52 +0000426
Tim Petersc32d8242001-04-10 02:48:53 +0000427 if not using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000428 write(APPEND)
429
Tim Petersc32d8242001-04-10 02:48:53 +0000430 if using_appends:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000431 write(APPENDS)
432 dispatch[ListType] = save_list
433
434 def save_dict(self, object):
435 d = id(object)
436
437 write = self.write
438 save = self.save
439 memo = self.memo
440
Tim Petersc32d8242001-04-10 02:48:53 +0000441 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000442 write(EMPTY_DICT)
443 else:
444 write(MARK + DICT)
445
446 memo_len = len(memo)
447 self.write(self.put(memo_len))
448 memo[d] = (memo_len, object)
449
450 using_setitems = (self.bin and (len(object) > 1))
451
Tim Petersc32d8242001-04-10 02:48:53 +0000452 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000453 write(MARK)
454
455 items = object.items()
456 for key, value in items:
457 save(key)
458 save(value)
459
Tim Petersc32d8242001-04-10 02:48:53 +0000460 if not using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000461 write(SETITEM)
462
Tim Petersc32d8242001-04-10 02:48:53 +0000463 if using_setitems:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000464 write(SETITEMS)
465
466 dispatch[DictionaryType] = save_dict
Jeremy Hylton2b9d0291998-05-27 22:38:22 +0000467 if not PyStringMap is None:
468 dispatch[PyStringMap] = save_dict
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000469
470 def save_inst(self, object):
471 d = id(object)
472 cls = object.__class__
473
474 memo = self.memo
475 write = self.write
476 save = self.save
477
478 if hasattr(object, '__getinitargs__'):
479 args = object.__getinitargs__()
480 len(args) # XXX Assert it's a sequence
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000481 _keep_alive(args, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000482 else:
483 args = ()
484
485 write(MARK)
486
Tim Petersc32d8242001-04-10 02:48:53 +0000487 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000488 save(cls)
489
490 for arg in args:
491 save(arg)
492
493 memo_len = len(memo)
Tim Petersc32d8242001-04-10 02:48:53 +0000494 if self.bin:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000495 write(OBJ + self.put(memo_len))
496 else:
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000497 write(INST + cls.__module__ + '\n' + cls.__name__ + '\n' +
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000498 self.put(memo_len))
499
500 memo[d] = (memo_len, object)
501
502 try:
503 getstate = object.__getstate__
504 except AttributeError:
505 stuff = object.__dict__
506 else:
507 stuff = getstate()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000508 _keep_alive(stuff, memo)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000509 save(stuff)
510 write(BUILD)
511 dispatch[InstanceType] = save_inst
512
513 def save_global(self, object, name = None):
514 write = self.write
515 memo = self.memo
516
Tim Petersc32d8242001-04-10 02:48:53 +0000517 if name is None:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000518 name = object.__name__
519
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000520 try:
521 module = object.__module__
522 except AttributeError:
523 module = whichmodule(object, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000524
Guido van Rossumb0a98e92001-08-17 18:49:52 +0000525 try:
526 __import__(module)
527 mod = sys.modules[module]
528 klass = getattr(mod, name)
529 except (ImportError, KeyError, AttributeError):
530 raise PicklingError(
531 "Can't pickle %r: it's not found as %s.%s" %
532 (object, module, name))
533 else:
534 if klass is not object:
535 raise PicklingError(
536 "Can't pickle %r: it's not the same object as %s.%s" %
537 (object, module, name))
538
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000539 memo_len = len(memo)
540 write(GLOBAL + module + '\n' + name + '\n' +
541 self.put(memo_len))
542 memo[id(object)] = (memo_len, object)
543 dispatch[ClassType] = save_global
544 dispatch[FunctionType] = save_global
545 dispatch[BuiltinFunctionType] = save_global
Tim Peters6d6c1a32001-08-02 04:15:00 +0000546 dispatch[TypeType] = save_global
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000547
Guido van Rossuma48061a1995-01-10 00:31:14 +0000548
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000549def _keep_alive(x, memo):
550 """Keeps a reference to the object x in the memo.
551
552 Because we remember objects by their id, we have
553 to assure that possibly temporary objects are kept
554 alive by referencing them.
555 We store a reference at the id of the memo, which should
556 normally not be used unless someone tries to deepcopy
557 the memo itself...
558 """
559 try:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000560 memo[id(memo)].append(x)
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000561 except KeyError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000562 # aha, this is the first one :-)
563 memo[id(memo)]=[x]
Guido van Rossum5ed5c4c1997-09-03 00:23:54 +0000564
565
Guido van Rossuma48061a1995-01-10 00:31:14 +0000566classmap = {}
567
Guido van Rossum4fb5b281997-09-12 20:07:24 +0000568# This is no longer used to find classes, but still for functions
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000569def whichmodule(cls, clsname):
570 """Figure out the module in which a class occurs.
Guido van Rossuma48061a1995-01-10 00:31:14 +0000571
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000572 Search sys.modules for the module.
573 Cache in classmap.
574 Return a module name.
575 If the class cannot be found, return __main__.
576 """
577 if classmap.has_key(cls):
578 return classmap[cls]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000579
580 for name, module in sys.modules.items():
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000581 if name != '__main__' and \
582 hasattr(module, clsname) and \
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000583 getattr(module, clsname) is cls:
584 break
585 else:
586 name = '__main__'
587 classmap[cls] = name
588 return name
Guido van Rossuma48061a1995-01-10 00:31:14 +0000589
590
591class Unpickler:
592
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000593 def __init__(self, file):
594 self.readline = file.readline
595 self.read = file.read
596 self.memo = {}
Guido van Rossuma48061a1995-01-10 00:31:14 +0000597
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000598 def load(self):
Jeremy Hylton20747fa2001-11-09 16:15:04 +0000599 self.mark = object() # any new unique object
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000600 self.stack = []
601 self.append = self.stack.append
602 read = self.read
603 dispatch = self.dispatch
604 try:
605 while 1:
606 key = read(1)
607 dispatch[key](self)
Guido van Rossumff871742000-12-13 18:11:56 +0000608 except _Stop, stopinst:
609 return stopinst.value
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000610
611 def marker(self):
612 stack = self.stack
613 mark = self.mark
614 k = len(stack)-1
615 while stack[k] is not mark: k = k-1
616 return k
617
618 dispatch = {}
619
620 def load_eof(self):
621 raise EOFError
622 dispatch[''] = load_eof
623
624 def load_persid(self):
625 pid = self.readline()[:-1]
626 self.append(self.persistent_load(pid))
627 dispatch[PERSID] = load_persid
628
629 def load_binpersid(self):
630 stack = self.stack
Tim Peters2344fae2001-01-15 00:50:52 +0000631
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000632 pid = stack[-1]
633 del stack[-1]
634
635 self.append(self.persistent_load(pid))
636 dispatch[BINPERSID] = load_binpersid
637
638 def load_none(self):
639 self.append(None)
640 dispatch[NONE] = load_none
641
Guido van Rossum77f6a652002-04-03 22:41:51 +0000642 def load_false(self):
643 self.append(False)
644 dispatch[FALSE] = load_false
645
646 def load_true(self):
647 self.append(True)
648 dispatch[TRUE] = load_true
649
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000650 def load_int(self):
Tim Peters19ef62d2001-08-28 22:21:18 +0000651 data = self.readline()
652 try:
653 self.append(int(data))
654 except ValueError:
655 self.append(long(data))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000656 dispatch[INT] = load_int
657
658 def load_binint(self):
659 self.append(mloads('i' + self.read(4)))
660 dispatch[BININT] = load_binint
661
662 def load_binint1(self):
663 self.append(mloads('i' + self.read(1) + '\000\000\000'))
664 dispatch[BININT1] = load_binint1
665
666 def load_binint2(self):
667 self.append(mloads('i' + self.read(2) + '\000\000'))
668 dispatch[BININT2] = load_binint2
Tim Peters2344fae2001-01-15 00:50:52 +0000669
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000670 def load_long(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000671 self.append(long(self.readline()[:-1], 0))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000672 dispatch[LONG] = load_long
673
674 def load_float(self):
Guido van Rossumff871742000-12-13 18:11:56 +0000675 self.append(float(self.readline()[:-1]))
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000676 dispatch[FLOAT] = load_float
677
Guido van Rossumd3703791998-10-22 20:15:36 +0000678 def load_binfloat(self, unpack=struct.unpack):
679 self.append(unpack('>d', self.read(8))[0])
680 dispatch[BINFLOAT] = load_binfloat
681
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000682 def load_string(self):
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000683 rep = self.readline()[:-1]
684 if not self._is_string_secure(rep):
685 raise ValueError, "insecure string pickle"
686 self.append(eval(rep,
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000687 {'__builtins__': {}})) # Let's be careful
688 dispatch[STRING] = load_string
689
Jeremy Hyltonbe467e52000-09-15 15:14:51 +0000690 def _is_string_secure(self, s):
691 """Return true if s contains a string that is safe to eval
692
693 The definition of secure string is based on the implementation
694 in cPickle. s is secure as long as it only contains a quoted
695 string and optional trailing whitespace.
696 """
697 q = s[0]
698 if q not in ("'", '"'):
699 return 0
700 # find the closing quote
701 offset = 1
702 i = None
703 while 1:
704 try:
705 i = s.index(q, offset)
706 except ValueError:
707 # if there is an error the first time, there is no
708 # close quote
709 if offset == 1:
710 return 0
711 if s[i-1] != '\\':
712 break
713 # check to see if this one is escaped
714 nslash = 0
715 j = i - 1
716 while j >= offset and s[j] == '\\':
717 j = j - 1
718 nslash = nslash + 1
719 if nslash % 2 == 0:
720 break
721 offset = i + 1
722 for c in s[i+1:]:
723 if ord(c) > 32:
724 return 0
725 return 1
726
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000727 def load_binstring(self):
728 len = mloads('i' + self.read(4))
729 self.append(self.read(len))
730 dispatch[BINSTRING] = load_binstring
731
Guido van Rossumb5f2f1b2000-03-10 23:20:09 +0000732 def load_unicode(self):
733 self.append(unicode(self.readline()[:-1],'raw-unicode-escape'))
734 dispatch[UNICODE] = load_unicode
735
736 def load_binunicode(self):
737 len = mloads('i' + self.read(4))
738 self.append(unicode(self.read(len),'utf-8'))
739 dispatch[BINUNICODE] = load_binunicode
740
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000741 def load_short_binstring(self):
742 len = mloads('i' + self.read(1) + '\000\000\000')
743 self.append(self.read(len))
744 dispatch[SHORT_BINSTRING] = load_short_binstring
745
746 def load_tuple(self):
747 k = self.marker()
748 self.stack[k:] = [tuple(self.stack[k+1:])]
749 dispatch[TUPLE] = load_tuple
750
751 def load_empty_tuple(self):
752 self.stack.append(())
753 dispatch[EMPTY_TUPLE] = load_empty_tuple
754
755 def load_empty_list(self):
756 self.stack.append([])
757 dispatch[EMPTY_LIST] = load_empty_list
758
759 def load_empty_dictionary(self):
760 self.stack.append({})
761 dispatch[EMPTY_DICT] = load_empty_dictionary
762
763 def load_list(self):
764 k = self.marker()
765 self.stack[k:] = [self.stack[k+1:]]
766 dispatch[LIST] = load_list
767
768 def load_dict(self):
769 k = self.marker()
770 d = {}
771 items = self.stack[k+1:]
772 for i in range(0, len(items), 2):
773 key = items[i]
774 value = items[i+1]
775 d[key] = value
776 self.stack[k:] = [d]
777 dispatch[DICT] = load_dict
778
779 def load_inst(self):
780 k = self.marker()
781 args = tuple(self.stack[k+1:])
782 del self.stack[k:]
783 module = self.readline()[:-1]
784 name = self.readline()[:-1]
785 klass = self.find_class(module, name)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000786 instantiated = 0
787 if (not args and type(klass) is ClassType and
788 not hasattr(klass, "__getinitargs__")):
789 try:
790 value = _EmptyClass()
791 value.__class__ = klass
Guido van Rossumb19e2a31998-04-13 18:08:45 +0000792 instantiated = 1
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000793 except RuntimeError:
794 # In restricted execution, assignment to inst.__class__ is
795 # prohibited
796 pass
797 if not instantiated:
Guido van Rossum743d17e1998-09-15 20:25:57 +0000798 try:
Barry Warsawbf4d9592001-11-15 23:42:58 +0000799 if not hasattr(klass, '__safe_for_unpickling__'):
800 raise UnpicklingError('%s is not safe for unpickling' %
801 klass)
Guido van Rossum743d17e1998-09-15 20:25:57 +0000802 value = apply(klass, args)
803 except TypeError, err:
804 raise TypeError, "in constructor for %s: %s" % (
805 klass.__name__, str(err)), sys.exc_info()[2]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000806 self.append(value)
807 dispatch[INST] = load_inst
808
809 def load_obj(self):
810 stack = self.stack
811 k = self.marker()
812 klass = stack[k + 1]
813 del stack[k + 1]
Tim Peters2344fae2001-01-15 00:50:52 +0000814 args = tuple(stack[k + 1:])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000815 del stack[k:]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000816 instantiated = 0
817 if (not args and type(klass) is ClassType and
818 not hasattr(klass, "__getinitargs__")):
819 try:
820 value = _EmptyClass()
821 value.__class__ = klass
822 instantiated = 1
823 except RuntimeError:
824 # In restricted execution, assignment to inst.__class__ is
825 # prohibited
826 pass
827 if not instantiated:
828 value = apply(klass, args)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000829 self.append(value)
Tim Peters2344fae2001-01-15 00:50:52 +0000830 dispatch[OBJ] = load_obj
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000831
832 def load_global(self):
833 module = self.readline()[:-1]
834 name = self.readline()[:-1]
835 klass = self.find_class(module, name)
836 self.append(klass)
837 dispatch[GLOBAL] = load_global
838
839 def find_class(self, module, name):
Barry Warsawbf4d9592001-11-15 23:42:58 +0000840 __import__(module)
841 mod = sys.modules[module]
842 klass = getattr(mod, name)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000843 return klass
844
845 def load_reduce(self):
846 stack = self.stack
847
848 callable = stack[-2]
849 arg_tup = stack[-1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000850 del stack[-2:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000851
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000852 if type(callable) is not ClassType:
853 if not safe_constructors.has_key(callable):
854 try:
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000855 safe = callable.__safe_for_unpickling__
856 except AttributeError:
857 safe = None
Guido van Rossuma48061a1995-01-10 00:31:14 +0000858
Tim Petersc32d8242001-04-10 02:48:53 +0000859 if not safe:
Tim Peters2344fae2001-01-15 00:50:52 +0000860 raise UnpicklingError, "%s is not safe for " \
861 "unpickling" % callable
Guido van Rossuma48061a1995-01-10 00:31:14 +0000862
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000863 if arg_tup is None:
864 value = callable.__basicnew__()
865 else:
866 value = apply(callable, arg_tup)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000867 self.append(value)
868 dispatch[REDUCE] = load_reduce
Guido van Rossuma48061a1995-01-10 00:31:14 +0000869
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000870 def load_pop(self):
871 del self.stack[-1]
872 dispatch[POP] = load_pop
Guido van Rossum7b5430f1995-03-04 22:25:21 +0000873
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000874 def load_pop_mark(self):
875 k = self.marker()
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000876 del self.stack[k:]
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000877 dispatch[POP_MARK] = load_pop_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000878
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000879 def load_dup(self):
Guido van Rossumb1062fc1998-03-31 17:00:46 +0000880 self.append(self.stack[-1])
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000881 dispatch[DUP] = load_dup
Guido van Rossuma48061a1995-01-10 00:31:14 +0000882
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000883 def load_get(self):
884 self.append(self.memo[self.readline()[:-1]])
885 dispatch[GET] = load_get
Guido van Rossum78536471996-04-12 13:36:27 +0000886
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000887 def load_binget(self):
888 i = mloads('i' + self.read(1) + '\000\000\000')
889 self.append(self.memo[`i`])
890 dispatch[BINGET] = load_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000891
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000892 def load_long_binget(self):
893 i = mloads('i' + self.read(4))
894 self.append(self.memo[`i`])
895 dispatch[LONG_BINGET] = load_long_binget
Guido van Rossum78536471996-04-12 13:36:27 +0000896
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000897 def load_put(self):
898 self.memo[self.readline()[:-1]] = self.stack[-1]
899 dispatch[PUT] = load_put
Guido van Rossuma48061a1995-01-10 00:31:14 +0000900
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000901 def load_binput(self):
902 i = mloads('i' + self.read(1) + '\000\000\000')
903 self.memo[`i`] = self.stack[-1]
904 dispatch[BINPUT] = load_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000905
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000906 def load_long_binput(self):
907 i = mloads('i' + self.read(4))
908 self.memo[`i`] = self.stack[-1]
909 dispatch[LONG_BINPUT] = load_long_binput
Guido van Rossuma48061a1995-01-10 00:31:14 +0000910
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000911 def load_append(self):
912 stack = self.stack
913 value = stack[-1]
914 del stack[-1]
915 list = stack[-1]
916 list.append(value)
917 dispatch[APPEND] = load_append
Guido van Rossuma48061a1995-01-10 00:31:14 +0000918
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000919 def load_appends(self):
920 stack = self.stack
921 mark = self.marker()
922 list = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000923 for i in range(mark + 1, len(stack)):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000924 list.append(stack[i])
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000925
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000926 del stack[mark:]
927 dispatch[APPENDS] = load_appends
Tim Peters2344fae2001-01-15 00:50:52 +0000928
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000929 def load_setitem(self):
930 stack = self.stack
931 value = stack[-1]
932 key = stack[-2]
933 del stack[-2:]
934 dict = stack[-1]
935 dict[key] = value
936 dispatch[SETITEM] = load_setitem
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000937
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000938 def load_setitems(self):
939 stack = self.stack
940 mark = self.marker()
941 dict = stack[mark - 1]
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000942 for i in range(mark + 1, len(stack), 2):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000943 dict[stack[i]] = stack[i + 1]
Guido van Rossuma48061a1995-01-10 00:31:14 +0000944
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000945 del stack[mark:]
946 dispatch[SETITEMS] = load_setitems
Guido van Rossuma48061a1995-01-10 00:31:14 +0000947
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000948 def load_build(self):
949 stack = self.stack
950 value = stack[-1]
951 del stack[-1]
952 inst = stack[-1]
953 try:
954 setstate = inst.__setstate__
955 except AttributeError:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000956 try:
957 inst.__dict__.update(value)
958 except RuntimeError:
959 # XXX In restricted execution, the instance's __dict__ is not
960 # accessible. Use the old way of unpickling the instance
961 # variables. This is a semantic different when unpickling in
962 # restricted vs. unrestricted modes.
963 for k, v in value.items():
964 setattr(inst, k, v)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000965 else:
966 setstate(value)
967 dispatch[BUILD] = load_build
Guido van Rossuma48061a1995-01-10 00:31:14 +0000968
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000969 def load_mark(self):
970 self.append(self.mark)
971 dispatch[MARK] = load_mark
Guido van Rossuma48061a1995-01-10 00:31:14 +0000972
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000973 def load_stop(self):
974 value = self.stack[-1]
975 del self.stack[-1]
Guido van Rossumff871742000-12-13 18:11:56 +0000976 raise _Stop(value)
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000977 dispatch[STOP] = load_stop
Guido van Rossuma48061a1995-01-10 00:31:14 +0000978
Guido van Rossume467be61997-12-05 19:42:42 +0000979# Helper class for load_inst/load_obj
980
981class _EmptyClass:
982 pass
Guido van Rossuma48061a1995-01-10 00:31:14 +0000983
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000984# Shorthands
985
Jeremy Hyltonabe2c622001-10-15 21:29:28 +0000986try:
987 from cStringIO import StringIO
988except ImportError:
989 from StringIO import StringIO
Guido van Rossumc7c5e691996-07-22 22:26:07 +0000990
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000991def dump(object, file, bin = 0):
992 Pickler(file, bin).dump(object)
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000993
Guido van Rossumb72cf2d1997-04-09 17:32:51 +0000994def dumps(object, bin = 0):
995 file = StringIO()
996 Pickler(file, bin).dump(object)
997 return file.getvalue()
Guido van Rossum0c891ce1995-03-14 15:09:05 +0000998
999def load(file):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +00001000 return Unpickler(file).load()
Guido van Rossum0c891ce1995-03-14 15:09:05 +00001001
1002def loads(str):
Guido van Rossumb72cf2d1997-04-09 17:32:51 +00001003 file = StringIO(str)
1004 return Unpickler(file).load()