blob: 73c43e22f7ada3a6f398848a68b9b8e48d339984 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossum62448671996-09-17 21:33:15 +00002
Thomas Wouters477c8d52006-05-27 19:21:47 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Thomas Wouters89f507f2006-12-13 04:49:30 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Thomas Wouters477c8d52006-05-27 19:21:47 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Thomas Wouters477c8d52006-05-27 19:21:47 +000013import time
14import calendar
15import socket
16import errno
17import copy
R. David Murrayb7deff12011-01-30 06:21:28 +000018import warnings
Thomas Wouters477c8d52006-05-27 19:21:47 +000019import email
Thomas Woutersb2137042007-02-01 18:02:27 +000020import email.message
21import email.generator
Guido van Rossum34d19282007-08-09 01:03:29 +000022import io
R David Murray05ff9902011-06-17 12:54:56 -040023import contextlib
Thomas Wouters477c8d52006-05-27 19:21:47 +000024try:
Thomas Wouters0e3f5912006-08-11 14:57:12 +000025 if sys.platform == 'os2emx':
26 # OS/2 EMX fcntl() not adequate
27 raise ImportError
28 import fcntl
Thomas Wouters477c8d52006-05-27 19:21:47 +000029except ImportError:
30 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000031
Thomas Wouters477c8d52006-05-27 19:21:47 +000032__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
33 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
Benjamin Peterson8041d472008-05-11 16:17:24 +000034 'BabylMessage', 'MMDFMessage']
Thomas Wouters477c8d52006-05-27 19:21:47 +000035
R. David Murrayb7deff12011-01-30 06:21:28 +000036linesep = os.linesep.encode('ascii')
37
Thomas Wouters477c8d52006-05-27 19:21:47 +000038class Mailbox:
39 """A group of messages in a particular place."""
40
41 def __init__(self, path, factory=None, create=True):
42 """Initialize a Mailbox instance."""
43 self._path = os.path.abspath(os.path.expanduser(path))
44 self._factory = factory
45
46 def add(self, message):
47 """Add message and return assigned key."""
48 raise NotImplementedError('Method must be implemented by subclass')
49
50 def remove(self, key):
51 """Remove the keyed message; raise KeyError if it doesn't exist."""
52 raise NotImplementedError('Method must be implemented by subclass')
53
54 def __delitem__(self, key):
55 self.remove(key)
56
57 def discard(self, key):
58 """If the keyed message exists, remove it."""
59 try:
60 self.remove(key)
61 except KeyError:
62 pass
63
64 def __setitem__(self, key, message):
65 """Replace the keyed message; raise KeyError if it doesn't exist."""
66 raise NotImplementedError('Method must be implemented by subclass')
67
68 def get(self, key, default=None):
69 """Return the keyed message, or default if it doesn't exist."""
70 try:
71 return self.__getitem__(key)
72 except KeyError:
73 return default
74
75 def __getitem__(self, key):
76 """Return the keyed message; raise KeyError if it doesn't exist."""
77 if not self._factory:
78 return self.get_message(key)
79 else:
R David Murray05ff9902011-06-17 12:54:56 -040080 with contextlib.closing(self.get_file(key)) as file:
81 return self._factory(file)
Thomas Wouters477c8d52006-05-27 19:21:47 +000082
83 def get_message(self, key):
84 """Return a Message representation or raise a KeyError."""
85 raise NotImplementedError('Method must be implemented by subclass')
86
87 def get_string(self, key):
R. David Murrayb7deff12011-01-30 06:21:28 +000088 """Return a string representation or raise a KeyError.
89
90 Uses email.message.Message to create a 7bit clean string
91 representation of the message."""
92 return email.message_from_bytes(self.get_bytes(key)).as_string()
93
94 def get_bytes(self, key):
95 """Return a byte string representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +000096 raise NotImplementedError('Method must be implemented by subclass')
97
98 def get_file(self, key):
99 """Return a file-like representation or raise a KeyError."""
100 raise NotImplementedError('Method must be implemented by subclass')
101
102 def iterkeys(self):
103 """Return an iterator over keys."""
104 raise NotImplementedError('Method must be implemented by subclass')
105
106 def keys(self):
107 """Return a list of keys."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000108 return list(self.iterkeys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000109
110 def itervalues(self):
111 """Return an iterator over all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000112 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000113 try:
114 value = self[key]
115 except KeyError:
116 continue
117 yield value
118
119 def __iter__(self):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000120 return self.itervalues()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000121
122 def values(self):
123 """Return a list of messages. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000124 return list(self.itervalues())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000125
126 def iteritems(self):
127 """Return an iterator over (key, message) tuples."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000128 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000129 try:
130 value = self[key]
131 except KeyError:
132 continue
133 yield (key, value)
134
135 def items(self):
136 """Return a list of (key, message) tuples. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000137 return list(self.iteritems())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000138
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000139 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000140 """Return True if the keyed message exists, False otherwise."""
141 raise NotImplementedError('Method must be implemented by subclass')
142
Thomas Wouters477c8d52006-05-27 19:21:47 +0000143 def __len__(self):
144 """Return a count of messages in the mailbox."""
145 raise NotImplementedError('Method must be implemented by subclass')
146
147 def clear(self):
148 """Delete all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000149 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000150 self.discard(key)
151
152 def pop(self, key, default=None):
153 """Delete the keyed message and return it, or default."""
154 try:
155 result = self[key]
156 except KeyError:
157 return default
158 self.discard(key)
159 return result
160
161 def popitem(self):
162 """Delete an arbitrary (key, message) pair and return it."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000163 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000164 return (key, self.pop(key)) # This is only run once.
165 else:
166 raise KeyError('No messages in mailbox')
167
168 def update(self, arg=None):
169 """Change the messages that correspond to certain keys."""
170 if hasattr(arg, 'iteritems'):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000171 source = arg.items()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000172 elif hasattr(arg, 'items'):
173 source = arg.items()
174 else:
175 source = arg
176 bad_key = False
177 for key, message in source:
178 try:
179 self[key] = message
180 except KeyError:
181 bad_key = True
182 if bad_key:
183 raise KeyError('No message with key(s)')
184
185 def flush(self):
186 """Write any pending changes to the disk."""
187 raise NotImplementedError('Method must be implemented by subclass')
188
189 def lock(self):
190 """Lock the mailbox."""
191 raise NotImplementedError('Method must be implemented by subclass')
192
193 def unlock(self):
194 """Unlock the mailbox if it is locked."""
195 raise NotImplementedError('Method must be implemented by subclass')
196
197 def close(self):
198 """Flush and close the mailbox."""
199 raise NotImplementedError('Method must be implemented by subclass')
200
R. David Murrayb7deff12011-01-30 06:21:28 +0000201 def _string_to_bytes(self, message):
202 # If a message is not 7bit clean, we refuse to handle it since it
203 # likely came from reading invalid messages in text mode, and that way
204 # lies mojibake.
205 try:
206 return message.encode('ascii')
207 except UnicodeError:
208 raise ValueError("String input must be ASCII-only; "
209 "use bytes or a Message instead")
210
Thomas Wouters477c8d52006-05-27 19:21:47 +0000211 def _dump_message(self, message, target, mangle_from_=False):
R. David Murrayb7deff12011-01-30 06:21:28 +0000212 # This assumes the target file is open in binary mode.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000213 """Dump message contents to target file."""
Thomas Woutersb2137042007-02-01 18:02:27 +0000214 if isinstance(message, email.message.Message):
R. David Murrayb7deff12011-01-30 06:21:28 +0000215 buffer = io.BytesIO()
216 gen = email.generator.BytesGenerator(buffer, mangle_from_, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000217 gen.flatten(message)
218 buffer.seek(0)
Guido van Rossum671117a2007-08-31 04:25:05 +0000219 data = buffer.read()
R. David Murrayb7deff12011-01-30 06:21:28 +0000220 data = data.replace(b'\n', linesep)
Guido van Rossum671117a2007-08-31 04:25:05 +0000221 target.write(data)
R. David Murrayb7deff12011-01-30 06:21:28 +0000222 elif isinstance(message, (str, bytes, io.StringIO)):
223 if isinstance(message, io.StringIO):
224 warnings.warn("Use of StringIO input is deprecated, "
225 "use BytesIO instead", DeprecationWarning, 3)
226 message = message.getvalue()
227 if isinstance(message, str):
228 message = self._string_to_bytes(message)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000229 if mangle_from_:
R. David Murrayb7deff12011-01-30 06:21:28 +0000230 message = message.replace(b'\nFrom ', b'\n>From ')
231 message = message.replace(b'\n', linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000232 target.write(message)
233 elif hasattr(message, 'read'):
R. David Murrayb7deff12011-01-30 06:21:28 +0000234 if hasattr(message, 'buffer'):
235 warnings.warn("Use of text mode files is deprecated, "
236 "use a binary mode file instead", DeprecationWarning, 3)
237 message = message.buffer
Thomas Wouters477c8d52006-05-27 19:21:47 +0000238 while True:
239 line = message.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +0000240 # Universal newline support.
241 if line.endswith(b'\r\n'):
242 line = line[:-2] + b'\n'
243 elif line.endswith(b'\r'):
244 line = line[:-1] + b'\n'
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000245 if not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000246 break
R. David Murrayb7deff12011-01-30 06:21:28 +0000247 if mangle_from_ and line.startswith(b'From '):
248 line = b'>From ' + line[5:]
249 line = line.replace(b'\n', linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000250 target.write(line)
251 else:
252 raise TypeError('Invalid message type: %s' % type(message))
253
254
255class Maildir(Mailbox):
256 """A qmail-style Maildir mailbox."""
257
258 colon = ':'
259
Georg Brandlaa5b4112008-05-11 20:51:18 +0000260 def __init__(self, dirname, factory=None, create=True):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000261 """Initialize a Maildir instance."""
262 Mailbox.__init__(self, dirname, factory, create)
R David Murraycaed7fe2011-05-06 22:07:19 -0400263 self._paths = {
264 'tmp': os.path.join(self._path, 'tmp'),
265 'new': os.path.join(self._path, 'new'),
266 'cur': os.path.join(self._path, 'cur'),
267 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000268 if not os.path.exists(self._path):
269 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000270 os.mkdir(self._path, 0o700)
R David Murraycaed7fe2011-05-06 22:07:19 -0400271 for path in self._paths.values():
272 os.mkdir(path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000273 else:
274 raise NoSuchMailboxError(self._path)
275 self._toc = {}
Petri Lehtinen8c482ee2011-11-05 09:44:59 +0200276 self._toc_mtimes = {'cur': 0, 'new': 0}
277 self._last_read = 0 # Records last time we read cur/new
278 self._skewfactor = 0.1 # Adjust if os/fs clocks are skewing
Thomas Wouters477c8d52006-05-27 19:21:47 +0000279
280 def add(self, message):
281 """Add message and return assigned key."""
282 tmp_file = self._create_tmp()
283 try:
284 self._dump_message(message, tmp_file)
R. David Murrayfc141142011-02-11 22:47:17 +0000285 except BaseException:
286 tmp_file.close()
287 os.remove(tmp_file.name)
288 raise
289 _sync_close(tmp_file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000290 if isinstance(message, MaildirMessage):
291 subdir = message.get_subdir()
292 suffix = self.colon + message.get_info()
293 if suffix == self.colon:
294 suffix = ''
295 else:
296 subdir = 'new'
297 suffix = ''
298 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
299 dest = os.path.join(self._path, subdir, uniq + suffix)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000300 try:
301 if hasattr(os, 'link'):
302 os.link(tmp_file.name, dest)
303 os.remove(tmp_file.name)
304 else:
305 os.rename(tmp_file.name, dest)
Guido van Rossumb940e112007-01-10 16:19:56 +0000306 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000307 os.remove(tmp_file.name)
308 if e.errno == errno.EEXIST:
309 raise ExternalClashError('Name clash with existing message: %s'
310 % dest)
311 else:
312 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000313 if isinstance(message, MaildirMessage):
314 os.utime(dest, (os.path.getatime(dest), message.get_date()))
315 return uniq
316
317 def remove(self, key):
318 """Remove the keyed message; raise KeyError if it doesn't exist."""
319 os.remove(os.path.join(self._path, self._lookup(key)))
320
321 def discard(self, key):
322 """If the keyed message exists, remove it."""
323 # This overrides an inapplicable implementation in the superclass.
324 try:
325 self.remove(key)
326 except KeyError:
327 pass
Guido van Rossumb940e112007-01-10 16:19:56 +0000328 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000329 if e.errno != errno.ENOENT:
330 raise
331
332 def __setitem__(self, key, message):
333 """Replace the keyed message; raise KeyError if it doesn't exist."""
334 old_subpath = self._lookup(key)
335 temp_key = self.add(message)
336 temp_subpath = self._lookup(temp_key)
337 if isinstance(message, MaildirMessage):
338 # temp's subdir and suffix were specified by message.
339 dominant_subpath = temp_subpath
340 else:
341 # temp's subdir and suffix were defaults from add().
342 dominant_subpath = old_subpath
343 subdir = os.path.dirname(dominant_subpath)
344 if self.colon in dominant_subpath:
345 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
346 else:
347 suffix = ''
348 self.discard(key)
349 new_path = os.path.join(self._path, subdir, key + suffix)
350 os.rename(os.path.join(self._path, temp_subpath), new_path)
351 if isinstance(message, MaildirMessage):
352 os.utime(new_path, (os.path.getatime(new_path),
353 message.get_date()))
354
355 def get_message(self, key):
356 """Return a Message representation or raise a KeyError."""
357 subpath = self._lookup(key)
R. David Murrayb7deff12011-01-30 06:21:28 +0000358 f = open(os.path.join(self._path, subpath), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000359 try:
Christian Heimesfdab48e2008-01-20 09:06:41 +0000360 if self._factory:
361 msg = self._factory(f)
362 else:
363 msg = MaildirMessage(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000364 finally:
365 f.close()
366 subdir, name = os.path.split(subpath)
367 msg.set_subdir(subdir)
368 if self.colon in name:
369 msg.set_info(name.split(self.colon)[-1])
370 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
371 return msg
372
R. David Murrayb7deff12011-01-30 06:21:28 +0000373 def get_bytes(self, key):
374 """Return a bytes representation or raise a KeyError."""
375 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000376 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000377 return f.read().replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000378 finally:
379 f.close()
380
381 def get_file(self, key):
382 """Return a file-like representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000383 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000384 return _ProxyFile(f)
385
386 def iterkeys(self):
387 """Return an iterator over keys."""
388 self._refresh()
389 for key in self._toc:
390 try:
391 self._lookup(key)
392 except KeyError:
393 continue
394 yield key
395
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000396 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000397 """Return True if the keyed message exists, False otherwise."""
398 self._refresh()
399 return key in self._toc
400
401 def __len__(self):
402 """Return a count of messages in the mailbox."""
403 self._refresh()
404 return len(self._toc)
405
406 def flush(self):
407 """Write any pending changes to disk."""
Antoine Pitrou03f13442009-11-02 11:36:51 +0000408 # Maildir changes are always written immediately, so there's nothing
R David Murraycaed7fe2011-05-06 22:07:19 -0400409 # to do.
410 pass
Thomas Wouters477c8d52006-05-27 19:21:47 +0000411
412 def lock(self):
413 """Lock the mailbox."""
414 return
415
416 def unlock(self):
417 """Unlock the mailbox if it is locked."""
418 return
419
420 def close(self):
421 """Flush and close the mailbox."""
422 return
423
424 def list_folders(self):
425 """Return a list of folder names."""
426 result = []
427 for entry in os.listdir(self._path):
428 if len(entry) > 1 and entry[0] == '.' and \
429 os.path.isdir(os.path.join(self._path, entry)):
430 result.append(entry[1:])
431 return result
432
433 def get_folder(self, folder):
434 """Return a Maildir instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000435 return Maildir(os.path.join(self._path, '.' + folder),
436 factory=self._factory,
437 create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000438
439 def add_folder(self, folder):
440 """Create a folder and return a Maildir instance representing it."""
441 path = os.path.join(self._path, '.' + folder)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000442 result = Maildir(path, factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000443 maildirfolder_path = os.path.join(path, 'maildirfolder')
444 if not os.path.exists(maildirfolder_path):
Georg Brandl6aa2d1f2008-08-12 08:35:52 +0000445 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY,
446 0o666))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000447 return result
448
449 def remove_folder(self, folder):
450 """Delete the named folder, which must be empty."""
451 path = os.path.join(self._path, '.' + folder)
452 for entry in os.listdir(os.path.join(path, 'new')) + \
453 os.listdir(os.path.join(path, 'cur')):
454 if len(entry) < 1 or entry[0] != '.':
455 raise NotEmptyError('Folder contains message(s): %s' % folder)
456 for entry in os.listdir(path):
457 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
458 os.path.isdir(os.path.join(path, entry)):
459 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
460 (folder, entry))
461 for root, dirs, files in os.walk(path, topdown=False):
462 for entry in files:
463 os.remove(os.path.join(root, entry))
464 for entry in dirs:
465 os.rmdir(os.path.join(root, entry))
466 os.rmdir(path)
467
468 def clean(self):
469 """Delete old files in "tmp"."""
470 now = time.time()
471 for entry in os.listdir(os.path.join(self._path, 'tmp')):
472 path = os.path.join(self._path, 'tmp', entry)
473 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
474 os.remove(path)
475
476 _count = 1 # This is used to generate unique file names.
477
478 def _create_tmp(self):
479 """Create a file in the tmp subdirectory and open and return it."""
480 now = time.time()
481 hostname = socket.gethostname()
482 if '/' in hostname:
483 hostname = hostname.replace('/', r'\057')
484 if ':' in hostname:
485 hostname = hostname.replace(':', r'\072')
486 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
487 Maildir._count, hostname)
488 path = os.path.join(self._path, 'tmp', uniq)
489 try:
490 os.stat(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000491 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000492 if e.errno == errno.ENOENT:
493 Maildir._count += 1
Thomas Wouters89f507f2006-12-13 04:49:30 +0000494 try:
495 return _create_carefully(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000496 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000497 if e.errno != errno.EEXIST:
498 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000499 else:
500 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000501
502 # Fall through to here if stat succeeded or open raised EEXIST.
503 raise ExternalClashError('Name clash prevented file creation: %s' %
504 path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000505
506 def _refresh(self):
507 """Update table of contents mapping."""
R David Murraycaed7fe2011-05-06 22:07:19 -0400508 # If it has been less than two seconds since the last _refresh() call,
509 # we have to unconditionally re-read the mailbox just in case it has
510 # been modified, because os.path.mtime() has a 2 sec resolution in the
511 # most common worst case (FAT) and a 1 sec resolution typically. This
512 # results in a few unnecessary re-reads when _refresh() is called
513 # multiple times in that interval, but once the clock ticks over, we
514 # will only re-read as needed. Because the filesystem might be being
515 # served by an independent system with its own clock, we record and
516 # compare with the mtimes from the filesystem. Because the other
517 # system's clock might be skewing relative to our clock, we add an
518 # extra delta to our wait. The default is one tenth second, but is an
519 # instance variable and so can be adjusted if dealing with a
520 # particularly skewed or irregular system.
521 if time.time() - self._last_read > 2 + self._skewfactor:
522 refresh = False
523 for subdir in self._toc_mtimes:
524 mtime = os.path.getmtime(self._paths[subdir])
525 if mtime > self._toc_mtimes[subdir]:
526 refresh = True
527 self._toc_mtimes[subdir] = mtime
528 if not refresh:
Benjamin Petersonf6489f92009-11-25 17:46:26 +0000529 return
R David Murraycaed7fe2011-05-06 22:07:19 -0400530 # Refresh toc
Thomas Wouters477c8d52006-05-27 19:21:47 +0000531 self._toc = {}
R David Murraycaed7fe2011-05-06 22:07:19 -0400532 for subdir in self._toc_mtimes:
533 path = self._paths[subdir]
Andrew M. Kuchlingfa815342009-05-03 02:52:20 +0000534 for entry in os.listdir(path):
535 p = os.path.join(path, entry)
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000536 if os.path.isdir(p):
537 continue
Thomas Wouters477c8d52006-05-27 19:21:47 +0000538 uniq = entry.split(self.colon)[0]
539 self._toc[uniq] = os.path.join(subdir, entry)
R David Murraycaed7fe2011-05-06 22:07:19 -0400540 self._last_read = time.time()
Andrew M. Kuchlingfa815342009-05-03 02:52:20 +0000541
Thomas Wouters477c8d52006-05-27 19:21:47 +0000542 def _lookup(self, key):
543 """Use TOC to return subpath for given key, or raise a KeyError."""
544 try:
545 if os.path.exists(os.path.join(self._path, self._toc[key])):
546 return self._toc[key]
547 except KeyError:
548 pass
549 self._refresh()
550 try:
551 return self._toc[key]
552 except KeyError:
553 raise KeyError('No message with key: %s' % key)
554
555 # This method is for backward compatibility only.
556 def next(self):
557 """Return the next message in a one-time iteration."""
558 if not hasattr(self, '_onetime_keys'):
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000559 self._onetime_keys = iter(self.keys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000560 while True:
561 try:
Georg Brandla18af4e2007-04-21 15:47:16 +0000562 return self[next(self._onetime_keys)]
Thomas Wouters477c8d52006-05-27 19:21:47 +0000563 except StopIteration:
564 return None
565 except KeyError:
566 continue
567
568
569class _singlefileMailbox(Mailbox):
570 """A single-file mailbox."""
571
572 def __init__(self, path, factory=None, create=True):
573 """Initialize a single-file mailbox."""
574 Mailbox.__init__(self, path, factory, create)
575 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000576 f = open(self._path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000577 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000578 if e.errno == errno.ENOENT:
579 if create:
R. David Murrayb7deff12011-01-30 06:21:28 +0000580 f = open(self._path, 'wb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000581 else:
582 raise NoSuchMailboxError(self._path)
R. David Murray752b9502011-03-03 18:12:34 +0000583 elif e.errno in (errno.EACCES, errno.EROFS):
R. David Murrayb7deff12011-01-30 06:21:28 +0000584 f = open(self._path, 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000585 else:
586 raise
587 self._file = f
588 self._toc = None
589 self._next_key = 0
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300590 self._pending = False # No changes require rewriting the file.
591 self._pending_sync = False # No need to sync the file
Thomas Wouters477c8d52006-05-27 19:21:47 +0000592 self._locked = False
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300593 self._file_length = None # Used to record mailbox size
Thomas Wouters477c8d52006-05-27 19:21:47 +0000594
595 def add(self, message):
596 """Add message and return assigned key."""
597 self._lookup()
598 self._toc[self._next_key] = self._append_message(message)
599 self._next_key += 1
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300600 # _append_message appends the message to the mailbox file. We
601 # don't need a full rewrite + rename, sync is enough.
602 self._pending_sync = True
Thomas Wouters477c8d52006-05-27 19:21:47 +0000603 return self._next_key - 1
604
605 def remove(self, key):
606 """Remove the keyed message; raise KeyError if it doesn't exist."""
607 self._lookup(key)
608 del self._toc[key]
609 self._pending = True
610
611 def __setitem__(self, key, message):
612 """Replace the keyed message; raise KeyError if it doesn't exist."""
613 self._lookup(key)
614 self._toc[key] = self._append_message(message)
615 self._pending = True
616
617 def iterkeys(self):
618 """Return an iterator over keys."""
619 self._lookup()
620 for key in self._toc.keys():
621 yield key
622
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000623 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000624 """Return True if the keyed message exists, False otherwise."""
625 self._lookup()
626 return key in self._toc
627
628 def __len__(self):
629 """Return a count of messages in the mailbox."""
630 self._lookup()
631 return len(self._toc)
632
633 def lock(self):
634 """Lock the mailbox."""
635 if not self._locked:
636 _lock_file(self._file)
637 self._locked = True
638
639 def unlock(self):
640 """Unlock the mailbox if it is locked."""
641 if self._locked:
642 _unlock_file(self._file)
643 self._locked = False
644
645 def flush(self):
646 """Write any pending changes to disk."""
647 if not self._pending:
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300648 if self._pending_sync:
649 # Messages have only been added, so syncing the file
650 # is enough.
651 _sync_flush(self._file)
652 self._pending_sync = False
Thomas Wouters477c8d52006-05-27 19:21:47 +0000653 return
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000654
655 # In order to be writing anything out at all, self._toc must
656 # already have been generated (and presumably has been modified
657 # by adding or deleting an item).
658 assert self._toc is not None
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000659
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000660 # Check length of self._file; if it's changed, some other process
661 # has modified the mailbox since we scanned it.
662 self._file.seek(0, 2)
663 cur_len = self._file.tell()
664 if cur_len != self._file_length:
665 raise ExternalClashError('Size of mailbox file changed '
666 '(expected %i, found %i)' %
667 (self._file_length, cur_len))
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000668
Thomas Wouters477c8d52006-05-27 19:21:47 +0000669 new_file = _create_temporary(self._path)
670 try:
671 new_toc = {}
672 self._pre_mailbox_hook(new_file)
673 for key in sorted(self._toc.keys()):
674 start, stop = self._toc[key]
675 self._file.seek(start)
676 self._pre_message_hook(new_file)
677 new_start = new_file.tell()
678 while True:
679 buffer = self._file.read(min(4096,
680 stop - self._file.tell()))
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000681 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000682 break
683 new_file.write(buffer)
684 new_toc[key] = (new_start, new_file.tell())
685 self._post_message_hook(new_file)
Petri Lehtinen02653f12012-06-15 20:50:51 +0300686 self._file_length = new_file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000687 except:
688 new_file.close()
689 os.remove(new_file.name)
690 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000691 _sync_close(new_file)
692 # self._file is about to get replaced, so no need to sync.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000693 self._file.close()
694 try:
695 os.rename(new_file.name, self._path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000696 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000697 if e.errno == errno.EEXIST or \
698 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000699 os.remove(self._path)
700 os.rename(new_file.name, self._path)
701 else:
702 raise
703 self._file = open(self._path, 'rb+')
704 self._toc = new_toc
705 self._pending = False
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300706 self._pending_sync = False
Thomas Wouters477c8d52006-05-27 19:21:47 +0000707 if self._locked:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000708 _lock_file(self._file, dotlock=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000709
710 def _pre_mailbox_hook(self, f):
711 """Called before writing the mailbox to file f."""
712 return
713
714 def _pre_message_hook(self, f):
715 """Called before writing each message to file f."""
716 return
717
718 def _post_message_hook(self, f):
719 """Called after writing each message to file f."""
720 return
721
722 def close(self):
723 """Flush and close the mailbox."""
724 self.flush()
725 if self._locked:
726 self.unlock()
Thomas Wouters89f507f2006-12-13 04:49:30 +0000727 self._file.close() # Sync has been done by self.flush() above.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000728
729 def _lookup(self, key=None):
730 """Return (start, stop) or raise KeyError."""
731 if self._toc is None:
732 self._generate_toc()
733 if key is not None:
734 try:
735 return self._toc[key]
736 except KeyError:
737 raise KeyError('No message with key: %s' % key)
738
739 def _append_message(self, message):
740 """Append message to mailbox and return (start, stop) offsets."""
741 self._file.seek(0, 2)
R. David Murrayfc141142011-02-11 22:47:17 +0000742 before = self._file.tell()
Petri Lehtinenb6ee3d62012-06-29 13:43:37 +0300743 if len(self._toc) == 0 and not self._pending:
744 # This is the first message, and the _pre_mailbox_hook
745 # hasn't yet been called. If self._pending is True,
746 # messages have been removed, so _pre_mailbox_hook must
747 # have been called already.
Petri Lehtinenf29435f2012-06-28 13:48:17 +0300748 self._pre_mailbox_hook(self._file)
R. David Murrayfc141142011-02-11 22:47:17 +0000749 try:
750 self._pre_message_hook(self._file)
751 offsets = self._install_message(message)
752 self._post_message_hook(self._file)
753 except BaseException:
754 self._file.truncate(before)
755 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000756 self._file.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000757 self._file_length = self._file.tell() # Record current length of mailbox
Thomas Wouters477c8d52006-05-27 19:21:47 +0000758 return offsets
759
760
761
762class _mboxMMDF(_singlefileMailbox):
763 """An mbox or MMDF mailbox."""
764
765 _mangle_from_ = True
766
767 def get_message(self, key):
768 """Return a Message representation or raise a KeyError."""
769 start, stop = self._lookup(key)
770 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +0000771 from_line = self._file.readline().replace(linesep, b'')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000772 string = self._file.read(stop - self._file.tell())
R. David Murrayb7deff12011-01-30 06:21:28 +0000773 msg = self._message_factory(string.replace(linesep, b'\n'))
774 msg.set_from(from_line[5:].decode('ascii'))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000775 return msg
776
777 def get_string(self, key, from_=False):
778 """Return a string representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000779 return email.message_from_bytes(
780 self.get_bytes(key)).as_string(unixfrom=from_)
781
782 def get_bytes(self, key, from_=False):
783 """Return a string representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +0000784 start, stop = self._lookup(key)
785 self._file.seek(start)
786 if not from_:
787 self._file.readline()
788 string = self._file.read(stop - self._file.tell())
R. David Murrayb7deff12011-01-30 06:21:28 +0000789 return string.replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000790
791 def get_file(self, key, from_=False):
792 """Return a file-like representation or raise a KeyError."""
793 start, stop = self._lookup(key)
794 self._file.seek(start)
795 if not from_:
796 self._file.readline()
797 return _PartialFile(self._file, self._file.tell(), stop)
798
799 def _install_message(self, message):
800 """Format a message and blindly write to self._file."""
801 from_line = None
R. David Murrayb7deff12011-01-30 06:21:28 +0000802 if isinstance(message, str):
803 message = self._string_to_bytes(message)
804 if isinstance(message, bytes) and message.startswith(b'From '):
805 newline = message.find(b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000806 if newline != -1:
807 from_line = message[:newline]
808 message = message[newline + 1:]
809 else:
810 from_line = message
R. David Murrayb7deff12011-01-30 06:21:28 +0000811 message = b''
Thomas Wouters477c8d52006-05-27 19:21:47 +0000812 elif isinstance(message, _mboxMMDFMessage):
R. David Murrayb7deff12011-01-30 06:21:28 +0000813 author = message.get_from().encode('ascii')
814 from_line = b'From ' + author
Thomas Woutersb2137042007-02-01 18:02:27 +0000815 elif isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000816 from_line = message.get_unixfrom() # May be None.
R. David Murrayb7deff12011-01-30 06:21:28 +0000817 if from_line is not None:
818 from_line = from_line.encode('ascii')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000819 if from_line is None:
R. David Murrayb7deff12011-01-30 06:21:28 +0000820 from_line = b'From MAILER-DAEMON ' + time.asctime(time.gmtime()).encode()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000821 start = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000822 self._file.write(from_line + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000823 self._dump_message(message, self._file, self._mangle_from_)
824 stop = self._file.tell()
825 return (start, stop)
826
827
828class mbox(_mboxMMDF):
829 """A classic mbox mailbox."""
830
831 _mangle_from_ = True
832
833 def __init__(self, path, factory=None, create=True):
834 """Initialize an mbox mailbox."""
835 self._message_factory = mboxMessage
836 _mboxMMDF.__init__(self, path, factory, create)
837
838 def _pre_message_hook(self, f):
839 """Called before writing each message to file f."""
840 if f.tell() != 0:
R. David Murrayb7deff12011-01-30 06:21:28 +0000841 f.write(linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000842
843 def _generate_toc(self):
844 """Generate key-to-(start, stop) table of contents."""
845 starts, stops = [], []
846 self._file.seek(0)
847 while True:
848 line_pos = self._file.tell()
849 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +0000850 if line.startswith(b'From '):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000851 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +0000852 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000853 starts.append(line_pos)
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000854 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000855 stops.append(line_pos)
856 break
857 self._toc = dict(enumerate(zip(starts, stops)))
858 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000859 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000860
861
862class MMDF(_mboxMMDF):
863 """An MMDF mailbox."""
864
865 def __init__(self, path, factory=None, create=True):
866 """Initialize an MMDF mailbox."""
867 self._message_factory = MMDFMessage
868 _mboxMMDF.__init__(self, path, factory, create)
869
870 def _pre_message_hook(self, f):
871 """Called before writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000872 f.write(b'\001\001\001\001' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000873
874 def _post_message_hook(self, f):
875 """Called after writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000876 f.write(linesep + b'\001\001\001\001' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000877
878 def _generate_toc(self):
879 """Generate key-to-(start, stop) table of contents."""
880 starts, stops = [], []
881 self._file.seek(0)
882 next_pos = 0
883 while True:
884 line_pos = next_pos
885 line = self._file.readline()
886 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000887 if line.startswith(b'\001\001\001\001' + linesep):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000888 starts.append(next_pos)
889 while True:
890 line_pos = next_pos
891 line = self._file.readline()
892 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000893 if line == b'\001\001\001\001' + linesep:
894 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000895 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000896 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000897 stops.append(line_pos)
898 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000899 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000900 break
901 self._toc = dict(enumerate(zip(starts, stops)))
902 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000903 self._file.seek(0, 2)
904 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000905
906
907class MH(Mailbox):
908 """An MH mailbox."""
909
910 def __init__(self, path, factory=None, create=True):
911 """Initialize an MH instance."""
912 Mailbox.__init__(self, path, factory, create)
913 if not os.path.exists(self._path):
914 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000915 os.mkdir(self._path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000916 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000917 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000918 else:
919 raise NoSuchMailboxError(self._path)
920 self._locked = False
921
922 def add(self, message):
923 """Add message and return assigned key."""
924 keys = self.keys()
925 if len(keys) == 0:
926 new_key = 1
927 else:
928 new_key = max(keys) + 1
929 new_path = os.path.join(self._path, str(new_key))
930 f = _create_carefully(new_path)
R. David Murray774a66d2011-02-12 00:03:31 +0000931 closed = False
Thomas Wouters477c8d52006-05-27 19:21:47 +0000932 try:
933 if self._locked:
934 _lock_file(f)
935 try:
R. David Murrayfc141142011-02-11 22:47:17 +0000936 try:
937 self._dump_message(message, f)
938 except BaseException:
R. David Murray774a66d2011-02-12 00:03:31 +0000939 # Unlock and close so it can be deleted on Windows
940 if self._locked:
941 _unlock_file(f)
942 _sync_close(f)
943 closed = True
R. David Murrayfc141142011-02-11 22:47:17 +0000944 os.remove(new_path)
945 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000946 if isinstance(message, MHMessage):
947 self._dump_sequences(message, new_key)
948 finally:
949 if self._locked:
950 _unlock_file(f)
951 finally:
R. David Murray774a66d2011-02-12 00:03:31 +0000952 if not closed:
953 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000954 return new_key
955
956 def remove(self, key):
957 """Remove the keyed message; raise KeyError if it doesn't exist."""
958 path = os.path.join(self._path, str(key))
959 try:
960 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000961 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000962 if e.errno == errno.ENOENT:
963 raise KeyError('No message with key: %s' % key)
964 else:
965 raise
Benjamin Peterson21896a32010-03-21 22:03:03 +0000966 else:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000967 f.close()
Benjamin Peterson21896a32010-03-21 22:03:03 +0000968 os.remove(path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000969
970 def __setitem__(self, key, message):
971 """Replace the keyed message; raise KeyError if it doesn't exist."""
972 path = os.path.join(self._path, str(key))
973 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000974 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000975 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000976 if e.errno == errno.ENOENT:
977 raise KeyError('No message with key: %s' % key)
978 else:
979 raise
980 try:
981 if self._locked:
982 _lock_file(f)
983 try:
984 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
985 self._dump_message(message, f)
986 if isinstance(message, MHMessage):
987 self._dump_sequences(message, key)
988 finally:
989 if self._locked:
990 _unlock_file(f)
991 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000992 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000993
994 def get_message(self, key):
995 """Return a Message representation or raise a KeyError."""
996 try:
997 if self._locked:
R. David Murrayb7deff12011-01-30 06:21:28 +0000998 f = open(os.path.join(self._path, str(key)), 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000999 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001000 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +00001001 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001002 if e.errno == errno.ENOENT:
1003 raise KeyError('No message with key: %s' % key)
1004 else:
1005 raise
1006 try:
1007 if self._locked:
1008 _lock_file(f)
1009 try:
1010 msg = MHMessage(f)
1011 finally:
1012 if self._locked:
1013 _unlock_file(f)
1014 finally:
1015 f.close()
R. David Murray548ac412009-04-02 19:44:43 +00001016 for name, key_list in self.get_sequences().items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001017 if key in key_list:
1018 msg.add_sequence(name)
1019 return msg
1020
R. David Murrayb7deff12011-01-30 06:21:28 +00001021 def get_bytes(self, key):
1022 """Return a bytes representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001023 try:
1024 if self._locked:
R. David Murrayb7deff12011-01-30 06:21:28 +00001025 f = open(os.path.join(self._path, str(key)), 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001026 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001027 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +00001028 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001029 if e.errno == errno.ENOENT:
1030 raise KeyError('No message with key: %s' % key)
1031 else:
1032 raise
1033 try:
1034 if self._locked:
1035 _lock_file(f)
1036 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00001037 return f.read().replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001038 finally:
1039 if self._locked:
1040 _unlock_file(f)
1041 finally:
1042 f.close()
1043
1044 def get_file(self, key):
1045 """Return a file-like representation or raise a KeyError."""
1046 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00001047 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +00001048 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001049 if e.errno == errno.ENOENT:
1050 raise KeyError('No message with key: %s' % key)
1051 else:
1052 raise
1053 return _ProxyFile(f)
1054
1055 def iterkeys(self):
1056 """Return an iterator over keys."""
1057 return iter(sorted(int(entry) for entry in os.listdir(self._path)
1058 if entry.isdigit()))
1059
Guido van Rossume2b70bc2006-08-18 22:13:04 +00001060 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001061 """Return True if the keyed message exists, False otherwise."""
1062 return os.path.exists(os.path.join(self._path, str(key)))
1063
1064 def __len__(self):
1065 """Return a count of messages in the mailbox."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001066 return len(list(self.keys()))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001067
1068 def lock(self):
1069 """Lock the mailbox."""
1070 if not self._locked:
1071 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
1072 _lock_file(self._file)
1073 self._locked = True
1074
1075 def unlock(self):
1076 """Unlock the mailbox if it is locked."""
1077 if self._locked:
1078 _unlock_file(self._file)
Thomas Wouters89f507f2006-12-13 04:49:30 +00001079 _sync_close(self._file)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001080 del self._file
1081 self._locked = False
1082
1083 def flush(self):
1084 """Write any pending changes to the disk."""
1085 return
1086
1087 def close(self):
1088 """Flush and close the mailbox."""
1089 if self._locked:
1090 self.unlock()
1091
1092 def list_folders(self):
1093 """Return a list of folder names."""
1094 result = []
1095 for entry in os.listdir(self._path):
1096 if os.path.isdir(os.path.join(self._path, entry)):
1097 result.append(entry)
1098 return result
1099
1100 def get_folder(self, folder):
1101 """Return an MH instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +00001102 return MH(os.path.join(self._path, folder),
1103 factory=self._factory, create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001104
1105 def add_folder(self, folder):
1106 """Create a folder and return an MH instance representing it."""
Thomas Wouters89f507f2006-12-13 04:49:30 +00001107 return MH(os.path.join(self._path, folder),
1108 factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001109
1110 def remove_folder(self, folder):
1111 """Delete the named folder, which must be empty."""
1112 path = os.path.join(self._path, folder)
1113 entries = os.listdir(path)
1114 if entries == ['.mh_sequences']:
1115 os.remove(os.path.join(path, '.mh_sequences'))
1116 elif entries == []:
1117 pass
1118 else:
1119 raise NotEmptyError('Folder not empty: %s' % self._path)
1120 os.rmdir(path)
1121
1122 def get_sequences(self):
1123 """Return a name-to-key-list dictionary to define each sequence."""
1124 results = {}
R. David Murrayb7deff12011-01-30 06:21:28 +00001125 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001126 try:
1127 all_keys = set(self.keys())
1128 for line in f:
1129 try:
1130 name, contents = line.split(':')
1131 keys = set()
1132 for spec in contents.split():
1133 if spec.isdigit():
1134 keys.add(int(spec))
1135 else:
1136 start, stop = (int(x) for x in spec.split('-'))
1137 keys.update(range(start, stop + 1))
1138 results[name] = [key for key in sorted(keys) \
1139 if key in all_keys]
1140 if len(results[name]) == 0:
1141 del results[name]
1142 except ValueError:
1143 raise FormatError('Invalid sequence specification: %s' %
1144 line.rstrip())
1145 finally:
1146 f.close()
1147 return results
1148
1149 def set_sequences(self, sequences):
1150 """Set sequences using the given name-to-key-list dictionary."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001151 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001152 try:
1153 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001154 for name, keys in sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001155 if len(keys) == 0:
1156 continue
R. David Murrayb7deff12011-01-30 06:21:28 +00001157 f.write(name + ':')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001158 prev = None
1159 completing = False
1160 for key in sorted(set(keys)):
1161 if key - 1 == prev:
1162 if not completing:
1163 completing = True
1164 f.write('-')
1165 elif completing:
1166 completing = False
1167 f.write('%s %s' % (prev, key))
1168 else:
1169 f.write(' %s' % key)
1170 prev = key
1171 if completing:
1172 f.write(str(prev) + '\n')
1173 else:
1174 f.write('\n')
1175 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +00001176 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001177
1178 def pack(self):
1179 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1180 sequences = self.get_sequences()
1181 prev = 0
1182 changes = []
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001183 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001184 if key - 1 != prev:
1185 changes.append((key, prev + 1))
Thomas Wouters89f507f2006-12-13 04:49:30 +00001186 if hasattr(os, 'link'):
1187 os.link(os.path.join(self._path, str(key)),
1188 os.path.join(self._path, str(prev + 1)))
1189 os.unlink(os.path.join(self._path, str(key)))
1190 else:
1191 os.rename(os.path.join(self._path, str(key)),
1192 os.path.join(self._path, str(prev + 1)))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001193 prev += 1
1194 self._next_key = prev + 1
1195 if len(changes) == 0:
1196 return
1197 for name, key_list in sequences.items():
1198 for old, new in changes:
1199 if old in key_list:
1200 key_list[key_list.index(old)] = new
1201 self.set_sequences(sequences)
1202
1203 def _dump_sequences(self, message, key):
1204 """Inspect a new MHMessage and update sequences appropriately."""
1205 pending_sequences = message.get_sequences()
1206 all_sequences = self.get_sequences()
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001207 for name, key_list in all_sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001208 if name in pending_sequences:
1209 key_list.append(key)
1210 elif key in key_list:
1211 del key_list[key_list.index(key)]
1212 for sequence in pending_sequences:
1213 if sequence not in all_sequences:
1214 all_sequences[sequence] = [key]
1215 self.set_sequences(all_sequences)
1216
1217
1218class Babyl(_singlefileMailbox):
1219 """An Rmail-style Babyl mailbox."""
1220
1221 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1222 'forwarded', 'edited', 'resent'))
1223
1224 def __init__(self, path, factory=None, create=True):
1225 """Initialize a Babyl mailbox."""
1226 _singlefileMailbox.__init__(self, path, factory, create)
1227 self._labels = {}
1228
1229 def add(self, message):
1230 """Add message and return assigned key."""
1231 key = _singlefileMailbox.add(self, message)
1232 if isinstance(message, BabylMessage):
1233 self._labels[key] = message.get_labels()
1234 return key
1235
1236 def remove(self, key):
1237 """Remove the keyed message; raise KeyError if it doesn't exist."""
1238 _singlefileMailbox.remove(self, key)
1239 if key in self._labels:
1240 del self._labels[key]
1241
1242 def __setitem__(self, key, message):
1243 """Replace the keyed message; raise KeyError if it doesn't exist."""
1244 _singlefileMailbox.__setitem__(self, key, message)
1245 if isinstance(message, BabylMessage):
1246 self._labels[key] = message.get_labels()
1247
1248 def get_message(self, key):
1249 """Return a Message representation or raise a KeyError."""
1250 start, stop = self._lookup(key)
1251 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +00001252 self._file.readline() # Skip b'1,' line specifying labels.
1253 original_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001254 while True:
1255 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001256 if line == b'*** EOOH ***' + linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001257 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001258 original_headers.write(line.replace(linesep, b'\n'))
1259 visible_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001260 while True:
1261 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001262 if line == linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001263 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001264 visible_headers.write(line.replace(linesep, b'\n'))
1265 # Read up to the stop, or to the end
1266 n = stop - self._file.tell()
1267 assert n >= 0
1268 body = self._file.read(n)
1269 body = body.replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001270 msg = BabylMessage(original_headers.getvalue() + body)
1271 msg.set_visible(visible_headers.getvalue())
1272 if key in self._labels:
1273 msg.set_labels(self._labels[key])
1274 return msg
1275
R. David Murrayb7deff12011-01-30 06:21:28 +00001276 def get_bytes(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001277 """Return a string representation or raise a KeyError."""
1278 start, stop = self._lookup(key)
1279 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +00001280 self._file.readline() # Skip b'1,' line specifying labels.
1281 original_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001282 while True:
1283 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001284 if line == b'*** EOOH ***' + linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001285 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001286 original_headers.write(line.replace(linesep, b'\n'))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001287 while True:
1288 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001289 if line == linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001290 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001291 headers = original_headers.getvalue()
1292 n = stop - self._file.tell()
1293 assert n >= 0
1294 data = self._file.read(n)
1295 data = data.replace(linesep, b'\n')
1296 return headers + data
Thomas Wouters477c8d52006-05-27 19:21:47 +00001297
1298 def get_file(self, key):
1299 """Return a file-like representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001300 return io.BytesIO(self.get_bytes(key).replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001301
1302 def get_labels(self):
1303 """Return a list of user-defined labels in the mailbox."""
1304 self._lookup()
1305 labels = set()
1306 for label_list in self._labels.values():
1307 labels.update(label_list)
1308 labels.difference_update(self._special_labels)
1309 return list(labels)
1310
1311 def _generate_toc(self):
1312 """Generate key-to-(start, stop) table of contents."""
1313 starts, stops = [], []
1314 self._file.seek(0)
1315 next_pos = 0
1316 label_lists = []
1317 while True:
1318 line_pos = next_pos
1319 line = self._file.readline()
1320 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +00001321 if line == b'\037\014' + linesep:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001322 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +00001323 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001324 starts.append(next_pos)
1325 labels = [label.strip() for label
R. David Murrayb7deff12011-01-30 06:21:28 +00001326 in self._file.readline()[1:].split(b',')
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001327 if label.strip()]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001328 label_lists.append(labels)
R. David Murrayb7deff12011-01-30 06:21:28 +00001329 elif line == b'\037' or line == b'\037' + linesep:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001330 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +00001331 stops.append(line_pos - len(linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001332 elif not line:
R. David Murrayb7deff12011-01-30 06:21:28 +00001333 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001334 break
1335 self._toc = dict(enumerate(zip(starts, stops)))
1336 self._labels = dict(enumerate(label_lists))
1337 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001338 self._file.seek(0, 2)
1339 self._file_length = self._file.tell()
Thomas Wouters9fe394c2007-02-05 01:24:16 +00001340
Thomas Wouters477c8d52006-05-27 19:21:47 +00001341 def _pre_mailbox_hook(self, f):
1342 """Called before writing the mailbox to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001343 babyl = b'BABYL OPTIONS:' + linesep
1344 babyl += b'Version: 5' + linesep
1345 labels = self.get_labels()
1346 labels = (label.encode() for label in labels)
1347 babyl += b'Labels:' + b','.join(labels) + linesep
1348 babyl += b'\037'
1349 f.write(babyl)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001350
1351 def _pre_message_hook(self, f):
1352 """Called before writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001353 f.write(b'\014' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001354
1355 def _post_message_hook(self, f):
1356 """Called after writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001357 f.write(linesep + b'\037')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001358
1359 def _install_message(self, message):
1360 """Write message contents and return (start, stop)."""
1361 start = self._file.tell()
1362 if isinstance(message, BabylMessage):
1363 special_labels = []
1364 labels = []
1365 for label in message.get_labels():
1366 if label in self._special_labels:
1367 special_labels.append(label)
1368 else:
1369 labels.append(label)
R. David Murrayb7deff12011-01-30 06:21:28 +00001370 self._file.write(b'1')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001371 for label in special_labels:
R. David Murrayb7deff12011-01-30 06:21:28 +00001372 self._file.write(b', ' + label.encode())
1373 self._file.write(b',,')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001374 for label in labels:
R. David Murrayb7deff12011-01-30 06:21:28 +00001375 self._file.write(b' ' + label.encode() + b',')
1376 self._file.write(linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001377 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001378 self._file.write(b'1,,' + linesep)
Thomas Woutersb2137042007-02-01 18:02:27 +00001379 if isinstance(message, email.message.Message):
R. David Murrayb7deff12011-01-30 06:21:28 +00001380 orig_buffer = io.BytesIO()
1381 orig_generator = email.generator.BytesGenerator(orig_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001382 orig_generator.flatten(message)
1383 orig_buffer.seek(0)
1384 while True:
1385 line = orig_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001386 self._file.write(line.replace(b'\n', linesep))
1387 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001388 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001389 self._file.write(b'*** EOOH ***' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001390 if isinstance(message, BabylMessage):
R. David Murrayb7deff12011-01-30 06:21:28 +00001391 vis_buffer = io.BytesIO()
1392 vis_generator = email.generator.BytesGenerator(vis_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001393 vis_generator.flatten(message.get_visible())
1394 while True:
1395 line = vis_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001396 self._file.write(line.replace(b'\n', linesep))
1397 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001398 break
1399 else:
1400 orig_buffer.seek(0)
1401 while True:
1402 line = orig_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001403 self._file.write(line.replace(b'\n', linesep))
1404 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001405 break
1406 while True:
1407 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001408 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001409 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001410 self._file.write(buffer.replace(b'\n', linesep))
1411 elif isinstance(message, (bytes, str, io.StringIO)):
1412 if isinstance(message, io.StringIO):
1413 warnings.warn("Use of StringIO input is deprecated, "
1414 "use BytesIO instead", DeprecationWarning, 3)
1415 message = message.getvalue()
1416 if isinstance(message, str):
1417 message = self._string_to_bytes(message)
1418 body_start = message.find(b'\n\n') + 2
Thomas Wouters477c8d52006-05-27 19:21:47 +00001419 if body_start - 2 != -1:
R. David Murrayb7deff12011-01-30 06:21:28 +00001420 self._file.write(message[:body_start].replace(b'\n', linesep))
1421 self._file.write(b'*** EOOH ***' + linesep)
1422 self._file.write(message[:body_start].replace(b'\n', linesep))
1423 self._file.write(message[body_start:].replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001424 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001425 self._file.write(b'*** EOOH ***' + linesep + linesep)
1426 self._file.write(message.replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001427 elif hasattr(message, 'readline'):
R. David Murrayb7deff12011-01-30 06:21:28 +00001428 if hasattr(message, 'buffer'):
1429 warnings.warn("Use of text mode files is deprecated, "
1430 "use a binary mode file instead", DeprecationWarning, 3)
1431 message = message.buffer
Thomas Wouters477c8d52006-05-27 19:21:47 +00001432 original_pos = message.tell()
1433 first_pass = True
1434 while True:
1435 line = message.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001436 # Universal newline support.
1437 if line.endswith(b'\r\n'):
1438 line = line[:-2] + b'\n'
1439 elif line.endswith(b'\r'):
1440 line = line[:-1] + b'\n'
1441 self._file.write(line.replace(b'\n', linesep))
1442 if line == b'\n' or not line:
1443 self._file.write(b'*** EOOH ***' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001444 if first_pass:
1445 first_pass = False
1446 message.seek(original_pos)
1447 else:
1448 break
1449 while True:
1450 buffer = message.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001451 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001452 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001453 self._file.write(buffer.replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001454 else:
1455 raise TypeError('Invalid message type: %s' % type(message))
1456 stop = self._file.tell()
1457 return (start, stop)
1458
1459
Thomas Woutersb2137042007-02-01 18:02:27 +00001460class Message(email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001461 """Message with mailbox-format-specific properties."""
1462
1463 def __init__(self, message=None):
1464 """Initialize a Message instance."""
Thomas Woutersb2137042007-02-01 18:02:27 +00001465 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001466 self._become_message(copy.deepcopy(message))
1467 if isinstance(message, Message):
1468 message._explain_to(self)
R. David Murrayb7deff12011-01-30 06:21:28 +00001469 elif isinstance(message, bytes):
1470 self._become_message(email.message_from_bytes(message))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001471 elif isinstance(message, str):
1472 self._become_message(email.message_from_string(message))
R. David Murrayb7deff12011-01-30 06:21:28 +00001473 elif isinstance(message, io.TextIOWrapper):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001474 self._become_message(email.message_from_file(message))
R. David Murrayb7deff12011-01-30 06:21:28 +00001475 elif hasattr(message, "read"):
1476 self._become_message(email.message_from_binary_file(message))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001477 elif message is None:
Thomas Woutersb2137042007-02-01 18:02:27 +00001478 email.message.Message.__init__(self)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001479 else:
1480 raise TypeError('Invalid message type: %s' % type(message))
1481
1482 def _become_message(self, message):
1483 """Assume the non-format-specific state of message."""
1484 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1485 'preamble', 'epilogue', 'defects', '_default_type'):
1486 self.__dict__[name] = message.__dict__[name]
1487
1488 def _explain_to(self, message):
1489 """Copy format-specific state to message insofar as possible."""
1490 if isinstance(message, Message):
1491 return # There's nothing format-specific to explain.
1492 else:
1493 raise TypeError('Cannot convert to specified type')
1494
1495
1496class MaildirMessage(Message):
1497 """Message with Maildir-specific properties."""
1498
1499 def __init__(self, message=None):
1500 """Initialize a MaildirMessage instance."""
1501 self._subdir = 'new'
1502 self._info = ''
1503 self._date = time.time()
1504 Message.__init__(self, message)
1505
1506 def get_subdir(self):
1507 """Return 'new' or 'cur'."""
1508 return self._subdir
1509
1510 def set_subdir(self, subdir):
1511 """Set subdir to 'new' or 'cur'."""
1512 if subdir == 'new' or subdir == 'cur':
1513 self._subdir = subdir
1514 else:
1515 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1516
1517 def get_flags(self):
1518 """Return as a string the flags that are set."""
1519 if self._info.startswith('2,'):
1520 return self._info[2:]
1521 else:
1522 return ''
1523
1524 def set_flags(self, flags):
1525 """Set the given flags and unset all others."""
1526 self._info = '2,' + ''.join(sorted(flags))
1527
1528 def add_flag(self, flag):
1529 """Set the given flag(s) without changing others."""
1530 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1531
1532 def remove_flag(self, flag):
1533 """Unset the given string flag(s) without changing others."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001534 if self.get_flags():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001535 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1536
1537 def get_date(self):
1538 """Return delivery date of message, in seconds since the epoch."""
1539 return self._date
1540
1541 def set_date(self, date):
1542 """Set delivery date of message, in seconds since the epoch."""
1543 try:
1544 self._date = float(date)
1545 except ValueError:
1546 raise TypeError("can't convert to float: %s" % date)
1547
1548 def get_info(self):
1549 """Get the message's "info" as a string."""
1550 return self._info
1551
1552 def set_info(self, info):
1553 """Set the message's "info" string."""
1554 if isinstance(info, str):
1555 self._info = info
1556 else:
1557 raise TypeError('info must be a string: %s' % type(info))
1558
1559 def _explain_to(self, message):
1560 """Copy Maildir-specific state to message insofar as possible."""
1561 if isinstance(message, MaildirMessage):
1562 message.set_flags(self.get_flags())
1563 message.set_subdir(self.get_subdir())
1564 message.set_date(self.get_date())
1565 elif isinstance(message, _mboxMMDFMessage):
1566 flags = set(self.get_flags())
1567 if 'S' in flags:
1568 message.add_flag('R')
1569 if self.get_subdir() == 'cur':
1570 message.add_flag('O')
1571 if 'T' in flags:
1572 message.add_flag('D')
1573 if 'F' in flags:
1574 message.add_flag('F')
1575 if 'R' in flags:
1576 message.add_flag('A')
1577 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1578 elif isinstance(message, MHMessage):
1579 flags = set(self.get_flags())
1580 if 'S' not in flags:
1581 message.add_sequence('unseen')
1582 if 'R' in flags:
1583 message.add_sequence('replied')
1584 if 'F' in flags:
1585 message.add_sequence('flagged')
1586 elif isinstance(message, BabylMessage):
1587 flags = set(self.get_flags())
1588 if 'S' not in flags:
1589 message.add_label('unseen')
1590 if 'T' in flags:
1591 message.add_label('deleted')
1592 if 'R' in flags:
1593 message.add_label('answered')
1594 if 'P' in flags:
1595 message.add_label('forwarded')
1596 elif isinstance(message, Message):
1597 pass
1598 else:
1599 raise TypeError('Cannot convert to specified type: %s' %
1600 type(message))
1601
1602
1603class _mboxMMDFMessage(Message):
1604 """Message with mbox- or MMDF-specific properties."""
1605
1606 def __init__(self, message=None):
1607 """Initialize an mboxMMDFMessage instance."""
1608 self.set_from('MAILER-DAEMON', True)
Thomas Woutersb2137042007-02-01 18:02:27 +00001609 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001610 unixfrom = message.get_unixfrom()
1611 if unixfrom is not None and unixfrom.startswith('From '):
1612 self.set_from(unixfrom[5:])
1613 Message.__init__(self, message)
1614
1615 def get_from(self):
1616 """Return contents of "From " line."""
1617 return self._from
1618
1619 def set_from(self, from_, time_=None):
1620 """Set "From " line, formatting and appending time_ if specified."""
1621 if time_ is not None:
1622 if time_ is True:
1623 time_ = time.gmtime()
1624 from_ += ' ' + time.asctime(time_)
1625 self._from = from_
1626
1627 def get_flags(self):
1628 """Return as a string the flags that are set."""
1629 return self.get('Status', '') + self.get('X-Status', '')
1630
1631 def set_flags(self, flags):
1632 """Set the given flags and unset all others."""
1633 flags = set(flags)
1634 status_flags, xstatus_flags = '', ''
1635 for flag in ('R', 'O'):
1636 if flag in flags:
1637 status_flags += flag
1638 flags.remove(flag)
1639 for flag in ('D', 'F', 'A'):
1640 if flag in flags:
1641 xstatus_flags += flag
1642 flags.remove(flag)
1643 xstatus_flags += ''.join(sorted(flags))
1644 try:
1645 self.replace_header('Status', status_flags)
1646 except KeyError:
1647 self.add_header('Status', status_flags)
1648 try:
1649 self.replace_header('X-Status', xstatus_flags)
1650 except KeyError:
1651 self.add_header('X-Status', xstatus_flags)
1652
1653 def add_flag(self, flag):
1654 """Set the given flag(s) without changing others."""
1655 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1656
1657 def remove_flag(self, flag):
1658 """Unset the given string flag(s) without changing others."""
1659 if 'Status' in self or 'X-Status' in self:
1660 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1661
1662 def _explain_to(self, message):
1663 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1664 if isinstance(message, MaildirMessage):
1665 flags = set(self.get_flags())
1666 if 'O' in flags:
1667 message.set_subdir('cur')
1668 if 'F' in flags:
1669 message.add_flag('F')
1670 if 'A' in flags:
1671 message.add_flag('R')
1672 if 'R' in flags:
1673 message.add_flag('S')
1674 if 'D' in flags:
1675 message.add_flag('T')
1676 del message['status']
1677 del message['x-status']
1678 maybe_date = ' '.join(self.get_from().split()[-5:])
1679 try:
1680 message.set_date(calendar.timegm(time.strptime(maybe_date,
1681 '%a %b %d %H:%M:%S %Y')))
1682 except (ValueError, OverflowError):
1683 pass
1684 elif isinstance(message, _mboxMMDFMessage):
1685 message.set_flags(self.get_flags())
1686 message.set_from(self.get_from())
1687 elif isinstance(message, MHMessage):
1688 flags = set(self.get_flags())
1689 if 'R' not in flags:
1690 message.add_sequence('unseen')
1691 if 'A' in flags:
1692 message.add_sequence('replied')
1693 if 'F' in flags:
1694 message.add_sequence('flagged')
1695 del message['status']
1696 del message['x-status']
1697 elif isinstance(message, BabylMessage):
1698 flags = set(self.get_flags())
1699 if 'R' not in flags:
1700 message.add_label('unseen')
1701 if 'D' in flags:
1702 message.add_label('deleted')
1703 if 'A' in flags:
1704 message.add_label('answered')
1705 del message['status']
1706 del message['x-status']
1707 elif isinstance(message, Message):
1708 pass
1709 else:
1710 raise TypeError('Cannot convert to specified type: %s' %
1711 type(message))
1712
1713
1714class mboxMessage(_mboxMMDFMessage):
1715 """Message with mbox-specific properties."""
1716
1717
1718class MHMessage(Message):
1719 """Message with MH-specific properties."""
1720
1721 def __init__(self, message=None):
1722 """Initialize an MHMessage instance."""
1723 self._sequences = []
1724 Message.__init__(self, message)
1725
1726 def get_sequences(self):
1727 """Return a list of sequences that include the message."""
1728 return self._sequences[:]
1729
1730 def set_sequences(self, sequences):
1731 """Set the list of sequences that include the message."""
1732 self._sequences = list(sequences)
1733
1734 def add_sequence(self, sequence):
1735 """Add sequence to list of sequences including the message."""
1736 if isinstance(sequence, str):
1737 if not sequence in self._sequences:
1738 self._sequences.append(sequence)
1739 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001740 raise TypeError('sequence type must be str: %s' % type(sequence))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001741
1742 def remove_sequence(self, sequence):
1743 """Remove sequence from the list of sequences including the message."""
1744 try:
1745 self._sequences.remove(sequence)
1746 except ValueError:
1747 pass
1748
1749 def _explain_to(self, message):
1750 """Copy MH-specific state to message insofar as possible."""
1751 if isinstance(message, MaildirMessage):
1752 sequences = set(self.get_sequences())
1753 if 'unseen' in sequences:
1754 message.set_subdir('cur')
1755 else:
1756 message.set_subdir('cur')
1757 message.add_flag('S')
1758 if 'flagged' in sequences:
1759 message.add_flag('F')
1760 if 'replied' in sequences:
1761 message.add_flag('R')
1762 elif isinstance(message, _mboxMMDFMessage):
1763 sequences = set(self.get_sequences())
1764 if 'unseen' not in sequences:
1765 message.add_flag('RO')
1766 else:
1767 message.add_flag('O')
1768 if 'flagged' in sequences:
1769 message.add_flag('F')
1770 if 'replied' in sequences:
1771 message.add_flag('A')
1772 elif isinstance(message, MHMessage):
1773 for sequence in self.get_sequences():
1774 message.add_sequence(sequence)
1775 elif isinstance(message, BabylMessage):
1776 sequences = set(self.get_sequences())
1777 if 'unseen' in sequences:
1778 message.add_label('unseen')
1779 if 'replied' in sequences:
1780 message.add_label('answered')
1781 elif isinstance(message, Message):
1782 pass
1783 else:
1784 raise TypeError('Cannot convert to specified type: %s' %
1785 type(message))
1786
1787
1788class BabylMessage(Message):
1789 """Message with Babyl-specific properties."""
1790
1791 def __init__(self, message=None):
1792 """Initialize an BabylMessage instance."""
1793 self._labels = []
1794 self._visible = Message()
1795 Message.__init__(self, message)
1796
1797 def get_labels(self):
1798 """Return a list of labels on the message."""
1799 return self._labels[:]
1800
1801 def set_labels(self, labels):
1802 """Set the list of labels on the message."""
1803 self._labels = list(labels)
1804
1805 def add_label(self, label):
1806 """Add label to list of labels on the message."""
1807 if isinstance(label, str):
1808 if label not in self._labels:
1809 self._labels.append(label)
1810 else:
1811 raise TypeError('label must be a string: %s' % type(label))
1812
1813 def remove_label(self, label):
1814 """Remove label from the list of labels on the message."""
1815 try:
1816 self._labels.remove(label)
1817 except ValueError:
1818 pass
1819
1820 def get_visible(self):
1821 """Return a Message representation of visible headers."""
1822 return Message(self._visible)
1823
1824 def set_visible(self, visible):
1825 """Set the Message representation of visible headers."""
1826 self._visible = Message(visible)
1827
1828 def update_visible(self):
1829 """Update and/or sensibly generate a set of visible headers."""
1830 for header in self._visible.keys():
1831 if header in self:
1832 self._visible.replace_header(header, self[header])
1833 else:
1834 del self._visible[header]
1835 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1836 if header in self and header not in self._visible:
1837 self._visible[header] = self[header]
1838
1839 def _explain_to(self, message):
1840 """Copy Babyl-specific state to message insofar as possible."""
1841 if isinstance(message, MaildirMessage):
1842 labels = set(self.get_labels())
1843 if 'unseen' in labels:
1844 message.set_subdir('cur')
1845 else:
1846 message.set_subdir('cur')
1847 message.add_flag('S')
1848 if 'forwarded' in labels or 'resent' in labels:
1849 message.add_flag('P')
1850 if 'answered' in labels:
1851 message.add_flag('R')
1852 if 'deleted' in labels:
1853 message.add_flag('T')
1854 elif isinstance(message, _mboxMMDFMessage):
1855 labels = set(self.get_labels())
1856 if 'unseen' not in labels:
1857 message.add_flag('RO')
1858 else:
1859 message.add_flag('O')
1860 if 'deleted' in labels:
1861 message.add_flag('D')
1862 if 'answered' in labels:
1863 message.add_flag('A')
1864 elif isinstance(message, MHMessage):
1865 labels = set(self.get_labels())
1866 if 'unseen' in labels:
1867 message.add_sequence('unseen')
1868 if 'answered' in labels:
1869 message.add_sequence('replied')
1870 elif isinstance(message, BabylMessage):
1871 message.set_visible(self.get_visible())
1872 for label in self.get_labels():
1873 message.add_label(label)
1874 elif isinstance(message, Message):
1875 pass
1876 else:
1877 raise TypeError('Cannot convert to specified type: %s' %
1878 type(message))
1879
1880
1881class MMDFMessage(_mboxMMDFMessage):
1882 """Message with MMDF-specific properties."""
1883
1884
1885class _ProxyFile:
1886 """A read-only wrapper of a file."""
1887
1888 def __init__(self, f, pos=None):
1889 """Initialize a _ProxyFile."""
1890 self._file = f
1891 if pos is None:
1892 self._pos = f.tell()
1893 else:
1894 self._pos = pos
1895
1896 def read(self, size=None):
1897 """Read bytes."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001898 return self._read(size, self._file.read)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001899
R. David Murrayb7deff12011-01-30 06:21:28 +00001900 def read1(self, size=None):
1901 """Read bytes."""
1902 return self._read(size, self._file.read1)
1903
Thomas Wouters477c8d52006-05-27 19:21:47 +00001904 def readline(self, size=None):
1905 """Read a line."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001906 return self._read(size, self._file.readline)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001907
1908 def readlines(self, sizehint=None):
1909 """Read multiple lines."""
1910 result = []
1911 for line in self:
1912 result.append(line)
1913 if sizehint is not None:
1914 sizehint -= len(line)
1915 if sizehint <= 0:
1916 break
1917 return result
1918
1919 def __iter__(self):
1920 """Iterate over lines."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001921 while True:
1922 line = self.readline()
1923 if not line:
1924 raise StopIteration
1925 yield line
Thomas Wouters477c8d52006-05-27 19:21:47 +00001926
1927 def tell(self):
1928 """Return the position."""
1929 return self._pos
1930
1931 def seek(self, offset, whence=0):
1932 """Change position."""
1933 if whence == 1:
1934 self._file.seek(self._pos)
1935 self._file.seek(offset, whence)
1936 self._pos = self._file.tell()
1937
1938 def close(self):
1939 """Close the file."""
R David Murrayc88bce12011-06-17 22:24:05 -04001940 if hasattr(self, '_file'):
1941 if hasattr(self._file, 'close'):
1942 self._file.close()
1943 del self._file
Thomas Wouters477c8d52006-05-27 19:21:47 +00001944
1945 def _read(self, size, read_method):
1946 """Read size bytes using read_method."""
1947 if size is None:
1948 size = -1
1949 self._file.seek(self._pos)
1950 result = read_method(size)
1951 self._pos = self._file.tell()
1952 return result
1953
Georg Brandl6ce29fa2010-10-30 14:33:28 +00001954 def __enter__(self):
1955 """Context manager protocol support."""
1956 return self
1957
1958 def __exit__(self, *exc):
1959 self.close()
1960
R. David Murrayb7deff12011-01-30 06:21:28 +00001961 def readable(self):
1962 return self._file.readable()
1963
1964 def writable(self):
1965 return self._file.writable()
1966
1967 def seekable(self):
1968 return self._file.seekable()
1969
1970 def flush(self):
1971 return self._file.flush()
1972
1973 @property
1974 def closed(self):
R David Murrayc88bce12011-06-17 22:24:05 -04001975 if not hasattr(self, '_file'):
1976 return True
1977 if not hasattr(self._file, 'closed'):
1978 return False
R. David Murrayb7deff12011-01-30 06:21:28 +00001979 return self._file.closed
1980
Thomas Wouters477c8d52006-05-27 19:21:47 +00001981
1982class _PartialFile(_ProxyFile):
1983 """A read-only wrapper of part of a file."""
1984
1985 def __init__(self, f, start=None, stop=None):
1986 """Initialize a _PartialFile."""
1987 _ProxyFile.__init__(self, f, start)
1988 self._start = start
1989 self._stop = stop
1990
1991 def tell(self):
1992 """Return the position with respect to start."""
1993 return _ProxyFile.tell(self) - self._start
1994
1995 def seek(self, offset, whence=0):
1996 """Change position, possibly with respect to start or stop."""
1997 if whence == 0:
1998 self._pos = self._start
1999 whence = 1
2000 elif whence == 2:
2001 self._pos = self._stop
2002 whence = 1
2003 _ProxyFile.seek(self, offset, whence)
2004
2005 def _read(self, size, read_method):
2006 """Read size bytes using read_method, honoring start and stop."""
2007 remaining = self._stop - self._pos
2008 if remaining <= 0:
R. David Murrayb7deff12011-01-30 06:21:28 +00002009 return b''
Thomas Wouters477c8d52006-05-27 19:21:47 +00002010 if size is None or size < 0 or size > remaining:
2011 size = remaining
2012 return _ProxyFile._read(self, size, read_method)
2013
Georg Brandl6ce29fa2010-10-30 14:33:28 +00002014 def close(self):
2015 # do *not* close the underlying file object for partial files,
2016 # since it's global to the mailbox object
R David Murrayc88bce12011-06-17 22:24:05 -04002017 if hasattr(self, '_file'):
2018 del self._file
Georg Brandl6ce29fa2010-10-30 14:33:28 +00002019
Thomas Wouters477c8d52006-05-27 19:21:47 +00002020
2021def _lock_file(f, dotlock=True):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002022 """Lock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00002023 dotlock_done = False
2024 try:
2025 if fcntl:
2026 try:
2027 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
Guido van Rossumb940e112007-01-10 16:19:56 +00002028 except IOError as e:
R. David Murray752b9502011-03-03 18:12:34 +00002029 if e.errno in (errno.EAGAIN, errno.EACCES, errno.EROFS):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002030 raise ExternalClashError('lockf: lock unavailable: %s' %
2031 f.name)
2032 else:
2033 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +00002034 if dotlock:
2035 try:
2036 pre_lock = _create_temporary(f.name + '.lock')
2037 pre_lock.close()
Guido van Rossumb940e112007-01-10 16:19:56 +00002038 except IOError as e:
R. David Murray752b9502011-03-03 18:12:34 +00002039 if e.errno in (errno.EACCES, errno.EROFS):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002040 return # Without write access, just skip dotlocking.
2041 else:
2042 raise
2043 try:
2044 if hasattr(os, 'link'):
2045 os.link(pre_lock.name, f.name + '.lock')
2046 dotlock_done = True
2047 os.unlink(pre_lock.name)
2048 else:
2049 os.rename(pre_lock.name, f.name + '.lock')
2050 dotlock_done = True
Guido van Rossumb940e112007-01-10 16:19:56 +00002051 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002052 if e.errno == errno.EEXIST or \
2053 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002054 os.remove(pre_lock.name)
2055 raise ExternalClashError('dot lock unavailable: %s' %
2056 f.name)
2057 else:
2058 raise
2059 except:
2060 if fcntl:
2061 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002062 if dotlock_done:
2063 os.remove(f.name + '.lock')
2064 raise
2065
2066def _unlock_file(f):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002067 """Unlock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00002068 if fcntl:
2069 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002070 if os.path.exists(f.name + '.lock'):
2071 os.remove(f.name + '.lock')
2072
2073def _create_carefully(path):
2074 """Create a file if it doesn't exist and open for reading and writing."""
Georg Brandl6aa2d1f2008-08-12 08:35:52 +00002075 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR, 0o666)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002076 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00002077 return open(path, 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00002078 finally:
2079 os.close(fd)
2080
2081def _create_temporary(path):
2082 """Create a temp file based on path and open for reading and writing."""
2083 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
2084 socket.gethostname(),
2085 os.getpid()))
2086
Thomas Wouters89f507f2006-12-13 04:49:30 +00002087def _sync_flush(f):
2088 """Ensure changes to file f are physically on disk."""
2089 f.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +00002090 if hasattr(os, 'fsync'):
2091 os.fsync(f.fileno())
Thomas Wouters89f507f2006-12-13 04:49:30 +00002092
2093def _sync_close(f):
2094 """Close file f, ensuring all changes are physically on disk."""
2095 _sync_flush(f)
2096 f.close()
Thomas Wouters477c8d52006-05-27 19:21:47 +00002097
Guido van Rossum62448671996-09-17 21:33:15 +00002098
Thomas Wouters477c8d52006-05-27 19:21:47 +00002099class Error(Exception):
2100 """Raised for module-specific errors."""
2101
2102class NoSuchMailboxError(Error):
2103 """The specified mailbox does not exist and won't be created."""
2104
2105class NotEmptyError(Error):
2106 """The specified mailbox is not empty and deletion was requested."""
2107
2108class ExternalClashError(Error):
2109 """Another process caused an action to fail."""
2110
2111class FormatError(Error):
2112 """A file appears to have an invalid format."""