blob: d86ad94478893fcc89f76cd66bb507b663b831d6 [file] [log] [blame]
Benjamin Peterson90f5ba52010-03-11 22:53:45 +00001#! /usr/bin/env python3
Guido van Rossum62448671996-09-17 21:33:15 +00002
Thomas Wouters477c8d52006-05-27 19:21:47 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Thomas Wouters89f507f2006-12-13 04:49:30 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Thomas Wouters477c8d52006-05-27 19:21:47 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Thomas Wouters477c8d52006-05-27 19:21:47 +000013import time
14import calendar
15import socket
16import errno
17import copy
R. David Murrayb7deff12011-01-30 06:21:28 +000018import warnings
Thomas Wouters477c8d52006-05-27 19:21:47 +000019import email
Thomas Woutersb2137042007-02-01 18:02:27 +000020import email.message
21import email.generator
Guido van Rossum34d19282007-08-09 01:03:29 +000022import io
R David Murray05ff9902011-06-17 12:54:56 -040023import contextlib
Thomas Wouters477c8d52006-05-27 19:21:47 +000024try:
Thomas Wouters0e3f5912006-08-11 14:57:12 +000025 if sys.platform == 'os2emx':
26 # OS/2 EMX fcntl() not adequate
27 raise ImportError
28 import fcntl
Thomas Wouters477c8d52006-05-27 19:21:47 +000029except ImportError:
30 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000031
Thomas Wouters477c8d52006-05-27 19:21:47 +000032__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
33 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
Benjamin Peterson8041d472008-05-11 16:17:24 +000034 'BabylMessage', 'MMDFMessage']
Thomas Wouters477c8d52006-05-27 19:21:47 +000035
R. David Murrayb7deff12011-01-30 06:21:28 +000036linesep = os.linesep.encode('ascii')
37
Thomas Wouters477c8d52006-05-27 19:21:47 +000038class Mailbox:
39 """A group of messages in a particular place."""
40
41 def __init__(self, path, factory=None, create=True):
42 """Initialize a Mailbox instance."""
43 self._path = os.path.abspath(os.path.expanduser(path))
44 self._factory = factory
45
46 def add(self, message):
47 """Add message and return assigned key."""
48 raise NotImplementedError('Method must be implemented by subclass')
49
50 def remove(self, key):
51 """Remove the keyed message; raise KeyError if it doesn't exist."""
52 raise NotImplementedError('Method must be implemented by subclass')
53
54 def __delitem__(self, key):
55 self.remove(key)
56
57 def discard(self, key):
58 """If the keyed message exists, remove it."""
59 try:
60 self.remove(key)
61 except KeyError:
62 pass
63
64 def __setitem__(self, key, message):
65 """Replace the keyed message; raise KeyError if it doesn't exist."""
66 raise NotImplementedError('Method must be implemented by subclass')
67
68 def get(self, key, default=None):
69 """Return the keyed message, or default if it doesn't exist."""
70 try:
71 return self.__getitem__(key)
72 except KeyError:
73 return default
74
75 def __getitem__(self, key):
76 """Return the keyed message; raise KeyError if it doesn't exist."""
77 if not self._factory:
78 return self.get_message(key)
79 else:
R David Murray05ff9902011-06-17 12:54:56 -040080 with contextlib.closing(self.get_file(key)) as file:
81 return self._factory(file)
Thomas Wouters477c8d52006-05-27 19:21:47 +000082
83 def get_message(self, key):
84 """Return a Message representation or raise a KeyError."""
85 raise NotImplementedError('Method must be implemented by subclass')
86
87 def get_string(self, key):
R. David Murrayb7deff12011-01-30 06:21:28 +000088 """Return a string representation or raise a KeyError.
89
90 Uses email.message.Message to create a 7bit clean string
91 representation of the message."""
92 return email.message_from_bytes(self.get_bytes(key)).as_string()
93
94 def get_bytes(self, key):
95 """Return a byte string representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +000096 raise NotImplementedError('Method must be implemented by subclass')
97
98 def get_file(self, key):
99 """Return a file-like representation or raise a KeyError."""
100 raise NotImplementedError('Method must be implemented by subclass')
101
102 def iterkeys(self):
103 """Return an iterator over keys."""
104 raise NotImplementedError('Method must be implemented by subclass')
105
106 def keys(self):
107 """Return a list of keys."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000108 return list(self.iterkeys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000109
110 def itervalues(self):
111 """Return an iterator over all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000112 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000113 try:
114 value = self[key]
115 except KeyError:
116 continue
117 yield value
118
119 def __iter__(self):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000120 return self.itervalues()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000121
122 def values(self):
123 """Return a list of messages. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000124 return list(self.itervalues())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000125
126 def iteritems(self):
127 """Return an iterator over (key, message) tuples."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000128 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000129 try:
130 value = self[key]
131 except KeyError:
132 continue
133 yield (key, value)
134
135 def items(self):
136 """Return a list of (key, message) tuples. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000137 return list(self.iteritems())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000138
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000139 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000140 """Return True if the keyed message exists, False otherwise."""
141 raise NotImplementedError('Method must be implemented by subclass')
142
Thomas Wouters477c8d52006-05-27 19:21:47 +0000143 def __len__(self):
144 """Return a count of messages in the mailbox."""
145 raise NotImplementedError('Method must be implemented by subclass')
146
147 def clear(self):
148 """Delete all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000149 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000150 self.discard(key)
151
152 def pop(self, key, default=None):
153 """Delete the keyed message and return it, or default."""
154 try:
155 result = self[key]
156 except KeyError:
157 return default
158 self.discard(key)
159 return result
160
161 def popitem(self):
162 """Delete an arbitrary (key, message) pair and return it."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000163 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000164 return (key, self.pop(key)) # This is only run once.
165 else:
166 raise KeyError('No messages in mailbox')
167
168 def update(self, arg=None):
169 """Change the messages that correspond to certain keys."""
170 if hasattr(arg, 'iteritems'):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000171 source = arg.items()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000172 elif hasattr(arg, 'items'):
173 source = arg.items()
174 else:
175 source = arg
176 bad_key = False
177 for key, message in source:
178 try:
179 self[key] = message
180 except KeyError:
181 bad_key = True
182 if bad_key:
183 raise KeyError('No message with key(s)')
184
185 def flush(self):
186 """Write any pending changes to the disk."""
187 raise NotImplementedError('Method must be implemented by subclass')
188
189 def lock(self):
190 """Lock the mailbox."""
191 raise NotImplementedError('Method must be implemented by subclass')
192
193 def unlock(self):
194 """Unlock the mailbox if it is locked."""
195 raise NotImplementedError('Method must be implemented by subclass')
196
197 def close(self):
198 """Flush and close the mailbox."""
199 raise NotImplementedError('Method must be implemented by subclass')
200
R. David Murrayb7deff12011-01-30 06:21:28 +0000201 def _string_to_bytes(self, message):
202 # If a message is not 7bit clean, we refuse to handle it since it
203 # likely came from reading invalid messages in text mode, and that way
204 # lies mojibake.
205 try:
206 return message.encode('ascii')
207 except UnicodeError:
208 raise ValueError("String input must be ASCII-only; "
209 "use bytes or a Message instead")
210
Thomas Wouters477c8d52006-05-27 19:21:47 +0000211 def _dump_message(self, message, target, mangle_from_=False):
R. David Murrayb7deff12011-01-30 06:21:28 +0000212 # This assumes the target file is open in binary mode.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000213 """Dump message contents to target file."""
Thomas Woutersb2137042007-02-01 18:02:27 +0000214 if isinstance(message, email.message.Message):
R. David Murrayb7deff12011-01-30 06:21:28 +0000215 buffer = io.BytesIO()
216 gen = email.generator.BytesGenerator(buffer, mangle_from_, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000217 gen.flatten(message)
218 buffer.seek(0)
Guido van Rossum671117a2007-08-31 04:25:05 +0000219 data = buffer.read()
R. David Murrayb7deff12011-01-30 06:21:28 +0000220 data = data.replace(b'\n', linesep)
Guido van Rossum671117a2007-08-31 04:25:05 +0000221 target.write(data)
R. David Murrayb7deff12011-01-30 06:21:28 +0000222 elif isinstance(message, (str, bytes, io.StringIO)):
223 if isinstance(message, io.StringIO):
224 warnings.warn("Use of StringIO input is deprecated, "
225 "use BytesIO instead", DeprecationWarning, 3)
226 message = message.getvalue()
227 if isinstance(message, str):
228 message = self._string_to_bytes(message)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000229 if mangle_from_:
R. David Murrayb7deff12011-01-30 06:21:28 +0000230 message = message.replace(b'\nFrom ', b'\n>From ')
231 message = message.replace(b'\n', linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000232 target.write(message)
233 elif hasattr(message, 'read'):
R. David Murrayb7deff12011-01-30 06:21:28 +0000234 if hasattr(message, 'buffer'):
235 warnings.warn("Use of text mode files is deprecated, "
236 "use a binary mode file instead", DeprecationWarning, 3)
237 message = message.buffer
Thomas Wouters477c8d52006-05-27 19:21:47 +0000238 while True:
239 line = message.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +0000240 # Universal newline support.
241 if line.endswith(b'\r\n'):
242 line = line[:-2] + b'\n'
243 elif line.endswith(b'\r'):
244 line = line[:-1] + b'\n'
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000245 if not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000246 break
R. David Murrayb7deff12011-01-30 06:21:28 +0000247 if mangle_from_ and line.startswith(b'From '):
248 line = b'>From ' + line[5:]
249 line = line.replace(b'\n', linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000250 target.write(line)
251 else:
252 raise TypeError('Invalid message type: %s' % type(message))
253
254
255class Maildir(Mailbox):
256 """A qmail-style Maildir mailbox."""
257
258 colon = ':'
259
Georg Brandlaa5b4112008-05-11 20:51:18 +0000260 def __init__(self, dirname, factory=None, create=True):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000261 """Initialize a Maildir instance."""
262 Mailbox.__init__(self, dirname, factory, create)
R David Murraycaed7fe2011-05-06 22:07:19 -0400263 self._paths = {
264 'tmp': os.path.join(self._path, 'tmp'),
265 'new': os.path.join(self._path, 'new'),
266 'cur': os.path.join(self._path, 'cur'),
267 }
Thomas Wouters477c8d52006-05-27 19:21:47 +0000268 if not os.path.exists(self._path):
269 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000270 os.mkdir(self._path, 0o700)
R David Murraycaed7fe2011-05-06 22:07:19 -0400271 for path in self._paths.values():
272 os.mkdir(path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000273 else:
274 raise NoSuchMailboxError(self._path)
275 self._toc = {}
Petri Lehtinen8c482ee2011-11-05 09:44:59 +0200276 self._toc_mtimes = {'cur': 0, 'new': 0}
277 self._last_read = 0 # Records last time we read cur/new
278 self._skewfactor = 0.1 # Adjust if os/fs clocks are skewing
Thomas Wouters477c8d52006-05-27 19:21:47 +0000279
280 def add(self, message):
281 """Add message and return assigned key."""
282 tmp_file = self._create_tmp()
283 try:
284 self._dump_message(message, tmp_file)
R. David Murrayfc141142011-02-11 22:47:17 +0000285 except BaseException:
286 tmp_file.close()
287 os.remove(tmp_file.name)
288 raise
289 _sync_close(tmp_file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000290 if isinstance(message, MaildirMessage):
291 subdir = message.get_subdir()
292 suffix = self.colon + message.get_info()
293 if suffix == self.colon:
294 suffix = ''
295 else:
296 subdir = 'new'
297 suffix = ''
298 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
299 dest = os.path.join(self._path, subdir, uniq + suffix)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000300 try:
301 if hasattr(os, 'link'):
302 os.link(tmp_file.name, dest)
303 os.remove(tmp_file.name)
304 else:
305 os.rename(tmp_file.name, dest)
Guido van Rossumb940e112007-01-10 16:19:56 +0000306 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000307 os.remove(tmp_file.name)
308 if e.errno == errno.EEXIST:
309 raise ExternalClashError('Name clash with existing message: %s'
310 % dest)
311 else:
312 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000313 if isinstance(message, MaildirMessage):
314 os.utime(dest, (os.path.getatime(dest), message.get_date()))
315 return uniq
316
317 def remove(self, key):
318 """Remove the keyed message; raise KeyError if it doesn't exist."""
319 os.remove(os.path.join(self._path, self._lookup(key)))
320
321 def discard(self, key):
322 """If the keyed message exists, remove it."""
323 # This overrides an inapplicable implementation in the superclass.
324 try:
325 self.remove(key)
326 except KeyError:
327 pass
Guido van Rossumb940e112007-01-10 16:19:56 +0000328 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000329 if e.errno != errno.ENOENT:
330 raise
331
332 def __setitem__(self, key, message):
333 """Replace the keyed message; raise KeyError if it doesn't exist."""
334 old_subpath = self._lookup(key)
335 temp_key = self.add(message)
336 temp_subpath = self._lookup(temp_key)
337 if isinstance(message, MaildirMessage):
338 # temp's subdir and suffix were specified by message.
339 dominant_subpath = temp_subpath
340 else:
341 # temp's subdir and suffix were defaults from add().
342 dominant_subpath = old_subpath
343 subdir = os.path.dirname(dominant_subpath)
344 if self.colon in dominant_subpath:
345 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
346 else:
347 suffix = ''
348 self.discard(key)
349 new_path = os.path.join(self._path, subdir, key + suffix)
350 os.rename(os.path.join(self._path, temp_subpath), new_path)
351 if isinstance(message, MaildirMessage):
352 os.utime(new_path, (os.path.getatime(new_path),
353 message.get_date()))
354
355 def get_message(self, key):
356 """Return a Message representation or raise a KeyError."""
357 subpath = self._lookup(key)
R. David Murrayb7deff12011-01-30 06:21:28 +0000358 f = open(os.path.join(self._path, subpath), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000359 try:
Christian Heimesfdab48e2008-01-20 09:06:41 +0000360 if self._factory:
361 msg = self._factory(f)
362 else:
363 msg = MaildirMessage(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000364 finally:
365 f.close()
366 subdir, name = os.path.split(subpath)
367 msg.set_subdir(subdir)
368 if self.colon in name:
369 msg.set_info(name.split(self.colon)[-1])
370 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
371 return msg
372
R. David Murrayb7deff12011-01-30 06:21:28 +0000373 def get_bytes(self, key):
374 """Return a bytes representation or raise a KeyError."""
375 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000376 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000377 return f.read().replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000378 finally:
379 f.close()
380
381 def get_file(self, key):
382 """Return a file-like representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000383 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000384 return _ProxyFile(f)
385
386 def iterkeys(self):
387 """Return an iterator over keys."""
388 self._refresh()
389 for key in self._toc:
390 try:
391 self._lookup(key)
392 except KeyError:
393 continue
394 yield key
395
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000396 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000397 """Return True if the keyed message exists, False otherwise."""
398 self._refresh()
399 return key in self._toc
400
401 def __len__(self):
402 """Return a count of messages in the mailbox."""
403 self._refresh()
404 return len(self._toc)
405
406 def flush(self):
407 """Write any pending changes to disk."""
Antoine Pitrou03f13442009-11-02 11:36:51 +0000408 # Maildir changes are always written immediately, so there's nothing
R David Murraycaed7fe2011-05-06 22:07:19 -0400409 # to do.
410 pass
Thomas Wouters477c8d52006-05-27 19:21:47 +0000411
412 def lock(self):
413 """Lock the mailbox."""
414 return
415
416 def unlock(self):
417 """Unlock the mailbox if it is locked."""
418 return
419
420 def close(self):
421 """Flush and close the mailbox."""
422 return
423
424 def list_folders(self):
425 """Return a list of folder names."""
426 result = []
427 for entry in os.listdir(self._path):
428 if len(entry) > 1 and entry[0] == '.' and \
429 os.path.isdir(os.path.join(self._path, entry)):
430 result.append(entry[1:])
431 return result
432
433 def get_folder(self, folder):
434 """Return a Maildir instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000435 return Maildir(os.path.join(self._path, '.' + folder),
436 factory=self._factory,
437 create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000438
439 def add_folder(self, folder):
440 """Create a folder and return a Maildir instance representing it."""
441 path = os.path.join(self._path, '.' + folder)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000442 result = Maildir(path, factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000443 maildirfolder_path = os.path.join(path, 'maildirfolder')
444 if not os.path.exists(maildirfolder_path):
Georg Brandl6aa2d1f2008-08-12 08:35:52 +0000445 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY,
446 0o666))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000447 return result
448
449 def remove_folder(self, folder):
450 """Delete the named folder, which must be empty."""
451 path = os.path.join(self._path, '.' + folder)
452 for entry in os.listdir(os.path.join(path, 'new')) + \
453 os.listdir(os.path.join(path, 'cur')):
454 if len(entry) < 1 or entry[0] != '.':
455 raise NotEmptyError('Folder contains message(s): %s' % folder)
456 for entry in os.listdir(path):
457 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
458 os.path.isdir(os.path.join(path, entry)):
459 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
460 (folder, entry))
461 for root, dirs, files in os.walk(path, topdown=False):
462 for entry in files:
463 os.remove(os.path.join(root, entry))
464 for entry in dirs:
465 os.rmdir(os.path.join(root, entry))
466 os.rmdir(path)
467
468 def clean(self):
469 """Delete old files in "tmp"."""
470 now = time.time()
471 for entry in os.listdir(os.path.join(self._path, 'tmp')):
472 path = os.path.join(self._path, 'tmp', entry)
473 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
474 os.remove(path)
475
476 _count = 1 # This is used to generate unique file names.
477
478 def _create_tmp(self):
479 """Create a file in the tmp subdirectory and open and return it."""
480 now = time.time()
481 hostname = socket.gethostname()
482 if '/' in hostname:
483 hostname = hostname.replace('/', r'\057')
484 if ':' in hostname:
485 hostname = hostname.replace(':', r'\072')
486 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
487 Maildir._count, hostname)
488 path = os.path.join(self._path, 'tmp', uniq)
489 try:
490 os.stat(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000491 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000492 if e.errno == errno.ENOENT:
493 Maildir._count += 1
Thomas Wouters89f507f2006-12-13 04:49:30 +0000494 try:
495 return _create_carefully(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000496 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000497 if e.errno != errno.EEXIST:
498 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000499 else:
500 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000501
502 # Fall through to here if stat succeeded or open raised EEXIST.
503 raise ExternalClashError('Name clash prevented file creation: %s' %
504 path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000505
506 def _refresh(self):
507 """Update table of contents mapping."""
R David Murraycaed7fe2011-05-06 22:07:19 -0400508 # If it has been less than two seconds since the last _refresh() call,
509 # we have to unconditionally re-read the mailbox just in case it has
510 # been modified, because os.path.mtime() has a 2 sec resolution in the
511 # most common worst case (FAT) and a 1 sec resolution typically. This
512 # results in a few unnecessary re-reads when _refresh() is called
513 # multiple times in that interval, but once the clock ticks over, we
514 # will only re-read as needed. Because the filesystem might be being
515 # served by an independent system with its own clock, we record and
516 # compare with the mtimes from the filesystem. Because the other
517 # system's clock might be skewing relative to our clock, we add an
518 # extra delta to our wait. The default is one tenth second, but is an
519 # instance variable and so can be adjusted if dealing with a
520 # particularly skewed or irregular system.
521 if time.time() - self._last_read > 2 + self._skewfactor:
522 refresh = False
523 for subdir in self._toc_mtimes:
524 mtime = os.path.getmtime(self._paths[subdir])
525 if mtime > self._toc_mtimes[subdir]:
526 refresh = True
527 self._toc_mtimes[subdir] = mtime
528 if not refresh:
Benjamin Petersonf6489f92009-11-25 17:46:26 +0000529 return
R David Murraycaed7fe2011-05-06 22:07:19 -0400530 # Refresh toc
Thomas Wouters477c8d52006-05-27 19:21:47 +0000531 self._toc = {}
R David Murraycaed7fe2011-05-06 22:07:19 -0400532 for subdir in self._toc_mtimes:
533 path = self._paths[subdir]
Andrew M. Kuchlingfa815342009-05-03 02:52:20 +0000534 for entry in os.listdir(path):
535 p = os.path.join(path, entry)
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000536 if os.path.isdir(p):
537 continue
Thomas Wouters477c8d52006-05-27 19:21:47 +0000538 uniq = entry.split(self.colon)[0]
539 self._toc[uniq] = os.path.join(subdir, entry)
R David Murraycaed7fe2011-05-06 22:07:19 -0400540 self._last_read = time.time()
Andrew M. Kuchlingfa815342009-05-03 02:52:20 +0000541
Thomas Wouters477c8d52006-05-27 19:21:47 +0000542 def _lookup(self, key):
543 """Use TOC to return subpath for given key, or raise a KeyError."""
544 try:
545 if os.path.exists(os.path.join(self._path, self._toc[key])):
546 return self._toc[key]
547 except KeyError:
548 pass
549 self._refresh()
550 try:
551 return self._toc[key]
552 except KeyError:
553 raise KeyError('No message with key: %s' % key)
554
555 # This method is for backward compatibility only.
556 def next(self):
557 """Return the next message in a one-time iteration."""
558 if not hasattr(self, '_onetime_keys'):
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000559 self._onetime_keys = iter(self.keys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000560 while True:
561 try:
Georg Brandla18af4e2007-04-21 15:47:16 +0000562 return self[next(self._onetime_keys)]
Thomas Wouters477c8d52006-05-27 19:21:47 +0000563 except StopIteration:
564 return None
565 except KeyError:
566 continue
567
568
569class _singlefileMailbox(Mailbox):
570 """A single-file mailbox."""
571
572 def __init__(self, path, factory=None, create=True):
573 """Initialize a single-file mailbox."""
574 Mailbox.__init__(self, path, factory, create)
575 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000576 f = open(self._path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000577 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000578 if e.errno == errno.ENOENT:
579 if create:
R. David Murrayb7deff12011-01-30 06:21:28 +0000580 f = open(self._path, 'wb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000581 else:
582 raise NoSuchMailboxError(self._path)
R. David Murray752b9502011-03-03 18:12:34 +0000583 elif e.errno in (errno.EACCES, errno.EROFS):
R. David Murrayb7deff12011-01-30 06:21:28 +0000584 f = open(self._path, 'rb')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000585 else:
586 raise
587 self._file = f
588 self._toc = None
589 self._next_key = 0
590 self._pending = False # No changes require rewriting the file.
591 self._locked = False
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000592 self._file_length = None # Used to record mailbox size
Thomas Wouters477c8d52006-05-27 19:21:47 +0000593
594 def add(self, message):
595 """Add message and return assigned key."""
596 self._lookup()
597 self._toc[self._next_key] = self._append_message(message)
598 self._next_key += 1
599 self._pending = True
600 return self._next_key - 1
601
602 def remove(self, key):
603 """Remove the keyed message; raise KeyError if it doesn't exist."""
604 self._lookup(key)
605 del self._toc[key]
606 self._pending = True
607
608 def __setitem__(self, key, message):
609 """Replace the keyed message; raise KeyError if it doesn't exist."""
610 self._lookup(key)
611 self._toc[key] = self._append_message(message)
612 self._pending = True
613
614 def iterkeys(self):
615 """Return an iterator over keys."""
616 self._lookup()
617 for key in self._toc.keys():
618 yield key
619
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000620 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000621 """Return True if the keyed message exists, False otherwise."""
622 self._lookup()
623 return key in self._toc
624
625 def __len__(self):
626 """Return a count of messages in the mailbox."""
627 self._lookup()
628 return len(self._toc)
629
630 def lock(self):
631 """Lock the mailbox."""
632 if not self._locked:
633 _lock_file(self._file)
634 self._locked = True
635
636 def unlock(self):
637 """Unlock the mailbox if it is locked."""
638 if self._locked:
639 _unlock_file(self._file)
640 self._locked = False
641
642 def flush(self):
643 """Write any pending changes to disk."""
644 if not self._pending:
645 return
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000646
647 # In order to be writing anything out at all, self._toc must
648 # already have been generated (and presumably has been modified
649 # by adding or deleting an item).
650 assert self._toc is not None
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000651
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000652 # Check length of self._file; if it's changed, some other process
653 # has modified the mailbox since we scanned it.
654 self._file.seek(0, 2)
655 cur_len = self._file.tell()
656 if cur_len != self._file_length:
657 raise ExternalClashError('Size of mailbox file changed '
658 '(expected %i, found %i)' %
659 (self._file_length, cur_len))
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000660
Thomas Wouters477c8d52006-05-27 19:21:47 +0000661 new_file = _create_temporary(self._path)
662 try:
663 new_toc = {}
664 self._pre_mailbox_hook(new_file)
665 for key in sorted(self._toc.keys()):
666 start, stop = self._toc[key]
667 self._file.seek(start)
668 self._pre_message_hook(new_file)
669 new_start = new_file.tell()
670 while True:
671 buffer = self._file.read(min(4096,
672 stop - self._file.tell()))
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000673 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000674 break
675 new_file.write(buffer)
676 new_toc[key] = (new_start, new_file.tell())
677 self._post_message_hook(new_file)
Petri Lehtinen02653f12012-06-15 20:50:51 +0300678 self._file_length = new_file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000679 except:
680 new_file.close()
681 os.remove(new_file.name)
682 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000683 _sync_close(new_file)
684 # self._file is about to get replaced, so no need to sync.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000685 self._file.close()
686 try:
687 os.rename(new_file.name, self._path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000688 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000689 if e.errno == errno.EEXIST or \
690 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000691 os.remove(self._path)
692 os.rename(new_file.name, self._path)
693 else:
694 raise
695 self._file = open(self._path, 'rb+')
696 self._toc = new_toc
697 self._pending = False
698 if self._locked:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000699 _lock_file(self._file, dotlock=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000700
701 def _pre_mailbox_hook(self, f):
702 """Called before writing the mailbox to file f."""
703 return
704
705 def _pre_message_hook(self, f):
706 """Called before writing each message to file f."""
707 return
708
709 def _post_message_hook(self, f):
710 """Called after writing each message to file f."""
711 return
712
713 def close(self):
714 """Flush and close the mailbox."""
715 self.flush()
716 if self._locked:
717 self.unlock()
Thomas Wouters89f507f2006-12-13 04:49:30 +0000718 self._file.close() # Sync has been done by self.flush() above.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000719
720 def _lookup(self, key=None):
721 """Return (start, stop) or raise KeyError."""
722 if self._toc is None:
723 self._generate_toc()
724 if key is not None:
725 try:
726 return self._toc[key]
727 except KeyError:
728 raise KeyError('No message with key: %s' % key)
729
730 def _append_message(self, message):
731 """Append message to mailbox and return (start, stop) offsets."""
732 self._file.seek(0, 2)
R. David Murrayfc141142011-02-11 22:47:17 +0000733 before = self._file.tell()
734 try:
735 self._pre_message_hook(self._file)
736 offsets = self._install_message(message)
737 self._post_message_hook(self._file)
738 except BaseException:
739 self._file.truncate(before)
740 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000741 self._file.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000742 self._file_length = self._file.tell() # Record current length of mailbox
Thomas Wouters477c8d52006-05-27 19:21:47 +0000743 return offsets
744
745
746
747class _mboxMMDF(_singlefileMailbox):
748 """An mbox or MMDF mailbox."""
749
750 _mangle_from_ = True
751
752 def get_message(self, key):
753 """Return a Message representation or raise a KeyError."""
754 start, stop = self._lookup(key)
755 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +0000756 from_line = self._file.readline().replace(linesep, b'')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000757 string = self._file.read(stop - self._file.tell())
R. David Murrayb7deff12011-01-30 06:21:28 +0000758 msg = self._message_factory(string.replace(linesep, b'\n'))
759 msg.set_from(from_line[5:].decode('ascii'))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000760 return msg
761
762 def get_string(self, key, from_=False):
763 """Return a string representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000764 return email.message_from_bytes(
765 self.get_bytes(key)).as_string(unixfrom=from_)
766
767 def get_bytes(self, key, from_=False):
768 """Return a string representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +0000769 start, stop = self._lookup(key)
770 self._file.seek(start)
771 if not from_:
772 self._file.readline()
773 string = self._file.read(stop - self._file.tell())
R. David Murrayb7deff12011-01-30 06:21:28 +0000774 return string.replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000775
776 def get_file(self, key, from_=False):
777 """Return a file-like representation or raise a KeyError."""
778 start, stop = self._lookup(key)
779 self._file.seek(start)
780 if not from_:
781 self._file.readline()
782 return _PartialFile(self._file, self._file.tell(), stop)
783
784 def _install_message(self, message):
785 """Format a message and blindly write to self._file."""
786 from_line = None
R. David Murrayb7deff12011-01-30 06:21:28 +0000787 if isinstance(message, str):
788 message = self._string_to_bytes(message)
789 if isinstance(message, bytes) and message.startswith(b'From '):
790 newline = message.find(b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000791 if newline != -1:
792 from_line = message[:newline]
793 message = message[newline + 1:]
794 else:
795 from_line = message
R. David Murrayb7deff12011-01-30 06:21:28 +0000796 message = b''
Thomas Wouters477c8d52006-05-27 19:21:47 +0000797 elif isinstance(message, _mboxMMDFMessage):
R. David Murrayb7deff12011-01-30 06:21:28 +0000798 author = message.get_from().encode('ascii')
799 from_line = b'From ' + author
Thomas Woutersb2137042007-02-01 18:02:27 +0000800 elif isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000801 from_line = message.get_unixfrom() # May be None.
R. David Murrayb7deff12011-01-30 06:21:28 +0000802 if from_line is not None:
803 from_line = from_line.encode('ascii')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000804 if from_line is None:
R. David Murrayb7deff12011-01-30 06:21:28 +0000805 from_line = b'From MAILER-DAEMON ' + time.asctime(time.gmtime()).encode()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000806 start = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000807 self._file.write(from_line + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000808 self._dump_message(message, self._file, self._mangle_from_)
809 stop = self._file.tell()
810 return (start, stop)
811
812
813class mbox(_mboxMMDF):
814 """A classic mbox mailbox."""
815
816 _mangle_from_ = True
817
818 def __init__(self, path, factory=None, create=True):
819 """Initialize an mbox mailbox."""
820 self._message_factory = mboxMessage
821 _mboxMMDF.__init__(self, path, factory, create)
822
823 def _pre_message_hook(self, f):
824 """Called before writing each message to file f."""
825 if f.tell() != 0:
R. David Murrayb7deff12011-01-30 06:21:28 +0000826 f.write(linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000827
828 def _generate_toc(self):
829 """Generate key-to-(start, stop) table of contents."""
830 starts, stops = [], []
831 self._file.seek(0)
832 while True:
833 line_pos = self._file.tell()
834 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +0000835 if line.startswith(b'From '):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000836 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +0000837 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000838 starts.append(line_pos)
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000839 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000840 stops.append(line_pos)
841 break
842 self._toc = dict(enumerate(zip(starts, stops)))
843 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000844 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000845
846
847class MMDF(_mboxMMDF):
848 """An MMDF mailbox."""
849
850 def __init__(self, path, factory=None, create=True):
851 """Initialize an MMDF mailbox."""
852 self._message_factory = MMDFMessage
853 _mboxMMDF.__init__(self, path, factory, create)
854
855 def _pre_message_hook(self, f):
856 """Called before writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000857 f.write(b'\001\001\001\001' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000858
859 def _post_message_hook(self, f):
860 """Called after writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +0000861 f.write(linesep + b'\001\001\001\001' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000862
863 def _generate_toc(self):
864 """Generate key-to-(start, stop) table of contents."""
865 starts, stops = [], []
866 self._file.seek(0)
867 next_pos = 0
868 while True:
869 line_pos = next_pos
870 line = self._file.readline()
871 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000872 if line.startswith(b'\001\001\001\001' + linesep):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000873 starts.append(next_pos)
874 while True:
875 line_pos = next_pos
876 line = self._file.readline()
877 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +0000878 if line == b'\001\001\001\001' + linesep:
879 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000880 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000881 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000882 stops.append(line_pos)
883 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000884 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000885 break
886 self._toc = dict(enumerate(zip(starts, stops)))
887 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000888 self._file.seek(0, 2)
889 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000890
891
892class MH(Mailbox):
893 """An MH mailbox."""
894
895 def __init__(self, path, factory=None, create=True):
896 """Initialize an MH instance."""
897 Mailbox.__init__(self, path, factory, create)
898 if not os.path.exists(self._path):
899 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000900 os.mkdir(self._path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000901 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000902 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000903 else:
904 raise NoSuchMailboxError(self._path)
905 self._locked = False
906
907 def add(self, message):
908 """Add message and return assigned key."""
909 keys = self.keys()
910 if len(keys) == 0:
911 new_key = 1
912 else:
913 new_key = max(keys) + 1
914 new_path = os.path.join(self._path, str(new_key))
915 f = _create_carefully(new_path)
R. David Murray774a66d2011-02-12 00:03:31 +0000916 closed = False
Thomas Wouters477c8d52006-05-27 19:21:47 +0000917 try:
918 if self._locked:
919 _lock_file(f)
920 try:
R. David Murrayfc141142011-02-11 22:47:17 +0000921 try:
922 self._dump_message(message, f)
923 except BaseException:
R. David Murray774a66d2011-02-12 00:03:31 +0000924 # Unlock and close so it can be deleted on Windows
925 if self._locked:
926 _unlock_file(f)
927 _sync_close(f)
928 closed = True
R. David Murrayfc141142011-02-11 22:47:17 +0000929 os.remove(new_path)
930 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000931 if isinstance(message, MHMessage):
932 self._dump_sequences(message, new_key)
933 finally:
934 if self._locked:
935 _unlock_file(f)
936 finally:
R. David Murray774a66d2011-02-12 00:03:31 +0000937 if not closed:
938 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000939 return new_key
940
941 def remove(self, key):
942 """Remove the keyed message; raise KeyError if it doesn't exist."""
943 path = os.path.join(self._path, str(key))
944 try:
945 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000946 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000947 if e.errno == errno.ENOENT:
948 raise KeyError('No message with key: %s' % key)
949 else:
950 raise
Benjamin Peterson21896a32010-03-21 22:03:03 +0000951 else:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000952 f.close()
Benjamin Peterson21896a32010-03-21 22:03:03 +0000953 os.remove(path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000954
955 def __setitem__(self, key, message):
956 """Replace the keyed message; raise KeyError if it doesn't exist."""
957 path = os.path.join(self._path, str(key))
958 try:
R. David Murrayb7deff12011-01-30 06:21:28 +0000959 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000960 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000961 if e.errno == errno.ENOENT:
962 raise KeyError('No message with key: %s' % key)
963 else:
964 raise
965 try:
966 if self._locked:
967 _lock_file(f)
968 try:
969 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
970 self._dump_message(message, f)
971 if isinstance(message, MHMessage):
972 self._dump_sequences(message, key)
973 finally:
974 if self._locked:
975 _unlock_file(f)
976 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000977 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000978
979 def get_message(self, key):
980 """Return a Message representation or raise a KeyError."""
981 try:
982 if self._locked:
R. David Murrayb7deff12011-01-30 06:21:28 +0000983 f = open(os.path.join(self._path, str(key)), 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000984 else:
R. David Murrayb7deff12011-01-30 06:21:28 +0000985 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +0000986 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000987 if e.errno == errno.ENOENT:
988 raise KeyError('No message with key: %s' % key)
989 else:
990 raise
991 try:
992 if self._locked:
993 _lock_file(f)
994 try:
995 msg = MHMessage(f)
996 finally:
997 if self._locked:
998 _unlock_file(f)
999 finally:
1000 f.close()
R. David Murray548ac412009-04-02 19:44:43 +00001001 for name, key_list in self.get_sequences().items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001002 if key in key_list:
1003 msg.add_sequence(name)
1004 return msg
1005
R. David Murrayb7deff12011-01-30 06:21:28 +00001006 def get_bytes(self, key):
1007 """Return a bytes representation or raise a KeyError."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001008 try:
1009 if self._locked:
R. David Murrayb7deff12011-01-30 06:21:28 +00001010 f = open(os.path.join(self._path, str(key)), 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001011 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001012 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +00001013 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001014 if e.errno == errno.ENOENT:
1015 raise KeyError('No message with key: %s' % key)
1016 else:
1017 raise
1018 try:
1019 if self._locked:
1020 _lock_file(f)
1021 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00001022 return f.read().replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001023 finally:
1024 if self._locked:
1025 _unlock_file(f)
1026 finally:
1027 f.close()
1028
1029 def get_file(self, key):
1030 """Return a file-like representation or raise a KeyError."""
1031 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00001032 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +00001033 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001034 if e.errno == errno.ENOENT:
1035 raise KeyError('No message with key: %s' % key)
1036 else:
1037 raise
1038 return _ProxyFile(f)
1039
1040 def iterkeys(self):
1041 """Return an iterator over keys."""
1042 return iter(sorted(int(entry) for entry in os.listdir(self._path)
1043 if entry.isdigit()))
1044
Guido van Rossume2b70bc2006-08-18 22:13:04 +00001045 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001046 """Return True if the keyed message exists, False otherwise."""
1047 return os.path.exists(os.path.join(self._path, str(key)))
1048
1049 def __len__(self):
1050 """Return a count of messages in the mailbox."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001051 return len(list(self.keys()))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001052
1053 def lock(self):
1054 """Lock the mailbox."""
1055 if not self._locked:
1056 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
1057 _lock_file(self._file)
1058 self._locked = True
1059
1060 def unlock(self):
1061 """Unlock the mailbox if it is locked."""
1062 if self._locked:
1063 _unlock_file(self._file)
Thomas Wouters89f507f2006-12-13 04:49:30 +00001064 _sync_close(self._file)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001065 del self._file
1066 self._locked = False
1067
1068 def flush(self):
1069 """Write any pending changes to the disk."""
1070 return
1071
1072 def close(self):
1073 """Flush and close the mailbox."""
1074 if self._locked:
1075 self.unlock()
1076
1077 def list_folders(self):
1078 """Return a list of folder names."""
1079 result = []
1080 for entry in os.listdir(self._path):
1081 if os.path.isdir(os.path.join(self._path, entry)):
1082 result.append(entry)
1083 return result
1084
1085 def get_folder(self, folder):
1086 """Return an MH instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +00001087 return MH(os.path.join(self._path, folder),
1088 factory=self._factory, create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001089
1090 def add_folder(self, folder):
1091 """Create a folder and return an MH instance representing it."""
Thomas Wouters89f507f2006-12-13 04:49:30 +00001092 return MH(os.path.join(self._path, folder),
1093 factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001094
1095 def remove_folder(self, folder):
1096 """Delete the named folder, which must be empty."""
1097 path = os.path.join(self._path, folder)
1098 entries = os.listdir(path)
1099 if entries == ['.mh_sequences']:
1100 os.remove(os.path.join(path, '.mh_sequences'))
1101 elif entries == []:
1102 pass
1103 else:
1104 raise NotEmptyError('Folder not empty: %s' % self._path)
1105 os.rmdir(path)
1106
1107 def get_sequences(self):
1108 """Return a name-to-key-list dictionary to define each sequence."""
1109 results = {}
Victor Stinner5c267e22011-10-17 20:44:22 +02001110 with open(os.path.join(self._path, '.mh_sequences'), 'r', encoding='ASCII') as f:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001111 all_keys = set(self.keys())
1112 for line in f:
1113 try:
1114 name, contents = line.split(':')
1115 keys = set()
1116 for spec in contents.split():
1117 if spec.isdigit():
1118 keys.add(int(spec))
1119 else:
1120 start, stop = (int(x) for x in spec.split('-'))
1121 keys.update(range(start, stop + 1))
1122 results[name] = [key for key in sorted(keys) \
1123 if key in all_keys]
1124 if len(results[name]) == 0:
1125 del results[name]
1126 except ValueError:
1127 raise FormatError('Invalid sequence specification: %s' %
1128 line.rstrip())
Thomas Wouters477c8d52006-05-27 19:21:47 +00001129 return results
1130
1131 def set_sequences(self, sequences):
1132 """Set sequences using the given name-to-key-list dictionary."""
Victor Stinner5c267e22011-10-17 20:44:22 +02001133 f = open(os.path.join(self._path, '.mh_sequences'), 'r+', encoding='ASCII')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001134 try:
1135 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001136 for name, keys in sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001137 if len(keys) == 0:
1138 continue
R. David Murrayb7deff12011-01-30 06:21:28 +00001139 f.write(name + ':')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001140 prev = None
1141 completing = False
1142 for key in sorted(set(keys)):
1143 if key - 1 == prev:
1144 if not completing:
1145 completing = True
1146 f.write('-')
1147 elif completing:
1148 completing = False
1149 f.write('%s %s' % (prev, key))
1150 else:
1151 f.write(' %s' % key)
1152 prev = key
1153 if completing:
1154 f.write(str(prev) + '\n')
1155 else:
1156 f.write('\n')
1157 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +00001158 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001159
1160 def pack(self):
1161 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1162 sequences = self.get_sequences()
1163 prev = 0
1164 changes = []
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001165 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001166 if key - 1 != prev:
1167 changes.append((key, prev + 1))
Thomas Wouters89f507f2006-12-13 04:49:30 +00001168 if hasattr(os, 'link'):
1169 os.link(os.path.join(self._path, str(key)),
1170 os.path.join(self._path, str(prev + 1)))
1171 os.unlink(os.path.join(self._path, str(key)))
1172 else:
1173 os.rename(os.path.join(self._path, str(key)),
1174 os.path.join(self._path, str(prev + 1)))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001175 prev += 1
1176 self._next_key = prev + 1
1177 if len(changes) == 0:
1178 return
1179 for name, key_list in sequences.items():
1180 for old, new in changes:
1181 if old in key_list:
1182 key_list[key_list.index(old)] = new
1183 self.set_sequences(sequences)
1184
1185 def _dump_sequences(self, message, key):
1186 """Inspect a new MHMessage and update sequences appropriately."""
1187 pending_sequences = message.get_sequences()
1188 all_sequences = self.get_sequences()
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001189 for name, key_list in all_sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001190 if name in pending_sequences:
1191 key_list.append(key)
1192 elif key in key_list:
1193 del key_list[key_list.index(key)]
1194 for sequence in pending_sequences:
1195 if sequence not in all_sequences:
1196 all_sequences[sequence] = [key]
1197 self.set_sequences(all_sequences)
1198
1199
1200class Babyl(_singlefileMailbox):
1201 """An Rmail-style Babyl mailbox."""
1202
1203 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1204 'forwarded', 'edited', 'resent'))
1205
1206 def __init__(self, path, factory=None, create=True):
1207 """Initialize a Babyl mailbox."""
1208 _singlefileMailbox.__init__(self, path, factory, create)
1209 self._labels = {}
1210
1211 def add(self, message):
1212 """Add message and return assigned key."""
1213 key = _singlefileMailbox.add(self, message)
1214 if isinstance(message, BabylMessage):
1215 self._labels[key] = message.get_labels()
1216 return key
1217
1218 def remove(self, key):
1219 """Remove the keyed message; raise KeyError if it doesn't exist."""
1220 _singlefileMailbox.remove(self, key)
1221 if key in self._labels:
1222 del self._labels[key]
1223
1224 def __setitem__(self, key, message):
1225 """Replace the keyed message; raise KeyError if it doesn't exist."""
1226 _singlefileMailbox.__setitem__(self, key, message)
1227 if isinstance(message, BabylMessage):
1228 self._labels[key] = message.get_labels()
1229
1230 def get_message(self, key):
1231 """Return a Message representation or raise a KeyError."""
1232 start, stop = self._lookup(key)
1233 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +00001234 self._file.readline() # Skip b'1,' line specifying labels.
1235 original_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001236 while True:
1237 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001238 if line == b'*** EOOH ***' + linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001239 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001240 original_headers.write(line.replace(linesep, b'\n'))
1241 visible_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001242 while True:
1243 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001244 if line == linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001245 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001246 visible_headers.write(line.replace(linesep, b'\n'))
1247 # Read up to the stop, or to the end
1248 n = stop - self._file.tell()
1249 assert n >= 0
1250 body = self._file.read(n)
1251 body = body.replace(linesep, b'\n')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001252 msg = BabylMessage(original_headers.getvalue() + body)
1253 msg.set_visible(visible_headers.getvalue())
1254 if key in self._labels:
1255 msg.set_labels(self._labels[key])
1256 return msg
1257
R. David Murrayb7deff12011-01-30 06:21:28 +00001258 def get_bytes(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001259 """Return a string representation or raise a KeyError."""
1260 start, stop = self._lookup(key)
1261 self._file.seek(start)
R. David Murrayb7deff12011-01-30 06:21:28 +00001262 self._file.readline() # Skip b'1,' line specifying labels.
1263 original_headers = io.BytesIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001264 while True:
1265 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001266 if line == b'*** EOOH ***' + linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001267 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001268 original_headers.write(line.replace(linesep, b'\n'))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001269 while True:
1270 line = self._file.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001271 if line == linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001272 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001273 headers = original_headers.getvalue()
1274 n = stop - self._file.tell()
1275 assert n >= 0
1276 data = self._file.read(n)
1277 data = data.replace(linesep, b'\n')
1278 return headers + data
Thomas Wouters477c8d52006-05-27 19:21:47 +00001279
1280 def get_file(self, key):
1281 """Return a file-like representation or raise a KeyError."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001282 return io.BytesIO(self.get_bytes(key).replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001283
1284 def get_labels(self):
1285 """Return a list of user-defined labels in the mailbox."""
1286 self._lookup()
1287 labels = set()
1288 for label_list in self._labels.values():
1289 labels.update(label_list)
1290 labels.difference_update(self._special_labels)
1291 return list(labels)
1292
1293 def _generate_toc(self):
1294 """Generate key-to-(start, stop) table of contents."""
1295 starts, stops = [], []
1296 self._file.seek(0)
1297 next_pos = 0
1298 label_lists = []
1299 while True:
1300 line_pos = next_pos
1301 line = self._file.readline()
1302 next_pos = self._file.tell()
R. David Murrayb7deff12011-01-30 06:21:28 +00001303 if line == b'\037\014' + linesep:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001304 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +00001305 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001306 starts.append(next_pos)
1307 labels = [label.strip() for label
R. David Murrayb7deff12011-01-30 06:21:28 +00001308 in self._file.readline()[1:].split(b',')
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001309 if label.strip()]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001310 label_lists.append(labels)
R. David Murrayb7deff12011-01-30 06:21:28 +00001311 elif line == b'\037' or line == b'\037' + linesep:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001312 if len(stops) < len(starts):
R. David Murrayb7deff12011-01-30 06:21:28 +00001313 stops.append(line_pos - len(linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001314 elif not line:
R. David Murrayb7deff12011-01-30 06:21:28 +00001315 stops.append(line_pos - len(linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001316 break
1317 self._toc = dict(enumerate(zip(starts, stops)))
1318 self._labels = dict(enumerate(label_lists))
1319 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001320 self._file.seek(0, 2)
1321 self._file_length = self._file.tell()
Thomas Wouters9fe394c2007-02-05 01:24:16 +00001322
Thomas Wouters477c8d52006-05-27 19:21:47 +00001323 def _pre_mailbox_hook(self, f):
1324 """Called before writing the mailbox to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001325 babyl = b'BABYL OPTIONS:' + linesep
1326 babyl += b'Version: 5' + linesep
1327 labels = self.get_labels()
1328 labels = (label.encode() for label in labels)
1329 babyl += b'Labels:' + b','.join(labels) + linesep
1330 babyl += b'\037'
1331 f.write(babyl)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001332
1333 def _pre_message_hook(self, f):
1334 """Called before writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001335 f.write(b'\014' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001336
1337 def _post_message_hook(self, f):
1338 """Called after writing each message to file f."""
R. David Murrayb7deff12011-01-30 06:21:28 +00001339 f.write(linesep + b'\037')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001340
1341 def _install_message(self, message):
1342 """Write message contents and return (start, stop)."""
1343 start = self._file.tell()
1344 if isinstance(message, BabylMessage):
1345 special_labels = []
1346 labels = []
1347 for label in message.get_labels():
1348 if label in self._special_labels:
1349 special_labels.append(label)
1350 else:
1351 labels.append(label)
R. David Murrayb7deff12011-01-30 06:21:28 +00001352 self._file.write(b'1')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001353 for label in special_labels:
R. David Murrayb7deff12011-01-30 06:21:28 +00001354 self._file.write(b', ' + label.encode())
1355 self._file.write(b',,')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001356 for label in labels:
R. David Murrayb7deff12011-01-30 06:21:28 +00001357 self._file.write(b' ' + label.encode() + b',')
1358 self._file.write(linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001359 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001360 self._file.write(b'1,,' + linesep)
Thomas Woutersb2137042007-02-01 18:02:27 +00001361 if isinstance(message, email.message.Message):
R. David Murrayb7deff12011-01-30 06:21:28 +00001362 orig_buffer = io.BytesIO()
1363 orig_generator = email.generator.BytesGenerator(orig_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001364 orig_generator.flatten(message)
1365 orig_buffer.seek(0)
1366 while True:
1367 line = orig_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001368 self._file.write(line.replace(b'\n', linesep))
1369 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001370 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001371 self._file.write(b'*** EOOH ***' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001372 if isinstance(message, BabylMessage):
R. David Murrayb7deff12011-01-30 06:21:28 +00001373 vis_buffer = io.BytesIO()
1374 vis_generator = email.generator.BytesGenerator(vis_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001375 vis_generator.flatten(message.get_visible())
1376 while True:
1377 line = vis_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001378 self._file.write(line.replace(b'\n', linesep))
1379 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001380 break
1381 else:
1382 orig_buffer.seek(0)
1383 while True:
1384 line = orig_buffer.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001385 self._file.write(line.replace(b'\n', linesep))
1386 if line == b'\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001387 break
1388 while True:
1389 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001390 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001391 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001392 self._file.write(buffer.replace(b'\n', linesep))
1393 elif isinstance(message, (bytes, str, io.StringIO)):
1394 if isinstance(message, io.StringIO):
1395 warnings.warn("Use of StringIO input is deprecated, "
1396 "use BytesIO instead", DeprecationWarning, 3)
1397 message = message.getvalue()
1398 if isinstance(message, str):
1399 message = self._string_to_bytes(message)
1400 body_start = message.find(b'\n\n') + 2
Thomas Wouters477c8d52006-05-27 19:21:47 +00001401 if body_start - 2 != -1:
R. David Murrayb7deff12011-01-30 06:21:28 +00001402 self._file.write(message[:body_start].replace(b'\n', linesep))
1403 self._file.write(b'*** EOOH ***' + linesep)
1404 self._file.write(message[:body_start].replace(b'\n', linesep))
1405 self._file.write(message[body_start:].replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001406 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001407 self._file.write(b'*** EOOH ***' + linesep + linesep)
1408 self._file.write(message.replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001409 elif hasattr(message, 'readline'):
R. David Murrayb7deff12011-01-30 06:21:28 +00001410 if hasattr(message, 'buffer'):
1411 warnings.warn("Use of text mode files is deprecated, "
1412 "use a binary mode file instead", DeprecationWarning, 3)
1413 message = message.buffer
Thomas Wouters477c8d52006-05-27 19:21:47 +00001414 original_pos = message.tell()
1415 first_pass = True
1416 while True:
1417 line = message.readline()
R. David Murrayb7deff12011-01-30 06:21:28 +00001418 # Universal newline support.
1419 if line.endswith(b'\r\n'):
1420 line = line[:-2] + b'\n'
1421 elif line.endswith(b'\r'):
1422 line = line[:-1] + b'\n'
1423 self._file.write(line.replace(b'\n', linesep))
1424 if line == b'\n' or not line:
1425 self._file.write(b'*** EOOH ***' + linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001426 if first_pass:
1427 first_pass = False
1428 message.seek(original_pos)
1429 else:
1430 break
1431 while True:
1432 buffer = message.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001433 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001434 break
R. David Murrayb7deff12011-01-30 06:21:28 +00001435 self._file.write(buffer.replace(b'\n', linesep))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001436 else:
1437 raise TypeError('Invalid message type: %s' % type(message))
1438 stop = self._file.tell()
1439 return (start, stop)
1440
1441
Thomas Woutersb2137042007-02-01 18:02:27 +00001442class Message(email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001443 """Message with mailbox-format-specific properties."""
1444
1445 def __init__(self, message=None):
1446 """Initialize a Message instance."""
Thomas Woutersb2137042007-02-01 18:02:27 +00001447 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001448 self._become_message(copy.deepcopy(message))
1449 if isinstance(message, Message):
1450 message._explain_to(self)
R. David Murrayb7deff12011-01-30 06:21:28 +00001451 elif isinstance(message, bytes):
1452 self._become_message(email.message_from_bytes(message))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001453 elif isinstance(message, str):
1454 self._become_message(email.message_from_string(message))
R. David Murrayb7deff12011-01-30 06:21:28 +00001455 elif isinstance(message, io.TextIOWrapper):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001456 self._become_message(email.message_from_file(message))
R. David Murrayb7deff12011-01-30 06:21:28 +00001457 elif hasattr(message, "read"):
1458 self._become_message(email.message_from_binary_file(message))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001459 elif message is None:
Thomas Woutersb2137042007-02-01 18:02:27 +00001460 email.message.Message.__init__(self)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001461 else:
1462 raise TypeError('Invalid message type: %s' % type(message))
1463
1464 def _become_message(self, message):
1465 """Assume the non-format-specific state of message."""
R David Murrayb019ee72012-04-08 22:36:07 -04001466 type_specific = getattr(message, '_type_specific_attributes', [])
1467 for name in message.__dict__:
1468 if name not in type_specific:
1469 self.__dict__[name] = message.__dict__[name]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001470
1471 def _explain_to(self, message):
1472 """Copy format-specific state to message insofar as possible."""
1473 if isinstance(message, Message):
1474 return # There's nothing format-specific to explain.
1475 else:
1476 raise TypeError('Cannot convert to specified type')
1477
1478
1479class MaildirMessage(Message):
1480 """Message with Maildir-specific properties."""
1481
R David Murrayb019ee72012-04-08 22:36:07 -04001482 _type_specific_attributes = ['_subdir', '_info', '_date']
1483
Thomas Wouters477c8d52006-05-27 19:21:47 +00001484 def __init__(self, message=None):
1485 """Initialize a MaildirMessage instance."""
1486 self._subdir = 'new'
1487 self._info = ''
1488 self._date = time.time()
1489 Message.__init__(self, message)
1490
1491 def get_subdir(self):
1492 """Return 'new' or 'cur'."""
1493 return self._subdir
1494
1495 def set_subdir(self, subdir):
1496 """Set subdir to 'new' or 'cur'."""
1497 if subdir == 'new' or subdir == 'cur':
1498 self._subdir = subdir
1499 else:
1500 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1501
1502 def get_flags(self):
1503 """Return as a string the flags that are set."""
1504 if self._info.startswith('2,'):
1505 return self._info[2:]
1506 else:
1507 return ''
1508
1509 def set_flags(self, flags):
1510 """Set the given flags and unset all others."""
1511 self._info = '2,' + ''.join(sorted(flags))
1512
1513 def add_flag(self, flag):
1514 """Set the given flag(s) without changing others."""
1515 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1516
1517 def remove_flag(self, flag):
1518 """Unset the given string flag(s) without changing others."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001519 if self.get_flags():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001520 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1521
1522 def get_date(self):
1523 """Return delivery date of message, in seconds since the epoch."""
1524 return self._date
1525
1526 def set_date(self, date):
1527 """Set delivery date of message, in seconds since the epoch."""
1528 try:
1529 self._date = float(date)
1530 except ValueError:
1531 raise TypeError("can't convert to float: %s" % date)
1532
1533 def get_info(self):
1534 """Get the message's "info" as a string."""
1535 return self._info
1536
1537 def set_info(self, info):
1538 """Set the message's "info" string."""
1539 if isinstance(info, str):
1540 self._info = info
1541 else:
1542 raise TypeError('info must be a string: %s' % type(info))
1543
1544 def _explain_to(self, message):
1545 """Copy Maildir-specific state to message insofar as possible."""
1546 if isinstance(message, MaildirMessage):
1547 message.set_flags(self.get_flags())
1548 message.set_subdir(self.get_subdir())
1549 message.set_date(self.get_date())
1550 elif isinstance(message, _mboxMMDFMessage):
1551 flags = set(self.get_flags())
1552 if 'S' in flags:
1553 message.add_flag('R')
1554 if self.get_subdir() == 'cur':
1555 message.add_flag('O')
1556 if 'T' in flags:
1557 message.add_flag('D')
1558 if 'F' in flags:
1559 message.add_flag('F')
1560 if 'R' in flags:
1561 message.add_flag('A')
1562 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1563 elif isinstance(message, MHMessage):
1564 flags = set(self.get_flags())
1565 if 'S' not in flags:
1566 message.add_sequence('unseen')
1567 if 'R' in flags:
1568 message.add_sequence('replied')
1569 if 'F' in flags:
1570 message.add_sequence('flagged')
1571 elif isinstance(message, BabylMessage):
1572 flags = set(self.get_flags())
1573 if 'S' not in flags:
1574 message.add_label('unseen')
1575 if 'T' in flags:
1576 message.add_label('deleted')
1577 if 'R' in flags:
1578 message.add_label('answered')
1579 if 'P' in flags:
1580 message.add_label('forwarded')
1581 elif isinstance(message, Message):
1582 pass
1583 else:
1584 raise TypeError('Cannot convert to specified type: %s' %
1585 type(message))
1586
1587
1588class _mboxMMDFMessage(Message):
1589 """Message with mbox- or MMDF-specific properties."""
1590
R David Murrayb019ee72012-04-08 22:36:07 -04001591 _type_specific_attributes = ['_from']
1592
Thomas Wouters477c8d52006-05-27 19:21:47 +00001593 def __init__(self, message=None):
1594 """Initialize an mboxMMDFMessage instance."""
1595 self.set_from('MAILER-DAEMON', True)
Thomas Woutersb2137042007-02-01 18:02:27 +00001596 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001597 unixfrom = message.get_unixfrom()
1598 if unixfrom is not None and unixfrom.startswith('From '):
1599 self.set_from(unixfrom[5:])
1600 Message.__init__(self, message)
1601
1602 def get_from(self):
1603 """Return contents of "From " line."""
1604 return self._from
1605
1606 def set_from(self, from_, time_=None):
1607 """Set "From " line, formatting and appending time_ if specified."""
1608 if time_ is not None:
1609 if time_ is True:
1610 time_ = time.gmtime()
1611 from_ += ' ' + time.asctime(time_)
1612 self._from = from_
1613
1614 def get_flags(self):
1615 """Return as a string the flags that are set."""
1616 return self.get('Status', '') + self.get('X-Status', '')
1617
1618 def set_flags(self, flags):
1619 """Set the given flags and unset all others."""
1620 flags = set(flags)
1621 status_flags, xstatus_flags = '', ''
1622 for flag in ('R', 'O'):
1623 if flag in flags:
1624 status_flags += flag
1625 flags.remove(flag)
1626 for flag in ('D', 'F', 'A'):
1627 if flag in flags:
1628 xstatus_flags += flag
1629 flags.remove(flag)
1630 xstatus_flags += ''.join(sorted(flags))
1631 try:
1632 self.replace_header('Status', status_flags)
1633 except KeyError:
1634 self.add_header('Status', status_flags)
1635 try:
1636 self.replace_header('X-Status', xstatus_flags)
1637 except KeyError:
1638 self.add_header('X-Status', xstatus_flags)
1639
1640 def add_flag(self, flag):
1641 """Set the given flag(s) without changing others."""
1642 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1643
1644 def remove_flag(self, flag):
1645 """Unset the given string flag(s) without changing others."""
1646 if 'Status' in self or 'X-Status' in self:
1647 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1648
1649 def _explain_to(self, message):
1650 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1651 if isinstance(message, MaildirMessage):
1652 flags = set(self.get_flags())
1653 if 'O' in flags:
1654 message.set_subdir('cur')
1655 if 'F' in flags:
1656 message.add_flag('F')
1657 if 'A' in flags:
1658 message.add_flag('R')
1659 if 'R' in flags:
1660 message.add_flag('S')
1661 if 'D' in flags:
1662 message.add_flag('T')
1663 del message['status']
1664 del message['x-status']
1665 maybe_date = ' '.join(self.get_from().split()[-5:])
1666 try:
1667 message.set_date(calendar.timegm(time.strptime(maybe_date,
1668 '%a %b %d %H:%M:%S %Y')))
1669 except (ValueError, OverflowError):
1670 pass
1671 elif isinstance(message, _mboxMMDFMessage):
1672 message.set_flags(self.get_flags())
1673 message.set_from(self.get_from())
1674 elif isinstance(message, MHMessage):
1675 flags = set(self.get_flags())
1676 if 'R' not in flags:
1677 message.add_sequence('unseen')
1678 if 'A' in flags:
1679 message.add_sequence('replied')
1680 if 'F' in flags:
1681 message.add_sequence('flagged')
1682 del message['status']
1683 del message['x-status']
1684 elif isinstance(message, BabylMessage):
1685 flags = set(self.get_flags())
1686 if 'R' not in flags:
1687 message.add_label('unseen')
1688 if 'D' in flags:
1689 message.add_label('deleted')
1690 if 'A' in flags:
1691 message.add_label('answered')
1692 del message['status']
1693 del message['x-status']
1694 elif isinstance(message, Message):
1695 pass
1696 else:
1697 raise TypeError('Cannot convert to specified type: %s' %
1698 type(message))
1699
1700
1701class mboxMessage(_mboxMMDFMessage):
1702 """Message with mbox-specific properties."""
1703
1704
1705class MHMessage(Message):
1706 """Message with MH-specific properties."""
1707
R David Murrayb019ee72012-04-08 22:36:07 -04001708 _type_specific_attributes = ['_sequences']
1709
Thomas Wouters477c8d52006-05-27 19:21:47 +00001710 def __init__(self, message=None):
1711 """Initialize an MHMessage instance."""
1712 self._sequences = []
1713 Message.__init__(self, message)
1714
1715 def get_sequences(self):
1716 """Return a list of sequences that include the message."""
1717 return self._sequences[:]
1718
1719 def set_sequences(self, sequences):
1720 """Set the list of sequences that include the message."""
1721 self._sequences = list(sequences)
1722
1723 def add_sequence(self, sequence):
1724 """Add sequence to list of sequences including the message."""
1725 if isinstance(sequence, str):
1726 if not sequence in self._sequences:
1727 self._sequences.append(sequence)
1728 else:
R. David Murrayb7deff12011-01-30 06:21:28 +00001729 raise TypeError('sequence type must be str: %s' % type(sequence))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001730
1731 def remove_sequence(self, sequence):
1732 """Remove sequence from the list of sequences including the message."""
1733 try:
1734 self._sequences.remove(sequence)
1735 except ValueError:
1736 pass
1737
1738 def _explain_to(self, message):
1739 """Copy MH-specific state to message insofar as possible."""
1740 if isinstance(message, MaildirMessage):
1741 sequences = set(self.get_sequences())
1742 if 'unseen' in sequences:
1743 message.set_subdir('cur')
1744 else:
1745 message.set_subdir('cur')
1746 message.add_flag('S')
1747 if 'flagged' in sequences:
1748 message.add_flag('F')
1749 if 'replied' in sequences:
1750 message.add_flag('R')
1751 elif isinstance(message, _mboxMMDFMessage):
1752 sequences = set(self.get_sequences())
1753 if 'unseen' not in sequences:
1754 message.add_flag('RO')
1755 else:
1756 message.add_flag('O')
1757 if 'flagged' in sequences:
1758 message.add_flag('F')
1759 if 'replied' in sequences:
1760 message.add_flag('A')
1761 elif isinstance(message, MHMessage):
1762 for sequence in self.get_sequences():
1763 message.add_sequence(sequence)
1764 elif isinstance(message, BabylMessage):
1765 sequences = set(self.get_sequences())
1766 if 'unseen' in sequences:
1767 message.add_label('unseen')
1768 if 'replied' in sequences:
1769 message.add_label('answered')
1770 elif isinstance(message, Message):
1771 pass
1772 else:
1773 raise TypeError('Cannot convert to specified type: %s' %
1774 type(message))
1775
1776
1777class BabylMessage(Message):
1778 """Message with Babyl-specific properties."""
1779
R David Murrayb019ee72012-04-08 22:36:07 -04001780 _type_specific_attributes = ['_labels', '_visible']
1781
Thomas Wouters477c8d52006-05-27 19:21:47 +00001782 def __init__(self, message=None):
1783 """Initialize an BabylMessage instance."""
1784 self._labels = []
1785 self._visible = Message()
1786 Message.__init__(self, message)
1787
1788 def get_labels(self):
1789 """Return a list of labels on the message."""
1790 return self._labels[:]
1791
1792 def set_labels(self, labels):
1793 """Set the list of labels on the message."""
1794 self._labels = list(labels)
1795
1796 def add_label(self, label):
1797 """Add label to list of labels on the message."""
1798 if isinstance(label, str):
1799 if label not in self._labels:
1800 self._labels.append(label)
1801 else:
1802 raise TypeError('label must be a string: %s' % type(label))
1803
1804 def remove_label(self, label):
1805 """Remove label from the list of labels on the message."""
1806 try:
1807 self._labels.remove(label)
1808 except ValueError:
1809 pass
1810
1811 def get_visible(self):
1812 """Return a Message representation of visible headers."""
1813 return Message(self._visible)
1814
1815 def set_visible(self, visible):
1816 """Set the Message representation of visible headers."""
1817 self._visible = Message(visible)
1818
1819 def update_visible(self):
1820 """Update and/or sensibly generate a set of visible headers."""
1821 for header in self._visible.keys():
1822 if header in self:
1823 self._visible.replace_header(header, self[header])
1824 else:
1825 del self._visible[header]
1826 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1827 if header in self and header not in self._visible:
1828 self._visible[header] = self[header]
1829
1830 def _explain_to(self, message):
1831 """Copy Babyl-specific state to message insofar as possible."""
1832 if isinstance(message, MaildirMessage):
1833 labels = set(self.get_labels())
1834 if 'unseen' in labels:
1835 message.set_subdir('cur')
1836 else:
1837 message.set_subdir('cur')
1838 message.add_flag('S')
1839 if 'forwarded' in labels or 'resent' in labels:
1840 message.add_flag('P')
1841 if 'answered' in labels:
1842 message.add_flag('R')
1843 if 'deleted' in labels:
1844 message.add_flag('T')
1845 elif isinstance(message, _mboxMMDFMessage):
1846 labels = set(self.get_labels())
1847 if 'unseen' not in labels:
1848 message.add_flag('RO')
1849 else:
1850 message.add_flag('O')
1851 if 'deleted' in labels:
1852 message.add_flag('D')
1853 if 'answered' in labels:
1854 message.add_flag('A')
1855 elif isinstance(message, MHMessage):
1856 labels = set(self.get_labels())
1857 if 'unseen' in labels:
1858 message.add_sequence('unseen')
1859 if 'answered' in labels:
1860 message.add_sequence('replied')
1861 elif isinstance(message, BabylMessage):
1862 message.set_visible(self.get_visible())
1863 for label in self.get_labels():
1864 message.add_label(label)
1865 elif isinstance(message, Message):
1866 pass
1867 else:
1868 raise TypeError('Cannot convert to specified type: %s' %
1869 type(message))
1870
1871
1872class MMDFMessage(_mboxMMDFMessage):
1873 """Message with MMDF-specific properties."""
1874
1875
1876class _ProxyFile:
1877 """A read-only wrapper of a file."""
1878
1879 def __init__(self, f, pos=None):
1880 """Initialize a _ProxyFile."""
1881 self._file = f
1882 if pos is None:
1883 self._pos = f.tell()
1884 else:
1885 self._pos = pos
1886
1887 def read(self, size=None):
1888 """Read bytes."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001889 return self._read(size, self._file.read)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001890
R. David Murrayb7deff12011-01-30 06:21:28 +00001891 def read1(self, size=None):
1892 """Read bytes."""
1893 return self._read(size, self._file.read1)
1894
Thomas Wouters477c8d52006-05-27 19:21:47 +00001895 def readline(self, size=None):
1896 """Read a line."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001897 return self._read(size, self._file.readline)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001898
1899 def readlines(self, sizehint=None):
1900 """Read multiple lines."""
1901 result = []
1902 for line in self:
1903 result.append(line)
1904 if sizehint is not None:
1905 sizehint -= len(line)
1906 if sizehint <= 0:
1907 break
1908 return result
1909
1910 def __iter__(self):
1911 """Iterate over lines."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001912 while True:
1913 line = self.readline()
1914 if not line:
1915 raise StopIteration
1916 yield line
Thomas Wouters477c8d52006-05-27 19:21:47 +00001917
1918 def tell(self):
1919 """Return the position."""
1920 return self._pos
1921
1922 def seek(self, offset, whence=0):
1923 """Change position."""
1924 if whence == 1:
1925 self._file.seek(self._pos)
1926 self._file.seek(offset, whence)
1927 self._pos = self._file.tell()
1928
1929 def close(self):
1930 """Close the file."""
R David Murrayc88bce12011-06-17 22:24:05 -04001931 if hasattr(self, '_file'):
1932 if hasattr(self._file, 'close'):
1933 self._file.close()
1934 del self._file
Thomas Wouters477c8d52006-05-27 19:21:47 +00001935
1936 def _read(self, size, read_method):
1937 """Read size bytes using read_method."""
1938 if size is None:
1939 size = -1
1940 self._file.seek(self._pos)
1941 result = read_method(size)
1942 self._pos = self._file.tell()
1943 return result
1944
Georg Brandl6ce29fa2010-10-30 14:33:28 +00001945 def __enter__(self):
1946 """Context manager protocol support."""
1947 return self
1948
1949 def __exit__(self, *exc):
1950 self.close()
1951
R. David Murrayb7deff12011-01-30 06:21:28 +00001952 def readable(self):
1953 return self._file.readable()
1954
1955 def writable(self):
1956 return self._file.writable()
1957
1958 def seekable(self):
1959 return self._file.seekable()
1960
1961 def flush(self):
1962 return self._file.flush()
1963
1964 @property
1965 def closed(self):
R David Murrayc88bce12011-06-17 22:24:05 -04001966 if not hasattr(self, '_file'):
1967 return True
1968 if not hasattr(self._file, 'closed'):
1969 return False
R. David Murrayb7deff12011-01-30 06:21:28 +00001970 return self._file.closed
1971
Thomas Wouters477c8d52006-05-27 19:21:47 +00001972
1973class _PartialFile(_ProxyFile):
1974 """A read-only wrapper of part of a file."""
1975
1976 def __init__(self, f, start=None, stop=None):
1977 """Initialize a _PartialFile."""
1978 _ProxyFile.__init__(self, f, start)
1979 self._start = start
1980 self._stop = stop
1981
1982 def tell(self):
1983 """Return the position with respect to start."""
1984 return _ProxyFile.tell(self) - self._start
1985
1986 def seek(self, offset, whence=0):
1987 """Change position, possibly with respect to start or stop."""
1988 if whence == 0:
1989 self._pos = self._start
1990 whence = 1
1991 elif whence == 2:
1992 self._pos = self._stop
1993 whence = 1
1994 _ProxyFile.seek(self, offset, whence)
1995
1996 def _read(self, size, read_method):
1997 """Read size bytes using read_method, honoring start and stop."""
1998 remaining = self._stop - self._pos
1999 if remaining <= 0:
R. David Murrayb7deff12011-01-30 06:21:28 +00002000 return b''
Thomas Wouters477c8d52006-05-27 19:21:47 +00002001 if size is None or size < 0 or size > remaining:
2002 size = remaining
2003 return _ProxyFile._read(self, size, read_method)
2004
Georg Brandl6ce29fa2010-10-30 14:33:28 +00002005 def close(self):
2006 # do *not* close the underlying file object for partial files,
2007 # since it's global to the mailbox object
R David Murrayc88bce12011-06-17 22:24:05 -04002008 if hasattr(self, '_file'):
2009 del self._file
Georg Brandl6ce29fa2010-10-30 14:33:28 +00002010
Thomas Wouters477c8d52006-05-27 19:21:47 +00002011
2012def _lock_file(f, dotlock=True):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002013 """Lock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00002014 dotlock_done = False
2015 try:
2016 if fcntl:
2017 try:
2018 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
Guido van Rossumb940e112007-01-10 16:19:56 +00002019 except IOError as e:
R. David Murray752b9502011-03-03 18:12:34 +00002020 if e.errno in (errno.EAGAIN, errno.EACCES, errno.EROFS):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002021 raise ExternalClashError('lockf: lock unavailable: %s' %
2022 f.name)
2023 else:
2024 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +00002025 if dotlock:
2026 try:
2027 pre_lock = _create_temporary(f.name + '.lock')
2028 pre_lock.close()
Guido van Rossumb940e112007-01-10 16:19:56 +00002029 except IOError as e:
R. David Murray752b9502011-03-03 18:12:34 +00002030 if e.errno in (errno.EACCES, errno.EROFS):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002031 return # Without write access, just skip dotlocking.
2032 else:
2033 raise
2034 try:
2035 if hasattr(os, 'link'):
2036 os.link(pre_lock.name, f.name + '.lock')
2037 dotlock_done = True
2038 os.unlink(pre_lock.name)
2039 else:
2040 os.rename(pre_lock.name, f.name + '.lock')
2041 dotlock_done = True
Guido van Rossumb940e112007-01-10 16:19:56 +00002042 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002043 if e.errno == errno.EEXIST or \
2044 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00002045 os.remove(pre_lock.name)
2046 raise ExternalClashError('dot lock unavailable: %s' %
2047 f.name)
2048 else:
2049 raise
2050 except:
2051 if fcntl:
2052 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002053 if dotlock_done:
2054 os.remove(f.name + '.lock')
2055 raise
2056
2057def _unlock_file(f):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00002058 """Unlock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00002059 if fcntl:
2060 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002061 if os.path.exists(f.name + '.lock'):
2062 os.remove(f.name + '.lock')
2063
2064def _create_carefully(path):
2065 """Create a file if it doesn't exist and open for reading and writing."""
Georg Brandl6aa2d1f2008-08-12 08:35:52 +00002066 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR, 0o666)
Thomas Wouters477c8d52006-05-27 19:21:47 +00002067 try:
R. David Murrayb7deff12011-01-30 06:21:28 +00002068 return open(path, 'rb+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00002069 finally:
2070 os.close(fd)
2071
2072def _create_temporary(path):
2073 """Create a temp file based on path and open for reading and writing."""
2074 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
2075 socket.gethostname(),
2076 os.getpid()))
2077
Thomas Wouters89f507f2006-12-13 04:49:30 +00002078def _sync_flush(f):
2079 """Ensure changes to file f are physically on disk."""
2080 f.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +00002081 if hasattr(os, 'fsync'):
2082 os.fsync(f.fileno())
Thomas Wouters89f507f2006-12-13 04:49:30 +00002083
2084def _sync_close(f):
2085 """Close file f, ensuring all changes are physically on disk."""
2086 _sync_flush(f)
2087 f.close()
Thomas Wouters477c8d52006-05-27 19:21:47 +00002088
Guido van Rossum62448671996-09-17 21:33:15 +00002089
Thomas Wouters477c8d52006-05-27 19:21:47 +00002090class Error(Exception):
2091 """Raised for module-specific errors."""
2092
2093class NoSuchMailboxError(Error):
2094 """The specified mailbox does not exist and won't be created."""
2095
2096class NotEmptyError(Error):
2097 """The specified mailbox is not empty and deletion was requested."""
2098
2099class ExternalClashError(Error):
2100 """Another process caused an action to fail."""
2101
2102class FormatError(Error):
2103 """A file appears to have an invalid format."""