blob: 13e3eb7efa824bbca3036e4722c9b699f5d77242 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Thomas Wouters477c8d52006-05-27 19:21:47 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Thomas Wouters89f507f2006-12-13 04:49:30 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Thomas Wouters477c8d52006-05-27 19:21:47 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Thomas Wouters477c8d52006-05-27 19:21:47 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
Thomas Woutersb2137042007-02-01 18:02:27 +000019import email.message
20import email.generator
Thomas Wouters477c8d52006-05-27 19:21:47 +000021import rfc822
Guido van Rossum34d19282007-08-09 01:03:29 +000022import io
Thomas Wouters477c8d52006-05-27 19:21:47 +000023try:
Thomas Wouters0e3f5912006-08-11 14:57:12 +000024 if sys.platform == 'os2emx':
25 # OS/2 EMX fcntl() not adequate
26 raise ImportError
27 import fcntl
Thomas Wouters477c8d52006-05-27 19:21:47 +000028except ImportError:
29 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000030
Thomas Wouters477c8d52006-05-27 19:21:47 +000031__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
32 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
33 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
34 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
35
36class Mailbox:
37 """A group of messages in a particular place."""
38
39 def __init__(self, path, factory=None, create=True):
40 """Initialize a Mailbox instance."""
41 self._path = os.path.abspath(os.path.expanduser(path))
42 self._factory = factory
43
44 def add(self, message):
45 """Add message and return assigned key."""
46 raise NotImplementedError('Method must be implemented by subclass')
47
48 def remove(self, key):
49 """Remove the keyed message; raise KeyError if it doesn't exist."""
50 raise NotImplementedError('Method must be implemented by subclass')
51
52 def __delitem__(self, key):
53 self.remove(key)
54
55 def discard(self, key):
56 """If the keyed message exists, remove it."""
57 try:
58 self.remove(key)
59 except KeyError:
60 pass
61
62 def __setitem__(self, key, message):
63 """Replace the keyed message; raise KeyError if it doesn't exist."""
64 raise NotImplementedError('Method must be implemented by subclass')
65
66 def get(self, key, default=None):
67 """Return the keyed message, or default if it doesn't exist."""
68 try:
69 return self.__getitem__(key)
70 except KeyError:
71 return default
72
73 def __getitem__(self, key):
74 """Return the keyed message; raise KeyError if it doesn't exist."""
75 if not self._factory:
76 return self.get_message(key)
77 else:
78 return self._factory(self.get_file(key))
79
80 def get_message(self, key):
81 """Return a Message representation or raise a KeyError."""
82 raise NotImplementedError('Method must be implemented by subclass')
83
84 def get_string(self, key):
85 """Return a string representation or raise a KeyError."""
86 raise NotImplementedError('Method must be implemented by subclass')
87
88 def get_file(self, key):
89 """Return a file-like representation or raise a KeyError."""
90 raise NotImplementedError('Method must be implemented by subclass')
91
92 def iterkeys(self):
93 """Return an iterator over keys."""
94 raise NotImplementedError('Method must be implemented by subclass')
95
96 def keys(self):
97 """Return a list of keys."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +000098 return list(self.iterkeys())
Thomas Wouters477c8d52006-05-27 19:21:47 +000099
100 def itervalues(self):
101 """Return an iterator over all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000102 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000103 try:
104 value = self[key]
105 except KeyError:
106 continue
107 yield value
108
109 def __iter__(self):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000110 return self.itervalues()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000111
112 def values(self):
113 """Return a list of messages. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000114 return list(self.itervalues())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000115
116 def iteritems(self):
117 """Return an iterator over (key, message) tuples."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000118 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000119 try:
120 value = self[key]
121 except KeyError:
122 continue
123 yield (key, value)
124
125 def items(self):
126 """Return a list of (key, message) tuples. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000127 return list(self.iteritems())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000128
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000129 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000130 """Return True if the keyed message exists, False otherwise."""
131 raise NotImplementedError('Method must be implemented by subclass')
132
Thomas Wouters477c8d52006-05-27 19:21:47 +0000133 def __len__(self):
134 """Return a count of messages in the mailbox."""
135 raise NotImplementedError('Method must be implemented by subclass')
136
137 def clear(self):
138 """Delete all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000139 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000140 self.discard(key)
141
142 def pop(self, key, default=None):
143 """Delete the keyed message and return it, or default."""
144 try:
145 result = self[key]
146 except KeyError:
147 return default
148 self.discard(key)
149 return result
150
151 def popitem(self):
152 """Delete an arbitrary (key, message) pair and return it."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000153 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000154 return (key, self.pop(key)) # This is only run once.
155 else:
156 raise KeyError('No messages in mailbox')
157
158 def update(self, arg=None):
159 """Change the messages that correspond to certain keys."""
160 if hasattr(arg, 'iteritems'):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000161 source = arg.items()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000162 elif hasattr(arg, 'items'):
163 source = arg.items()
164 else:
165 source = arg
166 bad_key = False
167 for key, message in source:
168 try:
169 self[key] = message
170 except KeyError:
171 bad_key = True
172 if bad_key:
173 raise KeyError('No message with key(s)')
174
175 def flush(self):
176 """Write any pending changes to the disk."""
177 raise NotImplementedError('Method must be implemented by subclass')
178
179 def lock(self):
180 """Lock the mailbox."""
181 raise NotImplementedError('Method must be implemented by subclass')
182
183 def unlock(self):
184 """Unlock the mailbox if it is locked."""
185 raise NotImplementedError('Method must be implemented by subclass')
186
187 def close(self):
188 """Flush and close the mailbox."""
189 raise NotImplementedError('Method must be implemented by subclass')
190
191 def _dump_message(self, message, target, mangle_from_=False):
Guido van Rossum671117a2007-08-31 04:25:05 +0000192 # This assumes the target file is open in *text* mode with the
193 # desired encoding and newline setting.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000194 """Dump message contents to target file."""
Thomas Woutersb2137042007-02-01 18:02:27 +0000195 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +0000196 buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +0000197 gen = email.generator.Generator(buffer, mangle_from_, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000198 gen.flatten(message)
199 buffer.seek(0)
Guido van Rossum671117a2007-08-31 04:25:05 +0000200 data = buffer.read()
201 ##data = data.replace('\n', os.linesep)
202 target.write(data)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000203 elif isinstance(message, str):
204 if mangle_from_:
205 message = message.replace('\nFrom ', '\n>From ')
Guido van Rossum671117a2007-08-31 04:25:05 +0000206 ##message = message.replace('\n', os.linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000207 target.write(message)
208 elif hasattr(message, 'read'):
209 while True:
210 line = message.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000211 if not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000212 break
213 if mangle_from_ and line.startswith('From '):
214 line = '>From ' + line[5:]
Guido van Rossum671117a2007-08-31 04:25:05 +0000215 ##line = line.replace('\n', os.linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000216 target.write(line)
217 else:
218 raise TypeError('Invalid message type: %s' % type(message))
219
220
221class Maildir(Mailbox):
222 """A qmail-style Maildir mailbox."""
223
224 colon = ':'
225
226 def __init__(self, dirname, factory=rfc822.Message, create=True):
227 """Initialize a Maildir instance."""
228 Mailbox.__init__(self, dirname, factory, create)
229 if not os.path.exists(self._path):
230 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000231 os.mkdir(self._path, 0o700)
232 os.mkdir(os.path.join(self._path, 'tmp'), 0o700)
233 os.mkdir(os.path.join(self._path, 'new'), 0o700)
234 os.mkdir(os.path.join(self._path, 'cur'), 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000235 else:
236 raise NoSuchMailboxError(self._path)
237 self._toc = {}
238
239 def add(self, message):
240 """Add message and return assigned key."""
241 tmp_file = self._create_tmp()
242 try:
243 self._dump_message(message, tmp_file)
244 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000245 _sync_close(tmp_file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000246 if isinstance(message, MaildirMessage):
247 subdir = message.get_subdir()
248 suffix = self.colon + message.get_info()
249 if suffix == self.colon:
250 suffix = ''
251 else:
252 subdir = 'new'
253 suffix = ''
254 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
255 dest = os.path.join(self._path, subdir, uniq + suffix)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000256 try:
257 if hasattr(os, 'link'):
258 os.link(tmp_file.name, dest)
259 os.remove(tmp_file.name)
260 else:
261 os.rename(tmp_file.name, dest)
Guido van Rossumb940e112007-01-10 16:19:56 +0000262 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000263 os.remove(tmp_file.name)
264 if e.errno == errno.EEXIST:
265 raise ExternalClashError('Name clash with existing message: %s'
266 % dest)
267 else:
268 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000269 if isinstance(message, MaildirMessage):
270 os.utime(dest, (os.path.getatime(dest), message.get_date()))
271 return uniq
272
273 def remove(self, key):
274 """Remove the keyed message; raise KeyError if it doesn't exist."""
275 os.remove(os.path.join(self._path, self._lookup(key)))
276
277 def discard(self, key):
278 """If the keyed message exists, remove it."""
279 # This overrides an inapplicable implementation in the superclass.
280 try:
281 self.remove(key)
282 except KeyError:
283 pass
Guido van Rossumb940e112007-01-10 16:19:56 +0000284 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000285 if e.errno != errno.ENOENT:
286 raise
287
288 def __setitem__(self, key, message):
289 """Replace the keyed message; raise KeyError if it doesn't exist."""
290 old_subpath = self._lookup(key)
291 temp_key = self.add(message)
292 temp_subpath = self._lookup(temp_key)
293 if isinstance(message, MaildirMessage):
294 # temp's subdir and suffix were specified by message.
295 dominant_subpath = temp_subpath
296 else:
297 # temp's subdir and suffix were defaults from add().
298 dominant_subpath = old_subpath
299 subdir = os.path.dirname(dominant_subpath)
300 if self.colon in dominant_subpath:
301 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
302 else:
303 suffix = ''
304 self.discard(key)
305 new_path = os.path.join(self._path, subdir, key + suffix)
306 os.rename(os.path.join(self._path, temp_subpath), new_path)
307 if isinstance(message, MaildirMessage):
308 os.utime(new_path, (os.path.getatime(new_path),
309 message.get_date()))
310
311 def get_message(self, key):
312 """Return a Message representation or raise a KeyError."""
313 subpath = self._lookup(key)
314 f = open(os.path.join(self._path, subpath), 'r')
315 try:
316 msg = MaildirMessage(f)
317 finally:
318 f.close()
319 subdir, name = os.path.split(subpath)
320 msg.set_subdir(subdir)
321 if self.colon in name:
322 msg.set_info(name.split(self.colon)[-1])
323 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
324 return msg
325
326 def get_string(self, key):
327 """Return a string representation or raise a KeyError."""
328 f = open(os.path.join(self._path, self._lookup(key)), 'r')
329 try:
330 return f.read()
331 finally:
332 f.close()
333
334 def get_file(self, key):
335 """Return a file-like representation or raise a KeyError."""
Guido van Rossum98297ee2007-11-06 21:34:58 +0000336 f = open(os.path.join(self._path, self._lookup(key)), 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000337 return _ProxyFile(f)
338
339 def iterkeys(self):
340 """Return an iterator over keys."""
341 self._refresh()
342 for key in self._toc:
343 try:
344 self._lookup(key)
345 except KeyError:
346 continue
347 yield key
348
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000349 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000350 """Return True if the keyed message exists, False otherwise."""
351 self._refresh()
352 return key in self._toc
353
354 def __len__(self):
355 """Return a count of messages in the mailbox."""
356 self._refresh()
357 return len(self._toc)
358
359 def flush(self):
360 """Write any pending changes to disk."""
361 return # Maildir changes are always written immediately.
362
363 def lock(self):
364 """Lock the mailbox."""
365 return
366
367 def unlock(self):
368 """Unlock the mailbox if it is locked."""
369 return
370
371 def close(self):
372 """Flush and close the mailbox."""
373 return
374
375 def list_folders(self):
376 """Return a list of folder names."""
377 result = []
378 for entry in os.listdir(self._path):
379 if len(entry) > 1 and entry[0] == '.' and \
380 os.path.isdir(os.path.join(self._path, entry)):
381 result.append(entry[1:])
382 return result
383
384 def get_folder(self, folder):
385 """Return a Maildir instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000386 return Maildir(os.path.join(self._path, '.' + folder),
387 factory=self._factory,
388 create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000389
390 def add_folder(self, folder):
391 """Create a folder and return a Maildir instance representing it."""
392 path = os.path.join(self._path, '.' + folder)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000393 result = Maildir(path, factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000394 maildirfolder_path = os.path.join(path, 'maildirfolder')
395 if not os.path.exists(maildirfolder_path):
396 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY))
397 return result
398
399 def remove_folder(self, folder):
400 """Delete the named folder, which must be empty."""
401 path = os.path.join(self._path, '.' + folder)
402 for entry in os.listdir(os.path.join(path, 'new')) + \
403 os.listdir(os.path.join(path, 'cur')):
404 if len(entry) < 1 or entry[0] != '.':
405 raise NotEmptyError('Folder contains message(s): %s' % folder)
406 for entry in os.listdir(path):
407 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
408 os.path.isdir(os.path.join(path, entry)):
409 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
410 (folder, entry))
411 for root, dirs, files in os.walk(path, topdown=False):
412 for entry in files:
413 os.remove(os.path.join(root, entry))
414 for entry in dirs:
415 os.rmdir(os.path.join(root, entry))
416 os.rmdir(path)
417
418 def clean(self):
419 """Delete old files in "tmp"."""
420 now = time.time()
421 for entry in os.listdir(os.path.join(self._path, 'tmp')):
422 path = os.path.join(self._path, 'tmp', entry)
423 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
424 os.remove(path)
425
426 _count = 1 # This is used to generate unique file names.
427
428 def _create_tmp(self):
429 """Create a file in the tmp subdirectory and open and return it."""
430 now = time.time()
431 hostname = socket.gethostname()
432 if '/' in hostname:
433 hostname = hostname.replace('/', r'\057')
434 if ':' in hostname:
435 hostname = hostname.replace(':', r'\072')
436 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
437 Maildir._count, hostname)
438 path = os.path.join(self._path, 'tmp', uniq)
439 try:
440 os.stat(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000441 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000442 if e.errno == errno.ENOENT:
443 Maildir._count += 1
Thomas Wouters89f507f2006-12-13 04:49:30 +0000444 try:
445 return _create_carefully(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000446 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000447 if e.errno != errno.EEXIST:
448 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000449 else:
450 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000451
452 # Fall through to here if stat succeeded or open raised EEXIST.
453 raise ExternalClashError('Name clash prevented file creation: %s' %
454 path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000455
456 def _refresh(self):
457 """Update table of contents mapping."""
458 self._toc = {}
459 for subdir in ('new', 'cur'):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000460 subdir_path = os.path.join(self._path, subdir)
461 for entry in os.listdir(subdir_path):
462 p = os.path.join(subdir_path, entry)
463 if os.path.isdir(p):
464 continue
Thomas Wouters477c8d52006-05-27 19:21:47 +0000465 uniq = entry.split(self.colon)[0]
466 self._toc[uniq] = os.path.join(subdir, entry)
467
468 def _lookup(self, key):
469 """Use TOC to return subpath for given key, or raise a KeyError."""
470 try:
471 if os.path.exists(os.path.join(self._path, self._toc[key])):
472 return self._toc[key]
473 except KeyError:
474 pass
475 self._refresh()
476 try:
477 return self._toc[key]
478 except KeyError:
479 raise KeyError('No message with key: %s' % key)
480
481 # This method is for backward compatibility only.
482 def next(self):
483 """Return the next message in a one-time iteration."""
484 if not hasattr(self, '_onetime_keys'):
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000485 self._onetime_keys = iter(self.keys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000486 while True:
487 try:
Georg Brandla18af4e2007-04-21 15:47:16 +0000488 return self[next(self._onetime_keys)]
Thomas Wouters477c8d52006-05-27 19:21:47 +0000489 except StopIteration:
490 return None
491 except KeyError:
492 continue
493
494
495class _singlefileMailbox(Mailbox):
496 """A single-file mailbox."""
497
498 def __init__(self, path, factory=None, create=True):
499 """Initialize a single-file mailbox."""
500 Mailbox.__init__(self, path, factory, create)
501 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000502 f = open(self._path, 'r+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000503 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000504 if e.errno == errno.ENOENT:
505 if create:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000506 f = open(self._path, 'w+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000507 else:
508 raise NoSuchMailboxError(self._path)
509 elif e.errno == errno.EACCES:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000510 f = open(self._path, 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000511 else:
512 raise
513 self._file = f
514 self._toc = None
515 self._next_key = 0
516 self._pending = False # No changes require rewriting the file.
517 self._locked = False
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000518 self._file_length = None # Used to record mailbox size
Thomas Wouters477c8d52006-05-27 19:21:47 +0000519
520 def add(self, message):
521 """Add message and return assigned key."""
522 self._lookup()
523 self._toc[self._next_key] = self._append_message(message)
524 self._next_key += 1
525 self._pending = True
526 return self._next_key - 1
527
528 def remove(self, key):
529 """Remove the keyed message; raise KeyError if it doesn't exist."""
530 self._lookup(key)
531 del self._toc[key]
532 self._pending = True
533
534 def __setitem__(self, key, message):
535 """Replace the keyed message; raise KeyError if it doesn't exist."""
536 self._lookup(key)
537 self._toc[key] = self._append_message(message)
538 self._pending = True
539
540 def iterkeys(self):
541 """Return an iterator over keys."""
542 self._lookup()
543 for key in self._toc.keys():
544 yield key
545
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000546 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000547 """Return True if the keyed message exists, False otherwise."""
548 self._lookup()
549 return key in self._toc
550
551 def __len__(self):
552 """Return a count of messages in the mailbox."""
553 self._lookup()
554 return len(self._toc)
555
556 def lock(self):
557 """Lock the mailbox."""
558 if not self._locked:
559 _lock_file(self._file)
560 self._locked = True
561
562 def unlock(self):
563 """Unlock the mailbox if it is locked."""
564 if self._locked:
565 _unlock_file(self._file)
566 self._locked = False
567
568 def flush(self):
569 """Write any pending changes to disk."""
570 if not self._pending:
571 return
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000572
573 # In order to be writing anything out at all, self._toc must
574 # already have been generated (and presumably has been modified
575 # by adding or deleting an item).
576 assert self._toc is not None
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000577
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000578 # Check length of self._file; if it's changed, some other process
579 # has modified the mailbox since we scanned it.
580 self._file.seek(0, 2)
581 cur_len = self._file.tell()
582 if cur_len != self._file_length:
583 raise ExternalClashError('Size of mailbox file changed '
584 '(expected %i, found %i)' %
585 (self._file_length, cur_len))
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000586
Thomas Wouters477c8d52006-05-27 19:21:47 +0000587 new_file = _create_temporary(self._path)
588 try:
589 new_toc = {}
590 self._pre_mailbox_hook(new_file)
591 for key in sorted(self._toc.keys()):
592 start, stop = self._toc[key]
593 self._file.seek(start)
594 self._pre_message_hook(new_file)
595 new_start = new_file.tell()
596 while True:
597 buffer = self._file.read(min(4096,
598 stop - self._file.tell()))
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000599 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000600 break
601 new_file.write(buffer)
602 new_toc[key] = (new_start, new_file.tell())
603 self._post_message_hook(new_file)
604 except:
605 new_file.close()
606 os.remove(new_file.name)
607 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000608 _sync_close(new_file)
609 # self._file is about to get replaced, so no need to sync.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000610 self._file.close()
611 try:
612 os.rename(new_file.name, self._path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000613 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000614 if e.errno == errno.EEXIST or \
615 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000616 os.remove(self._path)
617 os.rename(new_file.name, self._path)
618 else:
619 raise
620 self._file = open(self._path, 'rb+')
621 self._toc = new_toc
622 self._pending = False
623 if self._locked:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000624 _lock_file(self._file, dotlock=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000625
626 def _pre_mailbox_hook(self, f):
627 """Called before writing the mailbox to file f."""
628 return
629
630 def _pre_message_hook(self, f):
631 """Called before writing each message to file f."""
632 return
633
634 def _post_message_hook(self, f):
635 """Called after writing each message to file f."""
636 return
637
638 def close(self):
639 """Flush and close the mailbox."""
640 self.flush()
641 if self._locked:
642 self.unlock()
Thomas Wouters89f507f2006-12-13 04:49:30 +0000643 self._file.close() # Sync has been done by self.flush() above.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000644
645 def _lookup(self, key=None):
646 """Return (start, stop) or raise KeyError."""
647 if self._toc is None:
648 self._generate_toc()
649 if key is not None:
650 try:
651 return self._toc[key]
652 except KeyError:
653 raise KeyError('No message with key: %s' % key)
654
655 def _append_message(self, message):
656 """Append message to mailbox and return (start, stop) offsets."""
657 self._file.seek(0, 2)
658 self._pre_message_hook(self._file)
659 offsets = self._install_message(message)
660 self._post_message_hook(self._file)
661 self._file.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000662 self._file_length = self._file.tell() # Record current length of mailbox
Thomas Wouters477c8d52006-05-27 19:21:47 +0000663 return offsets
664
665
666
667class _mboxMMDF(_singlefileMailbox):
668 """An mbox or MMDF mailbox."""
669
670 _mangle_from_ = True
671
672 def get_message(self, key):
673 """Return a Message representation or raise a KeyError."""
674 start, stop = self._lookup(key)
675 self._file.seek(start)
676 from_line = self._file.readline().replace(os.linesep, '')
677 string = self._file.read(stop - self._file.tell())
678 msg = self._message_factory(string.replace(os.linesep, '\n'))
679 msg.set_from(from_line[5:])
680 return msg
681
682 def get_string(self, key, from_=False):
683 """Return a string representation or raise a KeyError."""
684 start, stop = self._lookup(key)
685 self._file.seek(start)
686 if not from_:
687 self._file.readline()
688 string = self._file.read(stop - self._file.tell())
689 return string.replace(os.linesep, '\n')
690
691 def get_file(self, key, from_=False):
692 """Return a file-like representation or raise a KeyError."""
693 start, stop = self._lookup(key)
694 self._file.seek(start)
695 if not from_:
696 self._file.readline()
697 return _PartialFile(self._file, self._file.tell(), stop)
698
699 def _install_message(self, message):
700 """Format a message and blindly write to self._file."""
701 from_line = None
702 if isinstance(message, str) and message.startswith('From '):
703 newline = message.find('\n')
704 if newline != -1:
705 from_line = message[:newline]
706 message = message[newline + 1:]
707 else:
708 from_line = message
709 message = ''
710 elif isinstance(message, _mboxMMDFMessage):
711 from_line = 'From ' + message.get_from()
Thomas Woutersb2137042007-02-01 18:02:27 +0000712 elif isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000713 from_line = message.get_unixfrom() # May be None.
714 if from_line is None:
715 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
716 start = self._file.tell()
717 self._file.write(from_line + os.linesep)
718 self._dump_message(message, self._file, self._mangle_from_)
719 stop = self._file.tell()
720 return (start, stop)
721
722
723class mbox(_mboxMMDF):
724 """A classic mbox mailbox."""
725
726 _mangle_from_ = True
727
728 def __init__(self, path, factory=None, create=True):
729 """Initialize an mbox mailbox."""
730 self._message_factory = mboxMessage
731 _mboxMMDF.__init__(self, path, factory, create)
732
733 def _pre_message_hook(self, f):
734 """Called before writing each message to file f."""
735 if f.tell() != 0:
736 f.write(os.linesep)
737
738 def _generate_toc(self):
739 """Generate key-to-(start, stop) table of contents."""
740 starts, stops = [], []
741 self._file.seek(0)
742 while True:
743 line_pos = self._file.tell()
744 line = self._file.readline()
745 if line.startswith('From '):
746 if len(stops) < len(starts):
747 stops.append(line_pos - len(os.linesep))
748 starts.append(line_pos)
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000749 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000750 stops.append(line_pos)
751 break
752 self._toc = dict(enumerate(zip(starts, stops)))
753 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000754 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000755
756
757class MMDF(_mboxMMDF):
758 """An MMDF mailbox."""
759
760 def __init__(self, path, factory=None, create=True):
761 """Initialize an MMDF mailbox."""
762 self._message_factory = MMDFMessage
763 _mboxMMDF.__init__(self, path, factory, create)
764
765 def _pre_message_hook(self, f):
766 """Called before writing each message to file f."""
767 f.write('\001\001\001\001' + os.linesep)
768
769 def _post_message_hook(self, f):
770 """Called after writing each message to file f."""
771 f.write(os.linesep + '\001\001\001\001' + os.linesep)
772
773 def _generate_toc(self):
774 """Generate key-to-(start, stop) table of contents."""
775 starts, stops = [], []
776 self._file.seek(0)
777 next_pos = 0
778 while True:
779 line_pos = next_pos
780 line = self._file.readline()
781 next_pos = self._file.tell()
782 if line.startswith('\001\001\001\001' + os.linesep):
783 starts.append(next_pos)
784 while True:
785 line_pos = next_pos
786 line = self._file.readline()
787 next_pos = self._file.tell()
788 if line == '\001\001\001\001' + os.linesep:
789 stops.append(line_pos - len(os.linesep))
790 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000791 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000792 stops.append(line_pos)
793 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000794 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000795 break
796 self._toc = dict(enumerate(zip(starts, stops)))
797 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000798 self._file.seek(0, 2)
799 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000800
801
802class MH(Mailbox):
803 """An MH mailbox."""
804
805 def __init__(self, path, factory=None, create=True):
806 """Initialize an MH instance."""
807 Mailbox.__init__(self, path, factory, create)
808 if not os.path.exists(self._path):
809 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000810 os.mkdir(self._path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000811 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000812 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000813 else:
814 raise NoSuchMailboxError(self._path)
815 self._locked = False
816
817 def add(self, message):
818 """Add message and return assigned key."""
819 keys = self.keys()
820 if len(keys) == 0:
821 new_key = 1
822 else:
823 new_key = max(keys) + 1
824 new_path = os.path.join(self._path, str(new_key))
825 f = _create_carefully(new_path)
826 try:
827 if self._locked:
828 _lock_file(f)
829 try:
830 self._dump_message(message, f)
831 if isinstance(message, MHMessage):
832 self._dump_sequences(message, new_key)
833 finally:
834 if self._locked:
835 _unlock_file(f)
836 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000837 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000838 return new_key
839
840 def remove(self, key):
841 """Remove the keyed message; raise KeyError if it doesn't exist."""
842 path = os.path.join(self._path, str(key))
843 try:
844 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000845 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000846 if e.errno == errno.ENOENT:
847 raise KeyError('No message with key: %s' % key)
848 else:
849 raise
850 try:
851 if self._locked:
852 _lock_file(f)
853 try:
854 f.close()
855 os.remove(os.path.join(self._path, str(key)))
856 finally:
857 if self._locked:
858 _unlock_file(f)
859 finally:
860 f.close()
861
862 def __setitem__(self, key, message):
863 """Replace the keyed message; raise KeyError if it doesn't exist."""
864 path = os.path.join(self._path, str(key))
865 try:
Guido van Rossum671117a2007-08-31 04:25:05 +0000866 f = open(path, 'r+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000867 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000868 if e.errno == errno.ENOENT:
869 raise KeyError('No message with key: %s' % key)
870 else:
871 raise
872 try:
873 if self._locked:
874 _lock_file(f)
875 try:
876 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
877 self._dump_message(message, f)
878 if isinstance(message, MHMessage):
879 self._dump_sequences(message, key)
880 finally:
881 if self._locked:
882 _unlock_file(f)
883 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000884 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000885
886 def get_message(self, key):
887 """Return a Message representation or raise a KeyError."""
888 try:
889 if self._locked:
890 f = open(os.path.join(self._path, str(key)), 'r+')
891 else:
892 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000893 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000894 if e.errno == errno.ENOENT:
895 raise KeyError('No message with key: %s' % key)
896 else:
897 raise
898 try:
899 if self._locked:
900 _lock_file(f)
901 try:
902 msg = MHMessage(f)
903 finally:
904 if self._locked:
905 _unlock_file(f)
906 finally:
907 f.close()
908 for name, key_list in self.get_sequences():
909 if key in key_list:
910 msg.add_sequence(name)
911 return msg
912
913 def get_string(self, key):
914 """Return a string representation or raise a KeyError."""
915 try:
916 if self._locked:
917 f = open(os.path.join(self._path, str(key)), 'r+')
918 else:
919 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000920 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000921 if e.errno == errno.ENOENT:
922 raise KeyError('No message with key: %s' % key)
923 else:
924 raise
925 try:
926 if self._locked:
927 _lock_file(f)
928 try:
929 return f.read()
930 finally:
931 if self._locked:
932 _unlock_file(f)
933 finally:
934 f.close()
935
936 def get_file(self, key):
937 """Return a file-like representation or raise a KeyError."""
938 try:
Guido van Rossum98297ee2007-11-06 21:34:58 +0000939 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000940 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000941 if e.errno == errno.ENOENT:
942 raise KeyError('No message with key: %s' % key)
943 else:
944 raise
945 return _ProxyFile(f)
946
947 def iterkeys(self):
948 """Return an iterator over keys."""
949 return iter(sorted(int(entry) for entry in os.listdir(self._path)
950 if entry.isdigit()))
951
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000952 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000953 """Return True if the keyed message exists, False otherwise."""
954 return os.path.exists(os.path.join(self._path, str(key)))
955
956 def __len__(self):
957 """Return a count of messages in the mailbox."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000958 return len(list(self.keys()))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000959
960 def lock(self):
961 """Lock the mailbox."""
962 if not self._locked:
963 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
964 _lock_file(self._file)
965 self._locked = True
966
967 def unlock(self):
968 """Unlock the mailbox if it is locked."""
969 if self._locked:
970 _unlock_file(self._file)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000971 _sync_close(self._file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000972 del self._file
973 self._locked = False
974
975 def flush(self):
976 """Write any pending changes to the disk."""
977 return
978
979 def close(self):
980 """Flush and close the mailbox."""
981 if self._locked:
982 self.unlock()
983
984 def list_folders(self):
985 """Return a list of folder names."""
986 result = []
987 for entry in os.listdir(self._path):
988 if os.path.isdir(os.path.join(self._path, entry)):
989 result.append(entry)
990 return result
991
992 def get_folder(self, folder):
993 """Return an MH instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000994 return MH(os.path.join(self._path, folder),
995 factory=self._factory, create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000996
997 def add_folder(self, folder):
998 """Create a folder and return an MH instance representing it."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000999 return MH(os.path.join(self._path, folder),
1000 factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001001
1002 def remove_folder(self, folder):
1003 """Delete the named folder, which must be empty."""
1004 path = os.path.join(self._path, folder)
1005 entries = os.listdir(path)
1006 if entries == ['.mh_sequences']:
1007 os.remove(os.path.join(path, '.mh_sequences'))
1008 elif entries == []:
1009 pass
1010 else:
1011 raise NotEmptyError('Folder not empty: %s' % self._path)
1012 os.rmdir(path)
1013
1014 def get_sequences(self):
1015 """Return a name-to-key-list dictionary to define each sequence."""
1016 results = {}
1017 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
1018 try:
1019 all_keys = set(self.keys())
1020 for line in f:
1021 try:
1022 name, contents = line.split(':')
1023 keys = set()
1024 for spec in contents.split():
1025 if spec.isdigit():
1026 keys.add(int(spec))
1027 else:
1028 start, stop = (int(x) for x in spec.split('-'))
1029 keys.update(range(start, stop + 1))
1030 results[name] = [key for key in sorted(keys) \
1031 if key in all_keys]
1032 if len(results[name]) == 0:
1033 del results[name]
1034 except ValueError:
1035 raise FormatError('Invalid sequence specification: %s' %
1036 line.rstrip())
1037 finally:
1038 f.close()
1039 return results
1040
1041 def set_sequences(self, sequences):
1042 """Set sequences using the given name-to-key-list dictionary."""
1043 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
1044 try:
1045 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001046 for name, keys in sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001047 if len(keys) == 0:
1048 continue
1049 f.write('%s:' % name)
1050 prev = None
1051 completing = False
1052 for key in sorted(set(keys)):
1053 if key - 1 == prev:
1054 if not completing:
1055 completing = True
1056 f.write('-')
1057 elif completing:
1058 completing = False
1059 f.write('%s %s' % (prev, key))
1060 else:
1061 f.write(' %s' % key)
1062 prev = key
1063 if completing:
1064 f.write(str(prev) + '\n')
1065 else:
1066 f.write('\n')
1067 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +00001068 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001069
1070 def pack(self):
1071 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1072 sequences = self.get_sequences()
1073 prev = 0
1074 changes = []
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001075 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001076 if key - 1 != prev:
1077 changes.append((key, prev + 1))
Thomas Wouters89f507f2006-12-13 04:49:30 +00001078 if hasattr(os, 'link'):
1079 os.link(os.path.join(self._path, str(key)),
1080 os.path.join(self._path, str(prev + 1)))
1081 os.unlink(os.path.join(self._path, str(key)))
1082 else:
1083 os.rename(os.path.join(self._path, str(key)),
1084 os.path.join(self._path, str(prev + 1)))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001085 prev += 1
1086 self._next_key = prev + 1
1087 if len(changes) == 0:
1088 return
1089 for name, key_list in sequences.items():
1090 for old, new in changes:
1091 if old in key_list:
1092 key_list[key_list.index(old)] = new
1093 self.set_sequences(sequences)
1094
1095 def _dump_sequences(self, message, key):
1096 """Inspect a new MHMessage and update sequences appropriately."""
1097 pending_sequences = message.get_sequences()
1098 all_sequences = self.get_sequences()
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001099 for name, key_list in all_sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001100 if name in pending_sequences:
1101 key_list.append(key)
1102 elif key in key_list:
1103 del key_list[key_list.index(key)]
1104 for sequence in pending_sequences:
1105 if sequence not in all_sequences:
1106 all_sequences[sequence] = [key]
1107 self.set_sequences(all_sequences)
1108
1109
1110class Babyl(_singlefileMailbox):
1111 """An Rmail-style Babyl mailbox."""
1112
1113 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1114 'forwarded', 'edited', 'resent'))
1115
1116 def __init__(self, path, factory=None, create=True):
1117 """Initialize a Babyl mailbox."""
1118 _singlefileMailbox.__init__(self, path, factory, create)
1119 self._labels = {}
1120
1121 def add(self, message):
1122 """Add message and return assigned key."""
1123 key = _singlefileMailbox.add(self, message)
1124 if isinstance(message, BabylMessage):
1125 self._labels[key] = message.get_labels()
1126 return key
1127
1128 def remove(self, key):
1129 """Remove the keyed message; raise KeyError if it doesn't exist."""
1130 _singlefileMailbox.remove(self, key)
1131 if key in self._labels:
1132 del self._labels[key]
1133
1134 def __setitem__(self, key, message):
1135 """Replace the keyed message; raise KeyError if it doesn't exist."""
1136 _singlefileMailbox.__setitem__(self, key, message)
1137 if isinstance(message, BabylMessage):
1138 self._labels[key] = message.get_labels()
1139
1140 def get_message(self, key):
1141 """Return a Message representation or raise a KeyError."""
1142 start, stop = self._lookup(key)
1143 self._file.seek(start)
1144 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001145 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001146 while True:
1147 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001148 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001149 break
1150 original_headers.write(line.replace(os.linesep, '\n'))
Guido van Rossum34d19282007-08-09 01:03:29 +00001151 visible_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001152 while True:
1153 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001154 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001155 break
1156 visible_headers.write(line.replace(os.linesep, '\n'))
1157 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1158 '\n')
1159 msg = BabylMessage(original_headers.getvalue() + body)
1160 msg.set_visible(visible_headers.getvalue())
1161 if key in self._labels:
1162 msg.set_labels(self._labels[key])
1163 return msg
1164
1165 def get_string(self, key):
1166 """Return a string representation or raise a KeyError."""
1167 start, stop = self._lookup(key)
1168 self._file.seek(start)
1169 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001170 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001171 while True:
1172 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001173 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001174 break
1175 original_headers.write(line.replace(os.linesep, '\n'))
1176 while True:
1177 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001178 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001179 break
1180 return original_headers.getvalue() + \
1181 self._file.read(stop - self._file.tell()).replace(os.linesep,
1182 '\n')
1183
1184 def get_file(self, key):
1185 """Return a file-like representation or raise a KeyError."""
Guido van Rossum34d19282007-08-09 01:03:29 +00001186 return io.StringIO(self.get_string(key).replace('\n',
Thomas Wouters477c8d52006-05-27 19:21:47 +00001187 os.linesep))
1188
1189 def get_labels(self):
1190 """Return a list of user-defined labels in the mailbox."""
1191 self._lookup()
1192 labels = set()
1193 for label_list in self._labels.values():
1194 labels.update(label_list)
1195 labels.difference_update(self._special_labels)
1196 return list(labels)
1197
1198 def _generate_toc(self):
1199 """Generate key-to-(start, stop) table of contents."""
1200 starts, stops = [], []
1201 self._file.seek(0)
1202 next_pos = 0
1203 label_lists = []
1204 while True:
1205 line_pos = next_pos
1206 line = self._file.readline()
1207 next_pos = self._file.tell()
1208 if line == '\037\014' + os.linesep:
1209 if len(stops) < len(starts):
1210 stops.append(line_pos - len(os.linesep))
1211 starts.append(next_pos)
1212 labels = [label.strip() for label
1213 in self._file.readline()[1:].split(',')
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001214 if label.strip()]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001215 label_lists.append(labels)
1216 elif line == '\037' or line == '\037' + os.linesep:
1217 if len(stops) < len(starts):
1218 stops.append(line_pos - len(os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001219 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001220 stops.append(line_pos - len(os.linesep))
1221 break
1222 self._toc = dict(enumerate(zip(starts, stops)))
1223 self._labels = dict(enumerate(label_lists))
1224 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001225 self._file.seek(0, 2)
1226 self._file_length = self._file.tell()
Thomas Wouters9fe394c2007-02-05 01:24:16 +00001227
Thomas Wouters477c8d52006-05-27 19:21:47 +00001228 def _pre_mailbox_hook(self, f):
1229 """Called before writing the mailbox to file f."""
1230 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1231 (os.linesep, os.linesep, ','.join(self.get_labels()),
1232 os.linesep))
1233
1234 def _pre_message_hook(self, f):
1235 """Called before writing each message to file f."""
1236 f.write('\014' + os.linesep)
1237
1238 def _post_message_hook(self, f):
1239 """Called after writing each message to file f."""
1240 f.write(os.linesep + '\037')
1241
1242 def _install_message(self, message):
1243 """Write message contents and return (start, stop)."""
1244 start = self._file.tell()
1245 if isinstance(message, BabylMessage):
1246 special_labels = []
1247 labels = []
1248 for label in message.get_labels():
1249 if label in self._special_labels:
1250 special_labels.append(label)
1251 else:
1252 labels.append(label)
1253 self._file.write('1')
1254 for label in special_labels:
1255 self._file.write(', ' + label)
1256 self._file.write(',,')
1257 for label in labels:
1258 self._file.write(' ' + label + ',')
1259 self._file.write(os.linesep)
1260 else:
1261 self._file.write('1,,' + os.linesep)
Thomas Woutersb2137042007-02-01 18:02:27 +00001262 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +00001263 orig_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001264 orig_generator = email.generator.Generator(orig_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001265 orig_generator.flatten(message)
1266 orig_buffer.seek(0)
1267 while True:
1268 line = orig_buffer.readline()
1269 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001270 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001271 break
1272 self._file.write('*** EOOH ***' + os.linesep)
1273 if isinstance(message, BabylMessage):
Guido van Rossum34d19282007-08-09 01:03:29 +00001274 vis_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001275 vis_generator = email.generator.Generator(vis_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001276 vis_generator.flatten(message.get_visible())
1277 while True:
1278 line = vis_buffer.readline()
1279 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001280 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001281 break
1282 else:
1283 orig_buffer.seek(0)
1284 while True:
1285 line = orig_buffer.readline()
1286 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001287 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001288 break
1289 while True:
1290 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001291 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001292 break
1293 self._file.write(buffer.replace('\n', os.linesep))
1294 elif isinstance(message, str):
1295 body_start = message.find('\n\n') + 2
1296 if body_start - 2 != -1:
1297 self._file.write(message[:body_start].replace('\n',
1298 os.linesep))
1299 self._file.write('*** EOOH ***' + os.linesep)
1300 self._file.write(message[:body_start].replace('\n',
1301 os.linesep))
1302 self._file.write(message[body_start:].replace('\n',
1303 os.linesep))
1304 else:
1305 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1306 self._file.write(message.replace('\n', os.linesep))
1307 elif hasattr(message, 'readline'):
1308 original_pos = message.tell()
1309 first_pass = True
1310 while True:
1311 line = message.readline()
1312 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001313 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001314 self._file.write('*** EOOH ***' + os.linesep)
1315 if first_pass:
1316 first_pass = False
1317 message.seek(original_pos)
1318 else:
1319 break
1320 while True:
1321 buffer = message.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001322 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001323 break
1324 self._file.write(buffer.replace('\n', os.linesep))
1325 else:
1326 raise TypeError('Invalid message type: %s' % type(message))
1327 stop = self._file.tell()
1328 return (start, stop)
1329
1330
Thomas Woutersb2137042007-02-01 18:02:27 +00001331class Message(email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001332 """Message with mailbox-format-specific properties."""
1333
1334 def __init__(self, message=None):
1335 """Initialize a Message instance."""
Thomas Woutersb2137042007-02-01 18:02:27 +00001336 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001337 self._become_message(copy.deepcopy(message))
1338 if isinstance(message, Message):
1339 message._explain_to(self)
1340 elif isinstance(message, str):
1341 self._become_message(email.message_from_string(message))
1342 elif hasattr(message, "read"):
1343 self._become_message(email.message_from_file(message))
1344 elif message is None:
Thomas Woutersb2137042007-02-01 18:02:27 +00001345 email.message.Message.__init__(self)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001346 else:
1347 raise TypeError('Invalid message type: %s' % type(message))
1348
1349 def _become_message(self, message):
1350 """Assume the non-format-specific state of message."""
1351 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1352 'preamble', 'epilogue', 'defects', '_default_type'):
1353 self.__dict__[name] = message.__dict__[name]
1354
1355 def _explain_to(self, message):
1356 """Copy format-specific state to message insofar as possible."""
1357 if isinstance(message, Message):
1358 return # There's nothing format-specific to explain.
1359 else:
1360 raise TypeError('Cannot convert to specified type')
1361
1362
1363class MaildirMessage(Message):
1364 """Message with Maildir-specific properties."""
1365
1366 def __init__(self, message=None):
1367 """Initialize a MaildirMessage instance."""
1368 self._subdir = 'new'
1369 self._info = ''
1370 self._date = time.time()
1371 Message.__init__(self, message)
1372
1373 def get_subdir(self):
1374 """Return 'new' or 'cur'."""
1375 return self._subdir
1376
1377 def set_subdir(self, subdir):
1378 """Set subdir to 'new' or 'cur'."""
1379 if subdir == 'new' or subdir == 'cur':
1380 self._subdir = subdir
1381 else:
1382 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1383
1384 def get_flags(self):
1385 """Return as a string the flags that are set."""
1386 if self._info.startswith('2,'):
1387 return self._info[2:]
1388 else:
1389 return ''
1390
1391 def set_flags(self, flags):
1392 """Set the given flags and unset all others."""
1393 self._info = '2,' + ''.join(sorted(flags))
1394
1395 def add_flag(self, flag):
1396 """Set the given flag(s) without changing others."""
1397 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1398
1399 def remove_flag(self, flag):
1400 """Unset the given string flag(s) without changing others."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001401 if self.get_flags():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001402 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1403
1404 def get_date(self):
1405 """Return delivery date of message, in seconds since the epoch."""
1406 return self._date
1407
1408 def set_date(self, date):
1409 """Set delivery date of message, in seconds since the epoch."""
1410 try:
1411 self._date = float(date)
1412 except ValueError:
1413 raise TypeError("can't convert to float: %s" % date)
1414
1415 def get_info(self):
1416 """Get the message's "info" as a string."""
1417 return self._info
1418
1419 def set_info(self, info):
1420 """Set the message's "info" string."""
1421 if isinstance(info, str):
1422 self._info = info
1423 else:
1424 raise TypeError('info must be a string: %s' % type(info))
1425
1426 def _explain_to(self, message):
1427 """Copy Maildir-specific state to message insofar as possible."""
1428 if isinstance(message, MaildirMessage):
1429 message.set_flags(self.get_flags())
1430 message.set_subdir(self.get_subdir())
1431 message.set_date(self.get_date())
1432 elif isinstance(message, _mboxMMDFMessage):
1433 flags = set(self.get_flags())
1434 if 'S' in flags:
1435 message.add_flag('R')
1436 if self.get_subdir() == 'cur':
1437 message.add_flag('O')
1438 if 'T' in flags:
1439 message.add_flag('D')
1440 if 'F' in flags:
1441 message.add_flag('F')
1442 if 'R' in flags:
1443 message.add_flag('A')
1444 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1445 elif isinstance(message, MHMessage):
1446 flags = set(self.get_flags())
1447 if 'S' not in flags:
1448 message.add_sequence('unseen')
1449 if 'R' in flags:
1450 message.add_sequence('replied')
1451 if 'F' in flags:
1452 message.add_sequence('flagged')
1453 elif isinstance(message, BabylMessage):
1454 flags = set(self.get_flags())
1455 if 'S' not in flags:
1456 message.add_label('unseen')
1457 if 'T' in flags:
1458 message.add_label('deleted')
1459 if 'R' in flags:
1460 message.add_label('answered')
1461 if 'P' in flags:
1462 message.add_label('forwarded')
1463 elif isinstance(message, Message):
1464 pass
1465 else:
1466 raise TypeError('Cannot convert to specified type: %s' %
1467 type(message))
1468
1469
1470class _mboxMMDFMessage(Message):
1471 """Message with mbox- or MMDF-specific properties."""
1472
1473 def __init__(self, message=None):
1474 """Initialize an mboxMMDFMessage instance."""
1475 self.set_from('MAILER-DAEMON', True)
Thomas Woutersb2137042007-02-01 18:02:27 +00001476 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001477 unixfrom = message.get_unixfrom()
1478 if unixfrom is not None and unixfrom.startswith('From '):
1479 self.set_from(unixfrom[5:])
1480 Message.__init__(self, message)
1481
1482 def get_from(self):
1483 """Return contents of "From " line."""
1484 return self._from
1485
1486 def set_from(self, from_, time_=None):
1487 """Set "From " line, formatting and appending time_ if specified."""
1488 if time_ is not None:
1489 if time_ is True:
1490 time_ = time.gmtime()
1491 from_ += ' ' + time.asctime(time_)
1492 self._from = from_
1493
1494 def get_flags(self):
1495 """Return as a string the flags that are set."""
1496 return self.get('Status', '') + self.get('X-Status', '')
1497
1498 def set_flags(self, flags):
1499 """Set the given flags and unset all others."""
1500 flags = set(flags)
1501 status_flags, xstatus_flags = '', ''
1502 for flag in ('R', 'O'):
1503 if flag in flags:
1504 status_flags += flag
1505 flags.remove(flag)
1506 for flag in ('D', 'F', 'A'):
1507 if flag in flags:
1508 xstatus_flags += flag
1509 flags.remove(flag)
1510 xstatus_flags += ''.join(sorted(flags))
1511 try:
1512 self.replace_header('Status', status_flags)
1513 except KeyError:
1514 self.add_header('Status', status_flags)
1515 try:
1516 self.replace_header('X-Status', xstatus_flags)
1517 except KeyError:
1518 self.add_header('X-Status', xstatus_flags)
1519
1520 def add_flag(self, flag):
1521 """Set the given flag(s) without changing others."""
1522 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1523
1524 def remove_flag(self, flag):
1525 """Unset the given string flag(s) without changing others."""
1526 if 'Status' in self or 'X-Status' in self:
1527 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1528
1529 def _explain_to(self, message):
1530 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1531 if isinstance(message, MaildirMessage):
1532 flags = set(self.get_flags())
1533 if 'O' in flags:
1534 message.set_subdir('cur')
1535 if 'F' in flags:
1536 message.add_flag('F')
1537 if 'A' in flags:
1538 message.add_flag('R')
1539 if 'R' in flags:
1540 message.add_flag('S')
1541 if 'D' in flags:
1542 message.add_flag('T')
1543 del message['status']
1544 del message['x-status']
1545 maybe_date = ' '.join(self.get_from().split()[-5:])
1546 try:
1547 message.set_date(calendar.timegm(time.strptime(maybe_date,
1548 '%a %b %d %H:%M:%S %Y')))
1549 except (ValueError, OverflowError):
1550 pass
1551 elif isinstance(message, _mboxMMDFMessage):
1552 message.set_flags(self.get_flags())
1553 message.set_from(self.get_from())
1554 elif isinstance(message, MHMessage):
1555 flags = set(self.get_flags())
1556 if 'R' not in flags:
1557 message.add_sequence('unseen')
1558 if 'A' in flags:
1559 message.add_sequence('replied')
1560 if 'F' in flags:
1561 message.add_sequence('flagged')
1562 del message['status']
1563 del message['x-status']
1564 elif isinstance(message, BabylMessage):
1565 flags = set(self.get_flags())
1566 if 'R' not in flags:
1567 message.add_label('unseen')
1568 if 'D' in flags:
1569 message.add_label('deleted')
1570 if 'A' in flags:
1571 message.add_label('answered')
1572 del message['status']
1573 del message['x-status']
1574 elif isinstance(message, Message):
1575 pass
1576 else:
1577 raise TypeError('Cannot convert to specified type: %s' %
1578 type(message))
1579
1580
1581class mboxMessage(_mboxMMDFMessage):
1582 """Message with mbox-specific properties."""
1583
1584
1585class MHMessage(Message):
1586 """Message with MH-specific properties."""
1587
1588 def __init__(self, message=None):
1589 """Initialize an MHMessage instance."""
1590 self._sequences = []
1591 Message.__init__(self, message)
1592
1593 def get_sequences(self):
1594 """Return a list of sequences that include the message."""
1595 return self._sequences[:]
1596
1597 def set_sequences(self, sequences):
1598 """Set the list of sequences that include the message."""
1599 self._sequences = list(sequences)
1600
1601 def add_sequence(self, sequence):
1602 """Add sequence to list of sequences including the message."""
1603 if isinstance(sequence, str):
1604 if not sequence in self._sequences:
1605 self._sequences.append(sequence)
1606 else:
1607 raise TypeError('sequence must be a string: %s' % type(sequence))
1608
1609 def remove_sequence(self, sequence):
1610 """Remove sequence from the list of sequences including the message."""
1611 try:
1612 self._sequences.remove(sequence)
1613 except ValueError:
1614 pass
1615
1616 def _explain_to(self, message):
1617 """Copy MH-specific state to message insofar as possible."""
1618 if isinstance(message, MaildirMessage):
1619 sequences = set(self.get_sequences())
1620 if 'unseen' in sequences:
1621 message.set_subdir('cur')
1622 else:
1623 message.set_subdir('cur')
1624 message.add_flag('S')
1625 if 'flagged' in sequences:
1626 message.add_flag('F')
1627 if 'replied' in sequences:
1628 message.add_flag('R')
1629 elif isinstance(message, _mboxMMDFMessage):
1630 sequences = set(self.get_sequences())
1631 if 'unseen' not in sequences:
1632 message.add_flag('RO')
1633 else:
1634 message.add_flag('O')
1635 if 'flagged' in sequences:
1636 message.add_flag('F')
1637 if 'replied' in sequences:
1638 message.add_flag('A')
1639 elif isinstance(message, MHMessage):
1640 for sequence in self.get_sequences():
1641 message.add_sequence(sequence)
1642 elif isinstance(message, BabylMessage):
1643 sequences = set(self.get_sequences())
1644 if 'unseen' in sequences:
1645 message.add_label('unseen')
1646 if 'replied' in sequences:
1647 message.add_label('answered')
1648 elif isinstance(message, Message):
1649 pass
1650 else:
1651 raise TypeError('Cannot convert to specified type: %s' %
1652 type(message))
1653
1654
1655class BabylMessage(Message):
1656 """Message with Babyl-specific properties."""
1657
1658 def __init__(self, message=None):
1659 """Initialize an BabylMessage instance."""
1660 self._labels = []
1661 self._visible = Message()
1662 Message.__init__(self, message)
1663
1664 def get_labels(self):
1665 """Return a list of labels on the message."""
1666 return self._labels[:]
1667
1668 def set_labels(self, labels):
1669 """Set the list of labels on the message."""
1670 self._labels = list(labels)
1671
1672 def add_label(self, label):
1673 """Add label to list of labels on the message."""
1674 if isinstance(label, str):
1675 if label not in self._labels:
1676 self._labels.append(label)
1677 else:
1678 raise TypeError('label must be a string: %s' % type(label))
1679
1680 def remove_label(self, label):
1681 """Remove label from the list of labels on the message."""
1682 try:
1683 self._labels.remove(label)
1684 except ValueError:
1685 pass
1686
1687 def get_visible(self):
1688 """Return a Message representation of visible headers."""
1689 return Message(self._visible)
1690
1691 def set_visible(self, visible):
1692 """Set the Message representation of visible headers."""
1693 self._visible = Message(visible)
1694
1695 def update_visible(self):
1696 """Update and/or sensibly generate a set of visible headers."""
1697 for header in self._visible.keys():
1698 if header in self:
1699 self._visible.replace_header(header, self[header])
1700 else:
1701 del self._visible[header]
1702 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1703 if header in self and header not in self._visible:
1704 self._visible[header] = self[header]
1705
1706 def _explain_to(self, message):
1707 """Copy Babyl-specific state to message insofar as possible."""
1708 if isinstance(message, MaildirMessage):
1709 labels = set(self.get_labels())
1710 if 'unseen' in labels:
1711 message.set_subdir('cur')
1712 else:
1713 message.set_subdir('cur')
1714 message.add_flag('S')
1715 if 'forwarded' in labels or 'resent' in labels:
1716 message.add_flag('P')
1717 if 'answered' in labels:
1718 message.add_flag('R')
1719 if 'deleted' in labels:
1720 message.add_flag('T')
1721 elif isinstance(message, _mboxMMDFMessage):
1722 labels = set(self.get_labels())
1723 if 'unseen' not in labels:
1724 message.add_flag('RO')
1725 else:
1726 message.add_flag('O')
1727 if 'deleted' in labels:
1728 message.add_flag('D')
1729 if 'answered' in labels:
1730 message.add_flag('A')
1731 elif isinstance(message, MHMessage):
1732 labels = set(self.get_labels())
1733 if 'unseen' in labels:
1734 message.add_sequence('unseen')
1735 if 'answered' in labels:
1736 message.add_sequence('replied')
1737 elif isinstance(message, BabylMessage):
1738 message.set_visible(self.get_visible())
1739 for label in self.get_labels():
1740 message.add_label(label)
1741 elif isinstance(message, Message):
1742 pass
1743 else:
1744 raise TypeError('Cannot convert to specified type: %s' %
1745 type(message))
1746
1747
1748class MMDFMessage(_mboxMMDFMessage):
1749 """Message with MMDF-specific properties."""
1750
1751
1752class _ProxyFile:
1753 """A read-only wrapper of a file."""
1754
1755 def __init__(self, f, pos=None):
1756 """Initialize a _ProxyFile."""
1757 self._file = f
1758 if pos is None:
1759 self._pos = f.tell()
1760 else:
1761 self._pos = pos
1762
1763 def read(self, size=None):
1764 """Read bytes."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001765 return self._read(size, self._file.read)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001766
1767 def readline(self, size=None):
1768 """Read a line."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001769 return self._read(size, self._file.readline)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001770
1771 def readlines(self, sizehint=None):
1772 """Read multiple lines."""
1773 result = []
1774 for line in self:
1775 result.append(line)
1776 if sizehint is not None:
1777 sizehint -= len(line)
1778 if sizehint <= 0:
1779 break
1780 return result
1781
1782 def __iter__(self):
1783 """Iterate over lines."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001784 while True:
1785 line = self.readline()
1786 if not line:
1787 raise StopIteration
1788 yield line
Thomas Wouters477c8d52006-05-27 19:21:47 +00001789
1790 def tell(self):
1791 """Return the position."""
1792 return self._pos
1793
1794 def seek(self, offset, whence=0):
1795 """Change position."""
1796 if whence == 1:
1797 self._file.seek(self._pos)
1798 self._file.seek(offset, whence)
1799 self._pos = self._file.tell()
1800
1801 def close(self):
1802 """Close the file."""
1803 del self._file
1804
1805 def _read(self, size, read_method):
1806 """Read size bytes using read_method."""
1807 if size is None:
1808 size = -1
1809 self._file.seek(self._pos)
1810 result = read_method(size)
1811 self._pos = self._file.tell()
1812 return result
1813
1814
1815class _PartialFile(_ProxyFile):
1816 """A read-only wrapper of part of a file."""
1817
1818 def __init__(self, f, start=None, stop=None):
1819 """Initialize a _PartialFile."""
1820 _ProxyFile.__init__(self, f, start)
1821 self._start = start
1822 self._stop = stop
1823
1824 def tell(self):
1825 """Return the position with respect to start."""
1826 return _ProxyFile.tell(self) - self._start
1827
1828 def seek(self, offset, whence=0):
1829 """Change position, possibly with respect to start or stop."""
1830 if whence == 0:
1831 self._pos = self._start
1832 whence = 1
1833 elif whence == 2:
1834 self._pos = self._stop
1835 whence = 1
1836 _ProxyFile.seek(self, offset, whence)
1837
1838 def _read(self, size, read_method):
1839 """Read size bytes using read_method, honoring start and stop."""
1840 remaining = self._stop - self._pos
1841 if remaining <= 0:
1842 return ''
1843 if size is None or size < 0 or size > remaining:
1844 size = remaining
1845 return _ProxyFile._read(self, size, read_method)
1846
1847
1848def _lock_file(f, dotlock=True):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001849 """Lock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001850 dotlock_done = False
1851 try:
1852 if fcntl:
1853 try:
1854 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
Guido van Rossumb940e112007-01-10 16:19:56 +00001855 except IOError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001856 if e.errno in (errno.EAGAIN, errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001857 raise ExternalClashError('lockf: lock unavailable: %s' %
1858 f.name)
1859 else:
1860 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +00001861 if dotlock:
1862 try:
1863 pre_lock = _create_temporary(f.name + '.lock')
1864 pre_lock.close()
Guido van Rossumb940e112007-01-10 16:19:56 +00001865 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001866 if e.errno == errno.EACCES:
1867 return # Without write access, just skip dotlocking.
1868 else:
1869 raise
1870 try:
1871 if hasattr(os, 'link'):
1872 os.link(pre_lock.name, f.name + '.lock')
1873 dotlock_done = True
1874 os.unlink(pre_lock.name)
1875 else:
1876 os.rename(pre_lock.name, f.name + '.lock')
1877 dotlock_done = True
Guido van Rossumb940e112007-01-10 16:19:56 +00001878 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001879 if e.errno == errno.EEXIST or \
1880 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001881 os.remove(pre_lock.name)
1882 raise ExternalClashError('dot lock unavailable: %s' %
1883 f.name)
1884 else:
1885 raise
1886 except:
1887 if fcntl:
1888 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001889 if dotlock_done:
1890 os.remove(f.name + '.lock')
1891 raise
1892
1893def _unlock_file(f):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001894 """Unlock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001895 if fcntl:
1896 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001897 if os.path.exists(f.name + '.lock'):
1898 os.remove(f.name + '.lock')
1899
1900def _create_carefully(path):
1901 """Create a file if it doesn't exist and open for reading and writing."""
1902 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR)
1903 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +00001904 return open(path, 'r+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001905 finally:
1906 os.close(fd)
1907
1908def _create_temporary(path):
1909 """Create a temp file based on path and open for reading and writing."""
1910 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1911 socket.gethostname(),
1912 os.getpid()))
1913
Thomas Wouters89f507f2006-12-13 04:49:30 +00001914def _sync_flush(f):
1915 """Ensure changes to file f are physically on disk."""
1916 f.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001917 if hasattr(os, 'fsync'):
1918 os.fsync(f.fileno())
Thomas Wouters89f507f2006-12-13 04:49:30 +00001919
1920def _sync_close(f):
1921 """Close file f, ensuring all changes are physically on disk."""
1922 _sync_flush(f)
1923 f.close()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001924
1925## Start: classes from the original module (for backward compatibility).
1926
1927# Note that the Maildir class, whose name is unchanged, itself offers a next()
1928# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001929
Guido van Rossumc7b68821994-04-28 09:53:33 +00001930class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001931
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001932 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001933 self.fp = fp
1934 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001935 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001936
Fred Drake72987a42001-05-02 20:20:53 +00001937 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001938 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001939
Fred Drakedbbf76b2000-07-09 16:44:26 +00001940 def next(self):
1941 while 1:
1942 self.fp.seek(self.seekp)
1943 try:
1944 self._search_start()
1945 except EOFError:
1946 self.seekp = self.fp.tell()
1947 return None
1948 start = self.fp.tell()
1949 self._search_end()
1950 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00001951 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00001952 break
Thomas Wouters477c8d52006-05-27 19:21:47 +00001953 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00001954
Barry Warsawffd05ee2002-03-01 22:39:14 +00001955# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00001956class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00001957
Fred Drakedbbf76b2000-07-09 16:44:26 +00001958 def _search_start(self):
1959 while 1:
1960 pos = self.fp.tell()
1961 line = self.fp.readline()
1962 if not line:
1963 raise EOFError
1964 if line[:5] == 'From ' and self._isrealfromline(line):
1965 self.fp.seek(pos)
1966 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00001967
Fred Drakedbbf76b2000-07-09 16:44:26 +00001968 def _search_end(self):
1969 self.fp.readline() # Throw away header line
1970 while 1:
1971 pos = self.fp.tell()
1972 line = self.fp.readline()
1973 if not line:
1974 return
1975 if line[:5] == 'From ' and self._isrealfromline(line):
1976 self.fp.seek(pos)
1977 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00001978
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001979 # An overridable mechanism to test for From-line-ness. You can either
1980 # specify a different regular expression or define a whole new
1981 # _isrealfromline() method. Note that this only gets called for lines
1982 # starting with the 5 characters "From ".
1983 #
1984 # BAW: According to
1985 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
1986 # the only portable, reliable way to find message delimiters in a BSD (i.e
1987 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
1988 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
1989 # like a good idea, in practice, there are too many variations for more
1990 # strict parsing of the line to be completely accurate.
1991 #
1992 # _strict_isrealfromline() is the old version which tries to do stricter
1993 # parsing of the From_ line. _portable_isrealfromline() simply returns
1994 # true, since it's never called if the line doesn't already start with
1995 # "From ".
1996 #
1997 # This algorithm, and the way it interacts with _search_start() and
1998 # _search_end() may not be completely correct, because it doesn't check
1999 # that the two characters preceding "From " are \n\n or the beginning of
2000 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00002001 # necessary. For convenience, we've added a PortableUnixMailbox class
Thomas Woutersb2137042007-02-01 18:02:27 +00002002 # which does no checking of the format of the 'From' line.
Guido van Rossumc7b68821994-04-28 09:53:33 +00002003
Thomas Woutersb2137042007-02-01 18:02:27 +00002004 _fromlinepattern = (r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+"
2005 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*"
2006 r"[^\s]*\s*"
2007 "$")
Fred Drakedbbf76b2000-07-09 16:44:26 +00002008 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002009
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002010 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002011 if not self._regexp:
2012 import re
2013 self._regexp = re.compile(self._fromlinepattern)
2014 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002015
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002016 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002017 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002018
2019 _isrealfromline = _strict_isrealfromline
2020
2021
2022class PortableUnixMailbox(UnixMailbox):
2023 _isrealfromline = UnixMailbox._portable_isrealfromline
2024
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002025
Guido van Rossumc7b68821994-04-28 09:53:33 +00002026class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002027
Fred Drakedbbf76b2000-07-09 16:44:26 +00002028 def _search_start(self):
2029 while 1:
2030 line = self.fp.readline()
2031 if not line:
2032 raise EOFError
2033 if line[:5] == '\001\001\001\001\n':
2034 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002035
Fred Drakedbbf76b2000-07-09 16:44:26 +00002036 def _search_end(self):
2037 while 1:
2038 pos = self.fp.tell()
2039 line = self.fp.readline()
2040 if not line:
2041 return
2042 if line == '\001\001\001\001\n':
2043 self.fp.seek(pos)
2044 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002045
Guido van Rossumc7b68821994-04-28 09:53:33 +00002046
Jack Jansen97157791995-10-23 13:59:53 +00002047class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002048
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002049 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002050 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002051 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002052 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002053 # the three following lines could be combined into:
2054 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2055 list = os.listdir(self.dirname)
2056 list = filter(pat.match, list)
Guido van Rossume2a383d2007-01-15 16:59:06 +00002057 list = map(int, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002058 list.sort()
2059 # This only works in Python 1.6 or later;
2060 # before that str() added 'L':
2061 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002062 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002063 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002064
Fred Drake72987a42001-05-02 20:20:53 +00002065 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002066 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002067
Fred Drakedbbf76b2000-07-09 16:44:26 +00002068 def next(self):
2069 if not self.boxes:
2070 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002071 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002072 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002073 msg = self.factory(fp)
2074 try:
2075 msg._mh_msgno = fn
2076 except (AttributeError, TypeError):
2077 pass
2078 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002079
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002080
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002081class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002082
Fred Drakedbbf76b2000-07-09 16:44:26 +00002083 def _search_start(self):
2084 while 1:
2085 line = self.fp.readline()
2086 if not line:
2087 raise EOFError
2088 if line == '*** EOOH ***\n':
2089 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002090
Fred Drakedbbf76b2000-07-09 16:44:26 +00002091 def _search_end(self):
2092 while 1:
2093 pos = self.fp.tell()
2094 line = self.fp.readline()
2095 if not line:
2096 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002097 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002098 self.fp.seek(pos)
2099 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002100
Thomas Wouters477c8d52006-05-27 19:21:47 +00002101## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002102
2103
Thomas Wouters477c8d52006-05-27 19:21:47 +00002104class Error(Exception):
2105 """Raised for module-specific errors."""
2106
2107class NoSuchMailboxError(Error):
2108 """The specified mailbox does not exist and won't be created."""
2109
2110class NotEmptyError(Error):
2111 """The specified mailbox is not empty and deletion was requested."""
2112
2113class ExternalClashError(Error):
2114 """Another process caused an action to fail."""
2115
2116class FormatError(Error):
2117 """A file appears to have an invalid format."""