blob: d2db53fa693efcd999c9d0aa55ffbd0eb81b6220 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Thomas Wouters477c8d52006-05-27 19:21:47 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Thomas Wouters89f507f2006-12-13 04:49:30 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Thomas Wouters477c8d52006-05-27 19:21:47 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Thomas Wouters477c8d52006-05-27 19:21:47 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
Thomas Woutersb2137042007-02-01 18:02:27 +000019import email.message
20import email.generator
Thomas Wouters477c8d52006-05-27 19:21:47 +000021import rfc822
Guido van Rossum34d19282007-08-09 01:03:29 +000022import io
Thomas Wouters477c8d52006-05-27 19:21:47 +000023try:
Thomas Wouters0e3f5912006-08-11 14:57:12 +000024 if sys.platform == 'os2emx':
25 # OS/2 EMX fcntl() not adequate
26 raise ImportError
27 import fcntl
Thomas Wouters477c8d52006-05-27 19:21:47 +000028except ImportError:
29 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000030
Thomas Wouters477c8d52006-05-27 19:21:47 +000031__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
32 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
33 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
34 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
35
36class Mailbox:
37 """A group of messages in a particular place."""
38
39 def __init__(self, path, factory=None, create=True):
40 """Initialize a Mailbox instance."""
41 self._path = os.path.abspath(os.path.expanduser(path))
42 self._factory = factory
43
44 def add(self, message):
45 """Add message and return assigned key."""
46 raise NotImplementedError('Method must be implemented by subclass')
47
48 def remove(self, key):
49 """Remove the keyed message; raise KeyError if it doesn't exist."""
50 raise NotImplementedError('Method must be implemented by subclass')
51
52 def __delitem__(self, key):
53 self.remove(key)
54
55 def discard(self, key):
56 """If the keyed message exists, remove it."""
57 try:
58 self.remove(key)
59 except KeyError:
60 pass
61
62 def __setitem__(self, key, message):
63 """Replace the keyed message; raise KeyError if it doesn't exist."""
64 raise NotImplementedError('Method must be implemented by subclass')
65
66 def get(self, key, default=None):
67 """Return the keyed message, or default if it doesn't exist."""
68 try:
69 return self.__getitem__(key)
70 except KeyError:
71 return default
72
73 def __getitem__(self, key):
74 """Return the keyed message; raise KeyError if it doesn't exist."""
75 if not self._factory:
76 return self.get_message(key)
77 else:
78 return self._factory(self.get_file(key))
79
80 def get_message(self, key):
81 """Return a Message representation or raise a KeyError."""
82 raise NotImplementedError('Method must be implemented by subclass')
83
84 def get_string(self, key):
85 """Return a string representation or raise a KeyError."""
86 raise NotImplementedError('Method must be implemented by subclass')
87
88 def get_file(self, key):
89 """Return a file-like representation or raise a KeyError."""
90 raise NotImplementedError('Method must be implemented by subclass')
91
92 def iterkeys(self):
93 """Return an iterator over keys."""
94 raise NotImplementedError('Method must be implemented by subclass')
95
96 def keys(self):
97 """Return a list of keys."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +000098 return list(self.iterkeys())
Thomas Wouters477c8d52006-05-27 19:21:47 +000099
100 def itervalues(self):
101 """Return an iterator over all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000102 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000103 try:
104 value = self[key]
105 except KeyError:
106 continue
107 yield value
108
109 def __iter__(self):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000110 return self.itervalues()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000111
112 def values(self):
113 """Return a list of messages. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000114 return list(self.itervalues())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000115
116 def iteritems(self):
117 """Return an iterator over (key, message) tuples."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000118 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000119 try:
120 value = self[key]
121 except KeyError:
122 continue
123 yield (key, value)
124
125 def items(self):
126 """Return a list of (key, message) tuples. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000127 return list(self.iteritems())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000128
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000129 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000130 """Return True if the keyed message exists, False otherwise."""
131 raise NotImplementedError('Method must be implemented by subclass')
132
Thomas Wouters477c8d52006-05-27 19:21:47 +0000133 def __len__(self):
134 """Return a count of messages in the mailbox."""
135 raise NotImplementedError('Method must be implemented by subclass')
136
137 def clear(self):
138 """Delete all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000139 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000140 self.discard(key)
141
142 def pop(self, key, default=None):
143 """Delete the keyed message and return it, or default."""
144 try:
145 result = self[key]
146 except KeyError:
147 return default
148 self.discard(key)
149 return result
150
151 def popitem(self):
152 """Delete an arbitrary (key, message) pair and return it."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000153 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000154 return (key, self.pop(key)) # This is only run once.
155 else:
156 raise KeyError('No messages in mailbox')
157
158 def update(self, arg=None):
159 """Change the messages that correspond to certain keys."""
160 if hasattr(arg, 'iteritems'):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000161 source = arg.items()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000162 elif hasattr(arg, 'items'):
163 source = arg.items()
164 else:
165 source = arg
166 bad_key = False
167 for key, message in source:
168 try:
169 self[key] = message
170 except KeyError:
171 bad_key = True
172 if bad_key:
173 raise KeyError('No message with key(s)')
174
175 def flush(self):
176 """Write any pending changes to the disk."""
177 raise NotImplementedError('Method must be implemented by subclass')
178
179 def lock(self):
180 """Lock the mailbox."""
181 raise NotImplementedError('Method must be implemented by subclass')
182
183 def unlock(self):
184 """Unlock the mailbox if it is locked."""
185 raise NotImplementedError('Method must be implemented by subclass')
186
187 def close(self):
188 """Flush and close the mailbox."""
189 raise NotImplementedError('Method must be implemented by subclass')
190
191 def _dump_message(self, message, target, mangle_from_=False):
Guido van Rossum671117a2007-08-31 04:25:05 +0000192 # This assumes the target file is open in *text* mode with the
193 # desired encoding and newline setting.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000194 """Dump message contents to target file."""
Thomas Woutersb2137042007-02-01 18:02:27 +0000195 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +0000196 buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +0000197 gen = email.generator.Generator(buffer, mangle_from_, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000198 gen.flatten(message)
199 buffer.seek(0)
Guido van Rossum671117a2007-08-31 04:25:05 +0000200 data = buffer.read()
201 ##data = data.replace('\n', os.linesep)
202 target.write(data)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000203 elif isinstance(message, str):
204 if mangle_from_:
205 message = message.replace('\nFrom ', '\n>From ')
Guido van Rossum671117a2007-08-31 04:25:05 +0000206 ##message = message.replace('\n', os.linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000207 target.write(message)
208 elif hasattr(message, 'read'):
209 while True:
210 line = message.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000211 if not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000212 break
213 if mangle_from_ and line.startswith('From '):
214 line = '>From ' + line[5:]
Guido van Rossum671117a2007-08-31 04:25:05 +0000215 ##line = line.replace('\n', os.linesep)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000216 target.write(line)
217 else:
218 raise TypeError('Invalid message type: %s' % type(message))
219
220
221class Maildir(Mailbox):
222 """A qmail-style Maildir mailbox."""
223
224 colon = ':'
225
226 def __init__(self, dirname, factory=rfc822.Message, create=True):
227 """Initialize a Maildir instance."""
228 Mailbox.__init__(self, dirname, factory, create)
229 if not os.path.exists(self._path):
230 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000231 os.mkdir(self._path, 0o700)
232 os.mkdir(os.path.join(self._path, 'tmp'), 0o700)
233 os.mkdir(os.path.join(self._path, 'new'), 0o700)
234 os.mkdir(os.path.join(self._path, 'cur'), 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000235 else:
236 raise NoSuchMailboxError(self._path)
237 self._toc = {}
238
239 def add(self, message):
240 """Add message and return assigned key."""
241 tmp_file = self._create_tmp()
242 try:
243 self._dump_message(message, tmp_file)
244 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000245 _sync_close(tmp_file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000246 if isinstance(message, MaildirMessage):
247 subdir = message.get_subdir()
248 suffix = self.colon + message.get_info()
249 if suffix == self.colon:
250 suffix = ''
251 else:
252 subdir = 'new'
253 suffix = ''
254 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
255 dest = os.path.join(self._path, subdir, uniq + suffix)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000256 try:
257 if hasattr(os, 'link'):
258 os.link(tmp_file.name, dest)
259 os.remove(tmp_file.name)
260 else:
261 os.rename(tmp_file.name, dest)
Guido van Rossumb940e112007-01-10 16:19:56 +0000262 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000263 os.remove(tmp_file.name)
264 if e.errno == errno.EEXIST:
265 raise ExternalClashError('Name clash with existing message: %s'
266 % dest)
267 else:
268 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000269 if isinstance(message, MaildirMessage):
270 os.utime(dest, (os.path.getatime(dest), message.get_date()))
271 return uniq
272
273 def remove(self, key):
274 """Remove the keyed message; raise KeyError if it doesn't exist."""
275 os.remove(os.path.join(self._path, self._lookup(key)))
276
277 def discard(self, key):
278 """If the keyed message exists, remove it."""
279 # This overrides an inapplicable implementation in the superclass.
280 try:
281 self.remove(key)
282 except KeyError:
283 pass
Guido van Rossumb940e112007-01-10 16:19:56 +0000284 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000285 if e.errno != errno.ENOENT:
286 raise
287
288 def __setitem__(self, key, message):
289 """Replace the keyed message; raise KeyError if it doesn't exist."""
290 old_subpath = self._lookup(key)
291 temp_key = self.add(message)
292 temp_subpath = self._lookup(temp_key)
293 if isinstance(message, MaildirMessage):
294 # temp's subdir and suffix were specified by message.
295 dominant_subpath = temp_subpath
296 else:
297 # temp's subdir and suffix were defaults from add().
298 dominant_subpath = old_subpath
299 subdir = os.path.dirname(dominant_subpath)
300 if self.colon in dominant_subpath:
301 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
302 else:
303 suffix = ''
304 self.discard(key)
305 new_path = os.path.join(self._path, subdir, key + suffix)
306 os.rename(os.path.join(self._path, temp_subpath), new_path)
307 if isinstance(message, MaildirMessage):
308 os.utime(new_path, (os.path.getatime(new_path),
309 message.get_date()))
310
311 def get_message(self, key):
312 """Return a Message representation or raise a KeyError."""
313 subpath = self._lookup(key)
314 f = open(os.path.join(self._path, subpath), 'r')
315 try:
Christian Heimesfdab48e2008-01-20 09:06:41 +0000316 if self._factory:
317 msg = self._factory(f)
318 else:
319 msg = MaildirMessage(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000320 finally:
321 f.close()
322 subdir, name = os.path.split(subpath)
323 msg.set_subdir(subdir)
324 if self.colon in name:
325 msg.set_info(name.split(self.colon)[-1])
326 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
327 return msg
328
329 def get_string(self, key):
330 """Return a string representation or raise a KeyError."""
331 f = open(os.path.join(self._path, self._lookup(key)), 'r')
332 try:
333 return f.read()
334 finally:
335 f.close()
336
337 def get_file(self, key):
338 """Return a file-like representation or raise a KeyError."""
Guido van Rossum98297ee2007-11-06 21:34:58 +0000339 f = open(os.path.join(self._path, self._lookup(key)), 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000340 return _ProxyFile(f)
341
342 def iterkeys(self):
343 """Return an iterator over keys."""
344 self._refresh()
345 for key in self._toc:
346 try:
347 self._lookup(key)
348 except KeyError:
349 continue
350 yield key
351
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000352 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000353 """Return True if the keyed message exists, False otherwise."""
354 self._refresh()
355 return key in self._toc
356
357 def __len__(self):
358 """Return a count of messages in the mailbox."""
359 self._refresh()
360 return len(self._toc)
361
362 def flush(self):
363 """Write any pending changes to disk."""
364 return # Maildir changes are always written immediately.
365
366 def lock(self):
367 """Lock the mailbox."""
368 return
369
370 def unlock(self):
371 """Unlock the mailbox if it is locked."""
372 return
373
374 def close(self):
375 """Flush and close the mailbox."""
376 return
377
378 def list_folders(self):
379 """Return a list of folder names."""
380 result = []
381 for entry in os.listdir(self._path):
382 if len(entry) > 1 and entry[0] == '.' and \
383 os.path.isdir(os.path.join(self._path, entry)):
384 result.append(entry[1:])
385 return result
386
387 def get_folder(self, folder):
388 """Return a Maildir instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000389 return Maildir(os.path.join(self._path, '.' + folder),
390 factory=self._factory,
391 create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000392
393 def add_folder(self, folder):
394 """Create a folder and return a Maildir instance representing it."""
395 path = os.path.join(self._path, '.' + folder)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000396 result = Maildir(path, factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000397 maildirfolder_path = os.path.join(path, 'maildirfolder')
398 if not os.path.exists(maildirfolder_path):
399 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY))
400 return result
401
402 def remove_folder(self, folder):
403 """Delete the named folder, which must be empty."""
404 path = os.path.join(self._path, '.' + folder)
405 for entry in os.listdir(os.path.join(path, 'new')) + \
406 os.listdir(os.path.join(path, 'cur')):
407 if len(entry) < 1 or entry[0] != '.':
408 raise NotEmptyError('Folder contains message(s): %s' % folder)
409 for entry in os.listdir(path):
410 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
411 os.path.isdir(os.path.join(path, entry)):
412 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
413 (folder, entry))
414 for root, dirs, files in os.walk(path, topdown=False):
415 for entry in files:
416 os.remove(os.path.join(root, entry))
417 for entry in dirs:
418 os.rmdir(os.path.join(root, entry))
419 os.rmdir(path)
420
421 def clean(self):
422 """Delete old files in "tmp"."""
423 now = time.time()
424 for entry in os.listdir(os.path.join(self._path, 'tmp')):
425 path = os.path.join(self._path, 'tmp', entry)
426 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
427 os.remove(path)
428
429 _count = 1 # This is used to generate unique file names.
430
431 def _create_tmp(self):
432 """Create a file in the tmp subdirectory and open and return it."""
433 now = time.time()
434 hostname = socket.gethostname()
435 if '/' in hostname:
436 hostname = hostname.replace('/', r'\057')
437 if ':' in hostname:
438 hostname = hostname.replace(':', r'\072')
439 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
440 Maildir._count, hostname)
441 path = os.path.join(self._path, 'tmp', uniq)
442 try:
443 os.stat(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000444 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000445 if e.errno == errno.ENOENT:
446 Maildir._count += 1
Thomas Wouters89f507f2006-12-13 04:49:30 +0000447 try:
448 return _create_carefully(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000449 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000450 if e.errno != errno.EEXIST:
451 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000452 else:
453 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000454
455 # Fall through to here if stat succeeded or open raised EEXIST.
456 raise ExternalClashError('Name clash prevented file creation: %s' %
457 path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000458
459 def _refresh(self):
460 """Update table of contents mapping."""
461 self._toc = {}
462 for subdir in ('new', 'cur'):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000463 subdir_path = os.path.join(self._path, subdir)
464 for entry in os.listdir(subdir_path):
465 p = os.path.join(subdir_path, entry)
466 if os.path.isdir(p):
467 continue
Thomas Wouters477c8d52006-05-27 19:21:47 +0000468 uniq = entry.split(self.colon)[0]
469 self._toc[uniq] = os.path.join(subdir, entry)
470
471 def _lookup(self, key):
472 """Use TOC to return subpath for given key, or raise a KeyError."""
473 try:
474 if os.path.exists(os.path.join(self._path, self._toc[key])):
475 return self._toc[key]
476 except KeyError:
477 pass
478 self._refresh()
479 try:
480 return self._toc[key]
481 except KeyError:
482 raise KeyError('No message with key: %s' % key)
483
484 # This method is for backward compatibility only.
485 def next(self):
486 """Return the next message in a one-time iteration."""
487 if not hasattr(self, '_onetime_keys'):
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000488 self._onetime_keys = iter(self.keys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000489 while True:
490 try:
Georg Brandla18af4e2007-04-21 15:47:16 +0000491 return self[next(self._onetime_keys)]
Thomas Wouters477c8d52006-05-27 19:21:47 +0000492 except StopIteration:
493 return None
494 except KeyError:
495 continue
496
497
498class _singlefileMailbox(Mailbox):
499 """A single-file mailbox."""
500
501 def __init__(self, path, factory=None, create=True):
502 """Initialize a single-file mailbox."""
503 Mailbox.__init__(self, path, factory, create)
504 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000505 f = open(self._path, 'r+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000506 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000507 if e.errno == errno.ENOENT:
508 if create:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000509 f = open(self._path, 'w+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000510 else:
511 raise NoSuchMailboxError(self._path)
512 elif e.errno == errno.EACCES:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000513 f = open(self._path, 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000514 else:
515 raise
516 self._file = f
517 self._toc = None
518 self._next_key = 0
519 self._pending = False # No changes require rewriting the file.
520 self._locked = False
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000521 self._file_length = None # Used to record mailbox size
Thomas Wouters477c8d52006-05-27 19:21:47 +0000522
523 def add(self, message):
524 """Add message and return assigned key."""
525 self._lookup()
526 self._toc[self._next_key] = self._append_message(message)
527 self._next_key += 1
528 self._pending = True
529 return self._next_key - 1
530
531 def remove(self, key):
532 """Remove the keyed message; raise KeyError if it doesn't exist."""
533 self._lookup(key)
534 del self._toc[key]
535 self._pending = True
536
537 def __setitem__(self, key, message):
538 """Replace the keyed message; raise KeyError if it doesn't exist."""
539 self._lookup(key)
540 self._toc[key] = self._append_message(message)
541 self._pending = True
542
543 def iterkeys(self):
544 """Return an iterator over keys."""
545 self._lookup()
546 for key in self._toc.keys():
547 yield key
548
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000549 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000550 """Return True if the keyed message exists, False otherwise."""
551 self._lookup()
552 return key in self._toc
553
554 def __len__(self):
555 """Return a count of messages in the mailbox."""
556 self._lookup()
557 return len(self._toc)
558
559 def lock(self):
560 """Lock the mailbox."""
561 if not self._locked:
562 _lock_file(self._file)
563 self._locked = True
564
565 def unlock(self):
566 """Unlock the mailbox if it is locked."""
567 if self._locked:
568 _unlock_file(self._file)
569 self._locked = False
570
571 def flush(self):
572 """Write any pending changes to disk."""
573 if not self._pending:
574 return
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000575
576 # In order to be writing anything out at all, self._toc must
577 # already have been generated (and presumably has been modified
578 # by adding or deleting an item).
579 assert self._toc is not None
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000580
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000581 # Check length of self._file; if it's changed, some other process
582 # has modified the mailbox since we scanned it.
583 self._file.seek(0, 2)
584 cur_len = self._file.tell()
585 if cur_len != self._file_length:
586 raise ExternalClashError('Size of mailbox file changed '
587 '(expected %i, found %i)' %
588 (self._file_length, cur_len))
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000589
Thomas Wouters477c8d52006-05-27 19:21:47 +0000590 new_file = _create_temporary(self._path)
591 try:
592 new_toc = {}
593 self._pre_mailbox_hook(new_file)
594 for key in sorted(self._toc.keys()):
595 start, stop = self._toc[key]
596 self._file.seek(start)
597 self._pre_message_hook(new_file)
598 new_start = new_file.tell()
599 while True:
600 buffer = self._file.read(min(4096,
601 stop - self._file.tell()))
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000602 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000603 break
604 new_file.write(buffer)
605 new_toc[key] = (new_start, new_file.tell())
606 self._post_message_hook(new_file)
607 except:
608 new_file.close()
609 os.remove(new_file.name)
610 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000611 _sync_close(new_file)
612 # self._file is about to get replaced, so no need to sync.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000613 self._file.close()
614 try:
615 os.rename(new_file.name, self._path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000616 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000617 if e.errno == errno.EEXIST or \
618 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000619 os.remove(self._path)
620 os.rename(new_file.name, self._path)
621 else:
622 raise
623 self._file = open(self._path, 'rb+')
624 self._toc = new_toc
625 self._pending = False
626 if self._locked:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000627 _lock_file(self._file, dotlock=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000628
629 def _pre_mailbox_hook(self, f):
630 """Called before writing the mailbox to file f."""
631 return
632
633 def _pre_message_hook(self, f):
634 """Called before writing each message to file f."""
635 return
636
637 def _post_message_hook(self, f):
638 """Called after writing each message to file f."""
639 return
640
641 def close(self):
642 """Flush and close the mailbox."""
643 self.flush()
644 if self._locked:
645 self.unlock()
Thomas Wouters89f507f2006-12-13 04:49:30 +0000646 self._file.close() # Sync has been done by self.flush() above.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000647
648 def _lookup(self, key=None):
649 """Return (start, stop) or raise KeyError."""
650 if self._toc is None:
651 self._generate_toc()
652 if key is not None:
653 try:
654 return self._toc[key]
655 except KeyError:
656 raise KeyError('No message with key: %s' % key)
657
658 def _append_message(self, message):
659 """Append message to mailbox and return (start, stop) offsets."""
660 self._file.seek(0, 2)
661 self._pre_message_hook(self._file)
662 offsets = self._install_message(message)
663 self._post_message_hook(self._file)
664 self._file.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000665 self._file_length = self._file.tell() # Record current length of mailbox
Thomas Wouters477c8d52006-05-27 19:21:47 +0000666 return offsets
667
668
669
670class _mboxMMDF(_singlefileMailbox):
671 """An mbox or MMDF mailbox."""
672
673 _mangle_from_ = True
674
675 def get_message(self, key):
676 """Return a Message representation or raise a KeyError."""
677 start, stop = self._lookup(key)
678 self._file.seek(start)
679 from_line = self._file.readline().replace(os.linesep, '')
680 string = self._file.read(stop - self._file.tell())
681 msg = self._message_factory(string.replace(os.linesep, '\n'))
682 msg.set_from(from_line[5:])
683 return msg
684
685 def get_string(self, key, from_=False):
686 """Return a string representation or raise a KeyError."""
687 start, stop = self._lookup(key)
688 self._file.seek(start)
689 if not from_:
690 self._file.readline()
691 string = self._file.read(stop - self._file.tell())
692 return string.replace(os.linesep, '\n')
693
694 def get_file(self, key, from_=False):
695 """Return a file-like representation or raise a KeyError."""
696 start, stop = self._lookup(key)
697 self._file.seek(start)
698 if not from_:
699 self._file.readline()
700 return _PartialFile(self._file, self._file.tell(), stop)
701
702 def _install_message(self, message):
703 """Format a message and blindly write to self._file."""
704 from_line = None
705 if isinstance(message, str) and message.startswith('From '):
706 newline = message.find('\n')
707 if newline != -1:
708 from_line = message[:newline]
709 message = message[newline + 1:]
710 else:
711 from_line = message
712 message = ''
713 elif isinstance(message, _mboxMMDFMessage):
714 from_line = 'From ' + message.get_from()
Thomas Woutersb2137042007-02-01 18:02:27 +0000715 elif isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000716 from_line = message.get_unixfrom() # May be None.
717 if from_line is None:
718 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
719 start = self._file.tell()
720 self._file.write(from_line + os.linesep)
721 self._dump_message(message, self._file, self._mangle_from_)
722 stop = self._file.tell()
723 return (start, stop)
724
725
726class mbox(_mboxMMDF):
727 """A classic mbox mailbox."""
728
729 _mangle_from_ = True
730
731 def __init__(self, path, factory=None, create=True):
732 """Initialize an mbox mailbox."""
733 self._message_factory = mboxMessage
734 _mboxMMDF.__init__(self, path, factory, create)
735
736 def _pre_message_hook(self, f):
737 """Called before writing each message to file f."""
738 if f.tell() != 0:
739 f.write(os.linesep)
740
741 def _generate_toc(self):
742 """Generate key-to-(start, stop) table of contents."""
743 starts, stops = [], []
744 self._file.seek(0)
745 while True:
746 line_pos = self._file.tell()
747 line = self._file.readline()
748 if line.startswith('From '):
749 if len(stops) < len(starts):
750 stops.append(line_pos - len(os.linesep))
751 starts.append(line_pos)
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000752 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000753 stops.append(line_pos)
754 break
755 self._toc = dict(enumerate(zip(starts, stops)))
756 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000757 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000758
759
760class MMDF(_mboxMMDF):
761 """An MMDF mailbox."""
762
763 def __init__(self, path, factory=None, create=True):
764 """Initialize an MMDF mailbox."""
765 self._message_factory = MMDFMessage
766 _mboxMMDF.__init__(self, path, factory, create)
767
768 def _pre_message_hook(self, f):
769 """Called before writing each message to file f."""
770 f.write('\001\001\001\001' + os.linesep)
771
772 def _post_message_hook(self, f):
773 """Called after writing each message to file f."""
774 f.write(os.linesep + '\001\001\001\001' + os.linesep)
775
776 def _generate_toc(self):
777 """Generate key-to-(start, stop) table of contents."""
778 starts, stops = [], []
779 self._file.seek(0)
780 next_pos = 0
781 while True:
782 line_pos = next_pos
783 line = self._file.readline()
784 next_pos = self._file.tell()
785 if line.startswith('\001\001\001\001' + os.linesep):
786 starts.append(next_pos)
787 while True:
788 line_pos = next_pos
789 line = self._file.readline()
790 next_pos = self._file.tell()
791 if line == '\001\001\001\001' + os.linesep:
792 stops.append(line_pos - len(os.linesep))
793 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000794 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000795 stops.append(line_pos)
796 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000797 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000798 break
799 self._toc = dict(enumerate(zip(starts, stops)))
800 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000801 self._file.seek(0, 2)
802 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000803
804
805class MH(Mailbox):
806 """An MH mailbox."""
807
808 def __init__(self, path, factory=None, create=True):
809 """Initialize an MH instance."""
810 Mailbox.__init__(self, path, factory, create)
811 if not os.path.exists(self._path):
812 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000813 os.mkdir(self._path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000814 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000815 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000816 else:
817 raise NoSuchMailboxError(self._path)
818 self._locked = False
819
820 def add(self, message):
821 """Add message and return assigned key."""
822 keys = self.keys()
823 if len(keys) == 0:
824 new_key = 1
825 else:
826 new_key = max(keys) + 1
827 new_path = os.path.join(self._path, str(new_key))
828 f = _create_carefully(new_path)
829 try:
830 if self._locked:
831 _lock_file(f)
832 try:
833 self._dump_message(message, f)
834 if isinstance(message, MHMessage):
835 self._dump_sequences(message, new_key)
836 finally:
837 if self._locked:
838 _unlock_file(f)
839 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000840 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000841 return new_key
842
843 def remove(self, key):
844 """Remove the keyed message; raise KeyError if it doesn't exist."""
845 path = os.path.join(self._path, str(key))
846 try:
847 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000848 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000849 if e.errno == errno.ENOENT:
850 raise KeyError('No message with key: %s' % key)
851 else:
852 raise
853 try:
854 if self._locked:
855 _lock_file(f)
856 try:
857 f.close()
858 os.remove(os.path.join(self._path, str(key)))
859 finally:
860 if self._locked:
861 _unlock_file(f)
862 finally:
863 f.close()
864
865 def __setitem__(self, key, message):
866 """Replace the keyed message; raise KeyError if it doesn't exist."""
867 path = os.path.join(self._path, str(key))
868 try:
Guido van Rossum671117a2007-08-31 04:25:05 +0000869 f = open(path, 'r+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000870 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000871 if e.errno == errno.ENOENT:
872 raise KeyError('No message with key: %s' % key)
873 else:
874 raise
875 try:
876 if self._locked:
877 _lock_file(f)
878 try:
879 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
880 self._dump_message(message, f)
881 if isinstance(message, MHMessage):
882 self._dump_sequences(message, key)
883 finally:
884 if self._locked:
885 _unlock_file(f)
886 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000887 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000888
889 def get_message(self, key):
890 """Return a Message representation or raise a KeyError."""
891 try:
892 if self._locked:
893 f = open(os.path.join(self._path, str(key)), 'r+')
894 else:
895 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000896 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000897 if e.errno == errno.ENOENT:
898 raise KeyError('No message with key: %s' % key)
899 else:
900 raise
901 try:
902 if self._locked:
903 _lock_file(f)
904 try:
905 msg = MHMessage(f)
906 finally:
907 if self._locked:
908 _unlock_file(f)
909 finally:
910 f.close()
911 for name, key_list in self.get_sequences():
912 if key in key_list:
913 msg.add_sequence(name)
914 return msg
915
916 def get_string(self, key):
917 """Return a string representation or raise a KeyError."""
918 try:
919 if self._locked:
920 f = open(os.path.join(self._path, str(key)), 'r+')
921 else:
922 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000923 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000924 if e.errno == errno.ENOENT:
925 raise KeyError('No message with key: %s' % key)
926 else:
927 raise
928 try:
929 if self._locked:
930 _lock_file(f)
931 try:
932 return f.read()
933 finally:
934 if self._locked:
935 _unlock_file(f)
936 finally:
937 f.close()
938
939 def get_file(self, key):
940 """Return a file-like representation or raise a KeyError."""
941 try:
Guido van Rossum98297ee2007-11-06 21:34:58 +0000942 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000943 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000944 if e.errno == errno.ENOENT:
945 raise KeyError('No message with key: %s' % key)
946 else:
947 raise
948 return _ProxyFile(f)
949
950 def iterkeys(self):
951 """Return an iterator over keys."""
952 return iter(sorted(int(entry) for entry in os.listdir(self._path)
953 if entry.isdigit()))
954
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000955 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000956 """Return True if the keyed message exists, False otherwise."""
957 return os.path.exists(os.path.join(self._path, str(key)))
958
959 def __len__(self):
960 """Return a count of messages in the mailbox."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000961 return len(list(self.keys()))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000962
963 def lock(self):
964 """Lock the mailbox."""
965 if not self._locked:
966 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
967 _lock_file(self._file)
968 self._locked = True
969
970 def unlock(self):
971 """Unlock the mailbox if it is locked."""
972 if self._locked:
973 _unlock_file(self._file)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000974 _sync_close(self._file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000975 del self._file
976 self._locked = False
977
978 def flush(self):
979 """Write any pending changes to the disk."""
980 return
981
982 def close(self):
983 """Flush and close the mailbox."""
984 if self._locked:
985 self.unlock()
986
987 def list_folders(self):
988 """Return a list of folder names."""
989 result = []
990 for entry in os.listdir(self._path):
991 if os.path.isdir(os.path.join(self._path, entry)):
992 result.append(entry)
993 return result
994
995 def get_folder(self, folder):
996 """Return an MH instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000997 return MH(os.path.join(self._path, folder),
998 factory=self._factory, create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000999
1000 def add_folder(self, folder):
1001 """Create a folder and return an MH instance representing it."""
Thomas Wouters89f507f2006-12-13 04:49:30 +00001002 return MH(os.path.join(self._path, folder),
1003 factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001004
1005 def remove_folder(self, folder):
1006 """Delete the named folder, which must be empty."""
1007 path = os.path.join(self._path, folder)
1008 entries = os.listdir(path)
1009 if entries == ['.mh_sequences']:
1010 os.remove(os.path.join(path, '.mh_sequences'))
1011 elif entries == []:
1012 pass
1013 else:
1014 raise NotEmptyError('Folder not empty: %s' % self._path)
1015 os.rmdir(path)
1016
1017 def get_sequences(self):
1018 """Return a name-to-key-list dictionary to define each sequence."""
1019 results = {}
1020 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
1021 try:
1022 all_keys = set(self.keys())
1023 for line in f:
1024 try:
1025 name, contents = line.split(':')
1026 keys = set()
1027 for spec in contents.split():
1028 if spec.isdigit():
1029 keys.add(int(spec))
1030 else:
1031 start, stop = (int(x) for x in spec.split('-'))
1032 keys.update(range(start, stop + 1))
1033 results[name] = [key for key in sorted(keys) \
1034 if key in all_keys]
1035 if len(results[name]) == 0:
1036 del results[name]
1037 except ValueError:
1038 raise FormatError('Invalid sequence specification: %s' %
1039 line.rstrip())
1040 finally:
1041 f.close()
1042 return results
1043
1044 def set_sequences(self, sequences):
1045 """Set sequences using the given name-to-key-list dictionary."""
1046 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
1047 try:
1048 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001049 for name, keys in sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001050 if len(keys) == 0:
1051 continue
1052 f.write('%s:' % name)
1053 prev = None
1054 completing = False
1055 for key in sorted(set(keys)):
1056 if key - 1 == prev:
1057 if not completing:
1058 completing = True
1059 f.write('-')
1060 elif completing:
1061 completing = False
1062 f.write('%s %s' % (prev, key))
1063 else:
1064 f.write(' %s' % key)
1065 prev = key
1066 if completing:
1067 f.write(str(prev) + '\n')
1068 else:
1069 f.write('\n')
1070 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +00001071 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001072
1073 def pack(self):
1074 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1075 sequences = self.get_sequences()
1076 prev = 0
1077 changes = []
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001078 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001079 if key - 1 != prev:
1080 changes.append((key, prev + 1))
Thomas Wouters89f507f2006-12-13 04:49:30 +00001081 if hasattr(os, 'link'):
1082 os.link(os.path.join(self._path, str(key)),
1083 os.path.join(self._path, str(prev + 1)))
1084 os.unlink(os.path.join(self._path, str(key)))
1085 else:
1086 os.rename(os.path.join(self._path, str(key)),
1087 os.path.join(self._path, str(prev + 1)))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001088 prev += 1
1089 self._next_key = prev + 1
1090 if len(changes) == 0:
1091 return
1092 for name, key_list in sequences.items():
1093 for old, new in changes:
1094 if old in key_list:
1095 key_list[key_list.index(old)] = new
1096 self.set_sequences(sequences)
1097
1098 def _dump_sequences(self, message, key):
1099 """Inspect a new MHMessage and update sequences appropriately."""
1100 pending_sequences = message.get_sequences()
1101 all_sequences = self.get_sequences()
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001102 for name, key_list in all_sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001103 if name in pending_sequences:
1104 key_list.append(key)
1105 elif key in key_list:
1106 del key_list[key_list.index(key)]
1107 for sequence in pending_sequences:
1108 if sequence not in all_sequences:
1109 all_sequences[sequence] = [key]
1110 self.set_sequences(all_sequences)
1111
1112
1113class Babyl(_singlefileMailbox):
1114 """An Rmail-style Babyl mailbox."""
1115
1116 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1117 'forwarded', 'edited', 'resent'))
1118
1119 def __init__(self, path, factory=None, create=True):
1120 """Initialize a Babyl mailbox."""
1121 _singlefileMailbox.__init__(self, path, factory, create)
1122 self._labels = {}
1123
1124 def add(self, message):
1125 """Add message and return assigned key."""
1126 key = _singlefileMailbox.add(self, message)
1127 if isinstance(message, BabylMessage):
1128 self._labels[key] = message.get_labels()
1129 return key
1130
1131 def remove(self, key):
1132 """Remove the keyed message; raise KeyError if it doesn't exist."""
1133 _singlefileMailbox.remove(self, key)
1134 if key in self._labels:
1135 del self._labels[key]
1136
1137 def __setitem__(self, key, message):
1138 """Replace the keyed message; raise KeyError if it doesn't exist."""
1139 _singlefileMailbox.__setitem__(self, key, message)
1140 if isinstance(message, BabylMessage):
1141 self._labels[key] = message.get_labels()
1142
1143 def get_message(self, key):
1144 """Return a Message representation or raise a KeyError."""
1145 start, stop = self._lookup(key)
1146 self._file.seek(start)
1147 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001148 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001149 while True:
1150 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001151 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001152 break
1153 original_headers.write(line.replace(os.linesep, '\n'))
Guido van Rossum34d19282007-08-09 01:03:29 +00001154 visible_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001155 while True:
1156 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001157 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001158 break
1159 visible_headers.write(line.replace(os.linesep, '\n'))
1160 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1161 '\n')
1162 msg = BabylMessage(original_headers.getvalue() + body)
1163 msg.set_visible(visible_headers.getvalue())
1164 if key in self._labels:
1165 msg.set_labels(self._labels[key])
1166 return msg
1167
1168 def get_string(self, key):
1169 """Return a string representation or raise a KeyError."""
1170 start, stop = self._lookup(key)
1171 self._file.seek(start)
1172 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001173 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001174 while True:
1175 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001176 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001177 break
1178 original_headers.write(line.replace(os.linesep, '\n'))
1179 while True:
1180 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001181 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001182 break
1183 return original_headers.getvalue() + \
1184 self._file.read(stop - self._file.tell()).replace(os.linesep,
1185 '\n')
1186
1187 def get_file(self, key):
1188 """Return a file-like representation or raise a KeyError."""
Guido van Rossum34d19282007-08-09 01:03:29 +00001189 return io.StringIO(self.get_string(key).replace('\n',
Thomas Wouters477c8d52006-05-27 19:21:47 +00001190 os.linesep))
1191
1192 def get_labels(self):
1193 """Return a list of user-defined labels in the mailbox."""
1194 self._lookup()
1195 labels = set()
1196 for label_list in self._labels.values():
1197 labels.update(label_list)
1198 labels.difference_update(self._special_labels)
1199 return list(labels)
1200
1201 def _generate_toc(self):
1202 """Generate key-to-(start, stop) table of contents."""
1203 starts, stops = [], []
1204 self._file.seek(0)
1205 next_pos = 0
1206 label_lists = []
1207 while True:
1208 line_pos = next_pos
1209 line = self._file.readline()
1210 next_pos = self._file.tell()
1211 if line == '\037\014' + os.linesep:
1212 if len(stops) < len(starts):
1213 stops.append(line_pos - len(os.linesep))
1214 starts.append(next_pos)
1215 labels = [label.strip() for label
1216 in self._file.readline()[1:].split(',')
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001217 if label.strip()]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001218 label_lists.append(labels)
1219 elif line == '\037' or line == '\037' + os.linesep:
1220 if len(stops) < len(starts):
1221 stops.append(line_pos - len(os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001222 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001223 stops.append(line_pos - len(os.linesep))
1224 break
1225 self._toc = dict(enumerate(zip(starts, stops)))
1226 self._labels = dict(enumerate(label_lists))
1227 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001228 self._file.seek(0, 2)
1229 self._file_length = self._file.tell()
Thomas Wouters9fe394c2007-02-05 01:24:16 +00001230
Thomas Wouters477c8d52006-05-27 19:21:47 +00001231 def _pre_mailbox_hook(self, f):
1232 """Called before writing the mailbox to file f."""
1233 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1234 (os.linesep, os.linesep, ','.join(self.get_labels()),
1235 os.linesep))
1236
1237 def _pre_message_hook(self, f):
1238 """Called before writing each message to file f."""
1239 f.write('\014' + os.linesep)
1240
1241 def _post_message_hook(self, f):
1242 """Called after writing each message to file f."""
1243 f.write(os.linesep + '\037')
1244
1245 def _install_message(self, message):
1246 """Write message contents and return (start, stop)."""
1247 start = self._file.tell()
1248 if isinstance(message, BabylMessage):
1249 special_labels = []
1250 labels = []
1251 for label in message.get_labels():
1252 if label in self._special_labels:
1253 special_labels.append(label)
1254 else:
1255 labels.append(label)
1256 self._file.write('1')
1257 for label in special_labels:
1258 self._file.write(', ' + label)
1259 self._file.write(',,')
1260 for label in labels:
1261 self._file.write(' ' + label + ',')
1262 self._file.write(os.linesep)
1263 else:
1264 self._file.write('1,,' + os.linesep)
Thomas Woutersb2137042007-02-01 18:02:27 +00001265 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +00001266 orig_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001267 orig_generator = email.generator.Generator(orig_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001268 orig_generator.flatten(message)
1269 orig_buffer.seek(0)
1270 while True:
1271 line = orig_buffer.readline()
1272 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001273 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001274 break
1275 self._file.write('*** EOOH ***' + os.linesep)
1276 if isinstance(message, BabylMessage):
Guido van Rossum34d19282007-08-09 01:03:29 +00001277 vis_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001278 vis_generator = email.generator.Generator(vis_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001279 vis_generator.flatten(message.get_visible())
1280 while True:
1281 line = vis_buffer.readline()
1282 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001283 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001284 break
1285 else:
1286 orig_buffer.seek(0)
1287 while True:
1288 line = orig_buffer.readline()
1289 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001290 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001291 break
1292 while True:
1293 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001294 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001295 break
1296 self._file.write(buffer.replace('\n', os.linesep))
1297 elif isinstance(message, str):
1298 body_start = message.find('\n\n') + 2
1299 if body_start - 2 != -1:
1300 self._file.write(message[:body_start].replace('\n',
1301 os.linesep))
1302 self._file.write('*** EOOH ***' + os.linesep)
1303 self._file.write(message[:body_start].replace('\n',
1304 os.linesep))
1305 self._file.write(message[body_start:].replace('\n',
1306 os.linesep))
1307 else:
1308 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1309 self._file.write(message.replace('\n', os.linesep))
1310 elif hasattr(message, 'readline'):
1311 original_pos = message.tell()
1312 first_pass = True
1313 while True:
1314 line = message.readline()
1315 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001316 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001317 self._file.write('*** EOOH ***' + os.linesep)
1318 if first_pass:
1319 first_pass = False
1320 message.seek(original_pos)
1321 else:
1322 break
1323 while True:
1324 buffer = message.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001325 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001326 break
1327 self._file.write(buffer.replace('\n', os.linesep))
1328 else:
1329 raise TypeError('Invalid message type: %s' % type(message))
1330 stop = self._file.tell()
1331 return (start, stop)
1332
1333
Thomas Woutersb2137042007-02-01 18:02:27 +00001334class Message(email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001335 """Message with mailbox-format-specific properties."""
1336
1337 def __init__(self, message=None):
1338 """Initialize a Message instance."""
Thomas Woutersb2137042007-02-01 18:02:27 +00001339 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001340 self._become_message(copy.deepcopy(message))
1341 if isinstance(message, Message):
1342 message._explain_to(self)
1343 elif isinstance(message, str):
1344 self._become_message(email.message_from_string(message))
1345 elif hasattr(message, "read"):
1346 self._become_message(email.message_from_file(message))
1347 elif message is None:
Thomas Woutersb2137042007-02-01 18:02:27 +00001348 email.message.Message.__init__(self)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001349 else:
1350 raise TypeError('Invalid message type: %s' % type(message))
1351
1352 def _become_message(self, message):
1353 """Assume the non-format-specific state of message."""
1354 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1355 'preamble', 'epilogue', 'defects', '_default_type'):
1356 self.__dict__[name] = message.__dict__[name]
1357
1358 def _explain_to(self, message):
1359 """Copy format-specific state to message insofar as possible."""
1360 if isinstance(message, Message):
1361 return # There's nothing format-specific to explain.
1362 else:
1363 raise TypeError('Cannot convert to specified type')
1364
1365
1366class MaildirMessage(Message):
1367 """Message with Maildir-specific properties."""
1368
1369 def __init__(self, message=None):
1370 """Initialize a MaildirMessage instance."""
1371 self._subdir = 'new'
1372 self._info = ''
1373 self._date = time.time()
1374 Message.__init__(self, message)
1375
1376 def get_subdir(self):
1377 """Return 'new' or 'cur'."""
1378 return self._subdir
1379
1380 def set_subdir(self, subdir):
1381 """Set subdir to 'new' or 'cur'."""
1382 if subdir == 'new' or subdir == 'cur':
1383 self._subdir = subdir
1384 else:
1385 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1386
1387 def get_flags(self):
1388 """Return as a string the flags that are set."""
1389 if self._info.startswith('2,'):
1390 return self._info[2:]
1391 else:
1392 return ''
1393
1394 def set_flags(self, flags):
1395 """Set the given flags and unset all others."""
1396 self._info = '2,' + ''.join(sorted(flags))
1397
1398 def add_flag(self, flag):
1399 """Set the given flag(s) without changing others."""
1400 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1401
1402 def remove_flag(self, flag):
1403 """Unset the given string flag(s) without changing others."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001404 if self.get_flags():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001405 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1406
1407 def get_date(self):
1408 """Return delivery date of message, in seconds since the epoch."""
1409 return self._date
1410
1411 def set_date(self, date):
1412 """Set delivery date of message, in seconds since the epoch."""
1413 try:
1414 self._date = float(date)
1415 except ValueError:
1416 raise TypeError("can't convert to float: %s" % date)
1417
1418 def get_info(self):
1419 """Get the message's "info" as a string."""
1420 return self._info
1421
1422 def set_info(self, info):
1423 """Set the message's "info" string."""
1424 if isinstance(info, str):
1425 self._info = info
1426 else:
1427 raise TypeError('info must be a string: %s' % type(info))
1428
1429 def _explain_to(self, message):
1430 """Copy Maildir-specific state to message insofar as possible."""
1431 if isinstance(message, MaildirMessage):
1432 message.set_flags(self.get_flags())
1433 message.set_subdir(self.get_subdir())
1434 message.set_date(self.get_date())
1435 elif isinstance(message, _mboxMMDFMessage):
1436 flags = set(self.get_flags())
1437 if 'S' in flags:
1438 message.add_flag('R')
1439 if self.get_subdir() == 'cur':
1440 message.add_flag('O')
1441 if 'T' in flags:
1442 message.add_flag('D')
1443 if 'F' in flags:
1444 message.add_flag('F')
1445 if 'R' in flags:
1446 message.add_flag('A')
1447 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1448 elif isinstance(message, MHMessage):
1449 flags = set(self.get_flags())
1450 if 'S' not in flags:
1451 message.add_sequence('unseen')
1452 if 'R' in flags:
1453 message.add_sequence('replied')
1454 if 'F' in flags:
1455 message.add_sequence('flagged')
1456 elif isinstance(message, BabylMessage):
1457 flags = set(self.get_flags())
1458 if 'S' not in flags:
1459 message.add_label('unseen')
1460 if 'T' in flags:
1461 message.add_label('deleted')
1462 if 'R' in flags:
1463 message.add_label('answered')
1464 if 'P' in flags:
1465 message.add_label('forwarded')
1466 elif isinstance(message, Message):
1467 pass
1468 else:
1469 raise TypeError('Cannot convert to specified type: %s' %
1470 type(message))
1471
1472
1473class _mboxMMDFMessage(Message):
1474 """Message with mbox- or MMDF-specific properties."""
1475
1476 def __init__(self, message=None):
1477 """Initialize an mboxMMDFMessage instance."""
1478 self.set_from('MAILER-DAEMON', True)
Thomas Woutersb2137042007-02-01 18:02:27 +00001479 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001480 unixfrom = message.get_unixfrom()
1481 if unixfrom is not None and unixfrom.startswith('From '):
1482 self.set_from(unixfrom[5:])
1483 Message.__init__(self, message)
1484
1485 def get_from(self):
1486 """Return contents of "From " line."""
1487 return self._from
1488
1489 def set_from(self, from_, time_=None):
1490 """Set "From " line, formatting and appending time_ if specified."""
1491 if time_ is not None:
1492 if time_ is True:
1493 time_ = time.gmtime()
1494 from_ += ' ' + time.asctime(time_)
1495 self._from = from_
1496
1497 def get_flags(self):
1498 """Return as a string the flags that are set."""
1499 return self.get('Status', '') + self.get('X-Status', '')
1500
1501 def set_flags(self, flags):
1502 """Set the given flags and unset all others."""
1503 flags = set(flags)
1504 status_flags, xstatus_flags = '', ''
1505 for flag in ('R', 'O'):
1506 if flag in flags:
1507 status_flags += flag
1508 flags.remove(flag)
1509 for flag in ('D', 'F', 'A'):
1510 if flag in flags:
1511 xstatus_flags += flag
1512 flags.remove(flag)
1513 xstatus_flags += ''.join(sorted(flags))
1514 try:
1515 self.replace_header('Status', status_flags)
1516 except KeyError:
1517 self.add_header('Status', status_flags)
1518 try:
1519 self.replace_header('X-Status', xstatus_flags)
1520 except KeyError:
1521 self.add_header('X-Status', xstatus_flags)
1522
1523 def add_flag(self, flag):
1524 """Set the given flag(s) without changing others."""
1525 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1526
1527 def remove_flag(self, flag):
1528 """Unset the given string flag(s) without changing others."""
1529 if 'Status' in self or 'X-Status' in self:
1530 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1531
1532 def _explain_to(self, message):
1533 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1534 if isinstance(message, MaildirMessage):
1535 flags = set(self.get_flags())
1536 if 'O' in flags:
1537 message.set_subdir('cur')
1538 if 'F' in flags:
1539 message.add_flag('F')
1540 if 'A' in flags:
1541 message.add_flag('R')
1542 if 'R' in flags:
1543 message.add_flag('S')
1544 if 'D' in flags:
1545 message.add_flag('T')
1546 del message['status']
1547 del message['x-status']
1548 maybe_date = ' '.join(self.get_from().split()[-5:])
1549 try:
1550 message.set_date(calendar.timegm(time.strptime(maybe_date,
1551 '%a %b %d %H:%M:%S %Y')))
1552 except (ValueError, OverflowError):
1553 pass
1554 elif isinstance(message, _mboxMMDFMessage):
1555 message.set_flags(self.get_flags())
1556 message.set_from(self.get_from())
1557 elif isinstance(message, MHMessage):
1558 flags = set(self.get_flags())
1559 if 'R' not in flags:
1560 message.add_sequence('unseen')
1561 if 'A' in flags:
1562 message.add_sequence('replied')
1563 if 'F' in flags:
1564 message.add_sequence('flagged')
1565 del message['status']
1566 del message['x-status']
1567 elif isinstance(message, BabylMessage):
1568 flags = set(self.get_flags())
1569 if 'R' not in flags:
1570 message.add_label('unseen')
1571 if 'D' in flags:
1572 message.add_label('deleted')
1573 if 'A' in flags:
1574 message.add_label('answered')
1575 del message['status']
1576 del message['x-status']
1577 elif isinstance(message, Message):
1578 pass
1579 else:
1580 raise TypeError('Cannot convert to specified type: %s' %
1581 type(message))
1582
1583
1584class mboxMessage(_mboxMMDFMessage):
1585 """Message with mbox-specific properties."""
1586
1587
1588class MHMessage(Message):
1589 """Message with MH-specific properties."""
1590
1591 def __init__(self, message=None):
1592 """Initialize an MHMessage instance."""
1593 self._sequences = []
1594 Message.__init__(self, message)
1595
1596 def get_sequences(self):
1597 """Return a list of sequences that include the message."""
1598 return self._sequences[:]
1599
1600 def set_sequences(self, sequences):
1601 """Set the list of sequences that include the message."""
1602 self._sequences = list(sequences)
1603
1604 def add_sequence(self, sequence):
1605 """Add sequence to list of sequences including the message."""
1606 if isinstance(sequence, str):
1607 if not sequence in self._sequences:
1608 self._sequences.append(sequence)
1609 else:
1610 raise TypeError('sequence must be a string: %s' % type(sequence))
1611
1612 def remove_sequence(self, sequence):
1613 """Remove sequence from the list of sequences including the message."""
1614 try:
1615 self._sequences.remove(sequence)
1616 except ValueError:
1617 pass
1618
1619 def _explain_to(self, message):
1620 """Copy MH-specific state to message insofar as possible."""
1621 if isinstance(message, MaildirMessage):
1622 sequences = set(self.get_sequences())
1623 if 'unseen' in sequences:
1624 message.set_subdir('cur')
1625 else:
1626 message.set_subdir('cur')
1627 message.add_flag('S')
1628 if 'flagged' in sequences:
1629 message.add_flag('F')
1630 if 'replied' in sequences:
1631 message.add_flag('R')
1632 elif isinstance(message, _mboxMMDFMessage):
1633 sequences = set(self.get_sequences())
1634 if 'unseen' not in sequences:
1635 message.add_flag('RO')
1636 else:
1637 message.add_flag('O')
1638 if 'flagged' in sequences:
1639 message.add_flag('F')
1640 if 'replied' in sequences:
1641 message.add_flag('A')
1642 elif isinstance(message, MHMessage):
1643 for sequence in self.get_sequences():
1644 message.add_sequence(sequence)
1645 elif isinstance(message, BabylMessage):
1646 sequences = set(self.get_sequences())
1647 if 'unseen' in sequences:
1648 message.add_label('unseen')
1649 if 'replied' in sequences:
1650 message.add_label('answered')
1651 elif isinstance(message, Message):
1652 pass
1653 else:
1654 raise TypeError('Cannot convert to specified type: %s' %
1655 type(message))
1656
1657
1658class BabylMessage(Message):
1659 """Message with Babyl-specific properties."""
1660
1661 def __init__(self, message=None):
1662 """Initialize an BabylMessage instance."""
1663 self._labels = []
1664 self._visible = Message()
1665 Message.__init__(self, message)
1666
1667 def get_labels(self):
1668 """Return a list of labels on the message."""
1669 return self._labels[:]
1670
1671 def set_labels(self, labels):
1672 """Set the list of labels on the message."""
1673 self._labels = list(labels)
1674
1675 def add_label(self, label):
1676 """Add label to list of labels on the message."""
1677 if isinstance(label, str):
1678 if label not in self._labels:
1679 self._labels.append(label)
1680 else:
1681 raise TypeError('label must be a string: %s' % type(label))
1682
1683 def remove_label(self, label):
1684 """Remove label from the list of labels on the message."""
1685 try:
1686 self._labels.remove(label)
1687 except ValueError:
1688 pass
1689
1690 def get_visible(self):
1691 """Return a Message representation of visible headers."""
1692 return Message(self._visible)
1693
1694 def set_visible(self, visible):
1695 """Set the Message representation of visible headers."""
1696 self._visible = Message(visible)
1697
1698 def update_visible(self):
1699 """Update and/or sensibly generate a set of visible headers."""
1700 for header in self._visible.keys():
1701 if header in self:
1702 self._visible.replace_header(header, self[header])
1703 else:
1704 del self._visible[header]
1705 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1706 if header in self and header not in self._visible:
1707 self._visible[header] = self[header]
1708
1709 def _explain_to(self, message):
1710 """Copy Babyl-specific state to message insofar as possible."""
1711 if isinstance(message, MaildirMessage):
1712 labels = set(self.get_labels())
1713 if 'unseen' in labels:
1714 message.set_subdir('cur')
1715 else:
1716 message.set_subdir('cur')
1717 message.add_flag('S')
1718 if 'forwarded' in labels or 'resent' in labels:
1719 message.add_flag('P')
1720 if 'answered' in labels:
1721 message.add_flag('R')
1722 if 'deleted' in labels:
1723 message.add_flag('T')
1724 elif isinstance(message, _mboxMMDFMessage):
1725 labels = set(self.get_labels())
1726 if 'unseen' not in labels:
1727 message.add_flag('RO')
1728 else:
1729 message.add_flag('O')
1730 if 'deleted' in labels:
1731 message.add_flag('D')
1732 if 'answered' in labels:
1733 message.add_flag('A')
1734 elif isinstance(message, MHMessage):
1735 labels = set(self.get_labels())
1736 if 'unseen' in labels:
1737 message.add_sequence('unseen')
1738 if 'answered' in labels:
1739 message.add_sequence('replied')
1740 elif isinstance(message, BabylMessage):
1741 message.set_visible(self.get_visible())
1742 for label in self.get_labels():
1743 message.add_label(label)
1744 elif isinstance(message, Message):
1745 pass
1746 else:
1747 raise TypeError('Cannot convert to specified type: %s' %
1748 type(message))
1749
1750
1751class MMDFMessage(_mboxMMDFMessage):
1752 """Message with MMDF-specific properties."""
1753
1754
1755class _ProxyFile:
1756 """A read-only wrapper of a file."""
1757
1758 def __init__(self, f, pos=None):
1759 """Initialize a _ProxyFile."""
1760 self._file = f
1761 if pos is None:
1762 self._pos = f.tell()
1763 else:
1764 self._pos = pos
1765
1766 def read(self, size=None):
1767 """Read bytes."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001768 return self._read(size, self._file.read)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001769
1770 def readline(self, size=None):
1771 """Read a line."""
Guido van Rossum98297ee2007-11-06 21:34:58 +00001772 return self._read(size, self._file.readline)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001773
1774 def readlines(self, sizehint=None):
1775 """Read multiple lines."""
1776 result = []
1777 for line in self:
1778 result.append(line)
1779 if sizehint is not None:
1780 sizehint -= len(line)
1781 if sizehint <= 0:
1782 break
1783 return result
1784
1785 def __iter__(self):
1786 """Iterate over lines."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001787 while True:
1788 line = self.readline()
1789 if not line:
1790 raise StopIteration
1791 yield line
Thomas Wouters477c8d52006-05-27 19:21:47 +00001792
1793 def tell(self):
1794 """Return the position."""
1795 return self._pos
1796
1797 def seek(self, offset, whence=0):
1798 """Change position."""
1799 if whence == 1:
1800 self._file.seek(self._pos)
1801 self._file.seek(offset, whence)
1802 self._pos = self._file.tell()
1803
1804 def close(self):
1805 """Close the file."""
1806 del self._file
1807
1808 def _read(self, size, read_method):
1809 """Read size bytes using read_method."""
1810 if size is None:
1811 size = -1
1812 self._file.seek(self._pos)
1813 result = read_method(size)
1814 self._pos = self._file.tell()
1815 return result
1816
1817
1818class _PartialFile(_ProxyFile):
1819 """A read-only wrapper of part of a file."""
1820
1821 def __init__(self, f, start=None, stop=None):
1822 """Initialize a _PartialFile."""
1823 _ProxyFile.__init__(self, f, start)
1824 self._start = start
1825 self._stop = stop
1826
1827 def tell(self):
1828 """Return the position with respect to start."""
1829 return _ProxyFile.tell(self) - self._start
1830
1831 def seek(self, offset, whence=0):
1832 """Change position, possibly with respect to start or stop."""
1833 if whence == 0:
1834 self._pos = self._start
1835 whence = 1
1836 elif whence == 2:
1837 self._pos = self._stop
1838 whence = 1
1839 _ProxyFile.seek(self, offset, whence)
1840
1841 def _read(self, size, read_method):
1842 """Read size bytes using read_method, honoring start and stop."""
1843 remaining = self._stop - self._pos
1844 if remaining <= 0:
1845 return ''
1846 if size is None or size < 0 or size > remaining:
1847 size = remaining
1848 return _ProxyFile._read(self, size, read_method)
1849
1850
1851def _lock_file(f, dotlock=True):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001852 """Lock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001853 dotlock_done = False
1854 try:
1855 if fcntl:
1856 try:
1857 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
Guido van Rossumb940e112007-01-10 16:19:56 +00001858 except IOError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001859 if e.errno in (errno.EAGAIN, errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001860 raise ExternalClashError('lockf: lock unavailable: %s' %
1861 f.name)
1862 else:
1863 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +00001864 if dotlock:
1865 try:
1866 pre_lock = _create_temporary(f.name + '.lock')
1867 pre_lock.close()
Guido van Rossumb940e112007-01-10 16:19:56 +00001868 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001869 if e.errno == errno.EACCES:
1870 return # Without write access, just skip dotlocking.
1871 else:
1872 raise
1873 try:
1874 if hasattr(os, 'link'):
1875 os.link(pre_lock.name, f.name + '.lock')
1876 dotlock_done = True
1877 os.unlink(pre_lock.name)
1878 else:
1879 os.rename(pre_lock.name, f.name + '.lock')
1880 dotlock_done = True
Guido van Rossumb940e112007-01-10 16:19:56 +00001881 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001882 if e.errno == errno.EEXIST or \
1883 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001884 os.remove(pre_lock.name)
1885 raise ExternalClashError('dot lock unavailable: %s' %
1886 f.name)
1887 else:
1888 raise
1889 except:
1890 if fcntl:
1891 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001892 if dotlock_done:
1893 os.remove(f.name + '.lock')
1894 raise
1895
1896def _unlock_file(f):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001897 """Unlock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001898 if fcntl:
1899 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001900 if os.path.exists(f.name + '.lock'):
1901 os.remove(f.name + '.lock')
1902
1903def _create_carefully(path):
1904 """Create a file if it doesn't exist and open for reading and writing."""
1905 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR)
1906 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +00001907 return open(path, 'r+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001908 finally:
1909 os.close(fd)
1910
1911def _create_temporary(path):
1912 """Create a temp file based on path and open for reading and writing."""
1913 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1914 socket.gethostname(),
1915 os.getpid()))
1916
Thomas Wouters89f507f2006-12-13 04:49:30 +00001917def _sync_flush(f):
1918 """Ensure changes to file f are physically on disk."""
1919 f.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001920 if hasattr(os, 'fsync'):
1921 os.fsync(f.fileno())
Thomas Wouters89f507f2006-12-13 04:49:30 +00001922
1923def _sync_close(f):
1924 """Close file f, ensuring all changes are physically on disk."""
1925 _sync_flush(f)
1926 f.close()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001927
1928## Start: classes from the original module (for backward compatibility).
1929
1930# Note that the Maildir class, whose name is unchanged, itself offers a next()
1931# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001932
Guido van Rossumc7b68821994-04-28 09:53:33 +00001933class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001934
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001935 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001936 self.fp = fp
1937 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001938 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001939
Fred Drake72987a42001-05-02 20:20:53 +00001940 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001941 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001942
Fred Drakedbbf76b2000-07-09 16:44:26 +00001943 def next(self):
1944 while 1:
1945 self.fp.seek(self.seekp)
1946 try:
1947 self._search_start()
1948 except EOFError:
1949 self.seekp = self.fp.tell()
1950 return None
1951 start = self.fp.tell()
1952 self._search_end()
1953 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00001954 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00001955 break
Thomas Wouters477c8d52006-05-27 19:21:47 +00001956 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00001957
Barry Warsawffd05ee2002-03-01 22:39:14 +00001958# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00001959class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00001960
Fred Drakedbbf76b2000-07-09 16:44:26 +00001961 def _search_start(self):
1962 while 1:
1963 pos = self.fp.tell()
1964 line = self.fp.readline()
1965 if not line:
1966 raise EOFError
1967 if line[:5] == 'From ' and self._isrealfromline(line):
1968 self.fp.seek(pos)
1969 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00001970
Fred Drakedbbf76b2000-07-09 16:44:26 +00001971 def _search_end(self):
1972 self.fp.readline() # Throw away header line
1973 while 1:
1974 pos = self.fp.tell()
1975 line = self.fp.readline()
1976 if not line:
1977 return
1978 if line[:5] == 'From ' and self._isrealfromline(line):
1979 self.fp.seek(pos)
1980 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00001981
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001982 # An overridable mechanism to test for From-line-ness. You can either
1983 # specify a different regular expression or define a whole new
1984 # _isrealfromline() method. Note that this only gets called for lines
1985 # starting with the 5 characters "From ".
1986 #
1987 # BAW: According to
1988 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
1989 # the only portable, reliable way to find message delimiters in a BSD (i.e
1990 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
1991 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
1992 # like a good idea, in practice, there are too many variations for more
1993 # strict parsing of the line to be completely accurate.
1994 #
1995 # _strict_isrealfromline() is the old version which tries to do stricter
1996 # parsing of the From_ line. _portable_isrealfromline() simply returns
1997 # true, since it's never called if the line doesn't already start with
1998 # "From ".
1999 #
2000 # This algorithm, and the way it interacts with _search_start() and
2001 # _search_end() may not be completely correct, because it doesn't check
2002 # that the two characters preceding "From " are \n\n or the beginning of
2003 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00002004 # necessary. For convenience, we've added a PortableUnixMailbox class
Thomas Woutersb2137042007-02-01 18:02:27 +00002005 # which does no checking of the format of the 'From' line.
Guido van Rossumc7b68821994-04-28 09:53:33 +00002006
Thomas Woutersb2137042007-02-01 18:02:27 +00002007 _fromlinepattern = (r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+"
2008 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*"
2009 r"[^\s]*\s*"
2010 "$")
Fred Drakedbbf76b2000-07-09 16:44:26 +00002011 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002012
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002013 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002014 if not self._regexp:
2015 import re
2016 self._regexp = re.compile(self._fromlinepattern)
2017 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002018
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002019 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002020 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002021
2022 _isrealfromline = _strict_isrealfromline
2023
2024
2025class PortableUnixMailbox(UnixMailbox):
2026 _isrealfromline = UnixMailbox._portable_isrealfromline
2027
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002028
Guido van Rossumc7b68821994-04-28 09:53:33 +00002029class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002030
Fred Drakedbbf76b2000-07-09 16:44:26 +00002031 def _search_start(self):
2032 while 1:
2033 line = self.fp.readline()
2034 if not line:
2035 raise EOFError
2036 if line[:5] == '\001\001\001\001\n':
2037 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002038
Fred Drakedbbf76b2000-07-09 16:44:26 +00002039 def _search_end(self):
2040 while 1:
2041 pos = self.fp.tell()
2042 line = self.fp.readline()
2043 if not line:
2044 return
2045 if line == '\001\001\001\001\n':
2046 self.fp.seek(pos)
2047 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002048
Guido van Rossumc7b68821994-04-28 09:53:33 +00002049
Jack Jansen97157791995-10-23 13:59:53 +00002050class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002051
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002052 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002053 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002054 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002055 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002056 # the three following lines could be combined into:
2057 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2058 list = os.listdir(self.dirname)
2059 list = filter(pat.match, list)
Guido van Rossume2a383d2007-01-15 16:59:06 +00002060 list = map(int, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002061 list.sort()
2062 # This only works in Python 1.6 or later;
2063 # before that str() added 'L':
2064 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002065 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002066 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002067
Fred Drake72987a42001-05-02 20:20:53 +00002068 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002069 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002070
Fred Drakedbbf76b2000-07-09 16:44:26 +00002071 def next(self):
2072 if not self.boxes:
2073 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002074 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002075 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002076 msg = self.factory(fp)
2077 try:
2078 msg._mh_msgno = fn
2079 except (AttributeError, TypeError):
2080 pass
2081 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002082
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002083
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002084class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002085
Fred Drakedbbf76b2000-07-09 16:44:26 +00002086 def _search_start(self):
2087 while 1:
2088 line = self.fp.readline()
2089 if not line:
2090 raise EOFError
2091 if line == '*** EOOH ***\n':
2092 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002093
Fred Drakedbbf76b2000-07-09 16:44:26 +00002094 def _search_end(self):
2095 while 1:
2096 pos = self.fp.tell()
2097 line = self.fp.readline()
2098 if not line:
2099 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002100 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002101 self.fp.seek(pos)
2102 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002103
Thomas Wouters477c8d52006-05-27 19:21:47 +00002104## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002105
2106
Thomas Wouters477c8d52006-05-27 19:21:47 +00002107class Error(Exception):
2108 """Raised for module-specific errors."""
2109
2110class NoSuchMailboxError(Error):
2111 """The specified mailbox does not exist and won't be created."""
2112
2113class NotEmptyError(Error):
2114 """The specified mailbox is not empty and deletion was requested."""
2115
2116class ExternalClashError(Error):
2117 """Another process caused an action to fail."""
2118
2119class FormatError(Error):
2120 """A file appears to have an invalid format."""