blob: 79feae0789a007cf059c5c4c39221d5d5bbf2f6f [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Thomas Wouters477c8d52006-05-27 19:21:47 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Thomas Wouters89f507f2006-12-13 04:49:30 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Thomas Wouters477c8d52006-05-27 19:21:47 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Thomas Wouters477c8d52006-05-27 19:21:47 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
Thomas Woutersb2137042007-02-01 18:02:27 +000019import email.message
20import email.generator
Thomas Wouters477c8d52006-05-27 19:21:47 +000021import rfc822
Guido van Rossum34d19282007-08-09 01:03:29 +000022import io
Thomas Wouters477c8d52006-05-27 19:21:47 +000023try:
Thomas Wouters0e3f5912006-08-11 14:57:12 +000024 if sys.platform == 'os2emx':
25 # OS/2 EMX fcntl() not adequate
26 raise ImportError
27 import fcntl
Thomas Wouters477c8d52006-05-27 19:21:47 +000028except ImportError:
29 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000030
Thomas Wouters477c8d52006-05-27 19:21:47 +000031__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
32 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
33 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
34 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
35
36class Mailbox:
37 """A group of messages in a particular place."""
38
39 def __init__(self, path, factory=None, create=True):
40 """Initialize a Mailbox instance."""
41 self._path = os.path.abspath(os.path.expanduser(path))
42 self._factory = factory
43
44 def add(self, message):
45 """Add message and return assigned key."""
46 raise NotImplementedError('Method must be implemented by subclass')
47
48 def remove(self, key):
49 """Remove the keyed message; raise KeyError if it doesn't exist."""
50 raise NotImplementedError('Method must be implemented by subclass')
51
52 def __delitem__(self, key):
53 self.remove(key)
54
55 def discard(self, key):
56 """If the keyed message exists, remove it."""
57 try:
58 self.remove(key)
59 except KeyError:
60 pass
61
62 def __setitem__(self, key, message):
63 """Replace the keyed message; raise KeyError if it doesn't exist."""
64 raise NotImplementedError('Method must be implemented by subclass')
65
66 def get(self, key, default=None):
67 """Return the keyed message, or default if it doesn't exist."""
68 try:
69 return self.__getitem__(key)
70 except KeyError:
71 return default
72
73 def __getitem__(self, key):
74 """Return the keyed message; raise KeyError if it doesn't exist."""
75 if not self._factory:
76 return self.get_message(key)
77 else:
78 return self._factory(self.get_file(key))
79
80 def get_message(self, key):
81 """Return a Message representation or raise a KeyError."""
82 raise NotImplementedError('Method must be implemented by subclass')
83
84 def get_string(self, key):
85 """Return a string representation or raise a KeyError."""
86 raise NotImplementedError('Method must be implemented by subclass')
87
88 def get_file(self, key):
89 """Return a file-like representation or raise a KeyError."""
90 raise NotImplementedError('Method must be implemented by subclass')
91
92 def iterkeys(self):
93 """Return an iterator over keys."""
94 raise NotImplementedError('Method must be implemented by subclass')
95
96 def keys(self):
97 """Return a list of keys."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +000098 return list(self.iterkeys())
Thomas Wouters477c8d52006-05-27 19:21:47 +000099
100 def itervalues(self):
101 """Return an iterator over all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000102 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000103 try:
104 value = self[key]
105 except KeyError:
106 continue
107 yield value
108
109 def __iter__(self):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000110 return self.itervalues()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000111
112 def values(self):
113 """Return a list of messages. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000114 return list(self.itervalues())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000115
116 def iteritems(self):
117 """Return an iterator over (key, message) tuples."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000118 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000119 try:
120 value = self[key]
121 except KeyError:
122 continue
123 yield (key, value)
124
125 def items(self):
126 """Return a list of (key, message) tuples. Memory intensive."""
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000127 return list(self.iteritems())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000128
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000129 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000130 """Return True if the keyed message exists, False otherwise."""
131 raise NotImplementedError('Method must be implemented by subclass')
132
Thomas Wouters477c8d52006-05-27 19:21:47 +0000133 def __len__(self):
134 """Return a count of messages in the mailbox."""
135 raise NotImplementedError('Method must be implemented by subclass')
136
137 def clear(self):
138 """Delete all messages."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000139 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000140 self.discard(key)
141
142 def pop(self, key, default=None):
143 """Delete the keyed message and return it, or default."""
144 try:
145 result = self[key]
146 except KeyError:
147 return default
148 self.discard(key)
149 return result
150
151 def popitem(self):
152 """Delete an arbitrary (key, message) pair and return it."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000153 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +0000154 return (key, self.pop(key)) # This is only run once.
155 else:
156 raise KeyError('No messages in mailbox')
157
158 def update(self, arg=None):
159 """Change the messages that correspond to certain keys."""
160 if hasattr(arg, 'iteritems'):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000161 source = arg.items()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000162 elif hasattr(arg, 'items'):
163 source = arg.items()
164 else:
165 source = arg
166 bad_key = False
167 for key, message in source:
168 try:
169 self[key] = message
170 except KeyError:
171 bad_key = True
172 if bad_key:
173 raise KeyError('No message with key(s)')
174
175 def flush(self):
176 """Write any pending changes to the disk."""
177 raise NotImplementedError('Method must be implemented by subclass')
178
179 def lock(self):
180 """Lock the mailbox."""
181 raise NotImplementedError('Method must be implemented by subclass')
182
183 def unlock(self):
184 """Unlock the mailbox if it is locked."""
185 raise NotImplementedError('Method must be implemented by subclass')
186
187 def close(self):
188 """Flush and close the mailbox."""
189 raise NotImplementedError('Method must be implemented by subclass')
190
191 def _dump_message(self, message, target, mangle_from_=False):
192 # Most files are opened in binary mode to allow predictable seeking.
193 # To get native line endings on disk, the user-friendly \n line endings
194 # used in strings and by email.Message are translated here.
195 """Dump message contents to target file."""
Thomas Woutersb2137042007-02-01 18:02:27 +0000196 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +0000197 buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +0000198 gen = email.generator.Generator(buffer, mangle_from_, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000199 gen.flatten(message)
200 buffer.seek(0)
201 target.write(buffer.read().replace('\n', os.linesep))
202 elif isinstance(message, str):
203 if mangle_from_:
204 message = message.replace('\nFrom ', '\n>From ')
205 message = message.replace('\n', os.linesep)
206 target.write(message)
207 elif hasattr(message, 'read'):
208 while True:
209 line = message.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000210 if not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000211 break
212 if mangle_from_ and line.startswith('From '):
213 line = '>From ' + line[5:]
214 line = line.replace('\n', os.linesep)
215 target.write(line)
216 else:
217 raise TypeError('Invalid message type: %s' % type(message))
218
219
220class Maildir(Mailbox):
221 """A qmail-style Maildir mailbox."""
222
223 colon = ':'
224
225 def __init__(self, dirname, factory=rfc822.Message, create=True):
226 """Initialize a Maildir instance."""
227 Mailbox.__init__(self, dirname, factory, create)
228 if not os.path.exists(self._path):
229 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000230 os.mkdir(self._path, 0o700)
231 os.mkdir(os.path.join(self._path, 'tmp'), 0o700)
232 os.mkdir(os.path.join(self._path, 'new'), 0o700)
233 os.mkdir(os.path.join(self._path, 'cur'), 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000234 else:
235 raise NoSuchMailboxError(self._path)
236 self._toc = {}
237
238 def add(self, message):
239 """Add message and return assigned key."""
240 tmp_file = self._create_tmp()
241 try:
242 self._dump_message(message, tmp_file)
243 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000244 _sync_close(tmp_file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000245 if isinstance(message, MaildirMessage):
246 subdir = message.get_subdir()
247 suffix = self.colon + message.get_info()
248 if suffix == self.colon:
249 suffix = ''
250 else:
251 subdir = 'new'
252 suffix = ''
253 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
254 dest = os.path.join(self._path, subdir, uniq + suffix)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000255 try:
256 if hasattr(os, 'link'):
257 os.link(tmp_file.name, dest)
258 os.remove(tmp_file.name)
259 else:
260 os.rename(tmp_file.name, dest)
Guido van Rossumb940e112007-01-10 16:19:56 +0000261 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000262 os.remove(tmp_file.name)
263 if e.errno == errno.EEXIST:
264 raise ExternalClashError('Name clash with existing message: %s'
265 % dest)
266 else:
267 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000268 if isinstance(message, MaildirMessage):
269 os.utime(dest, (os.path.getatime(dest), message.get_date()))
270 return uniq
271
272 def remove(self, key):
273 """Remove the keyed message; raise KeyError if it doesn't exist."""
274 os.remove(os.path.join(self._path, self._lookup(key)))
275
276 def discard(self, key):
277 """If the keyed message exists, remove it."""
278 # This overrides an inapplicable implementation in the superclass.
279 try:
280 self.remove(key)
281 except KeyError:
282 pass
Guido van Rossumb940e112007-01-10 16:19:56 +0000283 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000284 if e.errno != errno.ENOENT:
285 raise
286
287 def __setitem__(self, key, message):
288 """Replace the keyed message; raise KeyError if it doesn't exist."""
289 old_subpath = self._lookup(key)
290 temp_key = self.add(message)
291 temp_subpath = self._lookup(temp_key)
292 if isinstance(message, MaildirMessage):
293 # temp's subdir and suffix were specified by message.
294 dominant_subpath = temp_subpath
295 else:
296 # temp's subdir and suffix were defaults from add().
297 dominant_subpath = old_subpath
298 subdir = os.path.dirname(dominant_subpath)
299 if self.colon in dominant_subpath:
300 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
301 else:
302 suffix = ''
303 self.discard(key)
304 new_path = os.path.join(self._path, subdir, key + suffix)
305 os.rename(os.path.join(self._path, temp_subpath), new_path)
306 if isinstance(message, MaildirMessage):
307 os.utime(new_path, (os.path.getatime(new_path),
308 message.get_date()))
309
310 def get_message(self, key):
311 """Return a Message representation or raise a KeyError."""
312 subpath = self._lookup(key)
313 f = open(os.path.join(self._path, subpath), 'r')
314 try:
315 msg = MaildirMessage(f)
316 finally:
317 f.close()
318 subdir, name = os.path.split(subpath)
319 msg.set_subdir(subdir)
320 if self.colon in name:
321 msg.set_info(name.split(self.colon)[-1])
322 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
323 return msg
324
325 def get_string(self, key):
326 """Return a string representation or raise a KeyError."""
327 f = open(os.path.join(self._path, self._lookup(key)), 'r')
328 try:
329 return f.read()
330 finally:
331 f.close()
332
333 def get_file(self, key):
334 """Return a file-like representation or raise a KeyError."""
335 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
336 return _ProxyFile(f)
337
338 def iterkeys(self):
339 """Return an iterator over keys."""
340 self._refresh()
341 for key in self._toc:
342 try:
343 self._lookup(key)
344 except KeyError:
345 continue
346 yield key
347
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000348 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000349 """Return True if the keyed message exists, False otherwise."""
350 self._refresh()
351 return key in self._toc
352
353 def __len__(self):
354 """Return a count of messages in the mailbox."""
355 self._refresh()
356 return len(self._toc)
357
358 def flush(self):
359 """Write any pending changes to disk."""
360 return # Maildir changes are always written immediately.
361
362 def lock(self):
363 """Lock the mailbox."""
364 return
365
366 def unlock(self):
367 """Unlock the mailbox if it is locked."""
368 return
369
370 def close(self):
371 """Flush and close the mailbox."""
372 return
373
374 def list_folders(self):
375 """Return a list of folder names."""
376 result = []
377 for entry in os.listdir(self._path):
378 if len(entry) > 1 and entry[0] == '.' and \
379 os.path.isdir(os.path.join(self._path, entry)):
380 result.append(entry[1:])
381 return result
382
383 def get_folder(self, folder):
384 """Return a Maildir instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000385 return Maildir(os.path.join(self._path, '.' + folder),
386 factory=self._factory,
387 create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000388
389 def add_folder(self, folder):
390 """Create a folder and return a Maildir instance representing it."""
391 path = os.path.join(self._path, '.' + folder)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000392 result = Maildir(path, factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000393 maildirfolder_path = os.path.join(path, 'maildirfolder')
394 if not os.path.exists(maildirfolder_path):
395 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY))
396 return result
397
398 def remove_folder(self, folder):
399 """Delete the named folder, which must be empty."""
400 path = os.path.join(self._path, '.' + folder)
401 for entry in os.listdir(os.path.join(path, 'new')) + \
402 os.listdir(os.path.join(path, 'cur')):
403 if len(entry) < 1 or entry[0] != '.':
404 raise NotEmptyError('Folder contains message(s): %s' % folder)
405 for entry in os.listdir(path):
406 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
407 os.path.isdir(os.path.join(path, entry)):
408 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
409 (folder, entry))
410 for root, dirs, files in os.walk(path, topdown=False):
411 for entry in files:
412 os.remove(os.path.join(root, entry))
413 for entry in dirs:
414 os.rmdir(os.path.join(root, entry))
415 os.rmdir(path)
416
417 def clean(self):
418 """Delete old files in "tmp"."""
419 now = time.time()
420 for entry in os.listdir(os.path.join(self._path, 'tmp')):
421 path = os.path.join(self._path, 'tmp', entry)
422 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
423 os.remove(path)
424
425 _count = 1 # This is used to generate unique file names.
426
427 def _create_tmp(self):
428 """Create a file in the tmp subdirectory and open and return it."""
429 now = time.time()
430 hostname = socket.gethostname()
431 if '/' in hostname:
432 hostname = hostname.replace('/', r'\057')
433 if ':' in hostname:
434 hostname = hostname.replace(':', r'\072')
435 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
436 Maildir._count, hostname)
437 path = os.path.join(self._path, 'tmp', uniq)
438 try:
439 os.stat(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000440 except OSError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000441 if e.errno == errno.ENOENT:
442 Maildir._count += 1
Thomas Wouters89f507f2006-12-13 04:49:30 +0000443 try:
444 return _create_carefully(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000445 except OSError as e:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000446 if e.errno != errno.EEXIST:
447 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +0000448 else:
449 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000450
451 # Fall through to here if stat succeeded or open raised EEXIST.
452 raise ExternalClashError('Name clash prevented file creation: %s' %
453 path)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000454
455 def _refresh(self):
456 """Update table of contents mapping."""
457 self._toc = {}
458 for subdir in ('new', 'cur'):
Guido van Rossumb5a755e2007-07-18 18:15:48 +0000459 subdir_path = os.path.join(self._path, subdir)
460 for entry in os.listdir(subdir_path):
461 p = os.path.join(subdir_path, entry)
462 if os.path.isdir(p):
463 continue
Thomas Wouters477c8d52006-05-27 19:21:47 +0000464 uniq = entry.split(self.colon)[0]
465 self._toc[uniq] = os.path.join(subdir, entry)
466
467 def _lookup(self, key):
468 """Use TOC to return subpath for given key, or raise a KeyError."""
469 try:
470 if os.path.exists(os.path.join(self._path, self._toc[key])):
471 return self._toc[key]
472 except KeyError:
473 pass
474 self._refresh()
475 try:
476 return self._toc[key]
477 except KeyError:
478 raise KeyError('No message with key: %s' % key)
479
480 # This method is for backward compatibility only.
481 def next(self):
482 """Return the next message in a one-time iteration."""
483 if not hasattr(self, '_onetime_keys'):
Guido van Rossumdde4c2c2007-02-12 00:22:55 +0000484 self._onetime_keys = iter(self.keys())
Thomas Wouters477c8d52006-05-27 19:21:47 +0000485 while True:
486 try:
Georg Brandla18af4e2007-04-21 15:47:16 +0000487 return self[next(self._onetime_keys)]
Thomas Wouters477c8d52006-05-27 19:21:47 +0000488 except StopIteration:
489 return None
490 except KeyError:
491 continue
492
493
494class _singlefileMailbox(Mailbox):
495 """A single-file mailbox."""
496
497 def __init__(self, path, factory=None, create=True):
498 """Initialize a single-file mailbox."""
499 Mailbox.__init__(self, path, factory, create)
500 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000501 f = open(self._path, 'r+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000502 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000503 if e.errno == errno.ENOENT:
504 if create:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000505 f = open(self._path, 'w+')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000506 else:
507 raise NoSuchMailboxError(self._path)
508 elif e.errno == errno.EACCES:
Guido van Rossumd4eda822007-07-21 00:21:26 +0000509 f = open(self._path, 'r')
Thomas Wouters477c8d52006-05-27 19:21:47 +0000510 else:
511 raise
512 self._file = f
513 self._toc = None
514 self._next_key = 0
515 self._pending = False # No changes require rewriting the file.
516 self._locked = False
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000517 self._file_length = None # Used to record mailbox size
Thomas Wouters477c8d52006-05-27 19:21:47 +0000518
519 def add(self, message):
520 """Add message and return assigned key."""
521 self._lookup()
522 self._toc[self._next_key] = self._append_message(message)
523 self._next_key += 1
524 self._pending = True
525 return self._next_key - 1
526
527 def remove(self, key):
528 """Remove the keyed message; raise KeyError if it doesn't exist."""
529 self._lookup(key)
530 del self._toc[key]
531 self._pending = True
532
533 def __setitem__(self, key, message):
534 """Replace the keyed message; raise KeyError if it doesn't exist."""
535 self._lookup(key)
536 self._toc[key] = self._append_message(message)
537 self._pending = True
538
539 def iterkeys(self):
540 """Return an iterator over keys."""
541 self._lookup()
542 for key in self._toc.keys():
543 yield key
544
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000545 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000546 """Return True if the keyed message exists, False otherwise."""
547 self._lookup()
548 return key in self._toc
549
550 def __len__(self):
551 """Return a count of messages in the mailbox."""
552 self._lookup()
553 return len(self._toc)
554
555 def lock(self):
556 """Lock the mailbox."""
557 if not self._locked:
558 _lock_file(self._file)
559 self._locked = True
560
561 def unlock(self):
562 """Unlock the mailbox if it is locked."""
563 if self._locked:
564 _unlock_file(self._file)
565 self._locked = False
566
567 def flush(self):
568 """Write any pending changes to disk."""
569 if not self._pending:
570 return
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000571
572 # In order to be writing anything out at all, self._toc must
573 # already have been generated (and presumably has been modified
574 # by adding or deleting an item).
575 assert self._toc is not None
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000576
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000577 # Check length of self._file; if it's changed, some other process
578 # has modified the mailbox since we scanned it.
579 self._file.seek(0, 2)
580 cur_len = self._file.tell()
581 if cur_len != self._file_length:
582 raise ExternalClashError('Size of mailbox file changed '
583 '(expected %i, found %i)' %
584 (self._file_length, cur_len))
Thomas Wouters9fe394c2007-02-05 01:24:16 +0000585
Thomas Wouters477c8d52006-05-27 19:21:47 +0000586 new_file = _create_temporary(self._path)
587 try:
588 new_toc = {}
589 self._pre_mailbox_hook(new_file)
590 for key in sorted(self._toc.keys()):
591 start, stop = self._toc[key]
592 self._file.seek(start)
593 self._pre_message_hook(new_file)
594 new_start = new_file.tell()
595 while True:
596 buffer = self._file.read(min(4096,
597 stop - self._file.tell()))
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000598 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000599 break
600 new_file.write(buffer)
601 new_toc[key] = (new_start, new_file.tell())
602 self._post_message_hook(new_file)
603 except:
604 new_file.close()
605 os.remove(new_file.name)
606 raise
Thomas Wouters89f507f2006-12-13 04:49:30 +0000607 _sync_close(new_file)
608 # self._file is about to get replaced, so no need to sync.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000609 self._file.close()
610 try:
611 os.rename(new_file.name, self._path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000612 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000613 if e.errno == errno.EEXIST or \
614 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000615 os.remove(self._path)
616 os.rename(new_file.name, self._path)
617 else:
618 raise
619 self._file = open(self._path, 'rb+')
620 self._toc = new_toc
621 self._pending = False
622 if self._locked:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000623 _lock_file(self._file, dotlock=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000624
625 def _pre_mailbox_hook(self, f):
626 """Called before writing the mailbox to file f."""
627 return
628
629 def _pre_message_hook(self, f):
630 """Called before writing each message to file f."""
631 return
632
633 def _post_message_hook(self, f):
634 """Called after writing each message to file f."""
635 return
636
637 def close(self):
638 """Flush and close the mailbox."""
639 self.flush()
640 if self._locked:
641 self.unlock()
Thomas Wouters89f507f2006-12-13 04:49:30 +0000642 self._file.close() # Sync has been done by self.flush() above.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000643
644 def _lookup(self, key=None):
645 """Return (start, stop) or raise KeyError."""
646 if self._toc is None:
647 self._generate_toc()
648 if key is not None:
649 try:
650 return self._toc[key]
651 except KeyError:
652 raise KeyError('No message with key: %s' % key)
653
654 def _append_message(self, message):
655 """Append message to mailbox and return (start, stop) offsets."""
656 self._file.seek(0, 2)
657 self._pre_message_hook(self._file)
658 offsets = self._install_message(message)
659 self._post_message_hook(self._file)
660 self._file.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000661 self._file_length = self._file.tell() # Record current length of mailbox
Thomas Wouters477c8d52006-05-27 19:21:47 +0000662 return offsets
663
664
665
666class _mboxMMDF(_singlefileMailbox):
667 """An mbox or MMDF mailbox."""
668
669 _mangle_from_ = True
670
671 def get_message(self, key):
672 """Return a Message representation or raise a KeyError."""
673 start, stop = self._lookup(key)
674 self._file.seek(start)
675 from_line = self._file.readline().replace(os.linesep, '')
676 string = self._file.read(stop - self._file.tell())
677 msg = self._message_factory(string.replace(os.linesep, '\n'))
678 msg.set_from(from_line[5:])
679 return msg
680
681 def get_string(self, key, from_=False):
682 """Return a string representation or raise a KeyError."""
683 start, stop = self._lookup(key)
684 self._file.seek(start)
685 if not from_:
686 self._file.readline()
687 string = self._file.read(stop - self._file.tell())
688 return string.replace(os.linesep, '\n')
689
690 def get_file(self, key, from_=False):
691 """Return a file-like representation or raise a KeyError."""
692 start, stop = self._lookup(key)
693 self._file.seek(start)
694 if not from_:
695 self._file.readline()
696 return _PartialFile(self._file, self._file.tell(), stop)
697
698 def _install_message(self, message):
699 """Format a message and blindly write to self._file."""
700 from_line = None
701 if isinstance(message, str) and message.startswith('From '):
702 newline = message.find('\n')
703 if newline != -1:
704 from_line = message[:newline]
705 message = message[newline + 1:]
706 else:
707 from_line = message
708 message = ''
709 elif isinstance(message, _mboxMMDFMessage):
710 from_line = 'From ' + message.get_from()
Thomas Woutersb2137042007-02-01 18:02:27 +0000711 elif isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000712 from_line = message.get_unixfrom() # May be None.
713 if from_line is None:
714 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
715 start = self._file.tell()
716 self._file.write(from_line + os.linesep)
717 self._dump_message(message, self._file, self._mangle_from_)
718 stop = self._file.tell()
719 return (start, stop)
720
721
722class mbox(_mboxMMDF):
723 """A classic mbox mailbox."""
724
725 _mangle_from_ = True
726
727 def __init__(self, path, factory=None, create=True):
728 """Initialize an mbox mailbox."""
729 self._message_factory = mboxMessage
730 _mboxMMDF.__init__(self, path, factory, create)
731
732 def _pre_message_hook(self, f):
733 """Called before writing each message to file f."""
734 if f.tell() != 0:
735 f.write(os.linesep)
736
737 def _generate_toc(self):
738 """Generate key-to-(start, stop) table of contents."""
739 starts, stops = [], []
740 self._file.seek(0)
741 while True:
742 line_pos = self._file.tell()
743 line = self._file.readline()
744 if line.startswith('From '):
745 if len(stops) < len(starts):
746 stops.append(line_pos - len(os.linesep))
747 starts.append(line_pos)
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000748 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000749 stops.append(line_pos)
750 break
751 self._toc = dict(enumerate(zip(starts, stops)))
752 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000753 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000754
755
756class MMDF(_mboxMMDF):
757 """An MMDF mailbox."""
758
759 def __init__(self, path, factory=None, create=True):
760 """Initialize an MMDF mailbox."""
761 self._message_factory = MMDFMessage
762 _mboxMMDF.__init__(self, path, factory, create)
763
764 def _pre_message_hook(self, f):
765 """Called before writing each message to file f."""
766 f.write('\001\001\001\001' + os.linesep)
767
768 def _post_message_hook(self, f):
769 """Called after writing each message to file f."""
770 f.write(os.linesep + '\001\001\001\001' + os.linesep)
771
772 def _generate_toc(self):
773 """Generate key-to-(start, stop) table of contents."""
774 starts, stops = [], []
775 self._file.seek(0)
776 next_pos = 0
777 while True:
778 line_pos = next_pos
779 line = self._file.readline()
780 next_pos = self._file.tell()
781 if line.startswith('\001\001\001\001' + os.linesep):
782 starts.append(next_pos)
783 while True:
784 line_pos = next_pos
785 line = self._file.readline()
786 next_pos = self._file.tell()
787 if line == '\001\001\001\001' + os.linesep:
788 stops.append(line_pos - len(os.linesep))
789 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000790 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000791 stops.append(line_pos)
792 break
Guido van Rossum7cad4f32007-06-07 23:58:54 +0000793 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000794 break
795 self._toc = dict(enumerate(zip(starts, stops)))
796 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +0000797 self._file.seek(0, 2)
798 self._file_length = self._file.tell()
Thomas Wouters477c8d52006-05-27 19:21:47 +0000799
800
801class MH(Mailbox):
802 """An MH mailbox."""
803
804 def __init__(self, path, factory=None, create=True):
805 """Initialize an MH instance."""
806 Mailbox.__init__(self, path, factory, create)
807 if not os.path.exists(self._path):
808 if create:
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000809 os.mkdir(self._path, 0o700)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000810 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000811 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0o600))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000812 else:
813 raise NoSuchMailboxError(self._path)
814 self._locked = False
815
816 def add(self, message):
817 """Add message and return assigned key."""
818 keys = self.keys()
819 if len(keys) == 0:
820 new_key = 1
821 else:
822 new_key = max(keys) + 1
823 new_path = os.path.join(self._path, str(new_key))
824 f = _create_carefully(new_path)
825 try:
826 if self._locked:
827 _lock_file(f)
828 try:
829 self._dump_message(message, f)
830 if isinstance(message, MHMessage):
831 self._dump_sequences(message, new_key)
832 finally:
833 if self._locked:
834 _unlock_file(f)
835 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000836 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000837 return new_key
838
839 def remove(self, key):
840 """Remove the keyed message; raise KeyError if it doesn't exist."""
841 path = os.path.join(self._path, str(key))
842 try:
843 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000844 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000845 if e.errno == errno.ENOENT:
846 raise KeyError('No message with key: %s' % key)
847 else:
848 raise
849 try:
850 if self._locked:
851 _lock_file(f)
852 try:
853 f.close()
854 os.remove(os.path.join(self._path, str(key)))
855 finally:
856 if self._locked:
857 _unlock_file(f)
858 finally:
859 f.close()
860
861 def __setitem__(self, key, message):
862 """Replace the keyed message; raise KeyError if it doesn't exist."""
863 path = os.path.join(self._path, str(key))
864 try:
865 f = open(path, 'rb+')
Guido van Rossumb940e112007-01-10 16:19:56 +0000866 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000867 if e.errno == errno.ENOENT:
868 raise KeyError('No message with key: %s' % key)
869 else:
870 raise
871 try:
872 if self._locked:
873 _lock_file(f)
874 try:
875 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
876 self._dump_message(message, f)
877 if isinstance(message, MHMessage):
878 self._dump_sequences(message, key)
879 finally:
880 if self._locked:
881 _unlock_file(f)
882 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000883 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000884
885 def get_message(self, key):
886 """Return a Message representation or raise a KeyError."""
887 try:
888 if self._locked:
889 f = open(os.path.join(self._path, str(key)), 'r+')
890 else:
891 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000892 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000893 if e.errno == errno.ENOENT:
894 raise KeyError('No message with key: %s' % key)
895 else:
896 raise
897 try:
898 if self._locked:
899 _lock_file(f)
900 try:
901 msg = MHMessage(f)
902 finally:
903 if self._locked:
904 _unlock_file(f)
905 finally:
906 f.close()
907 for name, key_list in self.get_sequences():
908 if key in key_list:
909 msg.add_sequence(name)
910 return msg
911
912 def get_string(self, key):
913 """Return a string representation or raise a KeyError."""
914 try:
915 if self._locked:
916 f = open(os.path.join(self._path, str(key)), 'r+')
917 else:
918 f = open(os.path.join(self._path, str(key)), 'r')
Guido van Rossumb940e112007-01-10 16:19:56 +0000919 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000920 if e.errno == errno.ENOENT:
921 raise KeyError('No message with key: %s' % key)
922 else:
923 raise
924 try:
925 if self._locked:
926 _lock_file(f)
927 try:
928 return f.read()
929 finally:
930 if self._locked:
931 _unlock_file(f)
932 finally:
933 f.close()
934
935 def get_file(self, key):
936 """Return a file-like representation or raise a KeyError."""
937 try:
938 f = open(os.path.join(self._path, str(key)), 'rb')
Guido van Rossumb940e112007-01-10 16:19:56 +0000939 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +0000940 if e.errno == errno.ENOENT:
941 raise KeyError('No message with key: %s' % key)
942 else:
943 raise
944 return _ProxyFile(f)
945
946 def iterkeys(self):
947 """Return an iterator over keys."""
948 return iter(sorted(int(entry) for entry in os.listdir(self._path)
949 if entry.isdigit()))
950
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000951 def __contains__(self, key):
Thomas Wouters477c8d52006-05-27 19:21:47 +0000952 """Return True if the keyed message exists, False otherwise."""
953 return os.path.exists(os.path.join(self._path, str(key)))
954
955 def __len__(self):
956 """Return a count of messages in the mailbox."""
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000957 return len(list(self.keys()))
Thomas Wouters477c8d52006-05-27 19:21:47 +0000958
959 def lock(self):
960 """Lock the mailbox."""
961 if not self._locked:
962 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
963 _lock_file(self._file)
964 self._locked = True
965
966 def unlock(self):
967 """Unlock the mailbox if it is locked."""
968 if self._locked:
969 _unlock_file(self._file)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000970 _sync_close(self._file)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000971 del self._file
972 self._locked = False
973
974 def flush(self):
975 """Write any pending changes to the disk."""
976 return
977
978 def close(self):
979 """Flush and close the mailbox."""
980 if self._locked:
981 self.unlock()
982
983 def list_folders(self):
984 """Return a list of folder names."""
985 result = []
986 for entry in os.listdir(self._path):
987 if os.path.isdir(os.path.join(self._path, entry)):
988 result.append(entry)
989 return result
990
991 def get_folder(self, folder):
992 """Return an MH instance for the named folder."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000993 return MH(os.path.join(self._path, folder),
994 factory=self._factory, create=False)
Thomas Wouters477c8d52006-05-27 19:21:47 +0000995
996 def add_folder(self, folder):
997 """Create a folder and return an MH instance representing it."""
Thomas Wouters89f507f2006-12-13 04:49:30 +0000998 return MH(os.path.join(self._path, folder),
999 factory=self._factory)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001000
1001 def remove_folder(self, folder):
1002 """Delete the named folder, which must be empty."""
1003 path = os.path.join(self._path, folder)
1004 entries = os.listdir(path)
1005 if entries == ['.mh_sequences']:
1006 os.remove(os.path.join(path, '.mh_sequences'))
1007 elif entries == []:
1008 pass
1009 else:
1010 raise NotEmptyError('Folder not empty: %s' % self._path)
1011 os.rmdir(path)
1012
1013 def get_sequences(self):
1014 """Return a name-to-key-list dictionary to define each sequence."""
1015 results = {}
1016 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
1017 try:
1018 all_keys = set(self.keys())
1019 for line in f:
1020 try:
1021 name, contents = line.split(':')
1022 keys = set()
1023 for spec in contents.split():
1024 if spec.isdigit():
1025 keys.add(int(spec))
1026 else:
1027 start, stop = (int(x) for x in spec.split('-'))
1028 keys.update(range(start, stop + 1))
1029 results[name] = [key for key in sorted(keys) \
1030 if key in all_keys]
1031 if len(results[name]) == 0:
1032 del results[name]
1033 except ValueError:
1034 raise FormatError('Invalid sequence specification: %s' %
1035 line.rstrip())
1036 finally:
1037 f.close()
1038 return results
1039
1040 def set_sequences(self, sequences):
1041 """Set sequences using the given name-to-key-list dictionary."""
1042 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
1043 try:
1044 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001045 for name, keys in sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001046 if len(keys) == 0:
1047 continue
1048 f.write('%s:' % name)
1049 prev = None
1050 completing = False
1051 for key in sorted(set(keys)):
1052 if key - 1 == prev:
1053 if not completing:
1054 completing = True
1055 f.write('-')
1056 elif completing:
1057 completing = False
1058 f.write('%s %s' % (prev, key))
1059 else:
1060 f.write(' %s' % key)
1061 prev = key
1062 if completing:
1063 f.write(str(prev) + '\n')
1064 else:
1065 f.write('\n')
1066 finally:
Thomas Wouters89f507f2006-12-13 04:49:30 +00001067 _sync_close(f)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001068
1069 def pack(self):
1070 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1071 sequences = self.get_sequences()
1072 prev = 0
1073 changes = []
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001074 for key in self.keys():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001075 if key - 1 != prev:
1076 changes.append((key, prev + 1))
Thomas Wouters89f507f2006-12-13 04:49:30 +00001077 if hasattr(os, 'link'):
1078 os.link(os.path.join(self._path, str(key)),
1079 os.path.join(self._path, str(prev + 1)))
1080 os.unlink(os.path.join(self._path, str(key)))
1081 else:
1082 os.rename(os.path.join(self._path, str(key)),
1083 os.path.join(self._path, str(prev + 1)))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001084 prev += 1
1085 self._next_key = prev + 1
1086 if len(changes) == 0:
1087 return
1088 for name, key_list in sequences.items():
1089 for old, new in changes:
1090 if old in key_list:
1091 key_list[key_list.index(old)] = new
1092 self.set_sequences(sequences)
1093
1094 def _dump_sequences(self, message, key):
1095 """Inspect a new MHMessage and update sequences appropriately."""
1096 pending_sequences = message.get_sequences()
1097 all_sequences = self.get_sequences()
Guido van Rossumcc2b0162007-02-11 06:12:03 +00001098 for name, key_list in all_sequences.items():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001099 if name in pending_sequences:
1100 key_list.append(key)
1101 elif key in key_list:
1102 del key_list[key_list.index(key)]
1103 for sequence in pending_sequences:
1104 if sequence not in all_sequences:
1105 all_sequences[sequence] = [key]
1106 self.set_sequences(all_sequences)
1107
1108
1109class Babyl(_singlefileMailbox):
1110 """An Rmail-style Babyl mailbox."""
1111
1112 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1113 'forwarded', 'edited', 'resent'))
1114
1115 def __init__(self, path, factory=None, create=True):
1116 """Initialize a Babyl mailbox."""
1117 _singlefileMailbox.__init__(self, path, factory, create)
1118 self._labels = {}
1119
1120 def add(self, message):
1121 """Add message and return assigned key."""
1122 key = _singlefileMailbox.add(self, message)
1123 if isinstance(message, BabylMessage):
1124 self._labels[key] = message.get_labels()
1125 return key
1126
1127 def remove(self, key):
1128 """Remove the keyed message; raise KeyError if it doesn't exist."""
1129 _singlefileMailbox.remove(self, key)
1130 if key in self._labels:
1131 del self._labels[key]
1132
1133 def __setitem__(self, key, message):
1134 """Replace the keyed message; raise KeyError if it doesn't exist."""
1135 _singlefileMailbox.__setitem__(self, key, message)
1136 if isinstance(message, BabylMessage):
1137 self._labels[key] = message.get_labels()
1138
1139 def get_message(self, key):
1140 """Return a Message representation or raise a KeyError."""
1141 start, stop = self._lookup(key)
1142 self._file.seek(start)
1143 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001144 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001145 while True:
1146 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001147 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001148 break
1149 original_headers.write(line.replace(os.linesep, '\n'))
Guido van Rossum34d19282007-08-09 01:03:29 +00001150 visible_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001151 while True:
1152 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001153 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001154 break
1155 visible_headers.write(line.replace(os.linesep, '\n'))
1156 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1157 '\n')
1158 msg = BabylMessage(original_headers.getvalue() + body)
1159 msg.set_visible(visible_headers.getvalue())
1160 if key in self._labels:
1161 msg.set_labels(self._labels[key])
1162 return msg
1163
1164 def get_string(self, key):
1165 """Return a string representation or raise a KeyError."""
1166 start, stop = self._lookup(key)
1167 self._file.seek(start)
1168 self._file.readline() # Skip '1,' line specifying labels.
Guido van Rossum34d19282007-08-09 01:03:29 +00001169 original_headers = io.StringIO()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001170 while True:
1171 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001172 if line == '*** EOOH ***' + os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001173 break
1174 original_headers.write(line.replace(os.linesep, '\n'))
1175 while True:
1176 line = self._file.readline()
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001177 if line == os.linesep or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001178 break
1179 return original_headers.getvalue() + \
1180 self._file.read(stop - self._file.tell()).replace(os.linesep,
1181 '\n')
1182
1183 def get_file(self, key):
1184 """Return a file-like representation or raise a KeyError."""
Guido van Rossum34d19282007-08-09 01:03:29 +00001185 return io.StringIO(self.get_string(key).replace('\n',
Thomas Wouters477c8d52006-05-27 19:21:47 +00001186 os.linesep))
1187
1188 def get_labels(self):
1189 """Return a list of user-defined labels in the mailbox."""
1190 self._lookup()
1191 labels = set()
1192 for label_list in self._labels.values():
1193 labels.update(label_list)
1194 labels.difference_update(self._special_labels)
1195 return list(labels)
1196
1197 def _generate_toc(self):
1198 """Generate key-to-(start, stop) table of contents."""
1199 starts, stops = [], []
1200 self._file.seek(0)
1201 next_pos = 0
1202 label_lists = []
1203 while True:
1204 line_pos = next_pos
1205 line = self._file.readline()
1206 next_pos = self._file.tell()
1207 if line == '\037\014' + os.linesep:
1208 if len(stops) < len(starts):
1209 stops.append(line_pos - len(os.linesep))
1210 starts.append(next_pos)
1211 labels = [label.strip() for label
1212 in self._file.readline()[1:].split(',')
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001213 if label.strip()]
Thomas Wouters477c8d52006-05-27 19:21:47 +00001214 label_lists.append(labels)
1215 elif line == '\037' or line == '\037' + os.linesep:
1216 if len(stops) < len(starts):
1217 stops.append(line_pos - len(os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001218 elif not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001219 stops.append(line_pos - len(os.linesep))
1220 break
1221 self._toc = dict(enumerate(zip(starts, stops)))
1222 self._labels = dict(enumerate(label_lists))
1223 self._next_key = len(self._toc)
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001224 self._file.seek(0, 2)
1225 self._file_length = self._file.tell()
Thomas Wouters9fe394c2007-02-05 01:24:16 +00001226
Thomas Wouters477c8d52006-05-27 19:21:47 +00001227 def _pre_mailbox_hook(self, f):
1228 """Called before writing the mailbox to file f."""
1229 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1230 (os.linesep, os.linesep, ','.join(self.get_labels()),
1231 os.linesep))
1232
1233 def _pre_message_hook(self, f):
1234 """Called before writing each message to file f."""
1235 f.write('\014' + os.linesep)
1236
1237 def _post_message_hook(self, f):
1238 """Called after writing each message to file f."""
1239 f.write(os.linesep + '\037')
1240
1241 def _install_message(self, message):
1242 """Write message contents and return (start, stop)."""
1243 start = self._file.tell()
1244 if isinstance(message, BabylMessage):
1245 special_labels = []
1246 labels = []
1247 for label in message.get_labels():
1248 if label in self._special_labels:
1249 special_labels.append(label)
1250 else:
1251 labels.append(label)
1252 self._file.write('1')
1253 for label in special_labels:
1254 self._file.write(', ' + label)
1255 self._file.write(',,')
1256 for label in labels:
1257 self._file.write(' ' + label + ',')
1258 self._file.write(os.linesep)
1259 else:
1260 self._file.write('1,,' + os.linesep)
Thomas Woutersb2137042007-02-01 18:02:27 +00001261 if isinstance(message, email.message.Message):
Guido van Rossum34d19282007-08-09 01:03:29 +00001262 orig_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001263 orig_generator = email.generator.Generator(orig_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001264 orig_generator.flatten(message)
1265 orig_buffer.seek(0)
1266 while True:
1267 line = orig_buffer.readline()
1268 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001269 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001270 break
1271 self._file.write('*** EOOH ***' + os.linesep)
1272 if isinstance(message, BabylMessage):
Guido van Rossum34d19282007-08-09 01:03:29 +00001273 vis_buffer = io.StringIO()
Thomas Woutersb2137042007-02-01 18:02:27 +00001274 vis_generator = email.generator.Generator(vis_buffer, False, 0)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001275 vis_generator.flatten(message.get_visible())
1276 while True:
1277 line = vis_buffer.readline()
1278 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001279 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001280 break
1281 else:
1282 orig_buffer.seek(0)
1283 while True:
1284 line = orig_buffer.readline()
1285 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001286 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001287 break
1288 while True:
1289 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001290 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001291 break
1292 self._file.write(buffer.replace('\n', os.linesep))
1293 elif isinstance(message, str):
1294 body_start = message.find('\n\n') + 2
1295 if body_start - 2 != -1:
1296 self._file.write(message[:body_start].replace('\n',
1297 os.linesep))
1298 self._file.write('*** EOOH ***' + os.linesep)
1299 self._file.write(message[:body_start].replace('\n',
1300 os.linesep))
1301 self._file.write(message[body_start:].replace('\n',
1302 os.linesep))
1303 else:
1304 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1305 self._file.write(message.replace('\n', os.linesep))
1306 elif hasattr(message, 'readline'):
1307 original_pos = message.tell()
1308 first_pass = True
1309 while True:
1310 line = message.readline()
1311 self._file.write(line.replace('\n', os.linesep))
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001312 if line == '\n' or not line:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001313 self._file.write('*** EOOH ***' + os.linesep)
1314 if first_pass:
1315 first_pass = False
1316 message.seek(original_pos)
1317 else:
1318 break
1319 while True:
1320 buffer = message.read(4096) # Buffer size is arbitrary.
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001321 if not buffer:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001322 break
1323 self._file.write(buffer.replace('\n', os.linesep))
1324 else:
1325 raise TypeError('Invalid message type: %s' % type(message))
1326 stop = self._file.tell()
1327 return (start, stop)
1328
1329
Thomas Woutersb2137042007-02-01 18:02:27 +00001330class Message(email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001331 """Message with mailbox-format-specific properties."""
1332
1333 def __init__(self, message=None):
1334 """Initialize a Message instance."""
Thomas Woutersb2137042007-02-01 18:02:27 +00001335 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001336 self._become_message(copy.deepcopy(message))
1337 if isinstance(message, Message):
1338 message._explain_to(self)
1339 elif isinstance(message, str):
1340 self._become_message(email.message_from_string(message))
1341 elif hasattr(message, "read"):
1342 self._become_message(email.message_from_file(message))
1343 elif message is None:
Thomas Woutersb2137042007-02-01 18:02:27 +00001344 email.message.Message.__init__(self)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001345 else:
1346 raise TypeError('Invalid message type: %s' % type(message))
1347
1348 def _become_message(self, message):
1349 """Assume the non-format-specific state of message."""
1350 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1351 'preamble', 'epilogue', 'defects', '_default_type'):
1352 self.__dict__[name] = message.__dict__[name]
1353
1354 def _explain_to(self, message):
1355 """Copy format-specific state to message insofar as possible."""
1356 if isinstance(message, Message):
1357 return # There's nothing format-specific to explain.
1358 else:
1359 raise TypeError('Cannot convert to specified type')
1360
1361
1362class MaildirMessage(Message):
1363 """Message with Maildir-specific properties."""
1364
1365 def __init__(self, message=None):
1366 """Initialize a MaildirMessage instance."""
1367 self._subdir = 'new'
1368 self._info = ''
1369 self._date = time.time()
1370 Message.__init__(self, message)
1371
1372 def get_subdir(self):
1373 """Return 'new' or 'cur'."""
1374 return self._subdir
1375
1376 def set_subdir(self, subdir):
1377 """Set subdir to 'new' or 'cur'."""
1378 if subdir == 'new' or subdir == 'cur':
1379 self._subdir = subdir
1380 else:
1381 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1382
1383 def get_flags(self):
1384 """Return as a string the flags that are set."""
1385 if self._info.startswith('2,'):
1386 return self._info[2:]
1387 else:
1388 return ''
1389
1390 def set_flags(self, flags):
1391 """Set the given flags and unset all others."""
1392 self._info = '2,' + ''.join(sorted(flags))
1393
1394 def add_flag(self, flag):
1395 """Set the given flag(s) without changing others."""
1396 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1397
1398 def remove_flag(self, flag):
1399 """Unset the given string flag(s) without changing others."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001400 if self.get_flags():
Thomas Wouters477c8d52006-05-27 19:21:47 +00001401 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1402
1403 def get_date(self):
1404 """Return delivery date of message, in seconds since the epoch."""
1405 return self._date
1406
1407 def set_date(self, date):
1408 """Set delivery date of message, in seconds since the epoch."""
1409 try:
1410 self._date = float(date)
1411 except ValueError:
1412 raise TypeError("can't convert to float: %s" % date)
1413
1414 def get_info(self):
1415 """Get the message's "info" as a string."""
1416 return self._info
1417
1418 def set_info(self, info):
1419 """Set the message's "info" string."""
1420 if isinstance(info, str):
1421 self._info = info
1422 else:
1423 raise TypeError('info must be a string: %s' % type(info))
1424
1425 def _explain_to(self, message):
1426 """Copy Maildir-specific state to message insofar as possible."""
1427 if isinstance(message, MaildirMessage):
1428 message.set_flags(self.get_flags())
1429 message.set_subdir(self.get_subdir())
1430 message.set_date(self.get_date())
1431 elif isinstance(message, _mboxMMDFMessage):
1432 flags = set(self.get_flags())
1433 if 'S' in flags:
1434 message.add_flag('R')
1435 if self.get_subdir() == 'cur':
1436 message.add_flag('O')
1437 if 'T' in flags:
1438 message.add_flag('D')
1439 if 'F' in flags:
1440 message.add_flag('F')
1441 if 'R' in flags:
1442 message.add_flag('A')
1443 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1444 elif isinstance(message, MHMessage):
1445 flags = set(self.get_flags())
1446 if 'S' not in flags:
1447 message.add_sequence('unseen')
1448 if 'R' in flags:
1449 message.add_sequence('replied')
1450 if 'F' in flags:
1451 message.add_sequence('flagged')
1452 elif isinstance(message, BabylMessage):
1453 flags = set(self.get_flags())
1454 if 'S' not in flags:
1455 message.add_label('unseen')
1456 if 'T' in flags:
1457 message.add_label('deleted')
1458 if 'R' in flags:
1459 message.add_label('answered')
1460 if 'P' in flags:
1461 message.add_label('forwarded')
1462 elif isinstance(message, Message):
1463 pass
1464 else:
1465 raise TypeError('Cannot convert to specified type: %s' %
1466 type(message))
1467
1468
1469class _mboxMMDFMessage(Message):
1470 """Message with mbox- or MMDF-specific properties."""
1471
1472 def __init__(self, message=None):
1473 """Initialize an mboxMMDFMessage instance."""
1474 self.set_from('MAILER-DAEMON', True)
Thomas Woutersb2137042007-02-01 18:02:27 +00001475 if isinstance(message, email.message.Message):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001476 unixfrom = message.get_unixfrom()
1477 if unixfrom is not None and unixfrom.startswith('From '):
1478 self.set_from(unixfrom[5:])
1479 Message.__init__(self, message)
1480
1481 def get_from(self):
1482 """Return contents of "From " line."""
1483 return self._from
1484
1485 def set_from(self, from_, time_=None):
1486 """Set "From " line, formatting and appending time_ if specified."""
1487 if time_ is not None:
1488 if time_ is True:
1489 time_ = time.gmtime()
1490 from_ += ' ' + time.asctime(time_)
1491 self._from = from_
1492
1493 def get_flags(self):
1494 """Return as a string the flags that are set."""
1495 return self.get('Status', '') + self.get('X-Status', '')
1496
1497 def set_flags(self, flags):
1498 """Set the given flags and unset all others."""
1499 flags = set(flags)
1500 status_flags, xstatus_flags = '', ''
1501 for flag in ('R', 'O'):
1502 if flag in flags:
1503 status_flags += flag
1504 flags.remove(flag)
1505 for flag in ('D', 'F', 'A'):
1506 if flag in flags:
1507 xstatus_flags += flag
1508 flags.remove(flag)
1509 xstatus_flags += ''.join(sorted(flags))
1510 try:
1511 self.replace_header('Status', status_flags)
1512 except KeyError:
1513 self.add_header('Status', status_flags)
1514 try:
1515 self.replace_header('X-Status', xstatus_flags)
1516 except KeyError:
1517 self.add_header('X-Status', xstatus_flags)
1518
1519 def add_flag(self, flag):
1520 """Set the given flag(s) without changing others."""
1521 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1522
1523 def remove_flag(self, flag):
1524 """Unset the given string flag(s) without changing others."""
1525 if 'Status' in self or 'X-Status' in self:
1526 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1527
1528 def _explain_to(self, message):
1529 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1530 if isinstance(message, MaildirMessage):
1531 flags = set(self.get_flags())
1532 if 'O' in flags:
1533 message.set_subdir('cur')
1534 if 'F' in flags:
1535 message.add_flag('F')
1536 if 'A' in flags:
1537 message.add_flag('R')
1538 if 'R' in flags:
1539 message.add_flag('S')
1540 if 'D' in flags:
1541 message.add_flag('T')
1542 del message['status']
1543 del message['x-status']
1544 maybe_date = ' '.join(self.get_from().split()[-5:])
1545 try:
1546 message.set_date(calendar.timegm(time.strptime(maybe_date,
1547 '%a %b %d %H:%M:%S %Y')))
1548 except (ValueError, OverflowError):
1549 pass
1550 elif isinstance(message, _mboxMMDFMessage):
1551 message.set_flags(self.get_flags())
1552 message.set_from(self.get_from())
1553 elif isinstance(message, MHMessage):
1554 flags = set(self.get_flags())
1555 if 'R' not in flags:
1556 message.add_sequence('unseen')
1557 if 'A' in flags:
1558 message.add_sequence('replied')
1559 if 'F' in flags:
1560 message.add_sequence('flagged')
1561 del message['status']
1562 del message['x-status']
1563 elif isinstance(message, BabylMessage):
1564 flags = set(self.get_flags())
1565 if 'R' not in flags:
1566 message.add_label('unseen')
1567 if 'D' in flags:
1568 message.add_label('deleted')
1569 if 'A' in flags:
1570 message.add_label('answered')
1571 del message['status']
1572 del message['x-status']
1573 elif isinstance(message, Message):
1574 pass
1575 else:
1576 raise TypeError('Cannot convert to specified type: %s' %
1577 type(message))
1578
1579
1580class mboxMessage(_mboxMMDFMessage):
1581 """Message with mbox-specific properties."""
1582
1583
1584class MHMessage(Message):
1585 """Message with MH-specific properties."""
1586
1587 def __init__(self, message=None):
1588 """Initialize an MHMessage instance."""
1589 self._sequences = []
1590 Message.__init__(self, message)
1591
1592 def get_sequences(self):
1593 """Return a list of sequences that include the message."""
1594 return self._sequences[:]
1595
1596 def set_sequences(self, sequences):
1597 """Set the list of sequences that include the message."""
1598 self._sequences = list(sequences)
1599
1600 def add_sequence(self, sequence):
1601 """Add sequence to list of sequences including the message."""
1602 if isinstance(sequence, str):
1603 if not sequence in self._sequences:
1604 self._sequences.append(sequence)
1605 else:
1606 raise TypeError('sequence must be a string: %s' % type(sequence))
1607
1608 def remove_sequence(self, sequence):
1609 """Remove sequence from the list of sequences including the message."""
1610 try:
1611 self._sequences.remove(sequence)
1612 except ValueError:
1613 pass
1614
1615 def _explain_to(self, message):
1616 """Copy MH-specific state to message insofar as possible."""
1617 if isinstance(message, MaildirMessage):
1618 sequences = set(self.get_sequences())
1619 if 'unseen' in sequences:
1620 message.set_subdir('cur')
1621 else:
1622 message.set_subdir('cur')
1623 message.add_flag('S')
1624 if 'flagged' in sequences:
1625 message.add_flag('F')
1626 if 'replied' in sequences:
1627 message.add_flag('R')
1628 elif isinstance(message, _mboxMMDFMessage):
1629 sequences = set(self.get_sequences())
1630 if 'unseen' not in sequences:
1631 message.add_flag('RO')
1632 else:
1633 message.add_flag('O')
1634 if 'flagged' in sequences:
1635 message.add_flag('F')
1636 if 'replied' in sequences:
1637 message.add_flag('A')
1638 elif isinstance(message, MHMessage):
1639 for sequence in self.get_sequences():
1640 message.add_sequence(sequence)
1641 elif isinstance(message, BabylMessage):
1642 sequences = set(self.get_sequences())
1643 if 'unseen' in sequences:
1644 message.add_label('unseen')
1645 if 'replied' in sequences:
1646 message.add_label('answered')
1647 elif isinstance(message, Message):
1648 pass
1649 else:
1650 raise TypeError('Cannot convert to specified type: %s' %
1651 type(message))
1652
1653
1654class BabylMessage(Message):
1655 """Message with Babyl-specific properties."""
1656
1657 def __init__(self, message=None):
1658 """Initialize an BabylMessage instance."""
1659 self._labels = []
1660 self._visible = Message()
1661 Message.__init__(self, message)
1662
1663 def get_labels(self):
1664 """Return a list of labels on the message."""
1665 return self._labels[:]
1666
1667 def set_labels(self, labels):
1668 """Set the list of labels on the message."""
1669 self._labels = list(labels)
1670
1671 def add_label(self, label):
1672 """Add label to list of labels on the message."""
1673 if isinstance(label, str):
1674 if label not in self._labels:
1675 self._labels.append(label)
1676 else:
1677 raise TypeError('label must be a string: %s' % type(label))
1678
1679 def remove_label(self, label):
1680 """Remove label from the list of labels on the message."""
1681 try:
1682 self._labels.remove(label)
1683 except ValueError:
1684 pass
1685
1686 def get_visible(self):
1687 """Return a Message representation of visible headers."""
1688 return Message(self._visible)
1689
1690 def set_visible(self, visible):
1691 """Set the Message representation of visible headers."""
1692 self._visible = Message(visible)
1693
1694 def update_visible(self):
1695 """Update and/or sensibly generate a set of visible headers."""
1696 for header in self._visible.keys():
1697 if header in self:
1698 self._visible.replace_header(header, self[header])
1699 else:
1700 del self._visible[header]
1701 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1702 if header in self and header not in self._visible:
1703 self._visible[header] = self[header]
1704
1705 def _explain_to(self, message):
1706 """Copy Babyl-specific state to message insofar as possible."""
1707 if isinstance(message, MaildirMessage):
1708 labels = set(self.get_labels())
1709 if 'unseen' in labels:
1710 message.set_subdir('cur')
1711 else:
1712 message.set_subdir('cur')
1713 message.add_flag('S')
1714 if 'forwarded' in labels or 'resent' in labels:
1715 message.add_flag('P')
1716 if 'answered' in labels:
1717 message.add_flag('R')
1718 if 'deleted' in labels:
1719 message.add_flag('T')
1720 elif isinstance(message, _mboxMMDFMessage):
1721 labels = set(self.get_labels())
1722 if 'unseen' not in labels:
1723 message.add_flag('RO')
1724 else:
1725 message.add_flag('O')
1726 if 'deleted' in labels:
1727 message.add_flag('D')
1728 if 'answered' in labels:
1729 message.add_flag('A')
1730 elif isinstance(message, MHMessage):
1731 labels = set(self.get_labels())
1732 if 'unseen' in labels:
1733 message.add_sequence('unseen')
1734 if 'answered' in labels:
1735 message.add_sequence('replied')
1736 elif isinstance(message, BabylMessage):
1737 message.set_visible(self.get_visible())
1738 for label in self.get_labels():
1739 message.add_label(label)
1740 elif isinstance(message, Message):
1741 pass
1742 else:
1743 raise TypeError('Cannot convert to specified type: %s' %
1744 type(message))
1745
1746
1747class MMDFMessage(_mboxMMDFMessage):
1748 """Message with MMDF-specific properties."""
1749
1750
1751class _ProxyFile:
1752 """A read-only wrapper of a file."""
1753
1754 def __init__(self, f, pos=None):
1755 """Initialize a _ProxyFile."""
1756 self._file = f
1757 if pos is None:
1758 self._pos = f.tell()
1759 else:
1760 self._pos = pos
1761
1762 def read(self, size=None):
1763 """Read bytes."""
Guido van Rossumd4eda822007-07-21 00:21:26 +00001764 return str(self._read(size, self._file.read))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001765
1766 def readline(self, size=None):
1767 """Read a line."""
Guido van Rossumd4eda822007-07-21 00:21:26 +00001768 return str(self._read(size, self._file.readline))
Thomas Wouters477c8d52006-05-27 19:21:47 +00001769
1770 def readlines(self, sizehint=None):
1771 """Read multiple lines."""
1772 result = []
1773 for line in self:
1774 result.append(line)
1775 if sizehint is not None:
1776 sizehint -= len(line)
1777 if sizehint <= 0:
1778 break
1779 return result
1780
1781 def __iter__(self):
1782 """Iterate over lines."""
Guido van Rossum7cad4f32007-06-07 23:58:54 +00001783 while True:
1784 line = self.readline()
1785 if not line:
1786 raise StopIteration
1787 yield line
Thomas Wouters477c8d52006-05-27 19:21:47 +00001788
1789 def tell(self):
1790 """Return the position."""
1791 return self._pos
1792
1793 def seek(self, offset, whence=0):
1794 """Change position."""
1795 if whence == 1:
1796 self._file.seek(self._pos)
1797 self._file.seek(offset, whence)
1798 self._pos = self._file.tell()
1799
1800 def close(self):
1801 """Close the file."""
1802 del self._file
1803
1804 def _read(self, size, read_method):
1805 """Read size bytes using read_method."""
1806 if size is None:
1807 size = -1
1808 self._file.seek(self._pos)
1809 result = read_method(size)
1810 self._pos = self._file.tell()
1811 return result
1812
1813
1814class _PartialFile(_ProxyFile):
1815 """A read-only wrapper of part of a file."""
1816
1817 def __init__(self, f, start=None, stop=None):
1818 """Initialize a _PartialFile."""
1819 _ProxyFile.__init__(self, f, start)
1820 self._start = start
1821 self._stop = stop
1822
1823 def tell(self):
1824 """Return the position with respect to start."""
1825 return _ProxyFile.tell(self) - self._start
1826
1827 def seek(self, offset, whence=0):
1828 """Change position, possibly with respect to start or stop."""
1829 if whence == 0:
1830 self._pos = self._start
1831 whence = 1
1832 elif whence == 2:
1833 self._pos = self._stop
1834 whence = 1
1835 _ProxyFile.seek(self, offset, whence)
1836
1837 def _read(self, size, read_method):
1838 """Read size bytes using read_method, honoring start and stop."""
1839 remaining = self._stop - self._pos
1840 if remaining <= 0:
1841 return ''
1842 if size is None or size < 0 or size > remaining:
1843 size = remaining
1844 return _ProxyFile._read(self, size, read_method)
1845
1846
1847def _lock_file(f, dotlock=True):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001848 """Lock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001849 dotlock_done = False
1850 try:
1851 if fcntl:
1852 try:
1853 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
Guido van Rossumb940e112007-01-10 16:19:56 +00001854 except IOError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001855 if e.errno in (errno.EAGAIN, errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001856 raise ExternalClashError('lockf: lock unavailable: %s' %
1857 f.name)
1858 else:
1859 raise
Thomas Wouters477c8d52006-05-27 19:21:47 +00001860 if dotlock:
1861 try:
1862 pre_lock = _create_temporary(f.name + '.lock')
1863 pre_lock.close()
Guido van Rossumb940e112007-01-10 16:19:56 +00001864 except IOError as e:
Thomas Wouters477c8d52006-05-27 19:21:47 +00001865 if e.errno == errno.EACCES:
1866 return # Without write access, just skip dotlocking.
1867 else:
1868 raise
1869 try:
1870 if hasattr(os, 'link'):
1871 os.link(pre_lock.name, f.name + '.lock')
1872 dotlock_done = True
1873 os.unlink(pre_lock.name)
1874 else:
1875 os.rename(pre_lock.name, f.name + '.lock')
1876 dotlock_done = True
Guido van Rossumb940e112007-01-10 16:19:56 +00001877 except OSError as e:
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001878 if e.errno == errno.EEXIST or \
1879 (os.name == 'os2' and e.errno == errno.EACCES):
Thomas Wouters477c8d52006-05-27 19:21:47 +00001880 os.remove(pre_lock.name)
1881 raise ExternalClashError('dot lock unavailable: %s' %
1882 f.name)
1883 else:
1884 raise
1885 except:
1886 if fcntl:
1887 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001888 if dotlock_done:
1889 os.remove(f.name + '.lock')
1890 raise
1891
1892def _unlock_file(f):
Thomas Wouters0e3f5912006-08-11 14:57:12 +00001893 """Unlock file f using lockf and dot locking."""
Thomas Wouters477c8d52006-05-27 19:21:47 +00001894 if fcntl:
1895 fcntl.lockf(f, fcntl.LOCK_UN)
Thomas Wouters477c8d52006-05-27 19:21:47 +00001896 if os.path.exists(f.name + '.lock'):
1897 os.remove(f.name + '.lock')
1898
1899def _create_carefully(path):
1900 """Create a file if it doesn't exist and open for reading and writing."""
1901 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR)
1902 try:
Guido van Rossumd4eda822007-07-21 00:21:26 +00001903 return open(path, 'r+')
Thomas Wouters477c8d52006-05-27 19:21:47 +00001904 finally:
1905 os.close(fd)
1906
1907def _create_temporary(path):
1908 """Create a temp file based on path and open for reading and writing."""
1909 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1910 socket.gethostname(),
1911 os.getpid()))
1912
Thomas Wouters89f507f2006-12-13 04:49:30 +00001913def _sync_flush(f):
1914 """Ensure changes to file f are physically on disk."""
1915 f.flush()
Thomas Wouters902d6eb2007-01-09 23:18:33 +00001916 if hasattr(os, 'fsync'):
1917 os.fsync(f.fileno())
Thomas Wouters89f507f2006-12-13 04:49:30 +00001918
1919def _sync_close(f):
1920 """Close file f, ensuring all changes are physically on disk."""
1921 _sync_flush(f)
1922 f.close()
Thomas Wouters477c8d52006-05-27 19:21:47 +00001923
1924## Start: classes from the original module (for backward compatibility).
1925
1926# Note that the Maildir class, whose name is unchanged, itself offers a next()
1927# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001928
Guido van Rossumc7b68821994-04-28 09:53:33 +00001929class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001930
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001931 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001932 self.fp = fp
1933 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001934 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001935
Fred Drake72987a42001-05-02 20:20:53 +00001936 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001937 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001938
Fred Drakedbbf76b2000-07-09 16:44:26 +00001939 def next(self):
1940 while 1:
1941 self.fp.seek(self.seekp)
1942 try:
1943 self._search_start()
1944 except EOFError:
1945 self.seekp = self.fp.tell()
1946 return None
1947 start = self.fp.tell()
1948 self._search_end()
1949 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00001950 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00001951 break
Thomas Wouters477c8d52006-05-27 19:21:47 +00001952 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00001953
Barry Warsawffd05ee2002-03-01 22:39:14 +00001954# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00001955class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00001956
Fred Drakedbbf76b2000-07-09 16:44:26 +00001957 def _search_start(self):
1958 while 1:
1959 pos = self.fp.tell()
1960 line = self.fp.readline()
1961 if not line:
1962 raise EOFError
1963 if line[:5] == 'From ' and self._isrealfromline(line):
1964 self.fp.seek(pos)
1965 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00001966
Fred Drakedbbf76b2000-07-09 16:44:26 +00001967 def _search_end(self):
1968 self.fp.readline() # Throw away header line
1969 while 1:
1970 pos = self.fp.tell()
1971 line = self.fp.readline()
1972 if not line:
1973 return
1974 if line[:5] == 'From ' and self._isrealfromline(line):
1975 self.fp.seek(pos)
1976 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00001977
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001978 # An overridable mechanism to test for From-line-ness. You can either
1979 # specify a different regular expression or define a whole new
1980 # _isrealfromline() method. Note that this only gets called for lines
1981 # starting with the 5 characters "From ".
1982 #
1983 # BAW: According to
1984 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
1985 # the only portable, reliable way to find message delimiters in a BSD (i.e
1986 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
1987 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
1988 # like a good idea, in practice, there are too many variations for more
1989 # strict parsing of the line to be completely accurate.
1990 #
1991 # _strict_isrealfromline() is the old version which tries to do stricter
1992 # parsing of the From_ line. _portable_isrealfromline() simply returns
1993 # true, since it's never called if the line doesn't already start with
1994 # "From ".
1995 #
1996 # This algorithm, and the way it interacts with _search_start() and
1997 # _search_end() may not be completely correct, because it doesn't check
1998 # that the two characters preceding "From " are \n\n or the beginning of
1999 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00002000 # necessary. For convenience, we've added a PortableUnixMailbox class
Thomas Woutersb2137042007-02-01 18:02:27 +00002001 # which does no checking of the format of the 'From' line.
Guido van Rossumc7b68821994-04-28 09:53:33 +00002002
Thomas Woutersb2137042007-02-01 18:02:27 +00002003 _fromlinepattern = (r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+"
2004 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*"
2005 r"[^\s]*\s*"
2006 "$")
Fred Drakedbbf76b2000-07-09 16:44:26 +00002007 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002008
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002009 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002010 if not self._regexp:
2011 import re
2012 self._regexp = re.compile(self._fromlinepattern)
2013 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002014
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002015 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002016 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002017
2018 _isrealfromline = _strict_isrealfromline
2019
2020
2021class PortableUnixMailbox(UnixMailbox):
2022 _isrealfromline = UnixMailbox._portable_isrealfromline
2023
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002024
Guido van Rossumc7b68821994-04-28 09:53:33 +00002025class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002026
Fred Drakedbbf76b2000-07-09 16:44:26 +00002027 def _search_start(self):
2028 while 1:
2029 line = self.fp.readline()
2030 if not line:
2031 raise EOFError
2032 if line[:5] == '\001\001\001\001\n':
2033 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002034
Fred Drakedbbf76b2000-07-09 16:44:26 +00002035 def _search_end(self):
2036 while 1:
2037 pos = self.fp.tell()
2038 line = self.fp.readline()
2039 if not line:
2040 return
2041 if line == '\001\001\001\001\n':
2042 self.fp.seek(pos)
2043 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002044
Guido van Rossumc7b68821994-04-28 09:53:33 +00002045
Jack Jansen97157791995-10-23 13:59:53 +00002046class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002047
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002048 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002049 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002050 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002051 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002052 # the three following lines could be combined into:
2053 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2054 list = os.listdir(self.dirname)
2055 list = filter(pat.match, list)
Guido van Rossume2a383d2007-01-15 16:59:06 +00002056 list = map(int, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002057 list.sort()
2058 # This only works in Python 1.6 or later;
2059 # before that str() added 'L':
2060 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002061 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002062 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002063
Fred Drake72987a42001-05-02 20:20:53 +00002064 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002065 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002066
Fred Drakedbbf76b2000-07-09 16:44:26 +00002067 def next(self):
2068 if not self.boxes:
2069 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002070 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002071 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002072 msg = self.factory(fp)
2073 try:
2074 msg._mh_msgno = fn
2075 except (AttributeError, TypeError):
2076 pass
2077 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002078
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002079
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002080class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002081
Fred Drakedbbf76b2000-07-09 16:44:26 +00002082 def _search_start(self):
2083 while 1:
2084 line = self.fp.readline()
2085 if not line:
2086 raise EOFError
2087 if line == '*** EOOH ***\n':
2088 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002089
Fred Drakedbbf76b2000-07-09 16:44:26 +00002090 def _search_end(self):
2091 while 1:
2092 pos = self.fp.tell()
2093 line = self.fp.readline()
2094 if not line:
2095 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002096 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002097 self.fp.seek(pos)
2098 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002099
Thomas Wouters477c8d52006-05-27 19:21:47 +00002100## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002101
2102
Thomas Wouters477c8d52006-05-27 19:21:47 +00002103class Error(Exception):
2104 """Raised for module-specific errors."""
2105
2106class NoSuchMailboxError(Error):
2107 """The specified mailbox does not exist and won't be created."""
2108
2109class NotEmptyError(Error):
2110 """The specified mailbox is not empty and deletion was requested."""
2111
2112class ExternalClashError(Error):
2113 """Another process caused an action to fail."""
2114
2115class FormatError(Error):
2116 """A file appears to have an invalid format."""