blob: c6b0fa00e3c13087f27b72c83c299e05878d200c [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Martin v. Löwis08041d52006-05-04 14:27:52 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
19import email.Message
20import email.Generator
21import rfc822
22import StringIO
23try:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +000024 if sys.platform == 'os2emx':
25 # OS/2 EMX fcntl() not adequate
26 raise ImportError
Andrew M. Kuchlinga7ee9eb2006-06-26 13:08:24 +000027 import fcntl
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000028except ImportError:
29 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000030
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000031__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
32 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
33 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
34 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
35
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000036class Mailbox:
37 """A group of messages in a particular place."""
38
39 def __init__(self, path, factory=None, create=True):
40 """Initialize a Mailbox instance."""
41 self._path = os.path.abspath(os.path.expanduser(path))
42 self._factory = factory
43
44 def add(self, message):
45 """Add message and return assigned key."""
46 raise NotImplementedError('Method must be implemented by subclass')
47
48 def remove(self, key):
49 """Remove the keyed message; raise KeyError if it doesn't exist."""
50 raise NotImplementedError('Method must be implemented by subclass')
51
52 def __delitem__(self, key):
53 self.remove(key)
54
55 def discard(self, key):
56 """If the keyed message exists, remove it."""
57 try:
58 self.remove(key)
59 except KeyError:
60 pass
61
62 def __setitem__(self, key, message):
63 """Replace the keyed message; raise KeyError if it doesn't exist."""
64 raise NotImplementedError('Method must be implemented by subclass')
65
66 def get(self, key, default=None):
67 """Return the keyed message, or default if it doesn't exist."""
68 try:
69 return self.__getitem__(key)
70 except KeyError:
71 return default
72
73 def __getitem__(self, key):
74 """Return the keyed message; raise KeyError if it doesn't exist."""
75 if not self._factory:
76 return self.get_message(key)
77 else:
78 return self._factory(self.get_file(key))
79
80 def get_message(self, key):
81 """Return a Message representation or raise a KeyError."""
82 raise NotImplementedError('Method must be implemented by subclass')
83
84 def get_string(self, key):
85 """Return a string representation or raise a KeyError."""
86 raise NotImplementedError('Method must be implemented by subclass')
87
88 def get_file(self, key):
89 """Return a file-like representation or raise a KeyError."""
90 raise NotImplementedError('Method must be implemented by subclass')
91
92 def iterkeys(self):
93 """Return an iterator over keys."""
94 raise NotImplementedError('Method must be implemented by subclass')
95
96 def keys(self):
97 """Return a list of keys."""
98 return list(self.iterkeys())
99
100 def itervalues(self):
101 """Return an iterator over all messages."""
102 for key in self.iterkeys():
103 try:
104 value = self[key]
105 except KeyError:
106 continue
107 yield value
108
109 def __iter__(self):
110 return self.itervalues()
111
112 def values(self):
113 """Return a list of messages. Memory intensive."""
114 return list(self.itervalues())
115
116 def iteritems(self):
117 """Return an iterator over (key, message) tuples."""
118 for key in self.iterkeys():
119 try:
120 value = self[key]
121 except KeyError:
122 continue
123 yield (key, value)
124
125 def items(self):
126 """Return a list of (key, message) tuples. Memory intensive."""
127 return list(self.iteritems())
128
129 def has_key(self, key):
130 """Return True if the keyed message exists, False otherwise."""
131 raise NotImplementedError('Method must be implemented by subclass')
132
133 def __contains__(self, key):
134 return self.has_key(key)
135
136 def __len__(self):
137 """Return a count of messages in the mailbox."""
138 raise NotImplementedError('Method must be implemented by subclass')
139
140 def clear(self):
141 """Delete all messages."""
142 for key in self.iterkeys():
143 self.discard(key)
144
145 def pop(self, key, default=None):
146 """Delete the keyed message and return it, or default."""
147 try:
148 result = self[key]
149 except KeyError:
150 return default
151 self.discard(key)
152 return result
153
154 def popitem(self):
155 """Delete an arbitrary (key, message) pair and return it."""
156 for key in self.iterkeys():
157 return (key, self.pop(key)) # This is only run once.
158 else:
159 raise KeyError('No messages in mailbox')
160
161 def update(self, arg=None):
162 """Change the messages that correspond to certain keys."""
163 if hasattr(arg, 'iteritems'):
164 source = arg.iteritems()
165 elif hasattr(arg, 'items'):
166 source = arg.items()
167 else:
168 source = arg
169 bad_key = False
170 for key, message in source:
171 try:
172 self[key] = message
173 except KeyError:
174 bad_key = True
175 if bad_key:
176 raise KeyError('No message with key(s)')
177
178 def flush(self):
179 """Write any pending changes to the disk."""
180 raise NotImplementedError('Method must be implemented by subclass')
181
182 def lock(self):
183 """Lock the mailbox."""
184 raise NotImplementedError('Method must be implemented by subclass')
185
186 def unlock(self):
187 """Unlock the mailbox if it is locked."""
188 raise NotImplementedError('Method must be implemented by subclass')
189
190 def close(self):
191 """Flush and close the mailbox."""
192 raise NotImplementedError('Method must be implemented by subclass')
193
194 def _dump_message(self, message, target, mangle_from_=False):
195 # Most files are opened in binary mode to allow predictable seeking.
196 # To get native line endings on disk, the user-friendly \n line endings
197 # used in strings and by email.Message are translated here.
198 """Dump message contents to target file."""
199 if isinstance(message, email.Message.Message):
200 buffer = StringIO.StringIO()
201 gen = email.Generator.Generator(buffer, mangle_from_, 0)
202 gen.flatten(message)
203 buffer.seek(0)
204 target.write(buffer.read().replace('\n', os.linesep))
205 elif isinstance(message, str):
206 if mangle_from_:
207 message = message.replace('\nFrom ', '\n>From ')
208 message = message.replace('\n', os.linesep)
209 target.write(message)
210 elif hasattr(message, 'read'):
211 while True:
212 line = message.readline()
213 if line == '':
214 break
215 if mangle_from_ and line.startswith('From '):
216 line = '>From ' + line[5:]
217 line = line.replace('\n', os.linesep)
218 target.write(line)
219 else:
220 raise TypeError('Invalid message type: %s' % type(message))
221
222
223class Maildir(Mailbox):
224 """A qmail-style Maildir mailbox."""
225
226 colon = ':'
227
228 def __init__(self, dirname, factory=rfc822.Message, create=True):
229 """Initialize a Maildir instance."""
230 Mailbox.__init__(self, dirname, factory, create)
231 if not os.path.exists(self._path):
232 if create:
233 os.mkdir(self._path, 0700)
234 os.mkdir(os.path.join(self._path, 'tmp'), 0700)
235 os.mkdir(os.path.join(self._path, 'new'), 0700)
236 os.mkdir(os.path.join(self._path, 'cur'), 0700)
237 else:
238 raise NoSuchMailboxError(self._path)
239 self._toc = {}
240
241 def add(self, message):
242 """Add message and return assigned key."""
243 tmp_file = self._create_tmp()
244 try:
245 self._dump_message(message, tmp_file)
246 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000247 _sync_close(tmp_file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000248 if isinstance(message, MaildirMessage):
249 subdir = message.get_subdir()
250 suffix = self.colon + message.get_info()
251 if suffix == self.colon:
252 suffix = ''
253 else:
254 subdir = 'new'
255 suffix = ''
256 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
257 dest = os.path.join(self._path, subdir, uniq + suffix)
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000258 try:
259 if hasattr(os, 'link'):
260 os.link(tmp_file.name, dest)
261 os.remove(tmp_file.name)
262 else:
263 os.rename(tmp_file.name, dest)
264 except OSError, e:
265 os.remove(tmp_file.name)
266 if e.errno == errno.EEXIST:
267 raise ExternalClashError('Name clash with existing message: %s'
268 % dest)
269 else:
270 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000271 if isinstance(message, MaildirMessage):
272 os.utime(dest, (os.path.getatime(dest), message.get_date()))
273 return uniq
274
275 def remove(self, key):
276 """Remove the keyed message; raise KeyError if it doesn't exist."""
277 os.remove(os.path.join(self._path, self._lookup(key)))
278
279 def discard(self, key):
280 """If the keyed message exists, remove it."""
281 # This overrides an inapplicable implementation in the superclass.
282 try:
283 self.remove(key)
284 except KeyError:
285 pass
286 except OSError, e:
Martin v. Löwis08041d52006-05-04 14:27:52 +0000287 if e.errno != errno.ENOENT:
Tim Peters6d7cd7d2006-04-22 05:52:59 +0000288 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000289
290 def __setitem__(self, key, message):
291 """Replace the keyed message; raise KeyError if it doesn't exist."""
292 old_subpath = self._lookup(key)
293 temp_key = self.add(message)
294 temp_subpath = self._lookup(temp_key)
295 if isinstance(message, MaildirMessage):
296 # temp's subdir and suffix were specified by message.
297 dominant_subpath = temp_subpath
298 else:
299 # temp's subdir and suffix were defaults from add().
300 dominant_subpath = old_subpath
301 subdir = os.path.dirname(dominant_subpath)
302 if self.colon in dominant_subpath:
303 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
304 else:
305 suffix = ''
306 self.discard(key)
307 new_path = os.path.join(self._path, subdir, key + suffix)
308 os.rename(os.path.join(self._path, temp_subpath), new_path)
309 if isinstance(message, MaildirMessage):
310 os.utime(new_path, (os.path.getatime(new_path),
311 message.get_date()))
312
313 def get_message(self, key):
314 """Return a Message representation or raise a KeyError."""
315 subpath = self._lookup(key)
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000316 f = open(os.path.join(self._path, subpath), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000317 try:
318 msg = MaildirMessage(f)
319 finally:
320 f.close()
321 subdir, name = os.path.split(subpath)
322 msg.set_subdir(subdir)
323 if self.colon in name:
324 msg.set_info(name.split(self.colon)[-1])
325 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
326 return msg
327
328 def get_string(self, key):
329 """Return a string representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000330 f = open(os.path.join(self._path, self._lookup(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000331 try:
332 return f.read()
333 finally:
334 f.close()
335
336 def get_file(self, key):
337 """Return a file-like representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000338 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000339 return _ProxyFile(f)
340
341 def iterkeys(self):
342 """Return an iterator over keys."""
343 self._refresh()
344 for key in self._toc:
345 try:
346 self._lookup(key)
347 except KeyError:
348 continue
349 yield key
350
351 def has_key(self, key):
352 """Return True if the keyed message exists, False otherwise."""
353 self._refresh()
354 return key in self._toc
355
356 def __len__(self):
357 """Return a count of messages in the mailbox."""
358 self._refresh()
359 return len(self._toc)
360
361 def flush(self):
362 """Write any pending changes to disk."""
363 return # Maildir changes are always written immediately.
364
365 def lock(self):
366 """Lock the mailbox."""
367 return
368
369 def unlock(self):
370 """Unlock the mailbox if it is locked."""
371 return
372
373 def close(self):
374 """Flush and close the mailbox."""
375 return
376
377 def list_folders(self):
378 """Return a list of folder names."""
379 result = []
380 for entry in os.listdir(self._path):
381 if len(entry) > 1 and entry[0] == '.' and \
382 os.path.isdir(os.path.join(self._path, entry)):
383 result.append(entry[1:])
384 return result
385
386 def get_folder(self, folder):
387 """Return a Maildir instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000388 return Maildir(os.path.join(self._path, '.' + folder),
389 factory=self._factory,
390 create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000391
392 def add_folder(self, folder):
393 """Create a folder and return a Maildir instance representing it."""
394 path = os.path.join(self._path, '.' + folder)
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000395 result = Maildir(path, factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000396 maildirfolder_path = os.path.join(path, 'maildirfolder')
397 if not os.path.exists(maildirfolder_path):
398 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY))
399 return result
400
401 def remove_folder(self, folder):
402 """Delete the named folder, which must be empty."""
403 path = os.path.join(self._path, '.' + folder)
404 for entry in os.listdir(os.path.join(path, 'new')) + \
405 os.listdir(os.path.join(path, 'cur')):
406 if len(entry) < 1 or entry[0] != '.':
407 raise NotEmptyError('Folder contains message(s): %s' % folder)
408 for entry in os.listdir(path):
409 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
410 os.path.isdir(os.path.join(path, entry)):
411 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
412 (folder, entry))
413 for root, dirs, files in os.walk(path, topdown=False):
414 for entry in files:
415 os.remove(os.path.join(root, entry))
416 for entry in dirs:
417 os.rmdir(os.path.join(root, entry))
418 os.rmdir(path)
419
420 def clean(self):
421 """Delete old files in "tmp"."""
422 now = time.time()
423 for entry in os.listdir(os.path.join(self._path, 'tmp')):
424 path = os.path.join(self._path, 'tmp', entry)
425 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
426 os.remove(path)
427
428 _count = 1 # This is used to generate unique file names.
429
430 def _create_tmp(self):
431 """Create a file in the tmp subdirectory and open and return it."""
432 now = time.time()
433 hostname = socket.gethostname()
434 if '/' in hostname:
435 hostname = hostname.replace('/', r'\057')
436 if ':' in hostname:
437 hostname = hostname.replace(':', r'\072')
438 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
439 Maildir._count, hostname)
440 path = os.path.join(self._path, 'tmp', uniq)
441 try:
442 os.stat(path)
443 except OSError, e:
444 if e.errno == errno.ENOENT:
445 Maildir._count += 1
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000446 try:
447 return _create_carefully(path)
448 except OSError, e:
449 if e.errno != errno.EEXIST:
450 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000451 else:
452 raise
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000453
454 # Fall through to here if stat succeeded or open raised EEXIST.
455 raise ExternalClashError('Name clash prevented file creation: %s' %
456 path)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000457
458 def _refresh(self):
459 """Update table of contents mapping."""
460 self._toc = {}
461 for subdir in ('new', 'cur'):
462 for entry in os.listdir(os.path.join(self._path, subdir)):
463 uniq = entry.split(self.colon)[0]
464 self._toc[uniq] = os.path.join(subdir, entry)
465
466 def _lookup(self, key):
467 """Use TOC to return subpath for given key, or raise a KeyError."""
468 try:
469 if os.path.exists(os.path.join(self._path, self._toc[key])):
470 return self._toc[key]
471 except KeyError:
472 pass
473 self._refresh()
474 try:
475 return self._toc[key]
476 except KeyError:
477 raise KeyError('No message with key: %s' % key)
478
479 # This method is for backward compatibility only.
480 def next(self):
481 """Return the next message in a one-time iteration."""
482 if not hasattr(self, '_onetime_keys'):
483 self._onetime_keys = self.iterkeys()
484 while True:
485 try:
486 return self[self._onetime_keys.next()]
487 except StopIteration:
488 return None
489 except KeyError:
490 continue
491
492
493class _singlefileMailbox(Mailbox):
494 """A single-file mailbox."""
495
496 def __init__(self, path, factory=None, create=True):
497 """Initialize a single-file mailbox."""
498 Mailbox.__init__(self, path, factory, create)
499 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000500 f = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000501 except IOError, e:
502 if e.errno == errno.ENOENT:
503 if create:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000504 f = open(self._path, 'wb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000505 else:
506 raise NoSuchMailboxError(self._path)
507 elif e.errno == errno.EACCES:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000508 f = open(self._path, 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000509 else:
510 raise
511 self._file = f
512 self._toc = None
513 self._next_key = 0
514 self._pending = False # No changes require rewriting the file.
515 self._locked = False
516
517 def add(self, message):
518 """Add message and return assigned key."""
519 self._lookup()
520 self._toc[self._next_key] = self._append_message(message)
521 self._next_key += 1
522 self._pending = True
523 return self._next_key - 1
524
525 def remove(self, key):
526 """Remove the keyed message; raise KeyError if it doesn't exist."""
527 self._lookup(key)
528 del self._toc[key]
529 self._pending = True
530
531 def __setitem__(self, key, message):
532 """Replace the keyed message; raise KeyError if it doesn't exist."""
533 self._lookup(key)
534 self._toc[key] = self._append_message(message)
535 self._pending = True
536
537 def iterkeys(self):
538 """Return an iterator over keys."""
539 self._lookup()
540 for key in self._toc.keys():
541 yield key
542
543 def has_key(self, key):
544 """Return True if the keyed message exists, False otherwise."""
545 self._lookup()
546 return key in self._toc
547
548 def __len__(self):
549 """Return a count of messages in the mailbox."""
550 self._lookup()
551 return len(self._toc)
552
553 def lock(self):
554 """Lock the mailbox."""
555 if not self._locked:
556 _lock_file(self._file)
557 self._locked = True
558
559 def unlock(self):
560 """Unlock the mailbox if it is locked."""
561 if self._locked:
562 _unlock_file(self._file)
563 self._locked = False
564
565 def flush(self):
566 """Write any pending changes to disk."""
567 if not self._pending:
568 return
569 self._lookup()
570 new_file = _create_temporary(self._path)
571 try:
572 new_toc = {}
573 self._pre_mailbox_hook(new_file)
574 for key in sorted(self._toc.keys()):
575 start, stop = self._toc[key]
576 self._file.seek(start)
577 self._pre_message_hook(new_file)
578 new_start = new_file.tell()
579 while True:
580 buffer = self._file.read(min(4096,
581 stop - self._file.tell()))
582 if buffer == '':
583 break
584 new_file.write(buffer)
585 new_toc[key] = (new_start, new_file.tell())
586 self._post_message_hook(new_file)
587 except:
588 new_file.close()
589 os.remove(new_file.name)
590 raise
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000591 _sync_close(new_file)
592 # self._file is about to get replaced, so no need to sync.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000593 self._file.close()
594 try:
595 os.rename(new_file.name, self._path)
596 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +0000597 if e.errno == errno.EEXIST or \
598 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000599 os.remove(self._path)
600 os.rename(new_file.name, self._path)
601 else:
602 raise
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000603 self._file = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000604 self._toc = new_toc
605 self._pending = False
606 if self._locked:
Andrew M. Kuchling0f871832006-10-27 16:55:34 +0000607 _lock_file(self._file, dotlock=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000608
609 def _pre_mailbox_hook(self, f):
610 """Called before writing the mailbox to file f."""
611 return
612
613 def _pre_message_hook(self, f):
614 """Called before writing each message to file f."""
615 return
616
617 def _post_message_hook(self, f):
618 """Called after writing each message to file f."""
619 return
620
621 def close(self):
622 """Flush and close the mailbox."""
623 self.flush()
624 if self._locked:
625 self.unlock()
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000626 self._file.close() # Sync has been done by self.flush() above.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000627
628 def _lookup(self, key=None):
629 """Return (start, stop) or raise KeyError."""
630 if self._toc is None:
631 self._generate_toc()
632 if key is not None:
633 try:
634 return self._toc[key]
635 except KeyError:
636 raise KeyError('No message with key: %s' % key)
637
638 def _append_message(self, message):
639 """Append message to mailbox and return (start, stop) offsets."""
640 self._file.seek(0, 2)
641 self._pre_message_hook(self._file)
642 offsets = self._install_message(message)
643 self._post_message_hook(self._file)
644 self._file.flush()
645 return offsets
646
647
648
649class _mboxMMDF(_singlefileMailbox):
650 """An mbox or MMDF mailbox."""
651
652 _mangle_from_ = True
653
654 def get_message(self, key):
655 """Return a Message representation or raise a KeyError."""
656 start, stop = self._lookup(key)
657 self._file.seek(start)
658 from_line = self._file.readline().replace(os.linesep, '')
659 string = self._file.read(stop - self._file.tell())
660 msg = self._message_factory(string.replace(os.linesep, '\n'))
661 msg.set_from(from_line[5:])
662 return msg
663
664 def get_string(self, key, from_=False):
665 """Return a string representation or raise a KeyError."""
666 start, stop = self._lookup(key)
667 self._file.seek(start)
668 if not from_:
669 self._file.readline()
670 string = self._file.read(stop - self._file.tell())
671 return string.replace(os.linesep, '\n')
672
673 def get_file(self, key, from_=False):
674 """Return a file-like representation or raise a KeyError."""
675 start, stop = self._lookup(key)
676 self._file.seek(start)
677 if not from_:
678 self._file.readline()
679 return _PartialFile(self._file, self._file.tell(), stop)
680
681 def _install_message(self, message):
682 """Format a message and blindly write to self._file."""
683 from_line = None
684 if isinstance(message, str) and message.startswith('From '):
685 newline = message.find('\n')
686 if newline != -1:
687 from_line = message[:newline]
688 message = message[newline + 1:]
689 else:
690 from_line = message
691 message = ''
692 elif isinstance(message, _mboxMMDFMessage):
693 from_line = 'From ' + message.get_from()
694 elif isinstance(message, email.Message.Message):
695 from_line = message.get_unixfrom() # May be None.
696 if from_line is None:
697 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
698 start = self._file.tell()
699 self._file.write(from_line + os.linesep)
700 self._dump_message(message, self._file, self._mangle_from_)
701 stop = self._file.tell()
702 return (start, stop)
703
704
705class mbox(_mboxMMDF):
706 """A classic mbox mailbox."""
707
708 _mangle_from_ = True
709
710 def __init__(self, path, factory=None, create=True):
711 """Initialize an mbox mailbox."""
712 self._message_factory = mboxMessage
713 _mboxMMDF.__init__(self, path, factory, create)
714
715 def _pre_message_hook(self, f):
716 """Called before writing each message to file f."""
717 if f.tell() != 0:
718 f.write(os.linesep)
719
720 def _generate_toc(self):
721 """Generate key-to-(start, stop) table of contents."""
722 starts, stops = [], []
723 self._file.seek(0)
724 while True:
725 line_pos = self._file.tell()
726 line = self._file.readline()
727 if line.startswith('From '):
728 if len(stops) < len(starts):
729 stops.append(line_pos - len(os.linesep))
730 starts.append(line_pos)
731 elif line == '':
732 stops.append(line_pos)
733 break
734 self._toc = dict(enumerate(zip(starts, stops)))
735 self._next_key = len(self._toc)
736
737
738class MMDF(_mboxMMDF):
739 """An MMDF mailbox."""
740
741 def __init__(self, path, factory=None, create=True):
742 """Initialize an MMDF mailbox."""
743 self._message_factory = MMDFMessage
744 _mboxMMDF.__init__(self, path, factory, create)
745
746 def _pre_message_hook(self, f):
747 """Called before writing each message to file f."""
748 f.write('\001\001\001\001' + os.linesep)
749
750 def _post_message_hook(self, f):
751 """Called after writing each message to file f."""
752 f.write(os.linesep + '\001\001\001\001' + os.linesep)
753
754 def _generate_toc(self):
755 """Generate key-to-(start, stop) table of contents."""
756 starts, stops = [], []
757 self._file.seek(0)
758 next_pos = 0
759 while True:
760 line_pos = next_pos
761 line = self._file.readline()
762 next_pos = self._file.tell()
763 if line.startswith('\001\001\001\001' + os.linesep):
764 starts.append(next_pos)
765 while True:
766 line_pos = next_pos
767 line = self._file.readline()
768 next_pos = self._file.tell()
769 if line == '\001\001\001\001' + os.linesep:
770 stops.append(line_pos - len(os.linesep))
771 break
772 elif line == '':
773 stops.append(line_pos)
774 break
775 elif line == '':
776 break
777 self._toc = dict(enumerate(zip(starts, stops)))
778 self._next_key = len(self._toc)
779
780
781class MH(Mailbox):
782 """An MH mailbox."""
783
784 def __init__(self, path, factory=None, create=True):
785 """Initialize an MH instance."""
786 Mailbox.__init__(self, path, factory, create)
787 if not os.path.exists(self._path):
788 if create:
789 os.mkdir(self._path, 0700)
790 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
791 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0600))
792 else:
793 raise NoSuchMailboxError(self._path)
794 self._locked = False
795
796 def add(self, message):
797 """Add message and return assigned key."""
798 keys = self.keys()
799 if len(keys) == 0:
800 new_key = 1
801 else:
802 new_key = max(keys) + 1
803 new_path = os.path.join(self._path, str(new_key))
804 f = _create_carefully(new_path)
805 try:
806 if self._locked:
807 _lock_file(f)
808 try:
809 self._dump_message(message, f)
810 if isinstance(message, MHMessage):
811 self._dump_sequences(message, new_key)
812 finally:
813 if self._locked:
814 _unlock_file(f)
815 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000816 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000817 return new_key
818
819 def remove(self, key):
820 """Remove the keyed message; raise KeyError if it doesn't exist."""
821 path = os.path.join(self._path, str(key))
822 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000823 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000824 except IOError, e:
825 if e.errno == errno.ENOENT:
826 raise KeyError('No message with key: %s' % key)
827 else:
828 raise
829 try:
830 if self._locked:
831 _lock_file(f)
832 try:
833 f.close()
834 os.remove(os.path.join(self._path, str(key)))
835 finally:
836 if self._locked:
837 _unlock_file(f)
838 finally:
839 f.close()
840
841 def __setitem__(self, key, message):
842 """Replace the keyed message; raise KeyError if it doesn't exist."""
843 path = os.path.join(self._path, str(key))
844 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000845 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000846 except IOError, e:
847 if e.errno == errno.ENOENT:
848 raise KeyError('No message with key: %s' % key)
849 else:
850 raise
851 try:
852 if self._locked:
853 _lock_file(f)
854 try:
855 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
856 self._dump_message(message, f)
857 if isinstance(message, MHMessage):
858 self._dump_sequences(message, key)
859 finally:
860 if self._locked:
861 _unlock_file(f)
862 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000863 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000864
865 def get_message(self, key):
866 """Return a Message representation or raise a KeyError."""
867 try:
868 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000869 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000870 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000871 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000872 except IOError, e:
873 if e.errno == errno.ENOENT:
874 raise KeyError('No message with key: %s' % key)
875 else:
876 raise
877 try:
878 if self._locked:
879 _lock_file(f)
880 try:
881 msg = MHMessage(f)
882 finally:
883 if self._locked:
884 _unlock_file(f)
885 finally:
886 f.close()
887 for name, key_list in self.get_sequences():
888 if key in key_list:
889 msg.add_sequence(name)
890 return msg
891
892 def get_string(self, key):
893 """Return a string representation or raise a KeyError."""
894 try:
895 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000896 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000897 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000898 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000899 except IOError, e:
900 if e.errno == errno.ENOENT:
901 raise KeyError('No message with key: %s' % key)
902 else:
903 raise
904 try:
905 if self._locked:
906 _lock_file(f)
907 try:
908 return f.read()
909 finally:
910 if self._locked:
911 _unlock_file(f)
912 finally:
913 f.close()
914
915 def get_file(self, key):
916 """Return a file-like representation or raise a KeyError."""
917 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000918 f = open(os.path.join(self._path, str(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000919 except IOError, e:
920 if e.errno == errno.ENOENT:
921 raise KeyError('No message with key: %s' % key)
922 else:
923 raise
924 return _ProxyFile(f)
925
926 def iterkeys(self):
927 """Return an iterator over keys."""
928 return iter(sorted(int(entry) for entry in os.listdir(self._path)
929 if entry.isdigit()))
930
931 def has_key(self, key):
932 """Return True if the keyed message exists, False otherwise."""
933 return os.path.exists(os.path.join(self._path, str(key)))
934
935 def __len__(self):
936 """Return a count of messages in the mailbox."""
937 return len(list(self.iterkeys()))
938
939 def lock(self):
940 """Lock the mailbox."""
941 if not self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000942 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000943 _lock_file(self._file)
944 self._locked = True
945
946 def unlock(self):
947 """Unlock the mailbox if it is locked."""
948 if self._locked:
949 _unlock_file(self._file)
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000950 _sync_close(self._file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000951 del self._file
952 self._locked = False
953
954 def flush(self):
955 """Write any pending changes to the disk."""
956 return
957
958 def close(self):
959 """Flush and close the mailbox."""
960 if self._locked:
961 self.unlock()
962
963 def list_folders(self):
964 """Return a list of folder names."""
965 result = []
966 for entry in os.listdir(self._path):
967 if os.path.isdir(os.path.join(self._path, entry)):
968 result.append(entry)
969 return result
970
971 def get_folder(self, folder):
972 """Return an MH instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000973 return MH(os.path.join(self._path, folder),
974 factory=self._factory, create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000975
976 def add_folder(self, folder):
977 """Create a folder and return an MH instance representing it."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000978 return MH(os.path.join(self._path, folder),
979 factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000980
981 def remove_folder(self, folder):
982 """Delete the named folder, which must be empty."""
983 path = os.path.join(self._path, folder)
984 entries = os.listdir(path)
985 if entries == ['.mh_sequences']:
986 os.remove(os.path.join(path, '.mh_sequences'))
987 elif entries == []:
988 pass
989 else:
990 raise NotEmptyError('Folder not empty: %s' % self._path)
991 os.rmdir(path)
992
993 def get_sequences(self):
994 """Return a name-to-key-list dictionary to define each sequence."""
995 results = {}
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000996 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000997 try:
998 all_keys = set(self.keys())
999 for line in f:
1000 try:
1001 name, contents = line.split(':')
1002 keys = set()
1003 for spec in contents.split():
1004 if spec.isdigit():
1005 keys.add(int(spec))
1006 else:
1007 start, stop = (int(x) for x in spec.split('-'))
1008 keys.update(range(start, stop + 1))
1009 results[name] = [key for key in sorted(keys) \
1010 if key in all_keys]
1011 if len(results[name]) == 0:
1012 del results[name]
1013 except ValueError:
1014 raise FormatError('Invalid sequence specification: %s' %
1015 line.rstrip())
1016 finally:
1017 f.close()
1018 return results
1019
1020 def set_sequences(self, sequences):
1021 """Set sequences using the given name-to-key-list dictionary."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001022 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001023 try:
1024 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
1025 for name, keys in sequences.iteritems():
1026 if len(keys) == 0:
1027 continue
1028 f.write('%s:' % name)
1029 prev = None
1030 completing = False
1031 for key in sorted(set(keys)):
1032 if key - 1 == prev:
1033 if not completing:
1034 completing = True
1035 f.write('-')
1036 elif completing:
1037 completing = False
1038 f.write('%s %s' % (prev, key))
1039 else:
1040 f.write(' %s' % key)
1041 prev = key
1042 if completing:
1043 f.write(str(prev) + '\n')
1044 else:
1045 f.write('\n')
1046 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001047 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001048
1049 def pack(self):
1050 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1051 sequences = self.get_sequences()
1052 prev = 0
1053 changes = []
1054 for key in self.iterkeys():
1055 if key - 1 != prev:
1056 changes.append((key, prev + 1))
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001057 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001058 try:
1059 if self._locked:
1060 _lock_file(f)
1061 try:
1062 if hasattr(os, 'link'):
1063 os.link(os.path.join(self._path, str(key)),
1064 os.path.join(self._path, str(prev + 1)))
Andrew MacIntyreafa358f2006-07-23 13:04:00 +00001065 if sys.platform == 'os2emx':
1066 # cannot unlink an open file on OS/2
1067 f.close()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001068 os.unlink(os.path.join(self._path, str(key)))
1069 else:
1070 f.close()
1071 os.rename(os.path.join(self._path, str(key)),
1072 os.path.join(self._path, str(prev + 1)))
1073 finally:
1074 if self._locked:
1075 _unlock_file(f)
1076 finally:
1077 f.close()
1078 prev += 1
1079 self._next_key = prev + 1
1080 if len(changes) == 0:
1081 return
1082 for name, key_list in sequences.items():
1083 for old, new in changes:
1084 if old in key_list:
1085 key_list[key_list.index(old)] = new
1086 self.set_sequences(sequences)
1087
1088 def _dump_sequences(self, message, key):
1089 """Inspect a new MHMessage and update sequences appropriately."""
1090 pending_sequences = message.get_sequences()
1091 all_sequences = self.get_sequences()
1092 for name, key_list in all_sequences.iteritems():
1093 if name in pending_sequences:
1094 key_list.append(key)
1095 elif key in key_list:
1096 del key_list[key_list.index(key)]
1097 for sequence in pending_sequences:
1098 if sequence not in all_sequences:
1099 all_sequences[sequence] = [key]
1100 self.set_sequences(all_sequences)
1101
1102
1103class Babyl(_singlefileMailbox):
1104 """An Rmail-style Babyl mailbox."""
1105
1106 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1107 'forwarded', 'edited', 'resent'))
1108
1109 def __init__(self, path, factory=None, create=True):
1110 """Initialize a Babyl mailbox."""
1111 _singlefileMailbox.__init__(self, path, factory, create)
1112 self._labels = {}
1113
1114 def add(self, message):
1115 """Add message and return assigned key."""
1116 key = _singlefileMailbox.add(self, message)
1117 if isinstance(message, BabylMessage):
1118 self._labels[key] = message.get_labels()
1119 return key
1120
1121 def remove(self, key):
1122 """Remove the keyed message; raise KeyError if it doesn't exist."""
1123 _singlefileMailbox.remove(self, key)
1124 if key in self._labels:
1125 del self._labels[key]
1126
1127 def __setitem__(self, key, message):
1128 """Replace the keyed message; raise KeyError if it doesn't exist."""
1129 _singlefileMailbox.__setitem__(self, key, message)
1130 if isinstance(message, BabylMessage):
1131 self._labels[key] = message.get_labels()
1132
1133 def get_message(self, key):
1134 """Return a Message representation or raise a KeyError."""
1135 start, stop = self._lookup(key)
1136 self._file.seek(start)
1137 self._file.readline() # Skip '1,' line specifying labels.
1138 original_headers = StringIO.StringIO()
1139 while True:
1140 line = self._file.readline()
1141 if line == '*** EOOH ***' + os.linesep or line == '':
1142 break
1143 original_headers.write(line.replace(os.linesep, '\n'))
1144 visible_headers = StringIO.StringIO()
1145 while True:
1146 line = self._file.readline()
1147 if line == os.linesep or line == '':
1148 break
1149 visible_headers.write(line.replace(os.linesep, '\n'))
1150 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1151 '\n')
1152 msg = BabylMessage(original_headers.getvalue() + body)
1153 msg.set_visible(visible_headers.getvalue())
1154 if key in self._labels:
1155 msg.set_labels(self._labels[key])
1156 return msg
1157
1158 def get_string(self, key):
1159 """Return a string representation or raise a KeyError."""
1160 start, stop = self._lookup(key)
1161 self._file.seek(start)
1162 self._file.readline() # Skip '1,' line specifying labels.
1163 original_headers = StringIO.StringIO()
1164 while True:
1165 line = self._file.readline()
1166 if line == '*** EOOH ***' + os.linesep or line == '':
1167 break
1168 original_headers.write(line.replace(os.linesep, '\n'))
1169 while True:
1170 line = self._file.readline()
1171 if line == os.linesep or line == '':
1172 break
1173 return original_headers.getvalue() + \
1174 self._file.read(stop - self._file.tell()).replace(os.linesep,
1175 '\n')
1176
1177 def get_file(self, key):
1178 """Return a file-like representation or raise a KeyError."""
1179 return StringIO.StringIO(self.get_string(key).replace('\n',
1180 os.linesep))
1181
1182 def get_labels(self):
1183 """Return a list of user-defined labels in the mailbox."""
1184 self._lookup()
1185 labels = set()
1186 for label_list in self._labels.values():
1187 labels.update(label_list)
1188 labels.difference_update(self._special_labels)
1189 return list(labels)
1190
1191 def _generate_toc(self):
1192 """Generate key-to-(start, stop) table of contents."""
1193 starts, stops = [], []
1194 self._file.seek(0)
1195 next_pos = 0
1196 label_lists = []
1197 while True:
1198 line_pos = next_pos
1199 line = self._file.readline()
1200 next_pos = self._file.tell()
1201 if line == '\037\014' + os.linesep:
1202 if len(stops) < len(starts):
1203 stops.append(line_pos - len(os.linesep))
1204 starts.append(next_pos)
1205 labels = [label.strip() for label
1206 in self._file.readline()[1:].split(',')
1207 if label.strip() != '']
1208 label_lists.append(labels)
1209 elif line == '\037' or line == '\037' + os.linesep:
1210 if len(stops) < len(starts):
1211 stops.append(line_pos - len(os.linesep))
1212 elif line == '':
1213 stops.append(line_pos - len(os.linesep))
1214 break
1215 self._toc = dict(enumerate(zip(starts, stops)))
1216 self._labels = dict(enumerate(label_lists))
1217 self._next_key = len(self._toc)
1218
1219 def _pre_mailbox_hook(self, f):
1220 """Called before writing the mailbox to file f."""
1221 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1222 (os.linesep, os.linesep, ','.join(self.get_labels()),
1223 os.linesep))
1224
1225 def _pre_message_hook(self, f):
1226 """Called before writing each message to file f."""
1227 f.write('\014' + os.linesep)
1228
1229 def _post_message_hook(self, f):
1230 """Called after writing each message to file f."""
1231 f.write(os.linesep + '\037')
1232
1233 def _install_message(self, message):
1234 """Write message contents and return (start, stop)."""
1235 start = self._file.tell()
1236 if isinstance(message, BabylMessage):
1237 special_labels = []
1238 labels = []
1239 for label in message.get_labels():
1240 if label in self._special_labels:
1241 special_labels.append(label)
1242 else:
1243 labels.append(label)
1244 self._file.write('1')
1245 for label in special_labels:
1246 self._file.write(', ' + label)
1247 self._file.write(',,')
1248 for label in labels:
1249 self._file.write(' ' + label + ',')
1250 self._file.write(os.linesep)
1251 else:
1252 self._file.write('1,,' + os.linesep)
1253 if isinstance(message, email.Message.Message):
1254 orig_buffer = StringIO.StringIO()
1255 orig_generator = email.Generator.Generator(orig_buffer, False, 0)
1256 orig_generator.flatten(message)
1257 orig_buffer.seek(0)
1258 while True:
1259 line = orig_buffer.readline()
1260 self._file.write(line.replace('\n', os.linesep))
1261 if line == '\n' or line == '':
1262 break
1263 self._file.write('*** EOOH ***' + os.linesep)
1264 if isinstance(message, BabylMessage):
1265 vis_buffer = StringIO.StringIO()
1266 vis_generator = email.Generator.Generator(vis_buffer, False, 0)
1267 vis_generator.flatten(message.get_visible())
1268 while True:
1269 line = vis_buffer.readline()
1270 self._file.write(line.replace('\n', os.linesep))
1271 if line == '\n' or line == '':
1272 break
1273 else:
1274 orig_buffer.seek(0)
1275 while True:
1276 line = orig_buffer.readline()
1277 self._file.write(line.replace('\n', os.linesep))
1278 if line == '\n' or line == '':
1279 break
1280 while True:
1281 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
1282 if buffer == '':
1283 break
1284 self._file.write(buffer.replace('\n', os.linesep))
1285 elif isinstance(message, str):
1286 body_start = message.find('\n\n') + 2
1287 if body_start - 2 != -1:
1288 self._file.write(message[:body_start].replace('\n',
1289 os.linesep))
1290 self._file.write('*** EOOH ***' + os.linesep)
1291 self._file.write(message[:body_start].replace('\n',
1292 os.linesep))
1293 self._file.write(message[body_start:].replace('\n',
1294 os.linesep))
1295 else:
1296 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1297 self._file.write(message.replace('\n', os.linesep))
1298 elif hasattr(message, 'readline'):
1299 original_pos = message.tell()
1300 first_pass = True
1301 while True:
1302 line = message.readline()
1303 self._file.write(line.replace('\n', os.linesep))
1304 if line == '\n' or line == '':
1305 self._file.write('*** EOOH ***' + os.linesep)
1306 if first_pass:
1307 first_pass = False
1308 message.seek(original_pos)
1309 else:
1310 break
1311 while True:
1312 buffer = message.read(4096) # Buffer size is arbitrary.
1313 if buffer == '':
1314 break
1315 self._file.write(buffer.replace('\n', os.linesep))
1316 else:
1317 raise TypeError('Invalid message type: %s' % type(message))
1318 stop = self._file.tell()
1319 return (start, stop)
1320
1321
1322class Message(email.Message.Message):
1323 """Message with mailbox-format-specific properties."""
1324
1325 def __init__(self, message=None):
1326 """Initialize a Message instance."""
1327 if isinstance(message, email.Message.Message):
1328 self._become_message(copy.deepcopy(message))
1329 if isinstance(message, Message):
1330 message._explain_to(self)
1331 elif isinstance(message, str):
1332 self._become_message(email.message_from_string(message))
1333 elif hasattr(message, "read"):
1334 self._become_message(email.message_from_file(message))
1335 elif message is None:
1336 email.Message.Message.__init__(self)
1337 else:
1338 raise TypeError('Invalid message type: %s' % type(message))
1339
1340 def _become_message(self, message):
1341 """Assume the non-format-specific state of message."""
1342 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1343 'preamble', 'epilogue', 'defects', '_default_type'):
1344 self.__dict__[name] = message.__dict__[name]
1345
1346 def _explain_to(self, message):
1347 """Copy format-specific state to message insofar as possible."""
1348 if isinstance(message, Message):
1349 return # There's nothing format-specific to explain.
1350 else:
1351 raise TypeError('Cannot convert to specified type')
1352
1353
1354class MaildirMessage(Message):
1355 """Message with Maildir-specific properties."""
1356
1357 def __init__(self, message=None):
1358 """Initialize a MaildirMessage instance."""
1359 self._subdir = 'new'
1360 self._info = ''
1361 self._date = time.time()
1362 Message.__init__(self, message)
1363
1364 def get_subdir(self):
1365 """Return 'new' or 'cur'."""
1366 return self._subdir
1367
1368 def set_subdir(self, subdir):
1369 """Set subdir to 'new' or 'cur'."""
1370 if subdir == 'new' or subdir == 'cur':
1371 self._subdir = subdir
1372 else:
1373 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1374
1375 def get_flags(self):
1376 """Return as a string the flags that are set."""
1377 if self._info.startswith('2,'):
1378 return self._info[2:]
1379 else:
1380 return ''
1381
1382 def set_flags(self, flags):
1383 """Set the given flags and unset all others."""
1384 self._info = '2,' + ''.join(sorted(flags))
1385
1386 def add_flag(self, flag):
1387 """Set the given flag(s) without changing others."""
1388 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1389
1390 def remove_flag(self, flag):
1391 """Unset the given string flag(s) without changing others."""
1392 if self.get_flags() != '':
1393 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1394
1395 def get_date(self):
1396 """Return delivery date of message, in seconds since the epoch."""
1397 return self._date
1398
1399 def set_date(self, date):
1400 """Set delivery date of message, in seconds since the epoch."""
1401 try:
1402 self._date = float(date)
1403 except ValueError:
1404 raise TypeError("can't convert to float: %s" % date)
1405
1406 def get_info(self):
1407 """Get the message's "info" as a string."""
1408 return self._info
1409
1410 def set_info(self, info):
1411 """Set the message's "info" string."""
1412 if isinstance(info, str):
1413 self._info = info
1414 else:
1415 raise TypeError('info must be a string: %s' % type(info))
1416
1417 def _explain_to(self, message):
1418 """Copy Maildir-specific state to message insofar as possible."""
1419 if isinstance(message, MaildirMessage):
1420 message.set_flags(self.get_flags())
1421 message.set_subdir(self.get_subdir())
1422 message.set_date(self.get_date())
1423 elif isinstance(message, _mboxMMDFMessage):
1424 flags = set(self.get_flags())
1425 if 'S' in flags:
1426 message.add_flag('R')
1427 if self.get_subdir() == 'cur':
1428 message.add_flag('O')
1429 if 'T' in flags:
1430 message.add_flag('D')
1431 if 'F' in flags:
1432 message.add_flag('F')
1433 if 'R' in flags:
1434 message.add_flag('A')
1435 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1436 elif isinstance(message, MHMessage):
1437 flags = set(self.get_flags())
1438 if 'S' not in flags:
1439 message.add_sequence('unseen')
1440 if 'R' in flags:
1441 message.add_sequence('replied')
1442 if 'F' in flags:
1443 message.add_sequence('flagged')
1444 elif isinstance(message, BabylMessage):
1445 flags = set(self.get_flags())
1446 if 'S' not in flags:
1447 message.add_label('unseen')
1448 if 'T' in flags:
1449 message.add_label('deleted')
1450 if 'R' in flags:
1451 message.add_label('answered')
1452 if 'P' in flags:
1453 message.add_label('forwarded')
1454 elif isinstance(message, Message):
1455 pass
1456 else:
1457 raise TypeError('Cannot convert to specified type: %s' %
1458 type(message))
1459
1460
1461class _mboxMMDFMessage(Message):
1462 """Message with mbox- or MMDF-specific properties."""
1463
1464 def __init__(self, message=None):
1465 """Initialize an mboxMMDFMessage instance."""
1466 self.set_from('MAILER-DAEMON', True)
1467 if isinstance(message, email.Message.Message):
1468 unixfrom = message.get_unixfrom()
1469 if unixfrom is not None and unixfrom.startswith('From '):
1470 self.set_from(unixfrom[5:])
1471 Message.__init__(self, message)
1472
1473 def get_from(self):
1474 """Return contents of "From " line."""
1475 return self._from
1476
1477 def set_from(self, from_, time_=None):
1478 """Set "From " line, formatting and appending time_ if specified."""
1479 if time_ is not None:
1480 if time_ is True:
1481 time_ = time.gmtime()
1482 from_ += ' ' + time.asctime(time_)
1483 self._from = from_
1484
1485 def get_flags(self):
1486 """Return as a string the flags that are set."""
1487 return self.get('Status', '') + self.get('X-Status', '')
1488
1489 def set_flags(self, flags):
1490 """Set the given flags and unset all others."""
1491 flags = set(flags)
1492 status_flags, xstatus_flags = '', ''
1493 for flag in ('R', 'O'):
1494 if flag in flags:
1495 status_flags += flag
1496 flags.remove(flag)
1497 for flag in ('D', 'F', 'A'):
1498 if flag in flags:
1499 xstatus_flags += flag
1500 flags.remove(flag)
1501 xstatus_flags += ''.join(sorted(flags))
1502 try:
1503 self.replace_header('Status', status_flags)
1504 except KeyError:
1505 self.add_header('Status', status_flags)
1506 try:
1507 self.replace_header('X-Status', xstatus_flags)
1508 except KeyError:
1509 self.add_header('X-Status', xstatus_flags)
1510
1511 def add_flag(self, flag):
1512 """Set the given flag(s) without changing others."""
1513 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1514
1515 def remove_flag(self, flag):
1516 """Unset the given string flag(s) without changing others."""
1517 if 'Status' in self or 'X-Status' in self:
1518 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1519
1520 def _explain_to(self, message):
1521 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1522 if isinstance(message, MaildirMessage):
1523 flags = set(self.get_flags())
1524 if 'O' in flags:
1525 message.set_subdir('cur')
1526 if 'F' in flags:
1527 message.add_flag('F')
1528 if 'A' in flags:
1529 message.add_flag('R')
1530 if 'R' in flags:
1531 message.add_flag('S')
1532 if 'D' in flags:
1533 message.add_flag('T')
1534 del message['status']
1535 del message['x-status']
1536 maybe_date = ' '.join(self.get_from().split()[-5:])
1537 try:
1538 message.set_date(calendar.timegm(time.strptime(maybe_date,
1539 '%a %b %d %H:%M:%S %Y')))
1540 except (ValueError, OverflowError):
1541 pass
1542 elif isinstance(message, _mboxMMDFMessage):
1543 message.set_flags(self.get_flags())
1544 message.set_from(self.get_from())
1545 elif isinstance(message, MHMessage):
1546 flags = set(self.get_flags())
1547 if 'R' not in flags:
1548 message.add_sequence('unseen')
1549 if 'A' in flags:
1550 message.add_sequence('replied')
1551 if 'F' in flags:
1552 message.add_sequence('flagged')
1553 del message['status']
1554 del message['x-status']
1555 elif isinstance(message, BabylMessage):
1556 flags = set(self.get_flags())
1557 if 'R' not in flags:
1558 message.add_label('unseen')
1559 if 'D' in flags:
1560 message.add_label('deleted')
1561 if 'A' in flags:
1562 message.add_label('answered')
1563 del message['status']
1564 del message['x-status']
1565 elif isinstance(message, Message):
1566 pass
1567 else:
1568 raise TypeError('Cannot convert to specified type: %s' %
1569 type(message))
1570
1571
1572class mboxMessage(_mboxMMDFMessage):
1573 """Message with mbox-specific properties."""
1574
1575
1576class MHMessage(Message):
1577 """Message with MH-specific properties."""
1578
1579 def __init__(self, message=None):
1580 """Initialize an MHMessage instance."""
1581 self._sequences = []
1582 Message.__init__(self, message)
1583
1584 def get_sequences(self):
1585 """Return a list of sequences that include the message."""
1586 return self._sequences[:]
1587
1588 def set_sequences(self, sequences):
1589 """Set the list of sequences that include the message."""
1590 self._sequences = list(sequences)
1591
1592 def add_sequence(self, sequence):
1593 """Add sequence to list of sequences including the message."""
1594 if isinstance(sequence, str):
1595 if not sequence in self._sequences:
1596 self._sequences.append(sequence)
1597 else:
1598 raise TypeError('sequence must be a string: %s' % type(sequence))
1599
1600 def remove_sequence(self, sequence):
1601 """Remove sequence from the list of sequences including the message."""
1602 try:
1603 self._sequences.remove(sequence)
1604 except ValueError:
1605 pass
1606
1607 def _explain_to(self, message):
1608 """Copy MH-specific state to message insofar as possible."""
1609 if isinstance(message, MaildirMessage):
1610 sequences = set(self.get_sequences())
1611 if 'unseen' in sequences:
1612 message.set_subdir('cur')
1613 else:
1614 message.set_subdir('cur')
1615 message.add_flag('S')
1616 if 'flagged' in sequences:
1617 message.add_flag('F')
1618 if 'replied' in sequences:
1619 message.add_flag('R')
1620 elif isinstance(message, _mboxMMDFMessage):
1621 sequences = set(self.get_sequences())
1622 if 'unseen' not in sequences:
1623 message.add_flag('RO')
1624 else:
1625 message.add_flag('O')
1626 if 'flagged' in sequences:
1627 message.add_flag('F')
1628 if 'replied' in sequences:
1629 message.add_flag('A')
1630 elif isinstance(message, MHMessage):
1631 for sequence in self.get_sequences():
1632 message.add_sequence(sequence)
1633 elif isinstance(message, BabylMessage):
1634 sequences = set(self.get_sequences())
1635 if 'unseen' in sequences:
1636 message.add_label('unseen')
1637 if 'replied' in sequences:
1638 message.add_label('answered')
1639 elif isinstance(message, Message):
1640 pass
1641 else:
1642 raise TypeError('Cannot convert to specified type: %s' %
1643 type(message))
1644
1645
1646class BabylMessage(Message):
1647 """Message with Babyl-specific properties."""
1648
1649 def __init__(self, message=None):
1650 """Initialize an BabylMessage instance."""
1651 self._labels = []
1652 self._visible = Message()
1653 Message.__init__(self, message)
1654
1655 def get_labels(self):
1656 """Return a list of labels on the message."""
1657 return self._labels[:]
1658
1659 def set_labels(self, labels):
1660 """Set the list of labels on the message."""
1661 self._labels = list(labels)
1662
1663 def add_label(self, label):
1664 """Add label to list of labels on the message."""
1665 if isinstance(label, str):
1666 if label not in self._labels:
1667 self._labels.append(label)
1668 else:
1669 raise TypeError('label must be a string: %s' % type(label))
1670
1671 def remove_label(self, label):
1672 """Remove label from the list of labels on the message."""
1673 try:
1674 self._labels.remove(label)
1675 except ValueError:
1676 pass
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001677
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001678 def get_visible(self):
1679 """Return a Message representation of visible headers."""
1680 return Message(self._visible)
1681
1682 def set_visible(self, visible):
1683 """Set the Message representation of visible headers."""
1684 self._visible = Message(visible)
1685
1686 def update_visible(self):
1687 """Update and/or sensibly generate a set of visible headers."""
1688 for header in self._visible.keys():
1689 if header in self:
1690 self._visible.replace_header(header, self[header])
1691 else:
1692 del self._visible[header]
1693 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1694 if header in self and header not in self._visible:
1695 self._visible[header] = self[header]
1696
1697 def _explain_to(self, message):
1698 """Copy Babyl-specific state to message insofar as possible."""
1699 if isinstance(message, MaildirMessage):
1700 labels = set(self.get_labels())
1701 if 'unseen' in labels:
1702 message.set_subdir('cur')
1703 else:
1704 message.set_subdir('cur')
1705 message.add_flag('S')
1706 if 'forwarded' in labels or 'resent' in labels:
1707 message.add_flag('P')
1708 if 'answered' in labels:
1709 message.add_flag('R')
1710 if 'deleted' in labels:
1711 message.add_flag('T')
1712 elif isinstance(message, _mboxMMDFMessage):
1713 labels = set(self.get_labels())
1714 if 'unseen' not in labels:
1715 message.add_flag('RO')
1716 else:
1717 message.add_flag('O')
1718 if 'deleted' in labels:
1719 message.add_flag('D')
1720 if 'answered' in labels:
1721 message.add_flag('A')
1722 elif isinstance(message, MHMessage):
1723 labels = set(self.get_labels())
1724 if 'unseen' in labels:
1725 message.add_sequence('unseen')
1726 if 'answered' in labels:
1727 message.add_sequence('replied')
1728 elif isinstance(message, BabylMessage):
1729 message.set_visible(self.get_visible())
1730 for label in self.get_labels():
1731 message.add_label(label)
1732 elif isinstance(message, Message):
1733 pass
1734 else:
1735 raise TypeError('Cannot convert to specified type: %s' %
1736 type(message))
1737
1738
1739class MMDFMessage(_mboxMMDFMessage):
1740 """Message with MMDF-specific properties."""
1741
1742
1743class _ProxyFile:
1744 """A read-only wrapper of a file."""
1745
1746 def __init__(self, f, pos=None):
1747 """Initialize a _ProxyFile."""
1748 self._file = f
1749 if pos is None:
1750 self._pos = f.tell()
1751 else:
1752 self._pos = pos
1753
1754 def read(self, size=None):
1755 """Read bytes."""
1756 return self._read(size, self._file.read)
1757
1758 def readline(self, size=None):
1759 """Read a line."""
1760 return self._read(size, self._file.readline)
1761
1762 def readlines(self, sizehint=None):
1763 """Read multiple lines."""
1764 result = []
1765 for line in self:
1766 result.append(line)
1767 if sizehint is not None:
1768 sizehint -= len(line)
1769 if sizehint <= 0:
1770 break
1771 return result
1772
1773 def __iter__(self):
1774 """Iterate over lines."""
1775 return iter(self.readline, "")
1776
1777 def tell(self):
1778 """Return the position."""
1779 return self._pos
1780
1781 def seek(self, offset, whence=0):
1782 """Change position."""
1783 if whence == 1:
1784 self._file.seek(self._pos)
1785 self._file.seek(offset, whence)
1786 self._pos = self._file.tell()
1787
1788 def close(self):
1789 """Close the file."""
1790 del self._file
1791
1792 def _read(self, size, read_method):
1793 """Read size bytes using read_method."""
1794 if size is None:
1795 size = -1
1796 self._file.seek(self._pos)
1797 result = read_method(size)
1798 self._pos = self._file.tell()
1799 return result
1800
1801
1802class _PartialFile(_ProxyFile):
1803 """A read-only wrapper of part of a file."""
1804
1805 def __init__(self, f, start=None, stop=None):
1806 """Initialize a _PartialFile."""
1807 _ProxyFile.__init__(self, f, start)
1808 self._start = start
1809 self._stop = stop
1810
1811 def tell(self):
1812 """Return the position with respect to start."""
1813 return _ProxyFile.tell(self) - self._start
1814
1815 def seek(self, offset, whence=0):
1816 """Change position, possibly with respect to start or stop."""
1817 if whence == 0:
1818 self._pos = self._start
1819 whence = 1
1820 elif whence == 2:
1821 self._pos = self._stop
1822 whence = 1
1823 _ProxyFile.seek(self, offset, whence)
1824
1825 def _read(self, size, read_method):
1826 """Read size bytes using read_method, honoring start and stop."""
1827 remaining = self._stop - self._pos
1828 if remaining <= 0:
1829 return ''
1830 if size is None or size < 0 or size > remaining:
1831 size = remaining
1832 return _ProxyFile._read(self, size, read_method)
1833
1834
1835def _lock_file(f, dotlock=True):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001836 """Lock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001837 dotlock_done = False
1838 try:
1839 if fcntl:
1840 try:
1841 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
1842 except IOError, e:
Neal Norwitz7983c722006-06-28 05:03:22 +00001843 if e.errno in (errno.EAGAIN, errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001844 raise ExternalClashError('lockf: lock unavailable: %s' %
1845 f.name)
1846 else:
1847 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001848 if dotlock:
1849 try:
1850 pre_lock = _create_temporary(f.name + '.lock')
1851 pre_lock.close()
1852 except IOError, e:
1853 if e.errno == errno.EACCES:
1854 return # Without write access, just skip dotlocking.
1855 else:
1856 raise
1857 try:
1858 if hasattr(os, 'link'):
1859 os.link(pre_lock.name, f.name + '.lock')
1860 dotlock_done = True
1861 os.unlink(pre_lock.name)
1862 else:
1863 os.rename(pre_lock.name, f.name + '.lock')
1864 dotlock_done = True
1865 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +00001866 if e.errno == errno.EEXIST or \
1867 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001868 os.remove(pre_lock.name)
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001869 raise ExternalClashError('dot lock unavailable: %s' %
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001870 f.name)
1871 else:
1872 raise
1873 except:
1874 if fcntl:
1875 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001876 if dotlock_done:
1877 os.remove(f.name + '.lock')
1878 raise
1879
1880def _unlock_file(f):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001881 """Unlock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001882 if fcntl:
1883 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001884 if os.path.exists(f.name + '.lock'):
1885 os.remove(f.name + '.lock')
1886
1887def _create_carefully(path):
1888 """Create a file if it doesn't exist and open for reading and writing."""
1889 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR)
1890 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001891 return open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001892 finally:
1893 os.close(fd)
1894
1895def _create_temporary(path):
1896 """Create a temp file based on path and open for reading and writing."""
1897 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1898 socket.gethostname(),
1899 os.getpid()))
1900
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001901def _sync_flush(f):
1902 """Ensure changes to file f are physically on disk."""
1903 f.flush()
1904 os.fsync(f.fileno())
1905
1906def _sync_close(f):
1907 """Close file f, ensuring all changes are physically on disk."""
1908 _sync_flush(f)
1909 f.close()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001910
1911## Start: classes from the original module (for backward compatibility).
1912
1913# Note that the Maildir class, whose name is unchanged, itself offers a next()
1914# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001915
Guido van Rossumc7b68821994-04-28 09:53:33 +00001916class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001917
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001918 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001919 self.fp = fp
1920 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001921 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001922
Fred Drake72987a42001-05-02 20:20:53 +00001923 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001924 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001925
Fred Drakedbbf76b2000-07-09 16:44:26 +00001926 def next(self):
1927 while 1:
1928 self.fp.seek(self.seekp)
1929 try:
1930 self._search_start()
1931 except EOFError:
1932 self.seekp = self.fp.tell()
1933 return None
1934 start = self.fp.tell()
1935 self._search_end()
1936 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00001937 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00001938 break
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001939 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00001940
Barry Warsawffd05ee2002-03-01 22:39:14 +00001941# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00001942class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00001943
Fred Drakedbbf76b2000-07-09 16:44:26 +00001944 def _search_start(self):
1945 while 1:
1946 pos = self.fp.tell()
1947 line = self.fp.readline()
1948 if not line:
1949 raise EOFError
1950 if line[:5] == 'From ' and self._isrealfromline(line):
1951 self.fp.seek(pos)
1952 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00001953
Fred Drakedbbf76b2000-07-09 16:44:26 +00001954 def _search_end(self):
1955 self.fp.readline() # Throw away header line
1956 while 1:
1957 pos = self.fp.tell()
1958 line = self.fp.readline()
1959 if not line:
1960 return
1961 if line[:5] == 'From ' and self._isrealfromline(line):
1962 self.fp.seek(pos)
1963 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00001964
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001965 # An overridable mechanism to test for From-line-ness. You can either
1966 # specify a different regular expression or define a whole new
1967 # _isrealfromline() method. Note that this only gets called for lines
1968 # starting with the 5 characters "From ".
1969 #
1970 # BAW: According to
1971 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
1972 # the only portable, reliable way to find message delimiters in a BSD (i.e
1973 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
1974 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
1975 # like a good idea, in practice, there are too many variations for more
1976 # strict parsing of the line to be completely accurate.
1977 #
1978 # _strict_isrealfromline() is the old version which tries to do stricter
1979 # parsing of the From_ line. _portable_isrealfromline() simply returns
1980 # true, since it's never called if the line doesn't already start with
1981 # "From ".
1982 #
1983 # This algorithm, and the way it interacts with _search_start() and
1984 # _search_end() may not be completely correct, because it doesn't check
1985 # that the two characters preceding "From " are \n\n or the beginning of
1986 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00001987 # necessary. For convenience, we've added a PortableUnixMailbox class
1988 # which uses the more lenient _fromlinepattern regular expression.
Guido van Rossumc7b68821994-04-28 09:53:33 +00001989
Fred Drakedbbf76b2000-07-09 16:44:26 +00001990 _fromlinepattern = r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+" \
1991 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*$"
1992 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00001993
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001994 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001995 if not self._regexp:
1996 import re
1997 self._regexp = re.compile(self._fromlinepattern)
1998 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00001999
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002000 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002001 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002002
2003 _isrealfromline = _strict_isrealfromline
2004
2005
2006class PortableUnixMailbox(UnixMailbox):
2007 _isrealfromline = UnixMailbox._portable_isrealfromline
2008
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002009
Guido van Rossumc7b68821994-04-28 09:53:33 +00002010class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002011
Fred Drakedbbf76b2000-07-09 16:44:26 +00002012 def _search_start(self):
2013 while 1:
2014 line = self.fp.readline()
2015 if not line:
2016 raise EOFError
2017 if line[:5] == '\001\001\001\001\n':
2018 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002019
Fred Drakedbbf76b2000-07-09 16:44:26 +00002020 def _search_end(self):
2021 while 1:
2022 pos = self.fp.tell()
2023 line = self.fp.readline()
2024 if not line:
2025 return
2026 if line == '\001\001\001\001\n':
2027 self.fp.seek(pos)
2028 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002029
Guido van Rossumc7b68821994-04-28 09:53:33 +00002030
Jack Jansen97157791995-10-23 13:59:53 +00002031class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002032
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002033 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002034 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002035 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002036 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002037 # the three following lines could be combined into:
2038 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2039 list = os.listdir(self.dirname)
2040 list = filter(pat.match, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002041 list = map(long, list)
2042 list.sort()
2043 # This only works in Python 1.6 or later;
2044 # before that str() added 'L':
2045 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002046 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002047 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002048
Fred Drake72987a42001-05-02 20:20:53 +00002049 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002050 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002051
Fred Drakedbbf76b2000-07-09 16:44:26 +00002052 def next(self):
2053 if not self.boxes:
2054 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002055 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002056 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002057 msg = self.factory(fp)
2058 try:
2059 msg._mh_msgno = fn
2060 except (AttributeError, TypeError):
2061 pass
2062 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002063
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002064
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002065class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002066
Fred Drakedbbf76b2000-07-09 16:44:26 +00002067 def _search_start(self):
2068 while 1:
2069 line = self.fp.readline()
2070 if not line:
2071 raise EOFError
2072 if line == '*** EOOH ***\n':
2073 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002074
Fred Drakedbbf76b2000-07-09 16:44:26 +00002075 def _search_end(self):
2076 while 1:
2077 pos = self.fp.tell()
2078 line = self.fp.readline()
2079 if not line:
2080 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002081 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002082 self.fp.seek(pos)
2083 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002084
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002085## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002086
2087
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002088class Error(Exception):
2089 """Raised for module-specific errors."""
2090
2091class NoSuchMailboxError(Error):
2092 """The specified mailbox does not exist and won't be created."""
2093
2094class NotEmptyError(Error):
2095 """The specified mailbox is not empty and deletion was requested."""
2096
2097class ExternalClashError(Error):
2098 """Another process caused an action to fail."""
2099
2100class FormatError(Error):
2101 """A file appears to have an invalid format."""