blob: 305b2d2449241c4229c712e59238fa84699a3ee7 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Martin v. Löwis08041d52006-05-04 14:27:52 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
Georg Brandl5a096e12007-01-22 19:40:21 +000019import email.message
20import email.generator
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000021import rfc822
22import StringIO
23try:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +000024 if sys.platform == 'os2emx':
25 # OS/2 EMX fcntl() not adequate
26 raise ImportError
Andrew M. Kuchlinga7ee9eb2006-06-26 13:08:24 +000027 import fcntl
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000028except ImportError:
29 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000030
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000031__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
32 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
33 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
34 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
35
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000036class Mailbox:
37 """A group of messages in a particular place."""
38
39 def __init__(self, path, factory=None, create=True):
40 """Initialize a Mailbox instance."""
41 self._path = os.path.abspath(os.path.expanduser(path))
42 self._factory = factory
43
44 def add(self, message):
45 """Add message and return assigned key."""
46 raise NotImplementedError('Method must be implemented by subclass')
47
48 def remove(self, key):
49 """Remove the keyed message; raise KeyError if it doesn't exist."""
50 raise NotImplementedError('Method must be implemented by subclass')
51
52 def __delitem__(self, key):
53 self.remove(key)
54
55 def discard(self, key):
56 """If the keyed message exists, remove it."""
57 try:
58 self.remove(key)
59 except KeyError:
60 pass
61
62 def __setitem__(self, key, message):
63 """Replace the keyed message; raise KeyError if it doesn't exist."""
64 raise NotImplementedError('Method must be implemented by subclass')
65
66 def get(self, key, default=None):
67 """Return the keyed message, or default if it doesn't exist."""
68 try:
69 return self.__getitem__(key)
70 except KeyError:
71 return default
72
73 def __getitem__(self, key):
74 """Return the keyed message; raise KeyError if it doesn't exist."""
75 if not self._factory:
76 return self.get_message(key)
77 else:
78 return self._factory(self.get_file(key))
79
80 def get_message(self, key):
81 """Return a Message representation or raise a KeyError."""
82 raise NotImplementedError('Method must be implemented by subclass')
83
84 def get_string(self, key):
85 """Return a string representation or raise a KeyError."""
86 raise NotImplementedError('Method must be implemented by subclass')
87
88 def get_file(self, key):
89 """Return a file-like representation or raise a KeyError."""
90 raise NotImplementedError('Method must be implemented by subclass')
91
92 def iterkeys(self):
93 """Return an iterator over keys."""
94 raise NotImplementedError('Method must be implemented by subclass')
95
96 def keys(self):
97 """Return a list of keys."""
98 return list(self.iterkeys())
99
100 def itervalues(self):
101 """Return an iterator over all messages."""
102 for key in self.iterkeys():
103 try:
104 value = self[key]
105 except KeyError:
106 continue
107 yield value
108
109 def __iter__(self):
110 return self.itervalues()
111
112 def values(self):
113 """Return a list of messages. Memory intensive."""
114 return list(self.itervalues())
115
116 def iteritems(self):
117 """Return an iterator over (key, message) tuples."""
118 for key in self.iterkeys():
119 try:
120 value = self[key]
121 except KeyError:
122 continue
123 yield (key, value)
124
125 def items(self):
126 """Return a list of (key, message) tuples. Memory intensive."""
127 return list(self.iteritems())
128
129 def has_key(self, key):
130 """Return True if the keyed message exists, False otherwise."""
131 raise NotImplementedError('Method must be implemented by subclass')
132
133 def __contains__(self, key):
134 return self.has_key(key)
135
136 def __len__(self):
137 """Return a count of messages in the mailbox."""
138 raise NotImplementedError('Method must be implemented by subclass')
139
140 def clear(self):
141 """Delete all messages."""
142 for key in self.iterkeys():
143 self.discard(key)
144
145 def pop(self, key, default=None):
146 """Delete the keyed message and return it, or default."""
147 try:
148 result = self[key]
149 except KeyError:
150 return default
151 self.discard(key)
152 return result
153
154 def popitem(self):
155 """Delete an arbitrary (key, message) pair and return it."""
156 for key in self.iterkeys():
157 return (key, self.pop(key)) # This is only run once.
158 else:
159 raise KeyError('No messages in mailbox')
160
161 def update(self, arg=None):
162 """Change the messages that correspond to certain keys."""
163 if hasattr(arg, 'iteritems'):
164 source = arg.iteritems()
165 elif hasattr(arg, 'items'):
166 source = arg.items()
167 else:
168 source = arg
169 bad_key = False
170 for key, message in source:
171 try:
172 self[key] = message
173 except KeyError:
174 bad_key = True
175 if bad_key:
176 raise KeyError('No message with key(s)')
177
178 def flush(self):
179 """Write any pending changes to the disk."""
180 raise NotImplementedError('Method must be implemented by subclass')
181
182 def lock(self):
183 """Lock the mailbox."""
184 raise NotImplementedError('Method must be implemented by subclass')
185
186 def unlock(self):
187 """Unlock the mailbox if it is locked."""
188 raise NotImplementedError('Method must be implemented by subclass')
189
190 def close(self):
191 """Flush and close the mailbox."""
192 raise NotImplementedError('Method must be implemented by subclass')
193
194 def _dump_message(self, message, target, mangle_from_=False):
195 # Most files are opened in binary mode to allow predictable seeking.
196 # To get native line endings on disk, the user-friendly \n line endings
197 # used in strings and by email.Message are translated here.
198 """Dump message contents to target file."""
Georg Brandl5a096e12007-01-22 19:40:21 +0000199 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000200 buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +0000201 gen = email.generator.Generator(buffer, mangle_from_, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000202 gen.flatten(message)
203 buffer.seek(0)
204 target.write(buffer.read().replace('\n', os.linesep))
205 elif isinstance(message, str):
206 if mangle_from_:
207 message = message.replace('\nFrom ', '\n>From ')
208 message = message.replace('\n', os.linesep)
209 target.write(message)
210 elif hasattr(message, 'read'):
211 while True:
212 line = message.readline()
213 if line == '':
214 break
215 if mangle_from_ and line.startswith('From '):
216 line = '>From ' + line[5:]
217 line = line.replace('\n', os.linesep)
218 target.write(line)
219 else:
220 raise TypeError('Invalid message type: %s' % type(message))
221
222
223class Maildir(Mailbox):
224 """A qmail-style Maildir mailbox."""
225
226 colon = ':'
227
228 def __init__(self, dirname, factory=rfc822.Message, create=True):
229 """Initialize a Maildir instance."""
230 Mailbox.__init__(self, dirname, factory, create)
231 if not os.path.exists(self._path):
232 if create:
233 os.mkdir(self._path, 0700)
234 os.mkdir(os.path.join(self._path, 'tmp'), 0700)
235 os.mkdir(os.path.join(self._path, 'new'), 0700)
236 os.mkdir(os.path.join(self._path, 'cur'), 0700)
237 else:
238 raise NoSuchMailboxError(self._path)
239 self._toc = {}
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000240 self._last_read = None # Records last time we read cur/new
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000241
242 def add(self, message):
243 """Add message and return assigned key."""
244 tmp_file = self._create_tmp()
245 try:
246 self._dump_message(message, tmp_file)
247 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000248 _sync_close(tmp_file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000249 if isinstance(message, MaildirMessage):
250 subdir = message.get_subdir()
251 suffix = self.colon + message.get_info()
252 if suffix == self.colon:
253 suffix = ''
254 else:
255 subdir = 'new'
256 suffix = ''
257 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
258 dest = os.path.join(self._path, subdir, uniq + suffix)
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000259 try:
260 if hasattr(os, 'link'):
261 os.link(tmp_file.name, dest)
262 os.remove(tmp_file.name)
263 else:
264 os.rename(tmp_file.name, dest)
265 except OSError, e:
266 os.remove(tmp_file.name)
267 if e.errno == errno.EEXIST:
268 raise ExternalClashError('Name clash with existing message: %s'
269 % dest)
270 else:
271 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000272 if isinstance(message, MaildirMessage):
273 os.utime(dest, (os.path.getatime(dest), message.get_date()))
274 return uniq
275
276 def remove(self, key):
277 """Remove the keyed message; raise KeyError if it doesn't exist."""
278 os.remove(os.path.join(self._path, self._lookup(key)))
279
280 def discard(self, key):
281 """If the keyed message exists, remove it."""
282 # This overrides an inapplicable implementation in the superclass.
283 try:
284 self.remove(key)
285 except KeyError:
286 pass
287 except OSError, e:
Martin v. Löwis08041d52006-05-04 14:27:52 +0000288 if e.errno != errno.ENOENT:
Tim Peters6d7cd7d2006-04-22 05:52:59 +0000289 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000290
291 def __setitem__(self, key, message):
292 """Replace the keyed message; raise KeyError if it doesn't exist."""
293 old_subpath = self._lookup(key)
294 temp_key = self.add(message)
295 temp_subpath = self._lookup(temp_key)
296 if isinstance(message, MaildirMessage):
297 # temp's subdir and suffix were specified by message.
298 dominant_subpath = temp_subpath
299 else:
300 # temp's subdir and suffix were defaults from add().
301 dominant_subpath = old_subpath
302 subdir = os.path.dirname(dominant_subpath)
303 if self.colon in dominant_subpath:
304 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
305 else:
306 suffix = ''
307 self.discard(key)
308 new_path = os.path.join(self._path, subdir, key + suffix)
309 os.rename(os.path.join(self._path, temp_subpath), new_path)
310 if isinstance(message, MaildirMessage):
311 os.utime(new_path, (os.path.getatime(new_path),
312 message.get_date()))
313
314 def get_message(self, key):
315 """Return a Message representation or raise a KeyError."""
316 subpath = self._lookup(key)
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000317 f = open(os.path.join(self._path, subpath), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000318 try:
Andrew M. Kuchling15ce8802008-01-19 20:12:04 +0000319 if self._factory:
320 msg = self._factory(f)
321 else:
322 msg = MaildirMessage(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000323 finally:
324 f.close()
325 subdir, name = os.path.split(subpath)
326 msg.set_subdir(subdir)
327 if self.colon in name:
328 msg.set_info(name.split(self.colon)[-1])
329 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
330 return msg
331
332 def get_string(self, key):
333 """Return a string representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000334 f = open(os.path.join(self._path, self._lookup(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000335 try:
336 return f.read()
337 finally:
338 f.close()
339
340 def get_file(self, key):
341 """Return a file-like representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000342 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000343 return _ProxyFile(f)
344
345 def iterkeys(self):
346 """Return an iterator over keys."""
347 self._refresh()
348 for key in self._toc:
349 try:
350 self._lookup(key)
351 except KeyError:
352 continue
353 yield key
354
355 def has_key(self, key):
356 """Return True if the keyed message exists, False otherwise."""
357 self._refresh()
358 return key in self._toc
359
360 def __len__(self):
361 """Return a count of messages in the mailbox."""
362 self._refresh()
363 return len(self._toc)
364
365 def flush(self):
366 """Write any pending changes to disk."""
367 return # Maildir changes are always written immediately.
368
369 def lock(self):
370 """Lock the mailbox."""
371 return
372
373 def unlock(self):
374 """Unlock the mailbox if it is locked."""
375 return
376
377 def close(self):
378 """Flush and close the mailbox."""
379 return
380
381 def list_folders(self):
382 """Return a list of folder names."""
383 result = []
384 for entry in os.listdir(self._path):
385 if len(entry) > 1 and entry[0] == '.' and \
386 os.path.isdir(os.path.join(self._path, entry)):
387 result.append(entry[1:])
388 return result
389
390 def get_folder(self, folder):
391 """Return a Maildir instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000392 return Maildir(os.path.join(self._path, '.' + folder),
393 factory=self._factory,
394 create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000395
396 def add_folder(self, folder):
397 """Create a folder and return a Maildir instance representing it."""
398 path = os.path.join(self._path, '.' + folder)
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000399 result = Maildir(path, factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000400 maildirfolder_path = os.path.join(path, 'maildirfolder')
401 if not os.path.exists(maildirfolder_path):
Andrew M. Kuchling70a6dbd2008-08-04 01:43:43 +0000402 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY,
403 0666))
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000404 return result
405
406 def remove_folder(self, folder):
407 """Delete the named folder, which must be empty."""
408 path = os.path.join(self._path, '.' + folder)
409 for entry in os.listdir(os.path.join(path, 'new')) + \
410 os.listdir(os.path.join(path, 'cur')):
411 if len(entry) < 1 or entry[0] != '.':
412 raise NotEmptyError('Folder contains message(s): %s' % folder)
413 for entry in os.listdir(path):
414 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
415 os.path.isdir(os.path.join(path, entry)):
416 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
417 (folder, entry))
418 for root, dirs, files in os.walk(path, topdown=False):
419 for entry in files:
420 os.remove(os.path.join(root, entry))
421 for entry in dirs:
422 os.rmdir(os.path.join(root, entry))
423 os.rmdir(path)
424
425 def clean(self):
426 """Delete old files in "tmp"."""
427 now = time.time()
428 for entry in os.listdir(os.path.join(self._path, 'tmp')):
429 path = os.path.join(self._path, 'tmp', entry)
430 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
431 os.remove(path)
432
433 _count = 1 # This is used to generate unique file names.
434
435 def _create_tmp(self):
436 """Create a file in the tmp subdirectory and open and return it."""
437 now = time.time()
438 hostname = socket.gethostname()
439 if '/' in hostname:
440 hostname = hostname.replace('/', r'\057')
441 if ':' in hostname:
442 hostname = hostname.replace(':', r'\072')
443 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
444 Maildir._count, hostname)
445 path = os.path.join(self._path, 'tmp', uniq)
446 try:
447 os.stat(path)
448 except OSError, e:
449 if e.errno == errno.ENOENT:
450 Maildir._count += 1
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000451 try:
452 return _create_carefully(path)
453 except OSError, e:
454 if e.errno != errno.EEXIST:
455 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000456 else:
457 raise
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000458
459 # Fall through to here if stat succeeded or open raised EEXIST.
460 raise ExternalClashError('Name clash prevented file creation: %s' %
461 path)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000462
463 def _refresh(self):
464 """Update table of contents mapping."""
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000465 if self._last_read is not None:
466 for subdir in ('new', 'cur'):
467 mtime = os.path.getmtime(os.path.join(self._path, subdir))
468 if mtime > self._last_read:
469 break
470 else:
471 return
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000472
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000473 # We record the current time - 1sec so that, if _refresh() is called
474 # again in the same second, we will always re-read the mailbox
475 # just in case it's been modified. (os.path.mtime() only has
476 # 1sec resolution.) This results in a few unnecessary re-reads
477 # when _refresh() is called multiple times in the same second,
478 # but once the clock ticks over, we will only re-read as needed.
479 now = time.time() - 1
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000480
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000481 self._toc = {}
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000482 def update_dir (subdir):
483 path = os.path.join(self._path, subdir)
484 for entry in os.listdir(path):
485 p = os.path.join(path, entry)
Andrew M. Kuchling2b09ef02007-07-14 21:56:19 +0000486 if os.path.isdir(p):
487 continue
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000488 uniq = entry.split(self.colon)[0]
489 self._toc[uniq] = os.path.join(subdir, entry)
490
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000491 update_dir('new')
492 update_dir('cur')
493
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000494 self._last_read = now
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000495
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000496 def _lookup(self, key):
497 """Use TOC to return subpath for given key, or raise a KeyError."""
498 try:
499 if os.path.exists(os.path.join(self._path, self._toc[key])):
500 return self._toc[key]
501 except KeyError:
502 pass
503 self._refresh()
504 try:
505 return self._toc[key]
506 except KeyError:
507 raise KeyError('No message with key: %s' % key)
508
509 # This method is for backward compatibility only.
510 def next(self):
511 """Return the next message in a one-time iteration."""
512 if not hasattr(self, '_onetime_keys'):
513 self._onetime_keys = self.iterkeys()
514 while True:
515 try:
516 return self[self._onetime_keys.next()]
517 except StopIteration:
518 return None
519 except KeyError:
520 continue
521
522
523class _singlefileMailbox(Mailbox):
524 """A single-file mailbox."""
525
526 def __init__(self, path, factory=None, create=True):
527 """Initialize a single-file mailbox."""
528 Mailbox.__init__(self, path, factory, create)
529 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000530 f = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000531 except IOError, e:
532 if e.errno == errno.ENOENT:
533 if create:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000534 f = open(self._path, 'wb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000535 else:
536 raise NoSuchMailboxError(self._path)
537 elif e.errno == errno.EACCES:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000538 f = open(self._path, 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000539 else:
540 raise
541 self._file = f
542 self._toc = None
543 self._next_key = 0
544 self._pending = False # No changes require rewriting the file.
545 self._locked = False
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000546 self._file_length = None # Used to record mailbox size
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000547
548 def add(self, message):
549 """Add message and return assigned key."""
550 self._lookup()
551 self._toc[self._next_key] = self._append_message(message)
552 self._next_key += 1
553 self._pending = True
554 return self._next_key - 1
555
556 def remove(self, key):
557 """Remove the keyed message; raise KeyError if it doesn't exist."""
558 self._lookup(key)
559 del self._toc[key]
560 self._pending = True
561
562 def __setitem__(self, key, message):
563 """Replace the keyed message; raise KeyError if it doesn't exist."""
564 self._lookup(key)
565 self._toc[key] = self._append_message(message)
566 self._pending = True
567
568 def iterkeys(self):
569 """Return an iterator over keys."""
570 self._lookup()
571 for key in self._toc.keys():
572 yield key
573
574 def has_key(self, key):
575 """Return True if the keyed message exists, False otherwise."""
576 self._lookup()
577 return key in self._toc
578
579 def __len__(self):
580 """Return a count of messages in the mailbox."""
581 self._lookup()
582 return len(self._toc)
583
584 def lock(self):
585 """Lock the mailbox."""
586 if not self._locked:
587 _lock_file(self._file)
588 self._locked = True
589
590 def unlock(self):
591 """Unlock the mailbox if it is locked."""
592 if self._locked:
593 _unlock_file(self._file)
594 self._locked = False
595
596 def flush(self):
597 """Write any pending changes to disk."""
598 if not self._pending:
599 return
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000600
601 # In order to be writing anything out at all, self._toc must
602 # already have been generated (and presumably has been modified
603 # by adding or deleting an item).
604 assert self._toc is not None
Tim Petersf733abb2007-01-30 03:03:46 +0000605
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000606 # Check length of self._file; if it's changed, some other process
607 # has modified the mailbox since we scanned it.
608 self._file.seek(0, 2)
609 cur_len = self._file.tell()
610 if cur_len != self._file_length:
611 raise ExternalClashError('Size of mailbox file changed '
612 '(expected %i, found %i)' %
613 (self._file_length, cur_len))
Tim Petersf733abb2007-01-30 03:03:46 +0000614
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000615 new_file = _create_temporary(self._path)
616 try:
617 new_toc = {}
618 self._pre_mailbox_hook(new_file)
619 for key in sorted(self._toc.keys()):
620 start, stop = self._toc[key]
621 self._file.seek(start)
622 self._pre_message_hook(new_file)
623 new_start = new_file.tell()
624 while True:
625 buffer = self._file.read(min(4096,
626 stop - self._file.tell()))
627 if buffer == '':
628 break
629 new_file.write(buffer)
630 new_toc[key] = (new_start, new_file.tell())
631 self._post_message_hook(new_file)
632 except:
633 new_file.close()
634 os.remove(new_file.name)
635 raise
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000636 _sync_close(new_file)
637 # self._file is about to get replaced, so no need to sync.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000638 self._file.close()
639 try:
640 os.rename(new_file.name, self._path)
641 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +0000642 if e.errno == errno.EEXIST or \
643 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000644 os.remove(self._path)
645 os.rename(new_file.name, self._path)
646 else:
647 raise
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000648 self._file = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000649 self._toc = new_toc
650 self._pending = False
651 if self._locked:
Andrew M. Kuchling0f871832006-10-27 16:55:34 +0000652 _lock_file(self._file, dotlock=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000653
654 def _pre_mailbox_hook(self, f):
655 """Called before writing the mailbox to file f."""
656 return
657
658 def _pre_message_hook(self, f):
659 """Called before writing each message to file f."""
660 return
661
662 def _post_message_hook(self, f):
663 """Called after writing each message to file f."""
664 return
665
666 def close(self):
667 """Flush and close the mailbox."""
668 self.flush()
669 if self._locked:
670 self.unlock()
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000671 self._file.close() # Sync has been done by self.flush() above.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000672
673 def _lookup(self, key=None):
674 """Return (start, stop) or raise KeyError."""
675 if self._toc is None:
676 self._generate_toc()
677 if key is not None:
678 try:
679 return self._toc[key]
680 except KeyError:
681 raise KeyError('No message with key: %s' % key)
682
683 def _append_message(self, message):
684 """Append message to mailbox and return (start, stop) offsets."""
685 self._file.seek(0, 2)
686 self._pre_message_hook(self._file)
687 offsets = self._install_message(message)
688 self._post_message_hook(self._file)
689 self._file.flush()
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000690 self._file_length = self._file.tell() # Record current length of mailbox
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000691 return offsets
692
693
694
695class _mboxMMDF(_singlefileMailbox):
696 """An mbox or MMDF mailbox."""
697
698 _mangle_from_ = True
699
700 def get_message(self, key):
701 """Return a Message representation or raise a KeyError."""
702 start, stop = self._lookup(key)
703 self._file.seek(start)
704 from_line = self._file.readline().replace(os.linesep, '')
705 string = self._file.read(stop - self._file.tell())
706 msg = self._message_factory(string.replace(os.linesep, '\n'))
707 msg.set_from(from_line[5:])
708 return msg
709
710 def get_string(self, key, from_=False):
711 """Return a string representation or raise a KeyError."""
712 start, stop = self._lookup(key)
713 self._file.seek(start)
714 if not from_:
715 self._file.readline()
716 string = self._file.read(stop - self._file.tell())
717 return string.replace(os.linesep, '\n')
718
719 def get_file(self, key, from_=False):
720 """Return a file-like representation or raise a KeyError."""
721 start, stop = self._lookup(key)
722 self._file.seek(start)
723 if not from_:
724 self._file.readline()
725 return _PartialFile(self._file, self._file.tell(), stop)
726
727 def _install_message(self, message):
728 """Format a message and blindly write to self._file."""
729 from_line = None
730 if isinstance(message, str) and message.startswith('From '):
731 newline = message.find('\n')
732 if newline != -1:
733 from_line = message[:newline]
734 message = message[newline + 1:]
735 else:
736 from_line = message
737 message = ''
738 elif isinstance(message, _mboxMMDFMessage):
739 from_line = 'From ' + message.get_from()
Georg Brandl5a096e12007-01-22 19:40:21 +0000740 elif isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000741 from_line = message.get_unixfrom() # May be None.
742 if from_line is None:
743 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
744 start = self._file.tell()
745 self._file.write(from_line + os.linesep)
746 self._dump_message(message, self._file, self._mangle_from_)
747 stop = self._file.tell()
748 return (start, stop)
749
750
751class mbox(_mboxMMDF):
752 """A classic mbox mailbox."""
753
754 _mangle_from_ = True
755
756 def __init__(self, path, factory=None, create=True):
757 """Initialize an mbox mailbox."""
758 self._message_factory = mboxMessage
759 _mboxMMDF.__init__(self, path, factory, create)
760
761 def _pre_message_hook(self, f):
762 """Called before writing each message to file f."""
763 if f.tell() != 0:
764 f.write(os.linesep)
765
766 def _generate_toc(self):
767 """Generate key-to-(start, stop) table of contents."""
768 starts, stops = [], []
769 self._file.seek(0)
770 while True:
771 line_pos = self._file.tell()
772 line = self._file.readline()
773 if line.startswith('From '):
774 if len(stops) < len(starts):
775 stops.append(line_pos - len(os.linesep))
776 starts.append(line_pos)
777 elif line == '':
778 stops.append(line_pos)
779 break
780 self._toc = dict(enumerate(zip(starts, stops)))
781 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000782 self._file_length = self._file.tell()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000783
784
785class MMDF(_mboxMMDF):
786 """An MMDF mailbox."""
787
788 def __init__(self, path, factory=None, create=True):
789 """Initialize an MMDF mailbox."""
790 self._message_factory = MMDFMessage
791 _mboxMMDF.__init__(self, path, factory, create)
792
793 def _pre_message_hook(self, f):
794 """Called before writing each message to file f."""
795 f.write('\001\001\001\001' + os.linesep)
796
797 def _post_message_hook(self, f):
798 """Called after writing each message to file f."""
799 f.write(os.linesep + '\001\001\001\001' + os.linesep)
800
801 def _generate_toc(self):
802 """Generate key-to-(start, stop) table of contents."""
803 starts, stops = [], []
804 self._file.seek(0)
805 next_pos = 0
806 while True:
807 line_pos = next_pos
808 line = self._file.readline()
809 next_pos = self._file.tell()
810 if line.startswith('\001\001\001\001' + os.linesep):
811 starts.append(next_pos)
812 while True:
813 line_pos = next_pos
814 line = self._file.readline()
815 next_pos = self._file.tell()
816 if line == '\001\001\001\001' + os.linesep:
817 stops.append(line_pos - len(os.linesep))
818 break
819 elif line == '':
820 stops.append(line_pos)
821 break
822 elif line == '':
823 break
824 self._toc = dict(enumerate(zip(starts, stops)))
825 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000826 self._file.seek(0, 2)
827 self._file_length = self._file.tell()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000828
829
830class MH(Mailbox):
831 """An MH mailbox."""
832
833 def __init__(self, path, factory=None, create=True):
834 """Initialize an MH instance."""
835 Mailbox.__init__(self, path, factory, create)
836 if not os.path.exists(self._path):
837 if create:
838 os.mkdir(self._path, 0700)
839 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
840 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0600))
841 else:
842 raise NoSuchMailboxError(self._path)
843 self._locked = False
844
845 def add(self, message):
846 """Add message and return assigned key."""
847 keys = self.keys()
848 if len(keys) == 0:
849 new_key = 1
850 else:
851 new_key = max(keys) + 1
852 new_path = os.path.join(self._path, str(new_key))
853 f = _create_carefully(new_path)
854 try:
855 if self._locked:
856 _lock_file(f)
857 try:
858 self._dump_message(message, f)
859 if isinstance(message, MHMessage):
860 self._dump_sequences(message, new_key)
861 finally:
862 if self._locked:
863 _unlock_file(f)
864 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000865 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000866 return new_key
867
868 def remove(self, key):
869 """Remove the keyed message; raise KeyError if it doesn't exist."""
870 path = os.path.join(self._path, str(key))
871 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000872 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000873 except IOError, e:
874 if e.errno == errno.ENOENT:
875 raise KeyError('No message with key: %s' % key)
876 else:
877 raise
878 try:
879 if self._locked:
880 _lock_file(f)
881 try:
882 f.close()
883 os.remove(os.path.join(self._path, str(key)))
884 finally:
885 if self._locked:
886 _unlock_file(f)
887 finally:
888 f.close()
889
890 def __setitem__(self, key, message):
891 """Replace the keyed message; raise KeyError if it doesn't exist."""
892 path = os.path.join(self._path, str(key))
893 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000894 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000895 except IOError, e:
896 if e.errno == errno.ENOENT:
897 raise KeyError('No message with key: %s' % key)
898 else:
899 raise
900 try:
901 if self._locked:
902 _lock_file(f)
903 try:
904 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
905 self._dump_message(message, f)
906 if isinstance(message, MHMessage):
907 self._dump_sequences(message, key)
908 finally:
909 if self._locked:
910 _unlock_file(f)
911 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000912 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000913
914 def get_message(self, key):
915 """Return a Message representation or raise a KeyError."""
916 try:
917 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000918 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000919 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000920 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000921 except IOError, e:
922 if e.errno == errno.ENOENT:
923 raise KeyError('No message with key: %s' % key)
924 else:
925 raise
926 try:
927 if self._locked:
928 _lock_file(f)
929 try:
930 msg = MHMessage(f)
931 finally:
932 if self._locked:
933 _unlock_file(f)
934 finally:
935 f.close()
R. David Murray52720c52009-04-02 14:05:35 +0000936 for name, key_list in self.get_sequences().iteritems():
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000937 if key in key_list:
938 msg.add_sequence(name)
939 return msg
940
941 def get_string(self, key):
942 """Return a string representation or raise a KeyError."""
943 try:
944 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000945 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000946 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000947 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000948 except IOError, e:
949 if e.errno == errno.ENOENT:
950 raise KeyError('No message with key: %s' % key)
951 else:
952 raise
953 try:
954 if self._locked:
955 _lock_file(f)
956 try:
957 return f.read()
958 finally:
959 if self._locked:
960 _unlock_file(f)
961 finally:
962 f.close()
963
964 def get_file(self, key):
965 """Return a file-like representation or raise a KeyError."""
966 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000967 f = open(os.path.join(self._path, str(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000968 except IOError, e:
969 if e.errno == errno.ENOENT:
970 raise KeyError('No message with key: %s' % key)
971 else:
972 raise
973 return _ProxyFile(f)
974
975 def iterkeys(self):
976 """Return an iterator over keys."""
977 return iter(sorted(int(entry) for entry in os.listdir(self._path)
978 if entry.isdigit()))
979
980 def has_key(self, key):
981 """Return True if the keyed message exists, False otherwise."""
982 return os.path.exists(os.path.join(self._path, str(key)))
983
984 def __len__(self):
985 """Return a count of messages in the mailbox."""
986 return len(list(self.iterkeys()))
987
988 def lock(self):
989 """Lock the mailbox."""
990 if not self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000991 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000992 _lock_file(self._file)
993 self._locked = True
994
995 def unlock(self):
996 """Unlock the mailbox if it is locked."""
997 if self._locked:
998 _unlock_file(self._file)
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000999 _sync_close(self._file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001000 del self._file
1001 self._locked = False
1002
1003 def flush(self):
1004 """Write any pending changes to the disk."""
1005 return
1006
1007 def close(self):
1008 """Flush and close the mailbox."""
1009 if self._locked:
1010 self.unlock()
1011
1012 def list_folders(self):
1013 """Return a list of folder names."""
1014 result = []
1015 for entry in os.listdir(self._path):
1016 if os.path.isdir(os.path.join(self._path, entry)):
1017 result.append(entry)
1018 return result
1019
1020 def get_folder(self, folder):
1021 """Return an MH instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +00001022 return MH(os.path.join(self._path, folder),
1023 factory=self._factory, create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001024
1025 def add_folder(self, folder):
1026 """Create a folder and return an MH instance representing it."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +00001027 return MH(os.path.join(self._path, folder),
1028 factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001029
1030 def remove_folder(self, folder):
1031 """Delete the named folder, which must be empty."""
1032 path = os.path.join(self._path, folder)
1033 entries = os.listdir(path)
1034 if entries == ['.mh_sequences']:
1035 os.remove(os.path.join(path, '.mh_sequences'))
1036 elif entries == []:
1037 pass
1038 else:
1039 raise NotEmptyError('Folder not empty: %s' % self._path)
1040 os.rmdir(path)
1041
1042 def get_sequences(self):
1043 """Return a name-to-key-list dictionary to define each sequence."""
1044 results = {}
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001045 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001046 try:
1047 all_keys = set(self.keys())
1048 for line in f:
1049 try:
1050 name, contents = line.split(':')
1051 keys = set()
1052 for spec in contents.split():
1053 if spec.isdigit():
1054 keys.add(int(spec))
1055 else:
1056 start, stop = (int(x) for x in spec.split('-'))
1057 keys.update(range(start, stop + 1))
1058 results[name] = [key for key in sorted(keys) \
1059 if key in all_keys]
1060 if len(results[name]) == 0:
1061 del results[name]
1062 except ValueError:
1063 raise FormatError('Invalid sequence specification: %s' %
1064 line.rstrip())
1065 finally:
1066 f.close()
1067 return results
1068
1069 def set_sequences(self, sequences):
1070 """Set sequences using the given name-to-key-list dictionary."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001071 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001072 try:
1073 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
1074 for name, keys in sequences.iteritems():
1075 if len(keys) == 0:
1076 continue
1077 f.write('%s:' % name)
1078 prev = None
1079 completing = False
1080 for key in sorted(set(keys)):
1081 if key - 1 == prev:
1082 if not completing:
1083 completing = True
1084 f.write('-')
1085 elif completing:
1086 completing = False
1087 f.write('%s %s' % (prev, key))
1088 else:
1089 f.write(' %s' % key)
1090 prev = key
1091 if completing:
1092 f.write(str(prev) + '\n')
1093 else:
1094 f.write('\n')
1095 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001096 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001097
1098 def pack(self):
1099 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1100 sequences = self.get_sequences()
1101 prev = 0
1102 changes = []
1103 for key in self.iterkeys():
1104 if key - 1 != prev:
1105 changes.append((key, prev + 1))
Andrew M. Kuchling8c456f32006-11-17 13:30:25 +00001106 if hasattr(os, 'link'):
1107 os.link(os.path.join(self._path, str(key)),
1108 os.path.join(self._path, str(prev + 1)))
1109 os.unlink(os.path.join(self._path, str(key)))
1110 else:
1111 os.rename(os.path.join(self._path, str(key)),
1112 os.path.join(self._path, str(prev + 1)))
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001113 prev += 1
1114 self._next_key = prev + 1
1115 if len(changes) == 0:
1116 return
1117 for name, key_list in sequences.items():
1118 for old, new in changes:
1119 if old in key_list:
1120 key_list[key_list.index(old)] = new
1121 self.set_sequences(sequences)
1122
1123 def _dump_sequences(self, message, key):
1124 """Inspect a new MHMessage and update sequences appropriately."""
1125 pending_sequences = message.get_sequences()
1126 all_sequences = self.get_sequences()
1127 for name, key_list in all_sequences.iteritems():
1128 if name in pending_sequences:
1129 key_list.append(key)
1130 elif key in key_list:
1131 del key_list[key_list.index(key)]
1132 for sequence in pending_sequences:
1133 if sequence not in all_sequences:
1134 all_sequences[sequence] = [key]
1135 self.set_sequences(all_sequences)
1136
1137
1138class Babyl(_singlefileMailbox):
1139 """An Rmail-style Babyl mailbox."""
1140
1141 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1142 'forwarded', 'edited', 'resent'))
1143
1144 def __init__(self, path, factory=None, create=True):
1145 """Initialize a Babyl mailbox."""
1146 _singlefileMailbox.__init__(self, path, factory, create)
1147 self._labels = {}
1148
1149 def add(self, message):
1150 """Add message and return assigned key."""
1151 key = _singlefileMailbox.add(self, message)
1152 if isinstance(message, BabylMessage):
1153 self._labels[key] = message.get_labels()
1154 return key
1155
1156 def remove(self, key):
1157 """Remove the keyed message; raise KeyError if it doesn't exist."""
1158 _singlefileMailbox.remove(self, key)
1159 if key in self._labels:
1160 del self._labels[key]
1161
1162 def __setitem__(self, key, message):
1163 """Replace the keyed message; raise KeyError if it doesn't exist."""
1164 _singlefileMailbox.__setitem__(self, key, message)
1165 if isinstance(message, BabylMessage):
1166 self._labels[key] = message.get_labels()
1167
1168 def get_message(self, key):
1169 """Return a Message representation or raise a KeyError."""
1170 start, stop = self._lookup(key)
1171 self._file.seek(start)
1172 self._file.readline() # Skip '1,' line specifying labels.
1173 original_headers = StringIO.StringIO()
1174 while True:
1175 line = self._file.readline()
1176 if line == '*** EOOH ***' + os.linesep or line == '':
1177 break
1178 original_headers.write(line.replace(os.linesep, '\n'))
1179 visible_headers = StringIO.StringIO()
1180 while True:
1181 line = self._file.readline()
1182 if line == os.linesep or line == '':
1183 break
1184 visible_headers.write(line.replace(os.linesep, '\n'))
1185 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1186 '\n')
1187 msg = BabylMessage(original_headers.getvalue() + body)
1188 msg.set_visible(visible_headers.getvalue())
1189 if key in self._labels:
1190 msg.set_labels(self._labels[key])
1191 return msg
1192
1193 def get_string(self, key):
1194 """Return a string representation or raise a KeyError."""
1195 start, stop = self._lookup(key)
1196 self._file.seek(start)
1197 self._file.readline() # Skip '1,' line specifying labels.
1198 original_headers = StringIO.StringIO()
1199 while True:
1200 line = self._file.readline()
1201 if line == '*** EOOH ***' + os.linesep or line == '':
1202 break
1203 original_headers.write(line.replace(os.linesep, '\n'))
1204 while True:
1205 line = self._file.readline()
1206 if line == os.linesep or line == '':
1207 break
1208 return original_headers.getvalue() + \
1209 self._file.read(stop - self._file.tell()).replace(os.linesep,
1210 '\n')
1211
1212 def get_file(self, key):
1213 """Return a file-like representation or raise a KeyError."""
1214 return StringIO.StringIO(self.get_string(key).replace('\n',
1215 os.linesep))
1216
1217 def get_labels(self):
1218 """Return a list of user-defined labels in the mailbox."""
1219 self._lookup()
1220 labels = set()
1221 for label_list in self._labels.values():
1222 labels.update(label_list)
1223 labels.difference_update(self._special_labels)
1224 return list(labels)
1225
1226 def _generate_toc(self):
1227 """Generate key-to-(start, stop) table of contents."""
1228 starts, stops = [], []
1229 self._file.seek(0)
1230 next_pos = 0
1231 label_lists = []
1232 while True:
1233 line_pos = next_pos
1234 line = self._file.readline()
1235 next_pos = self._file.tell()
1236 if line == '\037\014' + os.linesep:
1237 if len(stops) < len(starts):
1238 stops.append(line_pos - len(os.linesep))
1239 starts.append(next_pos)
1240 labels = [label.strip() for label
1241 in self._file.readline()[1:].split(',')
1242 if label.strip() != '']
1243 label_lists.append(labels)
1244 elif line == '\037' or line == '\037' + os.linesep:
1245 if len(stops) < len(starts):
1246 stops.append(line_pos - len(os.linesep))
1247 elif line == '':
1248 stops.append(line_pos - len(os.linesep))
1249 break
1250 self._toc = dict(enumerate(zip(starts, stops)))
1251 self._labels = dict(enumerate(label_lists))
1252 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +00001253 self._file.seek(0, 2)
1254 self._file_length = self._file.tell()
Tim Petersf733abb2007-01-30 03:03:46 +00001255
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001256 def _pre_mailbox_hook(self, f):
1257 """Called before writing the mailbox to file f."""
1258 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1259 (os.linesep, os.linesep, ','.join(self.get_labels()),
1260 os.linesep))
1261
1262 def _pre_message_hook(self, f):
1263 """Called before writing each message to file f."""
1264 f.write('\014' + os.linesep)
1265
1266 def _post_message_hook(self, f):
1267 """Called after writing each message to file f."""
1268 f.write(os.linesep + '\037')
1269
1270 def _install_message(self, message):
1271 """Write message contents and return (start, stop)."""
1272 start = self._file.tell()
1273 if isinstance(message, BabylMessage):
1274 special_labels = []
1275 labels = []
1276 for label in message.get_labels():
1277 if label in self._special_labels:
1278 special_labels.append(label)
1279 else:
1280 labels.append(label)
1281 self._file.write('1')
1282 for label in special_labels:
1283 self._file.write(', ' + label)
1284 self._file.write(',,')
1285 for label in labels:
1286 self._file.write(' ' + label + ',')
1287 self._file.write(os.linesep)
1288 else:
1289 self._file.write('1,,' + os.linesep)
Georg Brandl5a096e12007-01-22 19:40:21 +00001290 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001291 orig_buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +00001292 orig_generator = email.generator.Generator(orig_buffer, False, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001293 orig_generator.flatten(message)
1294 orig_buffer.seek(0)
1295 while True:
1296 line = orig_buffer.readline()
1297 self._file.write(line.replace('\n', os.linesep))
1298 if line == '\n' or line == '':
1299 break
1300 self._file.write('*** EOOH ***' + os.linesep)
1301 if isinstance(message, BabylMessage):
1302 vis_buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +00001303 vis_generator = email.generator.Generator(vis_buffer, False, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001304 vis_generator.flatten(message.get_visible())
1305 while True:
1306 line = vis_buffer.readline()
1307 self._file.write(line.replace('\n', os.linesep))
1308 if line == '\n' or line == '':
1309 break
1310 else:
1311 orig_buffer.seek(0)
1312 while True:
1313 line = orig_buffer.readline()
1314 self._file.write(line.replace('\n', os.linesep))
1315 if line == '\n' or line == '':
1316 break
1317 while True:
1318 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
1319 if buffer == '':
1320 break
1321 self._file.write(buffer.replace('\n', os.linesep))
1322 elif isinstance(message, str):
1323 body_start = message.find('\n\n') + 2
1324 if body_start - 2 != -1:
1325 self._file.write(message[:body_start].replace('\n',
1326 os.linesep))
1327 self._file.write('*** EOOH ***' + os.linesep)
1328 self._file.write(message[:body_start].replace('\n',
1329 os.linesep))
1330 self._file.write(message[body_start:].replace('\n',
1331 os.linesep))
1332 else:
1333 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1334 self._file.write(message.replace('\n', os.linesep))
1335 elif hasattr(message, 'readline'):
1336 original_pos = message.tell()
1337 first_pass = True
1338 while True:
1339 line = message.readline()
1340 self._file.write(line.replace('\n', os.linesep))
1341 if line == '\n' or line == '':
1342 self._file.write('*** EOOH ***' + os.linesep)
1343 if first_pass:
1344 first_pass = False
1345 message.seek(original_pos)
1346 else:
1347 break
1348 while True:
1349 buffer = message.read(4096) # Buffer size is arbitrary.
1350 if buffer == '':
1351 break
1352 self._file.write(buffer.replace('\n', os.linesep))
1353 else:
1354 raise TypeError('Invalid message type: %s' % type(message))
1355 stop = self._file.tell()
1356 return (start, stop)
1357
1358
Georg Brandl5a096e12007-01-22 19:40:21 +00001359class Message(email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001360 """Message with mailbox-format-specific properties."""
1361
1362 def __init__(self, message=None):
1363 """Initialize a Message instance."""
Georg Brandl5a096e12007-01-22 19:40:21 +00001364 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001365 self._become_message(copy.deepcopy(message))
1366 if isinstance(message, Message):
1367 message._explain_to(self)
1368 elif isinstance(message, str):
1369 self._become_message(email.message_from_string(message))
1370 elif hasattr(message, "read"):
1371 self._become_message(email.message_from_file(message))
1372 elif message is None:
Georg Brandl5a096e12007-01-22 19:40:21 +00001373 email.message.Message.__init__(self)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001374 else:
1375 raise TypeError('Invalid message type: %s' % type(message))
1376
1377 def _become_message(self, message):
1378 """Assume the non-format-specific state of message."""
1379 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1380 'preamble', 'epilogue', 'defects', '_default_type'):
1381 self.__dict__[name] = message.__dict__[name]
1382
1383 def _explain_to(self, message):
1384 """Copy format-specific state to message insofar as possible."""
1385 if isinstance(message, Message):
1386 return # There's nothing format-specific to explain.
1387 else:
1388 raise TypeError('Cannot convert to specified type')
1389
1390
1391class MaildirMessage(Message):
1392 """Message with Maildir-specific properties."""
1393
1394 def __init__(self, message=None):
1395 """Initialize a MaildirMessage instance."""
1396 self._subdir = 'new'
1397 self._info = ''
1398 self._date = time.time()
1399 Message.__init__(self, message)
1400
1401 def get_subdir(self):
1402 """Return 'new' or 'cur'."""
1403 return self._subdir
1404
1405 def set_subdir(self, subdir):
1406 """Set subdir to 'new' or 'cur'."""
1407 if subdir == 'new' or subdir == 'cur':
1408 self._subdir = subdir
1409 else:
1410 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1411
1412 def get_flags(self):
1413 """Return as a string the flags that are set."""
1414 if self._info.startswith('2,'):
1415 return self._info[2:]
1416 else:
1417 return ''
1418
1419 def set_flags(self, flags):
1420 """Set the given flags and unset all others."""
1421 self._info = '2,' + ''.join(sorted(flags))
1422
1423 def add_flag(self, flag):
1424 """Set the given flag(s) without changing others."""
1425 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1426
1427 def remove_flag(self, flag):
1428 """Unset the given string flag(s) without changing others."""
1429 if self.get_flags() != '':
1430 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1431
1432 def get_date(self):
1433 """Return delivery date of message, in seconds since the epoch."""
1434 return self._date
1435
1436 def set_date(self, date):
1437 """Set delivery date of message, in seconds since the epoch."""
1438 try:
1439 self._date = float(date)
1440 except ValueError:
1441 raise TypeError("can't convert to float: %s" % date)
1442
1443 def get_info(self):
1444 """Get the message's "info" as a string."""
1445 return self._info
1446
1447 def set_info(self, info):
1448 """Set the message's "info" string."""
1449 if isinstance(info, str):
1450 self._info = info
1451 else:
1452 raise TypeError('info must be a string: %s' % type(info))
1453
1454 def _explain_to(self, message):
1455 """Copy Maildir-specific state to message insofar as possible."""
1456 if isinstance(message, MaildirMessage):
1457 message.set_flags(self.get_flags())
1458 message.set_subdir(self.get_subdir())
1459 message.set_date(self.get_date())
1460 elif isinstance(message, _mboxMMDFMessage):
1461 flags = set(self.get_flags())
1462 if 'S' in flags:
1463 message.add_flag('R')
1464 if self.get_subdir() == 'cur':
1465 message.add_flag('O')
1466 if 'T' in flags:
1467 message.add_flag('D')
1468 if 'F' in flags:
1469 message.add_flag('F')
1470 if 'R' in flags:
1471 message.add_flag('A')
1472 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1473 elif isinstance(message, MHMessage):
1474 flags = set(self.get_flags())
1475 if 'S' not in flags:
1476 message.add_sequence('unseen')
1477 if 'R' in flags:
1478 message.add_sequence('replied')
1479 if 'F' in flags:
1480 message.add_sequence('flagged')
1481 elif isinstance(message, BabylMessage):
1482 flags = set(self.get_flags())
1483 if 'S' not in flags:
1484 message.add_label('unseen')
1485 if 'T' in flags:
1486 message.add_label('deleted')
1487 if 'R' in flags:
1488 message.add_label('answered')
1489 if 'P' in flags:
1490 message.add_label('forwarded')
1491 elif isinstance(message, Message):
1492 pass
1493 else:
1494 raise TypeError('Cannot convert to specified type: %s' %
1495 type(message))
1496
1497
1498class _mboxMMDFMessage(Message):
1499 """Message with mbox- or MMDF-specific properties."""
1500
1501 def __init__(self, message=None):
1502 """Initialize an mboxMMDFMessage instance."""
1503 self.set_from('MAILER-DAEMON', True)
Georg Brandl5a096e12007-01-22 19:40:21 +00001504 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001505 unixfrom = message.get_unixfrom()
1506 if unixfrom is not None and unixfrom.startswith('From '):
1507 self.set_from(unixfrom[5:])
1508 Message.__init__(self, message)
1509
1510 def get_from(self):
1511 """Return contents of "From " line."""
1512 return self._from
1513
1514 def set_from(self, from_, time_=None):
1515 """Set "From " line, formatting and appending time_ if specified."""
1516 if time_ is not None:
1517 if time_ is True:
1518 time_ = time.gmtime()
1519 from_ += ' ' + time.asctime(time_)
1520 self._from = from_
1521
1522 def get_flags(self):
1523 """Return as a string the flags that are set."""
1524 return self.get('Status', '') + self.get('X-Status', '')
1525
1526 def set_flags(self, flags):
1527 """Set the given flags and unset all others."""
1528 flags = set(flags)
1529 status_flags, xstatus_flags = '', ''
1530 for flag in ('R', 'O'):
1531 if flag in flags:
1532 status_flags += flag
1533 flags.remove(flag)
1534 for flag in ('D', 'F', 'A'):
1535 if flag in flags:
1536 xstatus_flags += flag
1537 flags.remove(flag)
1538 xstatus_flags += ''.join(sorted(flags))
1539 try:
1540 self.replace_header('Status', status_flags)
1541 except KeyError:
1542 self.add_header('Status', status_flags)
1543 try:
1544 self.replace_header('X-Status', xstatus_flags)
1545 except KeyError:
1546 self.add_header('X-Status', xstatus_flags)
1547
1548 def add_flag(self, flag):
1549 """Set the given flag(s) without changing others."""
1550 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1551
1552 def remove_flag(self, flag):
1553 """Unset the given string flag(s) without changing others."""
1554 if 'Status' in self or 'X-Status' in self:
1555 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1556
1557 def _explain_to(self, message):
1558 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1559 if isinstance(message, MaildirMessage):
1560 flags = set(self.get_flags())
1561 if 'O' in flags:
1562 message.set_subdir('cur')
1563 if 'F' in flags:
1564 message.add_flag('F')
1565 if 'A' in flags:
1566 message.add_flag('R')
1567 if 'R' in flags:
1568 message.add_flag('S')
1569 if 'D' in flags:
1570 message.add_flag('T')
1571 del message['status']
1572 del message['x-status']
1573 maybe_date = ' '.join(self.get_from().split()[-5:])
1574 try:
1575 message.set_date(calendar.timegm(time.strptime(maybe_date,
1576 '%a %b %d %H:%M:%S %Y')))
1577 except (ValueError, OverflowError):
1578 pass
1579 elif isinstance(message, _mboxMMDFMessage):
1580 message.set_flags(self.get_flags())
1581 message.set_from(self.get_from())
1582 elif isinstance(message, MHMessage):
1583 flags = set(self.get_flags())
1584 if 'R' not in flags:
1585 message.add_sequence('unseen')
1586 if 'A' in flags:
1587 message.add_sequence('replied')
1588 if 'F' in flags:
1589 message.add_sequence('flagged')
1590 del message['status']
1591 del message['x-status']
1592 elif isinstance(message, BabylMessage):
1593 flags = set(self.get_flags())
1594 if 'R' not in flags:
1595 message.add_label('unseen')
1596 if 'D' in flags:
1597 message.add_label('deleted')
1598 if 'A' in flags:
1599 message.add_label('answered')
1600 del message['status']
1601 del message['x-status']
1602 elif isinstance(message, Message):
1603 pass
1604 else:
1605 raise TypeError('Cannot convert to specified type: %s' %
1606 type(message))
1607
1608
1609class mboxMessage(_mboxMMDFMessage):
1610 """Message with mbox-specific properties."""
1611
1612
1613class MHMessage(Message):
1614 """Message with MH-specific properties."""
1615
1616 def __init__(self, message=None):
1617 """Initialize an MHMessage instance."""
1618 self._sequences = []
1619 Message.__init__(self, message)
1620
1621 def get_sequences(self):
1622 """Return a list of sequences that include the message."""
1623 return self._sequences[:]
1624
1625 def set_sequences(self, sequences):
1626 """Set the list of sequences that include the message."""
1627 self._sequences = list(sequences)
1628
1629 def add_sequence(self, sequence):
1630 """Add sequence to list of sequences including the message."""
1631 if isinstance(sequence, str):
1632 if not sequence in self._sequences:
1633 self._sequences.append(sequence)
1634 else:
1635 raise TypeError('sequence must be a string: %s' % type(sequence))
1636
1637 def remove_sequence(self, sequence):
1638 """Remove sequence from the list of sequences including the message."""
1639 try:
1640 self._sequences.remove(sequence)
1641 except ValueError:
1642 pass
1643
1644 def _explain_to(self, message):
1645 """Copy MH-specific state to message insofar as possible."""
1646 if isinstance(message, MaildirMessage):
1647 sequences = set(self.get_sequences())
1648 if 'unseen' in sequences:
1649 message.set_subdir('cur')
1650 else:
1651 message.set_subdir('cur')
1652 message.add_flag('S')
1653 if 'flagged' in sequences:
1654 message.add_flag('F')
1655 if 'replied' in sequences:
1656 message.add_flag('R')
1657 elif isinstance(message, _mboxMMDFMessage):
1658 sequences = set(self.get_sequences())
1659 if 'unseen' not in sequences:
1660 message.add_flag('RO')
1661 else:
1662 message.add_flag('O')
1663 if 'flagged' in sequences:
1664 message.add_flag('F')
1665 if 'replied' in sequences:
1666 message.add_flag('A')
1667 elif isinstance(message, MHMessage):
1668 for sequence in self.get_sequences():
1669 message.add_sequence(sequence)
1670 elif isinstance(message, BabylMessage):
1671 sequences = set(self.get_sequences())
1672 if 'unseen' in sequences:
1673 message.add_label('unseen')
1674 if 'replied' in sequences:
1675 message.add_label('answered')
1676 elif isinstance(message, Message):
1677 pass
1678 else:
1679 raise TypeError('Cannot convert to specified type: %s' %
1680 type(message))
1681
1682
1683class BabylMessage(Message):
1684 """Message with Babyl-specific properties."""
1685
1686 def __init__(self, message=None):
1687 """Initialize an BabylMessage instance."""
1688 self._labels = []
1689 self._visible = Message()
1690 Message.__init__(self, message)
1691
1692 def get_labels(self):
1693 """Return a list of labels on the message."""
1694 return self._labels[:]
1695
1696 def set_labels(self, labels):
1697 """Set the list of labels on the message."""
1698 self._labels = list(labels)
1699
1700 def add_label(self, label):
1701 """Add label to list of labels on the message."""
1702 if isinstance(label, str):
1703 if label not in self._labels:
1704 self._labels.append(label)
1705 else:
1706 raise TypeError('label must be a string: %s' % type(label))
1707
1708 def remove_label(self, label):
1709 """Remove label from the list of labels on the message."""
1710 try:
1711 self._labels.remove(label)
1712 except ValueError:
1713 pass
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001714
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001715 def get_visible(self):
1716 """Return a Message representation of visible headers."""
1717 return Message(self._visible)
1718
1719 def set_visible(self, visible):
1720 """Set the Message representation of visible headers."""
1721 self._visible = Message(visible)
1722
1723 def update_visible(self):
1724 """Update and/or sensibly generate a set of visible headers."""
1725 for header in self._visible.keys():
1726 if header in self:
1727 self._visible.replace_header(header, self[header])
1728 else:
1729 del self._visible[header]
1730 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1731 if header in self and header not in self._visible:
1732 self._visible[header] = self[header]
1733
1734 def _explain_to(self, message):
1735 """Copy Babyl-specific state to message insofar as possible."""
1736 if isinstance(message, MaildirMessage):
1737 labels = set(self.get_labels())
1738 if 'unseen' in labels:
1739 message.set_subdir('cur')
1740 else:
1741 message.set_subdir('cur')
1742 message.add_flag('S')
1743 if 'forwarded' in labels or 'resent' in labels:
1744 message.add_flag('P')
1745 if 'answered' in labels:
1746 message.add_flag('R')
1747 if 'deleted' in labels:
1748 message.add_flag('T')
1749 elif isinstance(message, _mboxMMDFMessage):
1750 labels = set(self.get_labels())
1751 if 'unseen' not in labels:
1752 message.add_flag('RO')
1753 else:
1754 message.add_flag('O')
1755 if 'deleted' in labels:
1756 message.add_flag('D')
1757 if 'answered' in labels:
1758 message.add_flag('A')
1759 elif isinstance(message, MHMessage):
1760 labels = set(self.get_labels())
1761 if 'unseen' in labels:
1762 message.add_sequence('unseen')
1763 if 'answered' in labels:
1764 message.add_sequence('replied')
1765 elif isinstance(message, BabylMessage):
1766 message.set_visible(self.get_visible())
1767 for label in self.get_labels():
1768 message.add_label(label)
1769 elif isinstance(message, Message):
1770 pass
1771 else:
1772 raise TypeError('Cannot convert to specified type: %s' %
1773 type(message))
1774
1775
1776class MMDFMessage(_mboxMMDFMessage):
1777 """Message with MMDF-specific properties."""
1778
1779
1780class _ProxyFile:
1781 """A read-only wrapper of a file."""
1782
1783 def __init__(self, f, pos=None):
1784 """Initialize a _ProxyFile."""
1785 self._file = f
1786 if pos is None:
1787 self._pos = f.tell()
1788 else:
1789 self._pos = pos
1790
1791 def read(self, size=None):
1792 """Read bytes."""
1793 return self._read(size, self._file.read)
1794
1795 def readline(self, size=None):
1796 """Read a line."""
1797 return self._read(size, self._file.readline)
1798
1799 def readlines(self, sizehint=None):
1800 """Read multiple lines."""
1801 result = []
1802 for line in self:
1803 result.append(line)
1804 if sizehint is not None:
1805 sizehint -= len(line)
1806 if sizehint <= 0:
1807 break
1808 return result
1809
1810 def __iter__(self):
1811 """Iterate over lines."""
1812 return iter(self.readline, "")
1813
1814 def tell(self):
1815 """Return the position."""
1816 return self._pos
1817
1818 def seek(self, offset, whence=0):
1819 """Change position."""
1820 if whence == 1:
1821 self._file.seek(self._pos)
1822 self._file.seek(offset, whence)
1823 self._pos = self._file.tell()
1824
1825 def close(self):
1826 """Close the file."""
1827 del self._file
1828
1829 def _read(self, size, read_method):
1830 """Read size bytes using read_method."""
1831 if size is None:
1832 size = -1
1833 self._file.seek(self._pos)
1834 result = read_method(size)
1835 self._pos = self._file.tell()
1836 return result
1837
1838
1839class _PartialFile(_ProxyFile):
1840 """A read-only wrapper of part of a file."""
1841
1842 def __init__(self, f, start=None, stop=None):
1843 """Initialize a _PartialFile."""
1844 _ProxyFile.__init__(self, f, start)
1845 self._start = start
1846 self._stop = stop
1847
1848 def tell(self):
1849 """Return the position with respect to start."""
1850 return _ProxyFile.tell(self) - self._start
1851
1852 def seek(self, offset, whence=0):
1853 """Change position, possibly with respect to start or stop."""
1854 if whence == 0:
1855 self._pos = self._start
1856 whence = 1
1857 elif whence == 2:
1858 self._pos = self._stop
1859 whence = 1
1860 _ProxyFile.seek(self, offset, whence)
1861
1862 def _read(self, size, read_method):
1863 """Read size bytes using read_method, honoring start and stop."""
1864 remaining = self._stop - self._pos
1865 if remaining <= 0:
1866 return ''
1867 if size is None or size < 0 or size > remaining:
1868 size = remaining
1869 return _ProxyFile._read(self, size, read_method)
1870
1871
1872def _lock_file(f, dotlock=True):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001873 """Lock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001874 dotlock_done = False
1875 try:
1876 if fcntl:
1877 try:
1878 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
1879 except IOError, e:
Neal Norwitz7983c722006-06-28 05:03:22 +00001880 if e.errno in (errno.EAGAIN, errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001881 raise ExternalClashError('lockf: lock unavailable: %s' %
1882 f.name)
1883 else:
1884 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001885 if dotlock:
1886 try:
1887 pre_lock = _create_temporary(f.name + '.lock')
1888 pre_lock.close()
1889 except IOError, e:
1890 if e.errno == errno.EACCES:
1891 return # Without write access, just skip dotlocking.
1892 else:
1893 raise
1894 try:
1895 if hasattr(os, 'link'):
1896 os.link(pre_lock.name, f.name + '.lock')
1897 dotlock_done = True
1898 os.unlink(pre_lock.name)
1899 else:
1900 os.rename(pre_lock.name, f.name + '.lock')
1901 dotlock_done = True
1902 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +00001903 if e.errno == errno.EEXIST or \
1904 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001905 os.remove(pre_lock.name)
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001906 raise ExternalClashError('dot lock unavailable: %s' %
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001907 f.name)
1908 else:
1909 raise
1910 except:
1911 if fcntl:
1912 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001913 if dotlock_done:
1914 os.remove(f.name + '.lock')
1915 raise
1916
1917def _unlock_file(f):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001918 """Unlock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001919 if fcntl:
1920 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001921 if os.path.exists(f.name + '.lock'):
1922 os.remove(f.name + '.lock')
1923
1924def _create_carefully(path):
1925 """Create a file if it doesn't exist and open for reading and writing."""
Andrew M. Kuchling70a6dbd2008-08-04 01:43:43 +00001926 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR, 0666)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001927 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001928 return open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001929 finally:
1930 os.close(fd)
1931
1932def _create_temporary(path):
1933 """Create a temp file based on path and open for reading and writing."""
1934 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1935 socket.gethostname(),
1936 os.getpid()))
1937
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001938def _sync_flush(f):
1939 """Ensure changes to file f are physically on disk."""
1940 f.flush()
Andrew M. Kuchling16465682006-12-14 18:57:53 +00001941 if hasattr(os, 'fsync'):
1942 os.fsync(f.fileno())
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001943
1944def _sync_close(f):
1945 """Close file f, ensuring all changes are physically on disk."""
1946 _sync_flush(f)
1947 f.close()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001948
1949## Start: classes from the original module (for backward compatibility).
1950
1951# Note that the Maildir class, whose name is unchanged, itself offers a next()
1952# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001953
Guido van Rossumc7b68821994-04-28 09:53:33 +00001954class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001955
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001956 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001957 self.fp = fp
1958 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001959 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001960
Fred Drake72987a42001-05-02 20:20:53 +00001961 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001962 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001963
Fred Drakedbbf76b2000-07-09 16:44:26 +00001964 def next(self):
1965 while 1:
1966 self.fp.seek(self.seekp)
1967 try:
1968 self._search_start()
1969 except EOFError:
1970 self.seekp = self.fp.tell()
1971 return None
1972 start = self.fp.tell()
1973 self._search_end()
1974 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00001975 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00001976 break
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001977 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00001978
Barry Warsawffd05ee2002-03-01 22:39:14 +00001979# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00001980class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00001981
Fred Drakedbbf76b2000-07-09 16:44:26 +00001982 def _search_start(self):
1983 while 1:
1984 pos = self.fp.tell()
1985 line = self.fp.readline()
1986 if not line:
1987 raise EOFError
1988 if line[:5] == 'From ' and self._isrealfromline(line):
1989 self.fp.seek(pos)
1990 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00001991
Fred Drakedbbf76b2000-07-09 16:44:26 +00001992 def _search_end(self):
1993 self.fp.readline() # Throw away header line
1994 while 1:
1995 pos = self.fp.tell()
1996 line = self.fp.readline()
1997 if not line:
1998 return
1999 if line[:5] == 'From ' and self._isrealfromline(line):
2000 self.fp.seek(pos)
2001 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002002
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002003 # An overridable mechanism to test for From-line-ness. You can either
2004 # specify a different regular expression or define a whole new
2005 # _isrealfromline() method. Note that this only gets called for lines
2006 # starting with the 5 characters "From ".
2007 #
2008 # BAW: According to
2009 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
2010 # the only portable, reliable way to find message delimiters in a BSD (i.e
2011 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
2012 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
2013 # like a good idea, in practice, there are too many variations for more
2014 # strict parsing of the line to be completely accurate.
2015 #
2016 # _strict_isrealfromline() is the old version which tries to do stricter
2017 # parsing of the From_ line. _portable_isrealfromline() simply returns
2018 # true, since it's never called if the line doesn't already start with
2019 # "From ".
2020 #
2021 # This algorithm, and the way it interacts with _search_start() and
2022 # _search_end() may not be completely correct, because it doesn't check
2023 # that the two characters preceding "From " are \n\n or the beginning of
2024 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00002025 # necessary. For convenience, we've added a PortableUnixMailbox class
Andrew M. Kuchlingb94c0c32007-01-22 20:27:50 +00002026 # which does no checking of the format of the 'From' line.
Guido van Rossumc7b68821994-04-28 09:53:33 +00002027
Andrew M. Kuchlingb78bb742007-01-22 20:26:40 +00002028 _fromlinepattern = (r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+"
2029 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*"
2030 r"[^\s]*\s*"
2031 "$")
Fred Drakedbbf76b2000-07-09 16:44:26 +00002032 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002033
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002034 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002035 if not self._regexp:
2036 import re
2037 self._regexp = re.compile(self._fromlinepattern)
2038 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002039
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002040 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002041 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002042
2043 _isrealfromline = _strict_isrealfromline
2044
2045
2046class PortableUnixMailbox(UnixMailbox):
2047 _isrealfromline = UnixMailbox._portable_isrealfromline
2048
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002049
Guido van Rossumc7b68821994-04-28 09:53:33 +00002050class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002051
Fred Drakedbbf76b2000-07-09 16:44:26 +00002052 def _search_start(self):
2053 while 1:
2054 line = self.fp.readline()
2055 if not line:
2056 raise EOFError
2057 if line[:5] == '\001\001\001\001\n':
2058 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002059
Fred Drakedbbf76b2000-07-09 16:44:26 +00002060 def _search_end(self):
2061 while 1:
2062 pos = self.fp.tell()
2063 line = self.fp.readline()
2064 if not line:
2065 return
2066 if line == '\001\001\001\001\n':
2067 self.fp.seek(pos)
2068 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002069
Guido van Rossumc7b68821994-04-28 09:53:33 +00002070
Jack Jansen97157791995-10-23 13:59:53 +00002071class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002072
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002073 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002074 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002075 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002076 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002077 # the three following lines could be combined into:
2078 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2079 list = os.listdir(self.dirname)
2080 list = filter(pat.match, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002081 list = map(long, list)
2082 list.sort()
2083 # This only works in Python 1.6 or later;
2084 # before that str() added 'L':
2085 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002086 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002087 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002088
Fred Drake72987a42001-05-02 20:20:53 +00002089 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002090 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002091
Fred Drakedbbf76b2000-07-09 16:44:26 +00002092 def next(self):
2093 if not self.boxes:
2094 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002095 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002096 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002097 msg = self.factory(fp)
2098 try:
2099 msg._mh_msgno = fn
2100 except (AttributeError, TypeError):
2101 pass
2102 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002103
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002104
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002105class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002106
Fred Drakedbbf76b2000-07-09 16:44:26 +00002107 def _search_start(self):
2108 while 1:
2109 line = self.fp.readline()
2110 if not line:
2111 raise EOFError
2112 if line == '*** EOOH ***\n':
2113 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002114
Fred Drakedbbf76b2000-07-09 16:44:26 +00002115 def _search_end(self):
2116 while 1:
2117 pos = self.fp.tell()
2118 line = self.fp.readline()
2119 if not line:
2120 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002121 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002122 self.fp.seek(pos)
2123 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002124
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002125## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002126
2127
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002128class Error(Exception):
2129 """Raised for module-specific errors."""
2130
2131class NoSuchMailboxError(Error):
2132 """The specified mailbox does not exist and won't be created."""
2133
2134class NotEmptyError(Error):
2135 """The specified mailbox is not empty and deletion was requested."""
2136
2137class ExternalClashError(Error):
2138 """Another process caused an action to fail."""
2139
2140class FormatError(Error):
2141 """A file appears to have an invalid format."""