blob: b74eeb531cb3e5eb2a94c585cb2422122171f2d9 [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00003"""Read/write support for Maildir, mbox, MH, Babyl, and MMDF mailboxes."""
Guido van Rossum62448671996-09-17 21:33:15 +00004
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00005# Notes for authors of new mailbox subclasses:
6#
7# Remember to fsync() changes to disk before closing a modified file
8# or returning from a flush() method. See functions _sync_flush() and
9# _sync_close().
10
Martin v. Löwis08041d52006-05-04 14:27:52 +000011import sys
Jack Jansen97157791995-10-23 13:59:53 +000012import os
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000013import time
14import calendar
15import socket
16import errno
17import copy
18import email
Georg Brandl5a096e12007-01-22 19:40:21 +000019import email.message
20import email.generator
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000021import StringIO
22try:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +000023 if sys.platform == 'os2emx':
24 # OS/2 EMX fcntl() not adequate
25 raise ImportError
Andrew M. Kuchlinga7ee9eb2006-06-26 13:08:24 +000026 import fcntl
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000027except ImportError:
28 fcntl = None
Guido van Rossumc7b68821994-04-28 09:53:33 +000029
Antoine Pitroub9d49632010-01-04 23:22:44 +000030import warnings
31with warnings.catch_warnings():
32 if sys.py3kwarning:
33 warnings.filterwarnings("ignore", ".*rfc822 has been removed",
34 DeprecationWarning)
35 import rfc822
36
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000037__all__ = [ 'Mailbox', 'Maildir', 'mbox', 'MH', 'Babyl', 'MMDF',
38 'Message', 'MaildirMessage', 'mboxMessage', 'MHMessage',
39 'BabylMessage', 'MMDFMessage', 'UnixMailbox',
40 'PortableUnixMailbox', 'MmdfMailbox', 'MHMailbox', 'BabylMailbox' ]
41
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +000042class Mailbox:
43 """A group of messages in a particular place."""
44
45 def __init__(self, path, factory=None, create=True):
46 """Initialize a Mailbox instance."""
47 self._path = os.path.abspath(os.path.expanduser(path))
48 self._factory = factory
49
50 def add(self, message):
51 """Add message and return assigned key."""
52 raise NotImplementedError('Method must be implemented by subclass')
53
54 def remove(self, key):
55 """Remove the keyed message; raise KeyError if it doesn't exist."""
56 raise NotImplementedError('Method must be implemented by subclass')
57
58 def __delitem__(self, key):
59 self.remove(key)
60
61 def discard(self, key):
62 """If the keyed message exists, remove it."""
63 try:
64 self.remove(key)
65 except KeyError:
66 pass
67
68 def __setitem__(self, key, message):
69 """Replace the keyed message; raise KeyError if it doesn't exist."""
70 raise NotImplementedError('Method must be implemented by subclass')
71
72 def get(self, key, default=None):
73 """Return the keyed message, or default if it doesn't exist."""
74 try:
75 return self.__getitem__(key)
76 except KeyError:
77 return default
78
79 def __getitem__(self, key):
80 """Return the keyed message; raise KeyError if it doesn't exist."""
81 if not self._factory:
82 return self.get_message(key)
83 else:
84 return self._factory(self.get_file(key))
85
86 def get_message(self, key):
87 """Return a Message representation or raise a KeyError."""
88 raise NotImplementedError('Method must be implemented by subclass')
89
90 def get_string(self, key):
91 """Return a string representation or raise a KeyError."""
92 raise NotImplementedError('Method must be implemented by subclass')
93
94 def get_file(self, key):
95 """Return a file-like representation or raise a KeyError."""
96 raise NotImplementedError('Method must be implemented by subclass')
97
98 def iterkeys(self):
99 """Return an iterator over keys."""
100 raise NotImplementedError('Method must be implemented by subclass')
101
102 def keys(self):
103 """Return a list of keys."""
104 return list(self.iterkeys())
105
106 def itervalues(self):
107 """Return an iterator over all messages."""
108 for key in self.iterkeys():
109 try:
110 value = self[key]
111 except KeyError:
112 continue
113 yield value
114
115 def __iter__(self):
116 return self.itervalues()
117
118 def values(self):
119 """Return a list of messages. Memory intensive."""
120 return list(self.itervalues())
121
122 def iteritems(self):
123 """Return an iterator over (key, message) tuples."""
124 for key in self.iterkeys():
125 try:
126 value = self[key]
127 except KeyError:
128 continue
129 yield (key, value)
130
131 def items(self):
132 """Return a list of (key, message) tuples. Memory intensive."""
133 return list(self.iteritems())
134
135 def has_key(self, key):
136 """Return True if the keyed message exists, False otherwise."""
137 raise NotImplementedError('Method must be implemented by subclass')
138
139 def __contains__(self, key):
140 return self.has_key(key)
141
142 def __len__(self):
143 """Return a count of messages in the mailbox."""
144 raise NotImplementedError('Method must be implemented by subclass')
145
146 def clear(self):
147 """Delete all messages."""
148 for key in self.iterkeys():
149 self.discard(key)
150
151 def pop(self, key, default=None):
152 """Delete the keyed message and return it, or default."""
153 try:
154 result = self[key]
155 except KeyError:
156 return default
157 self.discard(key)
158 return result
159
160 def popitem(self):
161 """Delete an arbitrary (key, message) pair and return it."""
162 for key in self.iterkeys():
163 return (key, self.pop(key)) # This is only run once.
164 else:
165 raise KeyError('No messages in mailbox')
166
167 def update(self, arg=None):
168 """Change the messages that correspond to certain keys."""
169 if hasattr(arg, 'iteritems'):
170 source = arg.iteritems()
171 elif hasattr(arg, 'items'):
172 source = arg.items()
173 else:
174 source = arg
175 bad_key = False
176 for key, message in source:
177 try:
178 self[key] = message
179 except KeyError:
180 bad_key = True
181 if bad_key:
182 raise KeyError('No message with key(s)')
183
184 def flush(self):
185 """Write any pending changes to the disk."""
186 raise NotImplementedError('Method must be implemented by subclass')
187
188 def lock(self):
189 """Lock the mailbox."""
190 raise NotImplementedError('Method must be implemented by subclass')
191
192 def unlock(self):
193 """Unlock the mailbox if it is locked."""
194 raise NotImplementedError('Method must be implemented by subclass')
195
196 def close(self):
197 """Flush and close the mailbox."""
198 raise NotImplementedError('Method must be implemented by subclass')
199
200 def _dump_message(self, message, target, mangle_from_=False):
201 # Most files are opened in binary mode to allow predictable seeking.
202 # To get native line endings on disk, the user-friendly \n line endings
203 # used in strings and by email.Message are translated here.
204 """Dump message contents to target file."""
Georg Brandl5a096e12007-01-22 19:40:21 +0000205 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000206 buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +0000207 gen = email.generator.Generator(buffer, mangle_from_, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000208 gen.flatten(message)
209 buffer.seek(0)
210 target.write(buffer.read().replace('\n', os.linesep))
211 elif isinstance(message, str):
212 if mangle_from_:
213 message = message.replace('\nFrom ', '\n>From ')
214 message = message.replace('\n', os.linesep)
215 target.write(message)
216 elif hasattr(message, 'read'):
217 while True:
218 line = message.readline()
219 if line == '':
220 break
221 if mangle_from_ and line.startswith('From '):
222 line = '>From ' + line[5:]
223 line = line.replace('\n', os.linesep)
224 target.write(line)
225 else:
226 raise TypeError('Invalid message type: %s' % type(message))
227
228
229class Maildir(Mailbox):
230 """A qmail-style Maildir mailbox."""
231
232 colon = ':'
233
234 def __init__(self, dirname, factory=rfc822.Message, create=True):
235 """Initialize a Maildir instance."""
236 Mailbox.__init__(self, dirname, factory, create)
237 if not os.path.exists(self._path):
238 if create:
239 os.mkdir(self._path, 0700)
240 os.mkdir(os.path.join(self._path, 'tmp'), 0700)
241 os.mkdir(os.path.join(self._path, 'new'), 0700)
242 os.mkdir(os.path.join(self._path, 'cur'), 0700)
243 else:
244 raise NoSuchMailboxError(self._path)
245 self._toc = {}
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000246 self._last_read = None # Records last time we read cur/new
Antoine Pitroue4c6b162009-11-01 21:29:33 +0000247 # NOTE: we manually invalidate _last_read each time we do any
248 # modifications ourselves, otherwise we might get tripped up by
249 # bogus mtime behaviour on some systems (see issue #6896).
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000250
251 def add(self, message):
252 """Add message and return assigned key."""
253 tmp_file = self._create_tmp()
254 try:
255 self._dump_message(message, tmp_file)
R. David Murray008c0442011-02-11 23:03:13 +0000256 except BaseException:
257 tmp_file.close()
258 os.remove(tmp_file.name)
259 raise
260 _sync_close(tmp_file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000261 if isinstance(message, MaildirMessage):
262 subdir = message.get_subdir()
263 suffix = self.colon + message.get_info()
264 if suffix == self.colon:
265 suffix = ''
266 else:
267 subdir = 'new'
268 suffix = ''
269 uniq = os.path.basename(tmp_file.name).split(self.colon)[0]
270 dest = os.path.join(self._path, subdir, uniq + suffix)
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000271 try:
272 if hasattr(os, 'link'):
273 os.link(tmp_file.name, dest)
274 os.remove(tmp_file.name)
275 else:
276 os.rename(tmp_file.name, dest)
277 except OSError, e:
278 os.remove(tmp_file.name)
279 if e.errno == errno.EEXIST:
280 raise ExternalClashError('Name clash with existing message: %s'
281 % dest)
282 else:
283 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000284 if isinstance(message, MaildirMessage):
285 os.utime(dest, (os.path.getatime(dest), message.get_date()))
Antoine Pitroue4c6b162009-11-01 21:29:33 +0000286 # Invalidate cached toc
287 self._last_read = None
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000288 return uniq
289
290 def remove(self, key):
291 """Remove the keyed message; raise KeyError if it doesn't exist."""
292 os.remove(os.path.join(self._path, self._lookup(key)))
Antoine Pitroue4c6b162009-11-01 21:29:33 +0000293 # Invalidate cached toc (only on success)
294 self._last_read = None
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000295
296 def discard(self, key):
297 """If the keyed message exists, remove it."""
298 # This overrides an inapplicable implementation in the superclass.
299 try:
300 self.remove(key)
301 except KeyError:
302 pass
303 except OSError, e:
Martin v. Löwis08041d52006-05-04 14:27:52 +0000304 if e.errno != errno.ENOENT:
Tim Peters6d7cd7d2006-04-22 05:52:59 +0000305 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000306
307 def __setitem__(self, key, message):
308 """Replace the keyed message; raise KeyError if it doesn't exist."""
309 old_subpath = self._lookup(key)
310 temp_key = self.add(message)
311 temp_subpath = self._lookup(temp_key)
312 if isinstance(message, MaildirMessage):
313 # temp's subdir and suffix were specified by message.
314 dominant_subpath = temp_subpath
315 else:
316 # temp's subdir and suffix were defaults from add().
317 dominant_subpath = old_subpath
318 subdir = os.path.dirname(dominant_subpath)
319 if self.colon in dominant_subpath:
320 suffix = self.colon + dominant_subpath.split(self.colon)[-1]
321 else:
322 suffix = ''
323 self.discard(key)
324 new_path = os.path.join(self._path, subdir, key + suffix)
325 os.rename(os.path.join(self._path, temp_subpath), new_path)
326 if isinstance(message, MaildirMessage):
327 os.utime(new_path, (os.path.getatime(new_path),
328 message.get_date()))
Antoine Pitroue4c6b162009-11-01 21:29:33 +0000329 # Invalidate cached toc
330 self._last_read = None
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000331
332 def get_message(self, key):
333 """Return a Message representation or raise a KeyError."""
334 subpath = self._lookup(key)
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000335 f = open(os.path.join(self._path, subpath), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000336 try:
Andrew M. Kuchling15ce8802008-01-19 20:12:04 +0000337 if self._factory:
338 msg = self._factory(f)
339 else:
340 msg = MaildirMessage(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000341 finally:
342 f.close()
343 subdir, name = os.path.split(subpath)
344 msg.set_subdir(subdir)
345 if self.colon in name:
346 msg.set_info(name.split(self.colon)[-1])
347 msg.set_date(os.path.getmtime(os.path.join(self._path, subpath)))
348 return msg
349
350 def get_string(self, key):
351 """Return a string representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000352 f = open(os.path.join(self._path, self._lookup(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000353 try:
354 return f.read()
355 finally:
356 f.close()
357
358 def get_file(self, key):
359 """Return a file-like representation or raise a KeyError."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000360 f = open(os.path.join(self._path, self._lookup(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000361 return _ProxyFile(f)
362
363 def iterkeys(self):
364 """Return an iterator over keys."""
365 self._refresh()
366 for key in self._toc:
367 try:
368 self._lookup(key)
369 except KeyError:
370 continue
371 yield key
372
373 def has_key(self, key):
374 """Return True if the keyed message exists, False otherwise."""
375 self._refresh()
376 return key in self._toc
377
378 def __len__(self):
379 """Return a count of messages in the mailbox."""
380 self._refresh()
381 return len(self._toc)
382
383 def flush(self):
384 """Write any pending changes to disk."""
Antoine Pitroue4c6b162009-11-01 21:29:33 +0000385 # Maildir changes are always written immediately, so there's nothing
386 # to do except invalidate our cached toc.
387 self._last_read = None
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000388
389 def lock(self):
390 """Lock the mailbox."""
391 return
392
393 def unlock(self):
394 """Unlock the mailbox if it is locked."""
395 return
396
397 def close(self):
398 """Flush and close the mailbox."""
399 return
400
401 def list_folders(self):
402 """Return a list of folder names."""
403 result = []
404 for entry in os.listdir(self._path):
405 if len(entry) > 1 and entry[0] == '.' and \
406 os.path.isdir(os.path.join(self._path, entry)):
407 result.append(entry[1:])
408 return result
409
410 def get_folder(self, folder):
411 """Return a Maildir instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000412 return Maildir(os.path.join(self._path, '.' + folder),
413 factory=self._factory,
414 create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000415
416 def add_folder(self, folder):
417 """Create a folder and return a Maildir instance representing it."""
418 path = os.path.join(self._path, '.' + folder)
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +0000419 result = Maildir(path, factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000420 maildirfolder_path = os.path.join(path, 'maildirfolder')
421 if not os.path.exists(maildirfolder_path):
Andrew M. Kuchling70a6dbd2008-08-04 01:43:43 +0000422 os.close(os.open(maildirfolder_path, os.O_CREAT | os.O_WRONLY,
423 0666))
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000424 return result
425
426 def remove_folder(self, folder):
427 """Delete the named folder, which must be empty."""
428 path = os.path.join(self._path, '.' + folder)
429 for entry in os.listdir(os.path.join(path, 'new')) + \
430 os.listdir(os.path.join(path, 'cur')):
431 if len(entry) < 1 or entry[0] != '.':
432 raise NotEmptyError('Folder contains message(s): %s' % folder)
433 for entry in os.listdir(path):
434 if entry != 'new' and entry != 'cur' and entry != 'tmp' and \
435 os.path.isdir(os.path.join(path, entry)):
436 raise NotEmptyError("Folder contains subdirectory '%s': %s" %
437 (folder, entry))
438 for root, dirs, files in os.walk(path, topdown=False):
439 for entry in files:
440 os.remove(os.path.join(root, entry))
441 for entry in dirs:
442 os.rmdir(os.path.join(root, entry))
443 os.rmdir(path)
444
445 def clean(self):
446 """Delete old files in "tmp"."""
447 now = time.time()
448 for entry in os.listdir(os.path.join(self._path, 'tmp')):
449 path = os.path.join(self._path, 'tmp', entry)
450 if now - os.path.getatime(path) > 129600: # 60 * 60 * 36
451 os.remove(path)
452
453 _count = 1 # This is used to generate unique file names.
454
455 def _create_tmp(self):
456 """Create a file in the tmp subdirectory and open and return it."""
457 now = time.time()
458 hostname = socket.gethostname()
459 if '/' in hostname:
460 hostname = hostname.replace('/', r'\057')
461 if ':' in hostname:
462 hostname = hostname.replace(':', r'\072')
463 uniq = "%s.M%sP%sQ%s.%s" % (int(now), int(now % 1 * 1e6), os.getpid(),
464 Maildir._count, hostname)
465 path = os.path.join(self._path, 'tmp', uniq)
466 try:
467 os.stat(path)
468 except OSError, e:
469 if e.errno == errno.ENOENT:
470 Maildir._count += 1
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000471 try:
472 return _create_carefully(path)
473 except OSError, e:
474 if e.errno != errno.EEXIST:
475 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000476 else:
477 raise
Andrew M. Kuchling978d8282006-11-09 21:16:46 +0000478
479 # Fall through to here if stat succeeded or open raised EEXIST.
480 raise ExternalClashError('Name clash prevented file creation: %s' %
481 path)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000482
483 def _refresh(self):
484 """Update table of contents mapping."""
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000485 if self._last_read is not None:
486 for subdir in ('new', 'cur'):
487 mtime = os.path.getmtime(os.path.join(self._path, subdir))
488 if mtime > self._last_read:
489 break
490 else:
491 return
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000492
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000493 # We record the current time - 1sec so that, if _refresh() is called
494 # again in the same second, we will always re-read the mailbox
495 # just in case it's been modified. (os.path.mtime() only has
496 # 1sec resolution.) This results in a few unnecessary re-reads
497 # when _refresh() is called multiple times in the same second,
498 # but once the clock ticks over, we will only re-read as needed.
499 now = time.time() - 1
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000500
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000501 self._toc = {}
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000502 def update_dir (subdir):
503 path = os.path.join(self._path, subdir)
504 for entry in os.listdir(path):
505 p = os.path.join(path, entry)
Andrew M. Kuchling2b09ef02007-07-14 21:56:19 +0000506 if os.path.isdir(p):
507 continue
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000508 uniq = entry.split(self.colon)[0]
509 self._toc[uniq] = os.path.join(subdir, entry)
510
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000511 update_dir('new')
512 update_dir('cur')
513
Antoine Pitroud35b8c72009-11-01 00:30:13 +0000514 self._last_read = now
Andrew M. Kuchling420d4eb2009-05-02 19:17:28 +0000515
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000516 def _lookup(self, key):
517 """Use TOC to return subpath for given key, or raise a KeyError."""
518 try:
519 if os.path.exists(os.path.join(self._path, self._toc[key])):
520 return self._toc[key]
521 except KeyError:
522 pass
523 self._refresh()
524 try:
525 return self._toc[key]
526 except KeyError:
527 raise KeyError('No message with key: %s' % key)
528
529 # This method is for backward compatibility only.
530 def next(self):
531 """Return the next message in a one-time iteration."""
532 if not hasattr(self, '_onetime_keys'):
533 self._onetime_keys = self.iterkeys()
534 while True:
535 try:
536 return self[self._onetime_keys.next()]
537 except StopIteration:
538 return None
539 except KeyError:
540 continue
541
542
543class _singlefileMailbox(Mailbox):
544 """A single-file mailbox."""
545
546 def __init__(self, path, factory=None, create=True):
547 """Initialize a single-file mailbox."""
548 Mailbox.__init__(self, path, factory, create)
549 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000550 f = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000551 except IOError, e:
552 if e.errno == errno.ENOENT:
553 if create:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000554 f = open(self._path, 'wb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000555 else:
556 raise NoSuchMailboxError(self._path)
R. David Murray1a337902011-03-03 18:17:40 +0000557 elif e.errno in (errno.EACCES, errno.EROFS):
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000558 f = open(self._path, 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000559 else:
560 raise
561 self._file = f
562 self._toc = None
563 self._next_key = 0
564 self._pending = False # No changes require rewriting the file.
565 self._locked = False
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000566 self._file_length = None # Used to record mailbox size
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000567
568 def add(self, message):
569 """Add message and return assigned key."""
570 self._lookup()
571 self._toc[self._next_key] = self._append_message(message)
572 self._next_key += 1
573 self._pending = True
574 return self._next_key - 1
575
576 def remove(self, key):
577 """Remove the keyed message; raise KeyError if it doesn't exist."""
578 self._lookup(key)
579 del self._toc[key]
580 self._pending = True
581
582 def __setitem__(self, key, message):
583 """Replace the keyed message; raise KeyError if it doesn't exist."""
584 self._lookup(key)
585 self._toc[key] = self._append_message(message)
586 self._pending = True
587
588 def iterkeys(self):
589 """Return an iterator over keys."""
590 self._lookup()
591 for key in self._toc.keys():
592 yield key
593
594 def has_key(self, key):
595 """Return True if the keyed message exists, False otherwise."""
596 self._lookup()
597 return key in self._toc
598
599 def __len__(self):
600 """Return a count of messages in the mailbox."""
601 self._lookup()
602 return len(self._toc)
603
604 def lock(self):
605 """Lock the mailbox."""
606 if not self._locked:
607 _lock_file(self._file)
608 self._locked = True
609
610 def unlock(self):
611 """Unlock the mailbox if it is locked."""
612 if self._locked:
613 _unlock_file(self._file)
614 self._locked = False
615
616 def flush(self):
617 """Write any pending changes to disk."""
618 if not self._pending:
619 return
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000620
621 # In order to be writing anything out at all, self._toc must
622 # already have been generated (and presumably has been modified
623 # by adding or deleting an item).
624 assert self._toc is not None
Tim Petersf733abb2007-01-30 03:03:46 +0000625
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000626 # Check length of self._file; if it's changed, some other process
627 # has modified the mailbox since we scanned it.
628 self._file.seek(0, 2)
629 cur_len = self._file.tell()
630 if cur_len != self._file_length:
631 raise ExternalClashError('Size of mailbox file changed '
632 '(expected %i, found %i)' %
633 (self._file_length, cur_len))
Tim Petersf733abb2007-01-30 03:03:46 +0000634
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000635 new_file = _create_temporary(self._path)
636 try:
637 new_toc = {}
638 self._pre_mailbox_hook(new_file)
639 for key in sorted(self._toc.keys()):
640 start, stop = self._toc[key]
641 self._file.seek(start)
642 self._pre_message_hook(new_file)
643 new_start = new_file.tell()
644 while True:
645 buffer = self._file.read(min(4096,
646 stop - self._file.tell()))
647 if buffer == '':
648 break
649 new_file.write(buffer)
650 new_toc[key] = (new_start, new_file.tell())
651 self._post_message_hook(new_file)
652 except:
653 new_file.close()
654 os.remove(new_file.name)
655 raise
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000656 _sync_close(new_file)
657 # self._file is about to get replaced, so no need to sync.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000658 self._file.close()
659 try:
660 os.rename(new_file.name, self._path)
661 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +0000662 if e.errno == errno.EEXIST or \
663 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000664 os.remove(self._path)
665 os.rename(new_file.name, self._path)
666 else:
667 raise
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000668 self._file = open(self._path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000669 self._toc = new_toc
670 self._pending = False
671 if self._locked:
Andrew M. Kuchling0f871832006-10-27 16:55:34 +0000672 _lock_file(self._file, dotlock=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000673
674 def _pre_mailbox_hook(self, f):
675 """Called before writing the mailbox to file f."""
676 return
677
678 def _pre_message_hook(self, f):
679 """Called before writing each message to file f."""
680 return
681
682 def _post_message_hook(self, f):
683 """Called after writing each message to file f."""
684 return
685
686 def close(self):
687 """Flush and close the mailbox."""
688 self.flush()
689 if self._locked:
690 self.unlock()
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000691 self._file.close() # Sync has been done by self.flush() above.
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000692
693 def _lookup(self, key=None):
694 """Return (start, stop) or raise KeyError."""
695 if self._toc is None:
696 self._generate_toc()
697 if key is not None:
698 try:
699 return self._toc[key]
700 except KeyError:
701 raise KeyError('No message with key: %s' % key)
702
703 def _append_message(self, message):
704 """Append message to mailbox and return (start, stop) offsets."""
705 self._file.seek(0, 2)
R. David Murray008c0442011-02-11 23:03:13 +0000706 before = self._file.tell()
707 try:
708 self._pre_message_hook(self._file)
709 offsets = self._install_message(message)
710 self._post_message_hook(self._file)
711 except BaseException:
712 self._file.truncate(before)
713 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000714 self._file.flush()
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000715 self._file_length = self._file.tell() # Record current length of mailbox
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000716 return offsets
717
718
719
720class _mboxMMDF(_singlefileMailbox):
721 """An mbox or MMDF mailbox."""
722
723 _mangle_from_ = True
724
725 def get_message(self, key):
726 """Return a Message representation or raise a KeyError."""
727 start, stop = self._lookup(key)
728 self._file.seek(start)
729 from_line = self._file.readline().replace(os.linesep, '')
730 string = self._file.read(stop - self._file.tell())
731 msg = self._message_factory(string.replace(os.linesep, '\n'))
732 msg.set_from(from_line[5:])
733 return msg
734
735 def get_string(self, key, from_=False):
736 """Return a string representation or raise a KeyError."""
737 start, stop = self._lookup(key)
738 self._file.seek(start)
739 if not from_:
740 self._file.readline()
741 string = self._file.read(stop - self._file.tell())
742 return string.replace(os.linesep, '\n')
743
744 def get_file(self, key, from_=False):
745 """Return a file-like representation or raise a KeyError."""
746 start, stop = self._lookup(key)
747 self._file.seek(start)
748 if not from_:
749 self._file.readline()
750 return _PartialFile(self._file, self._file.tell(), stop)
751
752 def _install_message(self, message):
753 """Format a message and blindly write to self._file."""
754 from_line = None
755 if isinstance(message, str) and message.startswith('From '):
756 newline = message.find('\n')
757 if newline != -1:
758 from_line = message[:newline]
759 message = message[newline + 1:]
760 else:
761 from_line = message
762 message = ''
763 elif isinstance(message, _mboxMMDFMessage):
764 from_line = 'From ' + message.get_from()
Georg Brandl5a096e12007-01-22 19:40:21 +0000765 elif isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000766 from_line = message.get_unixfrom() # May be None.
767 if from_line is None:
768 from_line = 'From MAILER-DAEMON %s' % time.asctime(time.gmtime())
769 start = self._file.tell()
770 self._file.write(from_line + os.linesep)
771 self._dump_message(message, self._file, self._mangle_from_)
772 stop = self._file.tell()
773 return (start, stop)
774
775
776class mbox(_mboxMMDF):
777 """A classic mbox mailbox."""
778
779 _mangle_from_ = True
780
781 def __init__(self, path, factory=None, create=True):
782 """Initialize an mbox mailbox."""
783 self._message_factory = mboxMessage
784 _mboxMMDF.__init__(self, path, factory, create)
785
786 def _pre_message_hook(self, f):
787 """Called before writing each message to file f."""
788 if f.tell() != 0:
789 f.write(os.linesep)
790
791 def _generate_toc(self):
792 """Generate key-to-(start, stop) table of contents."""
793 starts, stops = [], []
794 self._file.seek(0)
795 while True:
796 line_pos = self._file.tell()
797 line = self._file.readline()
798 if line.startswith('From '):
799 if len(stops) < len(starts):
800 stops.append(line_pos - len(os.linesep))
801 starts.append(line_pos)
802 elif line == '':
803 stops.append(line_pos)
804 break
805 self._toc = dict(enumerate(zip(starts, stops)))
806 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000807 self._file_length = self._file.tell()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000808
809
810class MMDF(_mboxMMDF):
811 """An MMDF mailbox."""
812
813 def __init__(self, path, factory=None, create=True):
814 """Initialize an MMDF mailbox."""
815 self._message_factory = MMDFMessage
816 _mboxMMDF.__init__(self, path, factory, create)
817
818 def _pre_message_hook(self, f):
819 """Called before writing each message to file f."""
820 f.write('\001\001\001\001' + os.linesep)
821
822 def _post_message_hook(self, f):
823 """Called after writing each message to file f."""
824 f.write(os.linesep + '\001\001\001\001' + os.linesep)
825
826 def _generate_toc(self):
827 """Generate key-to-(start, stop) table of contents."""
828 starts, stops = [], []
829 self._file.seek(0)
830 next_pos = 0
831 while True:
832 line_pos = next_pos
833 line = self._file.readline()
834 next_pos = self._file.tell()
835 if line.startswith('\001\001\001\001' + os.linesep):
836 starts.append(next_pos)
837 while True:
838 line_pos = next_pos
839 line = self._file.readline()
840 next_pos = self._file.tell()
841 if line == '\001\001\001\001' + os.linesep:
842 stops.append(line_pos - len(os.linesep))
843 break
844 elif line == '':
845 stops.append(line_pos)
846 break
847 elif line == '':
848 break
849 self._toc = dict(enumerate(zip(starts, stops)))
850 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +0000851 self._file.seek(0, 2)
852 self._file_length = self._file.tell()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000853
854
855class MH(Mailbox):
856 """An MH mailbox."""
857
858 def __init__(self, path, factory=None, create=True):
859 """Initialize an MH instance."""
860 Mailbox.__init__(self, path, factory, create)
861 if not os.path.exists(self._path):
862 if create:
863 os.mkdir(self._path, 0700)
864 os.close(os.open(os.path.join(self._path, '.mh_sequences'),
865 os.O_CREAT | os.O_EXCL | os.O_WRONLY, 0600))
866 else:
867 raise NoSuchMailboxError(self._path)
868 self._locked = False
869
870 def add(self, message):
871 """Add message and return assigned key."""
872 keys = self.keys()
873 if len(keys) == 0:
874 new_key = 1
875 else:
876 new_key = max(keys) + 1
877 new_path = os.path.join(self._path, str(new_key))
878 f = _create_carefully(new_path)
R. David Murrayf9e34232011-02-12 02:03:56 +0000879 closed = False
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000880 try:
881 if self._locked:
882 _lock_file(f)
883 try:
R. David Murray008c0442011-02-11 23:03:13 +0000884 try:
885 self._dump_message(message, f)
886 except BaseException:
R. David Murrayf9e34232011-02-12 02:03:56 +0000887 # Unlock and close so it can be deleted on Windows
888 if self._locked:
889 _unlock_file(f)
890 _sync_close(f)
891 closed = True
R. David Murray008c0442011-02-11 23:03:13 +0000892 os.remove(new_path)
893 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000894 if isinstance(message, MHMessage):
895 self._dump_sequences(message, new_key)
896 finally:
897 if self._locked:
898 _unlock_file(f)
899 finally:
R. David Murrayf9e34232011-02-12 02:03:56 +0000900 if not closed:
901 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000902 return new_key
903
904 def remove(self, key):
905 """Remove the keyed message; raise KeyError if it doesn't exist."""
906 path = os.path.join(self._path, str(key))
907 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000908 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000909 except IOError, e:
910 if e.errno == errno.ENOENT:
911 raise KeyError('No message with key: %s' % key)
912 else:
913 raise
Andrew M. Kuchlingb72b0eb2010-02-22 18:42:07 +0000914 else:
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000915 f.close()
Andrew M. Kuchlingb72b0eb2010-02-22 18:42:07 +0000916 os.remove(path)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000917
918 def __setitem__(self, key, message):
919 """Replace the keyed message; raise KeyError if it doesn't exist."""
920 path = os.path.join(self._path, str(key))
921 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000922 f = open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000923 except IOError, e:
924 if e.errno == errno.ENOENT:
925 raise KeyError('No message with key: %s' % key)
926 else:
927 raise
928 try:
929 if self._locked:
930 _lock_file(f)
931 try:
932 os.close(os.open(path, os.O_WRONLY | os.O_TRUNC))
933 self._dump_message(message, f)
934 if isinstance(message, MHMessage):
935 self._dump_sequences(message, key)
936 finally:
937 if self._locked:
938 _unlock_file(f)
939 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +0000940 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000941
942 def get_message(self, key):
943 """Return a Message representation or raise a KeyError."""
944 try:
945 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000946 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000947 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000948 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000949 except IOError, e:
950 if e.errno == errno.ENOENT:
951 raise KeyError('No message with key: %s' % key)
952 else:
953 raise
954 try:
955 if self._locked:
956 _lock_file(f)
957 try:
958 msg = MHMessage(f)
959 finally:
960 if self._locked:
961 _unlock_file(f)
962 finally:
963 f.close()
R. David Murray52720c52009-04-02 14:05:35 +0000964 for name, key_list in self.get_sequences().iteritems():
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000965 if key in key_list:
966 msg.add_sequence(name)
967 return msg
968
969 def get_string(self, key):
970 """Return a string representation or raise a KeyError."""
971 try:
972 if self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000973 f = open(os.path.join(self._path, str(key)), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000974 else:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000975 f = open(os.path.join(self._path, str(key)), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000976 except IOError, e:
977 if e.errno == errno.ENOENT:
978 raise KeyError('No message with key: %s' % key)
979 else:
980 raise
981 try:
982 if self._locked:
983 _lock_file(f)
984 try:
985 return f.read()
986 finally:
987 if self._locked:
988 _unlock_file(f)
989 finally:
990 f.close()
991
992 def get_file(self, key):
993 """Return a file-like representation or raise a KeyError."""
994 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +0000995 f = open(os.path.join(self._path, str(key)), 'rb')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +0000996 except IOError, e:
997 if e.errno == errno.ENOENT:
998 raise KeyError('No message with key: %s' % key)
999 else:
1000 raise
1001 return _ProxyFile(f)
1002
1003 def iterkeys(self):
1004 """Return an iterator over keys."""
1005 return iter(sorted(int(entry) for entry in os.listdir(self._path)
1006 if entry.isdigit()))
1007
1008 def has_key(self, key):
1009 """Return True if the keyed message exists, False otherwise."""
1010 return os.path.exists(os.path.join(self._path, str(key)))
1011
1012 def __len__(self):
1013 """Return a count of messages in the mailbox."""
1014 return len(list(self.iterkeys()))
1015
1016 def lock(self):
1017 """Lock the mailbox."""
1018 if not self._locked:
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001019 self._file = open(os.path.join(self._path, '.mh_sequences'), 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001020 _lock_file(self._file)
1021 self._locked = True
1022
1023 def unlock(self):
1024 """Unlock the mailbox if it is locked."""
1025 if self._locked:
1026 _unlock_file(self._file)
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001027 _sync_close(self._file)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001028 del self._file
1029 self._locked = False
1030
1031 def flush(self):
1032 """Write any pending changes to the disk."""
1033 return
1034
1035 def close(self):
1036 """Flush and close the mailbox."""
1037 if self._locked:
1038 self.unlock()
1039
1040 def list_folders(self):
1041 """Return a list of folder names."""
1042 result = []
1043 for entry in os.listdir(self._path):
1044 if os.path.isdir(os.path.join(self._path, entry)):
1045 result.append(entry)
1046 return result
1047
1048 def get_folder(self, folder):
1049 """Return an MH instance for the named folder."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +00001050 return MH(os.path.join(self._path, folder),
1051 factory=self._factory, create=False)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001052
1053 def add_folder(self, folder):
1054 """Create a folder and return an MH instance representing it."""
Andrew M. Kuchlinga3e5d372006-11-09 13:27:07 +00001055 return MH(os.path.join(self._path, folder),
1056 factory=self._factory)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001057
1058 def remove_folder(self, folder):
1059 """Delete the named folder, which must be empty."""
1060 path = os.path.join(self._path, folder)
1061 entries = os.listdir(path)
1062 if entries == ['.mh_sequences']:
1063 os.remove(os.path.join(path, '.mh_sequences'))
1064 elif entries == []:
1065 pass
1066 else:
1067 raise NotEmptyError('Folder not empty: %s' % self._path)
1068 os.rmdir(path)
1069
1070 def get_sequences(self):
1071 """Return a name-to-key-list dictionary to define each sequence."""
1072 results = {}
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001073 f = open(os.path.join(self._path, '.mh_sequences'), 'r')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001074 try:
1075 all_keys = set(self.keys())
1076 for line in f:
1077 try:
1078 name, contents = line.split(':')
1079 keys = set()
1080 for spec in contents.split():
1081 if spec.isdigit():
1082 keys.add(int(spec))
1083 else:
1084 start, stop = (int(x) for x in spec.split('-'))
1085 keys.update(range(start, stop + 1))
1086 results[name] = [key for key in sorted(keys) \
1087 if key in all_keys]
1088 if len(results[name]) == 0:
1089 del results[name]
1090 except ValueError:
1091 raise FormatError('Invalid sequence specification: %s' %
1092 line.rstrip())
1093 finally:
1094 f.close()
1095 return results
1096
1097 def set_sequences(self, sequences):
1098 """Set sequences using the given name-to-key-list dictionary."""
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001099 f = open(os.path.join(self._path, '.mh_sequences'), 'r+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001100 try:
1101 os.close(os.open(f.name, os.O_WRONLY | os.O_TRUNC))
1102 for name, keys in sequences.iteritems():
1103 if len(keys) == 0:
1104 continue
1105 f.write('%s:' % name)
1106 prev = None
1107 completing = False
1108 for key in sorted(set(keys)):
1109 if key - 1 == prev:
1110 if not completing:
1111 completing = True
1112 f.write('-')
1113 elif completing:
1114 completing = False
1115 f.write('%s %s' % (prev, key))
1116 else:
1117 f.write(' %s' % key)
1118 prev = key
1119 if completing:
1120 f.write(str(prev) + '\n')
1121 else:
1122 f.write('\n')
1123 finally:
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001124 _sync_close(f)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001125
1126 def pack(self):
1127 """Re-name messages to eliminate numbering gaps. Invalidates keys."""
1128 sequences = self.get_sequences()
1129 prev = 0
1130 changes = []
1131 for key in self.iterkeys():
1132 if key - 1 != prev:
1133 changes.append((key, prev + 1))
Andrew M. Kuchling8c456f32006-11-17 13:30:25 +00001134 if hasattr(os, 'link'):
1135 os.link(os.path.join(self._path, str(key)),
1136 os.path.join(self._path, str(prev + 1)))
1137 os.unlink(os.path.join(self._path, str(key)))
1138 else:
1139 os.rename(os.path.join(self._path, str(key)),
1140 os.path.join(self._path, str(prev + 1)))
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001141 prev += 1
1142 self._next_key = prev + 1
1143 if len(changes) == 0:
1144 return
1145 for name, key_list in sequences.items():
1146 for old, new in changes:
1147 if old in key_list:
1148 key_list[key_list.index(old)] = new
1149 self.set_sequences(sequences)
1150
1151 def _dump_sequences(self, message, key):
1152 """Inspect a new MHMessage and update sequences appropriately."""
1153 pending_sequences = message.get_sequences()
1154 all_sequences = self.get_sequences()
1155 for name, key_list in all_sequences.iteritems():
1156 if name in pending_sequences:
1157 key_list.append(key)
1158 elif key in key_list:
1159 del key_list[key_list.index(key)]
1160 for sequence in pending_sequences:
1161 if sequence not in all_sequences:
1162 all_sequences[sequence] = [key]
1163 self.set_sequences(all_sequences)
1164
1165
1166class Babyl(_singlefileMailbox):
1167 """An Rmail-style Babyl mailbox."""
1168
1169 _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered',
1170 'forwarded', 'edited', 'resent'))
1171
1172 def __init__(self, path, factory=None, create=True):
1173 """Initialize a Babyl mailbox."""
1174 _singlefileMailbox.__init__(self, path, factory, create)
1175 self._labels = {}
1176
1177 def add(self, message):
1178 """Add message and return assigned key."""
1179 key = _singlefileMailbox.add(self, message)
1180 if isinstance(message, BabylMessage):
1181 self._labels[key] = message.get_labels()
1182 return key
1183
1184 def remove(self, key):
1185 """Remove the keyed message; raise KeyError if it doesn't exist."""
1186 _singlefileMailbox.remove(self, key)
1187 if key in self._labels:
1188 del self._labels[key]
1189
1190 def __setitem__(self, key, message):
1191 """Replace the keyed message; raise KeyError if it doesn't exist."""
1192 _singlefileMailbox.__setitem__(self, key, message)
1193 if isinstance(message, BabylMessage):
1194 self._labels[key] = message.get_labels()
1195
1196 def get_message(self, key):
1197 """Return a Message representation or raise a KeyError."""
1198 start, stop = self._lookup(key)
1199 self._file.seek(start)
1200 self._file.readline() # Skip '1,' line specifying labels.
1201 original_headers = StringIO.StringIO()
1202 while True:
1203 line = self._file.readline()
1204 if line == '*** EOOH ***' + os.linesep or line == '':
1205 break
1206 original_headers.write(line.replace(os.linesep, '\n'))
1207 visible_headers = StringIO.StringIO()
1208 while True:
1209 line = self._file.readline()
1210 if line == os.linesep or line == '':
1211 break
1212 visible_headers.write(line.replace(os.linesep, '\n'))
1213 body = self._file.read(stop - self._file.tell()).replace(os.linesep,
1214 '\n')
1215 msg = BabylMessage(original_headers.getvalue() + body)
1216 msg.set_visible(visible_headers.getvalue())
1217 if key in self._labels:
1218 msg.set_labels(self._labels[key])
1219 return msg
1220
1221 def get_string(self, key):
1222 """Return a string representation or raise a KeyError."""
1223 start, stop = self._lookup(key)
1224 self._file.seek(start)
1225 self._file.readline() # Skip '1,' line specifying labels.
1226 original_headers = StringIO.StringIO()
1227 while True:
1228 line = self._file.readline()
1229 if line == '*** EOOH ***' + os.linesep or line == '':
1230 break
1231 original_headers.write(line.replace(os.linesep, '\n'))
1232 while True:
1233 line = self._file.readline()
1234 if line == os.linesep or line == '':
1235 break
1236 return original_headers.getvalue() + \
1237 self._file.read(stop - self._file.tell()).replace(os.linesep,
1238 '\n')
1239
1240 def get_file(self, key):
1241 """Return a file-like representation or raise a KeyError."""
1242 return StringIO.StringIO(self.get_string(key).replace('\n',
1243 os.linesep))
1244
1245 def get_labels(self):
1246 """Return a list of user-defined labels in the mailbox."""
1247 self._lookup()
1248 labels = set()
1249 for label_list in self._labels.values():
1250 labels.update(label_list)
1251 labels.difference_update(self._special_labels)
1252 return list(labels)
1253
1254 def _generate_toc(self):
1255 """Generate key-to-(start, stop) table of contents."""
1256 starts, stops = [], []
1257 self._file.seek(0)
1258 next_pos = 0
1259 label_lists = []
1260 while True:
1261 line_pos = next_pos
1262 line = self._file.readline()
1263 next_pos = self._file.tell()
1264 if line == '\037\014' + os.linesep:
1265 if len(stops) < len(starts):
1266 stops.append(line_pos - len(os.linesep))
1267 starts.append(next_pos)
1268 labels = [label.strip() for label
1269 in self._file.readline()[1:].split(',')
1270 if label.strip() != '']
1271 label_lists.append(labels)
1272 elif line == '\037' or line == '\037' + os.linesep:
1273 if len(stops) < len(starts):
1274 stops.append(line_pos - len(os.linesep))
1275 elif line == '':
1276 stops.append(line_pos - len(os.linesep))
1277 break
1278 self._toc = dict(enumerate(zip(starts, stops)))
1279 self._labels = dict(enumerate(label_lists))
1280 self._next_key = len(self._toc)
Andrew M. Kuchlingeca4c312006-12-20 19:48:20 +00001281 self._file.seek(0, 2)
1282 self._file_length = self._file.tell()
Tim Petersf733abb2007-01-30 03:03:46 +00001283
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001284 def _pre_mailbox_hook(self, f):
1285 """Called before writing the mailbox to file f."""
1286 f.write('BABYL OPTIONS:%sVersion: 5%sLabels:%s%s\037' %
1287 (os.linesep, os.linesep, ','.join(self.get_labels()),
1288 os.linesep))
1289
1290 def _pre_message_hook(self, f):
1291 """Called before writing each message to file f."""
1292 f.write('\014' + os.linesep)
1293
1294 def _post_message_hook(self, f):
1295 """Called after writing each message to file f."""
1296 f.write(os.linesep + '\037')
1297
1298 def _install_message(self, message):
1299 """Write message contents and return (start, stop)."""
1300 start = self._file.tell()
1301 if isinstance(message, BabylMessage):
1302 special_labels = []
1303 labels = []
1304 for label in message.get_labels():
1305 if label in self._special_labels:
1306 special_labels.append(label)
1307 else:
1308 labels.append(label)
1309 self._file.write('1')
1310 for label in special_labels:
1311 self._file.write(', ' + label)
1312 self._file.write(',,')
1313 for label in labels:
1314 self._file.write(' ' + label + ',')
1315 self._file.write(os.linesep)
1316 else:
1317 self._file.write('1,,' + os.linesep)
Georg Brandl5a096e12007-01-22 19:40:21 +00001318 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001319 orig_buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +00001320 orig_generator = email.generator.Generator(orig_buffer, False, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001321 orig_generator.flatten(message)
1322 orig_buffer.seek(0)
1323 while True:
1324 line = orig_buffer.readline()
1325 self._file.write(line.replace('\n', os.linesep))
1326 if line == '\n' or line == '':
1327 break
1328 self._file.write('*** EOOH ***' + os.linesep)
1329 if isinstance(message, BabylMessage):
1330 vis_buffer = StringIO.StringIO()
Georg Brandl5a096e12007-01-22 19:40:21 +00001331 vis_generator = email.generator.Generator(vis_buffer, False, 0)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001332 vis_generator.flatten(message.get_visible())
1333 while True:
1334 line = vis_buffer.readline()
1335 self._file.write(line.replace('\n', os.linesep))
1336 if line == '\n' or line == '':
1337 break
1338 else:
1339 orig_buffer.seek(0)
1340 while True:
1341 line = orig_buffer.readline()
1342 self._file.write(line.replace('\n', os.linesep))
1343 if line == '\n' or line == '':
1344 break
1345 while True:
1346 buffer = orig_buffer.read(4096) # Buffer size is arbitrary.
1347 if buffer == '':
1348 break
1349 self._file.write(buffer.replace('\n', os.linesep))
1350 elif isinstance(message, str):
1351 body_start = message.find('\n\n') + 2
1352 if body_start - 2 != -1:
1353 self._file.write(message[:body_start].replace('\n',
1354 os.linesep))
1355 self._file.write('*** EOOH ***' + os.linesep)
1356 self._file.write(message[:body_start].replace('\n',
1357 os.linesep))
1358 self._file.write(message[body_start:].replace('\n',
1359 os.linesep))
1360 else:
1361 self._file.write('*** EOOH ***' + os.linesep + os.linesep)
1362 self._file.write(message.replace('\n', os.linesep))
1363 elif hasattr(message, 'readline'):
1364 original_pos = message.tell()
1365 first_pass = True
1366 while True:
1367 line = message.readline()
1368 self._file.write(line.replace('\n', os.linesep))
1369 if line == '\n' or line == '':
1370 self._file.write('*** EOOH ***' + os.linesep)
1371 if first_pass:
1372 first_pass = False
1373 message.seek(original_pos)
1374 else:
1375 break
1376 while True:
1377 buffer = message.read(4096) # Buffer size is arbitrary.
1378 if buffer == '':
1379 break
1380 self._file.write(buffer.replace('\n', os.linesep))
1381 else:
1382 raise TypeError('Invalid message type: %s' % type(message))
1383 stop = self._file.tell()
1384 return (start, stop)
1385
1386
Georg Brandl5a096e12007-01-22 19:40:21 +00001387class Message(email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001388 """Message with mailbox-format-specific properties."""
1389
1390 def __init__(self, message=None):
1391 """Initialize a Message instance."""
Georg Brandl5a096e12007-01-22 19:40:21 +00001392 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001393 self._become_message(copy.deepcopy(message))
1394 if isinstance(message, Message):
1395 message._explain_to(self)
1396 elif isinstance(message, str):
1397 self._become_message(email.message_from_string(message))
1398 elif hasattr(message, "read"):
1399 self._become_message(email.message_from_file(message))
1400 elif message is None:
Georg Brandl5a096e12007-01-22 19:40:21 +00001401 email.message.Message.__init__(self)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001402 else:
1403 raise TypeError('Invalid message type: %s' % type(message))
1404
1405 def _become_message(self, message):
1406 """Assume the non-format-specific state of message."""
1407 for name in ('_headers', '_unixfrom', '_payload', '_charset',
1408 'preamble', 'epilogue', 'defects', '_default_type'):
1409 self.__dict__[name] = message.__dict__[name]
1410
1411 def _explain_to(self, message):
1412 """Copy format-specific state to message insofar as possible."""
1413 if isinstance(message, Message):
1414 return # There's nothing format-specific to explain.
1415 else:
1416 raise TypeError('Cannot convert to specified type')
1417
1418
1419class MaildirMessage(Message):
1420 """Message with Maildir-specific properties."""
1421
1422 def __init__(self, message=None):
1423 """Initialize a MaildirMessage instance."""
1424 self._subdir = 'new'
1425 self._info = ''
1426 self._date = time.time()
1427 Message.__init__(self, message)
1428
1429 def get_subdir(self):
1430 """Return 'new' or 'cur'."""
1431 return self._subdir
1432
1433 def set_subdir(self, subdir):
1434 """Set subdir to 'new' or 'cur'."""
1435 if subdir == 'new' or subdir == 'cur':
1436 self._subdir = subdir
1437 else:
1438 raise ValueError("subdir must be 'new' or 'cur': %s" % subdir)
1439
1440 def get_flags(self):
1441 """Return as a string the flags that are set."""
1442 if self._info.startswith('2,'):
1443 return self._info[2:]
1444 else:
1445 return ''
1446
1447 def set_flags(self, flags):
1448 """Set the given flags and unset all others."""
1449 self._info = '2,' + ''.join(sorted(flags))
1450
1451 def add_flag(self, flag):
1452 """Set the given flag(s) without changing others."""
1453 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1454
1455 def remove_flag(self, flag):
1456 """Unset the given string flag(s) without changing others."""
1457 if self.get_flags() != '':
1458 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1459
1460 def get_date(self):
1461 """Return delivery date of message, in seconds since the epoch."""
1462 return self._date
1463
1464 def set_date(self, date):
1465 """Set delivery date of message, in seconds since the epoch."""
1466 try:
1467 self._date = float(date)
1468 except ValueError:
1469 raise TypeError("can't convert to float: %s" % date)
1470
1471 def get_info(self):
1472 """Get the message's "info" as a string."""
1473 return self._info
1474
1475 def set_info(self, info):
1476 """Set the message's "info" string."""
1477 if isinstance(info, str):
1478 self._info = info
1479 else:
1480 raise TypeError('info must be a string: %s' % type(info))
1481
1482 def _explain_to(self, message):
1483 """Copy Maildir-specific state to message insofar as possible."""
1484 if isinstance(message, MaildirMessage):
1485 message.set_flags(self.get_flags())
1486 message.set_subdir(self.get_subdir())
1487 message.set_date(self.get_date())
1488 elif isinstance(message, _mboxMMDFMessage):
1489 flags = set(self.get_flags())
1490 if 'S' in flags:
1491 message.add_flag('R')
1492 if self.get_subdir() == 'cur':
1493 message.add_flag('O')
1494 if 'T' in flags:
1495 message.add_flag('D')
1496 if 'F' in flags:
1497 message.add_flag('F')
1498 if 'R' in flags:
1499 message.add_flag('A')
1500 message.set_from('MAILER-DAEMON', time.gmtime(self.get_date()))
1501 elif isinstance(message, MHMessage):
1502 flags = set(self.get_flags())
1503 if 'S' not in flags:
1504 message.add_sequence('unseen')
1505 if 'R' in flags:
1506 message.add_sequence('replied')
1507 if 'F' in flags:
1508 message.add_sequence('flagged')
1509 elif isinstance(message, BabylMessage):
1510 flags = set(self.get_flags())
1511 if 'S' not in flags:
1512 message.add_label('unseen')
1513 if 'T' in flags:
1514 message.add_label('deleted')
1515 if 'R' in flags:
1516 message.add_label('answered')
1517 if 'P' in flags:
1518 message.add_label('forwarded')
1519 elif isinstance(message, Message):
1520 pass
1521 else:
1522 raise TypeError('Cannot convert to specified type: %s' %
1523 type(message))
1524
1525
1526class _mboxMMDFMessage(Message):
1527 """Message with mbox- or MMDF-specific properties."""
1528
1529 def __init__(self, message=None):
1530 """Initialize an mboxMMDFMessage instance."""
1531 self.set_from('MAILER-DAEMON', True)
Georg Brandl5a096e12007-01-22 19:40:21 +00001532 if isinstance(message, email.message.Message):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001533 unixfrom = message.get_unixfrom()
1534 if unixfrom is not None and unixfrom.startswith('From '):
1535 self.set_from(unixfrom[5:])
1536 Message.__init__(self, message)
1537
1538 def get_from(self):
1539 """Return contents of "From " line."""
1540 return self._from
1541
1542 def set_from(self, from_, time_=None):
1543 """Set "From " line, formatting and appending time_ if specified."""
1544 if time_ is not None:
1545 if time_ is True:
1546 time_ = time.gmtime()
1547 from_ += ' ' + time.asctime(time_)
1548 self._from = from_
1549
1550 def get_flags(self):
1551 """Return as a string the flags that are set."""
1552 return self.get('Status', '') + self.get('X-Status', '')
1553
1554 def set_flags(self, flags):
1555 """Set the given flags and unset all others."""
1556 flags = set(flags)
1557 status_flags, xstatus_flags = '', ''
1558 for flag in ('R', 'O'):
1559 if flag in flags:
1560 status_flags += flag
1561 flags.remove(flag)
1562 for flag in ('D', 'F', 'A'):
1563 if flag in flags:
1564 xstatus_flags += flag
1565 flags.remove(flag)
1566 xstatus_flags += ''.join(sorted(flags))
1567 try:
1568 self.replace_header('Status', status_flags)
1569 except KeyError:
1570 self.add_header('Status', status_flags)
1571 try:
1572 self.replace_header('X-Status', xstatus_flags)
1573 except KeyError:
1574 self.add_header('X-Status', xstatus_flags)
1575
1576 def add_flag(self, flag):
1577 """Set the given flag(s) without changing others."""
1578 self.set_flags(''.join(set(self.get_flags()) | set(flag)))
1579
1580 def remove_flag(self, flag):
1581 """Unset the given string flag(s) without changing others."""
1582 if 'Status' in self or 'X-Status' in self:
1583 self.set_flags(''.join(set(self.get_flags()) - set(flag)))
1584
1585 def _explain_to(self, message):
1586 """Copy mbox- or MMDF-specific state to message insofar as possible."""
1587 if isinstance(message, MaildirMessage):
1588 flags = set(self.get_flags())
1589 if 'O' in flags:
1590 message.set_subdir('cur')
1591 if 'F' in flags:
1592 message.add_flag('F')
1593 if 'A' in flags:
1594 message.add_flag('R')
1595 if 'R' in flags:
1596 message.add_flag('S')
1597 if 'D' in flags:
1598 message.add_flag('T')
1599 del message['status']
1600 del message['x-status']
1601 maybe_date = ' '.join(self.get_from().split()[-5:])
1602 try:
1603 message.set_date(calendar.timegm(time.strptime(maybe_date,
1604 '%a %b %d %H:%M:%S %Y')))
1605 except (ValueError, OverflowError):
1606 pass
1607 elif isinstance(message, _mboxMMDFMessage):
1608 message.set_flags(self.get_flags())
1609 message.set_from(self.get_from())
1610 elif isinstance(message, MHMessage):
1611 flags = set(self.get_flags())
1612 if 'R' not in flags:
1613 message.add_sequence('unseen')
1614 if 'A' in flags:
1615 message.add_sequence('replied')
1616 if 'F' in flags:
1617 message.add_sequence('flagged')
1618 del message['status']
1619 del message['x-status']
1620 elif isinstance(message, BabylMessage):
1621 flags = set(self.get_flags())
1622 if 'R' not in flags:
1623 message.add_label('unseen')
1624 if 'D' in flags:
1625 message.add_label('deleted')
1626 if 'A' in flags:
1627 message.add_label('answered')
1628 del message['status']
1629 del message['x-status']
1630 elif isinstance(message, Message):
1631 pass
1632 else:
1633 raise TypeError('Cannot convert to specified type: %s' %
1634 type(message))
1635
1636
1637class mboxMessage(_mboxMMDFMessage):
1638 """Message with mbox-specific properties."""
1639
1640
1641class MHMessage(Message):
1642 """Message with MH-specific properties."""
1643
1644 def __init__(self, message=None):
1645 """Initialize an MHMessage instance."""
1646 self._sequences = []
1647 Message.__init__(self, message)
1648
1649 def get_sequences(self):
1650 """Return a list of sequences that include the message."""
1651 return self._sequences[:]
1652
1653 def set_sequences(self, sequences):
1654 """Set the list of sequences that include the message."""
1655 self._sequences = list(sequences)
1656
1657 def add_sequence(self, sequence):
1658 """Add sequence to list of sequences including the message."""
1659 if isinstance(sequence, str):
1660 if not sequence in self._sequences:
1661 self._sequences.append(sequence)
1662 else:
1663 raise TypeError('sequence must be a string: %s' % type(sequence))
1664
1665 def remove_sequence(self, sequence):
1666 """Remove sequence from the list of sequences including the message."""
1667 try:
1668 self._sequences.remove(sequence)
1669 except ValueError:
1670 pass
1671
1672 def _explain_to(self, message):
1673 """Copy MH-specific state to message insofar as possible."""
1674 if isinstance(message, MaildirMessage):
1675 sequences = set(self.get_sequences())
1676 if 'unseen' in sequences:
1677 message.set_subdir('cur')
1678 else:
1679 message.set_subdir('cur')
1680 message.add_flag('S')
1681 if 'flagged' in sequences:
1682 message.add_flag('F')
1683 if 'replied' in sequences:
1684 message.add_flag('R')
1685 elif isinstance(message, _mboxMMDFMessage):
1686 sequences = set(self.get_sequences())
1687 if 'unseen' not in sequences:
1688 message.add_flag('RO')
1689 else:
1690 message.add_flag('O')
1691 if 'flagged' in sequences:
1692 message.add_flag('F')
1693 if 'replied' in sequences:
1694 message.add_flag('A')
1695 elif isinstance(message, MHMessage):
1696 for sequence in self.get_sequences():
1697 message.add_sequence(sequence)
1698 elif isinstance(message, BabylMessage):
1699 sequences = set(self.get_sequences())
1700 if 'unseen' in sequences:
1701 message.add_label('unseen')
1702 if 'replied' in sequences:
1703 message.add_label('answered')
1704 elif isinstance(message, Message):
1705 pass
1706 else:
1707 raise TypeError('Cannot convert to specified type: %s' %
1708 type(message))
1709
1710
1711class BabylMessage(Message):
1712 """Message with Babyl-specific properties."""
1713
1714 def __init__(self, message=None):
1715 """Initialize an BabylMessage instance."""
1716 self._labels = []
1717 self._visible = Message()
1718 Message.__init__(self, message)
1719
1720 def get_labels(self):
1721 """Return a list of labels on the message."""
1722 return self._labels[:]
1723
1724 def set_labels(self, labels):
1725 """Set the list of labels on the message."""
1726 self._labels = list(labels)
1727
1728 def add_label(self, label):
1729 """Add label to list of labels on the message."""
1730 if isinstance(label, str):
1731 if label not in self._labels:
1732 self._labels.append(label)
1733 else:
1734 raise TypeError('label must be a string: %s' % type(label))
1735
1736 def remove_label(self, label):
1737 """Remove label from the list of labels on the message."""
1738 try:
1739 self._labels.remove(label)
1740 except ValueError:
1741 pass
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001742
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001743 def get_visible(self):
1744 """Return a Message representation of visible headers."""
1745 return Message(self._visible)
1746
1747 def set_visible(self, visible):
1748 """Set the Message representation of visible headers."""
1749 self._visible = Message(visible)
1750
1751 def update_visible(self):
1752 """Update and/or sensibly generate a set of visible headers."""
1753 for header in self._visible.keys():
1754 if header in self:
1755 self._visible.replace_header(header, self[header])
1756 else:
1757 del self._visible[header]
1758 for header in ('Date', 'From', 'Reply-To', 'To', 'CC', 'Subject'):
1759 if header in self and header not in self._visible:
1760 self._visible[header] = self[header]
1761
1762 def _explain_to(self, message):
1763 """Copy Babyl-specific state to message insofar as possible."""
1764 if isinstance(message, MaildirMessage):
1765 labels = set(self.get_labels())
1766 if 'unseen' in labels:
1767 message.set_subdir('cur')
1768 else:
1769 message.set_subdir('cur')
1770 message.add_flag('S')
1771 if 'forwarded' in labels or 'resent' in labels:
1772 message.add_flag('P')
1773 if 'answered' in labels:
1774 message.add_flag('R')
1775 if 'deleted' in labels:
1776 message.add_flag('T')
1777 elif isinstance(message, _mboxMMDFMessage):
1778 labels = set(self.get_labels())
1779 if 'unseen' not in labels:
1780 message.add_flag('RO')
1781 else:
1782 message.add_flag('O')
1783 if 'deleted' in labels:
1784 message.add_flag('D')
1785 if 'answered' in labels:
1786 message.add_flag('A')
1787 elif isinstance(message, MHMessage):
1788 labels = set(self.get_labels())
1789 if 'unseen' in labels:
1790 message.add_sequence('unseen')
1791 if 'answered' in labels:
1792 message.add_sequence('replied')
1793 elif isinstance(message, BabylMessage):
1794 message.set_visible(self.get_visible())
1795 for label in self.get_labels():
1796 message.add_label(label)
1797 elif isinstance(message, Message):
1798 pass
1799 else:
1800 raise TypeError('Cannot convert to specified type: %s' %
1801 type(message))
1802
1803
1804class MMDFMessage(_mboxMMDFMessage):
1805 """Message with MMDF-specific properties."""
1806
1807
1808class _ProxyFile:
1809 """A read-only wrapper of a file."""
1810
1811 def __init__(self, f, pos=None):
1812 """Initialize a _ProxyFile."""
1813 self._file = f
1814 if pos is None:
1815 self._pos = f.tell()
1816 else:
1817 self._pos = pos
1818
1819 def read(self, size=None):
1820 """Read bytes."""
1821 return self._read(size, self._file.read)
1822
1823 def readline(self, size=None):
1824 """Read a line."""
1825 return self._read(size, self._file.readline)
1826
1827 def readlines(self, sizehint=None):
1828 """Read multiple lines."""
1829 result = []
1830 for line in self:
1831 result.append(line)
1832 if sizehint is not None:
1833 sizehint -= len(line)
1834 if sizehint <= 0:
1835 break
1836 return result
1837
1838 def __iter__(self):
1839 """Iterate over lines."""
1840 return iter(self.readline, "")
1841
1842 def tell(self):
1843 """Return the position."""
1844 return self._pos
1845
1846 def seek(self, offset, whence=0):
1847 """Change position."""
1848 if whence == 1:
1849 self._file.seek(self._pos)
1850 self._file.seek(offset, whence)
1851 self._pos = self._file.tell()
1852
1853 def close(self):
1854 """Close the file."""
1855 del self._file
1856
1857 def _read(self, size, read_method):
1858 """Read size bytes using read_method."""
1859 if size is None:
1860 size = -1
1861 self._file.seek(self._pos)
1862 result = read_method(size)
1863 self._pos = self._file.tell()
1864 return result
1865
1866
1867class _PartialFile(_ProxyFile):
1868 """A read-only wrapper of part of a file."""
1869
1870 def __init__(self, f, start=None, stop=None):
1871 """Initialize a _PartialFile."""
1872 _ProxyFile.__init__(self, f, start)
1873 self._start = start
1874 self._stop = stop
1875
1876 def tell(self):
1877 """Return the position with respect to start."""
1878 return _ProxyFile.tell(self) - self._start
1879
1880 def seek(self, offset, whence=0):
1881 """Change position, possibly with respect to start or stop."""
1882 if whence == 0:
1883 self._pos = self._start
1884 whence = 1
1885 elif whence == 2:
1886 self._pos = self._stop
1887 whence = 1
1888 _ProxyFile.seek(self, offset, whence)
1889
1890 def _read(self, size, read_method):
1891 """Read size bytes using read_method, honoring start and stop."""
1892 remaining = self._stop - self._pos
1893 if remaining <= 0:
1894 return ''
1895 if size is None or size < 0 or size > remaining:
1896 size = remaining
1897 return _ProxyFile._read(self, size, read_method)
1898
1899
1900def _lock_file(f, dotlock=True):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001901 """Lock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001902 dotlock_done = False
1903 try:
1904 if fcntl:
1905 try:
1906 fcntl.lockf(f, fcntl.LOCK_EX | fcntl.LOCK_NB)
1907 except IOError, e:
R. David Murray1a337902011-03-03 18:17:40 +00001908 if e.errno in (errno.EAGAIN, errno.EACCES, errno.EROFS):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001909 raise ExternalClashError('lockf: lock unavailable: %s' %
1910 f.name)
1911 else:
1912 raise
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001913 if dotlock:
1914 try:
1915 pre_lock = _create_temporary(f.name + '.lock')
1916 pre_lock.close()
1917 except IOError, e:
R. David Murray1a337902011-03-03 18:17:40 +00001918 if e.errno in (errno.EACCES, errno.EROFS):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001919 return # Without write access, just skip dotlocking.
1920 else:
1921 raise
1922 try:
1923 if hasattr(os, 'link'):
1924 os.link(pre_lock.name, f.name + '.lock')
1925 dotlock_done = True
1926 os.unlink(pre_lock.name)
1927 else:
1928 os.rename(pre_lock.name, f.name + '.lock')
1929 dotlock_done = True
1930 except OSError, e:
Andrew MacIntyreafa358f2006-07-23 13:04:00 +00001931 if e.errno == errno.EEXIST or \
1932 (os.name == 'os2' and e.errno == errno.EACCES):
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001933 os.remove(pre_lock.name)
Tim Peters6d7cd7d2006-04-22 05:52:59 +00001934 raise ExternalClashError('dot lock unavailable: %s' %
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001935 f.name)
1936 else:
1937 raise
1938 except:
1939 if fcntl:
1940 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001941 if dotlock_done:
1942 os.remove(f.name + '.lock')
1943 raise
1944
1945def _unlock_file(f):
Andrew M. Kuchling55732592006-06-26 13:12:16 +00001946 """Unlock file f using lockf and dot locking."""
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001947 if fcntl:
1948 fcntl.lockf(f, fcntl.LOCK_UN)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001949 if os.path.exists(f.name + '.lock'):
1950 os.remove(f.name + '.lock')
1951
1952def _create_carefully(path):
1953 """Create a file if it doesn't exist and open for reading and writing."""
Andrew M. Kuchling70a6dbd2008-08-04 01:43:43 +00001954 fd = os.open(path, os.O_CREAT | os.O_EXCL | os.O_RDWR, 0666)
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001955 try:
Andrew M. Kuchling214db632006-05-02 21:44:33 +00001956 return open(path, 'rb+')
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001957 finally:
1958 os.close(fd)
1959
1960def _create_temporary(path):
1961 """Create a temp file based on path and open for reading and writing."""
1962 return _create_carefully('%s.%s.%s.%s' % (path, int(time.time()),
1963 socket.gethostname(),
1964 os.getpid()))
1965
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001966def _sync_flush(f):
1967 """Ensure changes to file f are physically on disk."""
1968 f.flush()
Andrew M. Kuchling16465682006-12-14 18:57:53 +00001969 if hasattr(os, 'fsync'):
1970 os.fsync(f.fileno())
Andrew M. Kuchlingb5686da2006-11-09 13:51:14 +00001971
1972def _sync_close(f):
1973 """Close file f, ensuring all changes are physically on disk."""
1974 _sync_flush(f)
1975 f.close()
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00001976
1977## Start: classes from the original module (for backward compatibility).
1978
1979# Note that the Maildir class, whose name is unchanged, itself offers a next()
1980# method for backward compatibility.
Skip Montanaro17ab1232001-01-24 06:27:27 +00001981
Guido van Rossumc7b68821994-04-28 09:53:33 +00001982class _Mailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00001983
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001984 def __init__(self, fp, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00001985 self.fp = fp
1986 self.seekp = 0
Barry Warsaw81ad67c2001-01-31 22:13:15 +00001987 self.factory = factory
Guido van Rossum8ca84201998-03-26 20:56:10 +00001988
Fred Drake72987a42001-05-02 20:20:53 +00001989 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00001990 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00001991
Fred Drakedbbf76b2000-07-09 16:44:26 +00001992 def next(self):
1993 while 1:
1994 self.fp.seek(self.seekp)
1995 try:
1996 self._search_start()
1997 except EOFError:
1998 self.seekp = self.fp.tell()
1999 return None
2000 start = self.fp.tell()
2001 self._search_end()
2002 self.seekp = stop = self.fp.tell()
Fred Drake8152d322000-12-12 23:20:45 +00002003 if start != stop:
Fred Drakedbbf76b2000-07-09 16:44:26 +00002004 break
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002005 return self.factory(_PartialFile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +00002006
Barry Warsawffd05ee2002-03-01 22:39:14 +00002007# Recommended to use PortableUnixMailbox instead!
Guido van Rossumc7b68821994-04-28 09:53:33 +00002008class UnixMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002009
Fred Drakedbbf76b2000-07-09 16:44:26 +00002010 def _search_start(self):
2011 while 1:
2012 pos = self.fp.tell()
2013 line = self.fp.readline()
2014 if not line:
2015 raise EOFError
2016 if line[:5] == 'From ' and self._isrealfromline(line):
2017 self.fp.seek(pos)
2018 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002019
Fred Drakedbbf76b2000-07-09 16:44:26 +00002020 def _search_end(self):
2021 self.fp.readline() # Throw away header line
2022 while 1:
2023 pos = self.fp.tell()
2024 line = self.fp.readline()
2025 if not line:
2026 return
2027 if line[:5] == 'From ' and self._isrealfromline(line):
2028 self.fp.seek(pos)
2029 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002030
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002031 # An overridable mechanism to test for From-line-ness. You can either
2032 # specify a different regular expression or define a whole new
2033 # _isrealfromline() method. Note that this only gets called for lines
2034 # starting with the 5 characters "From ".
2035 #
2036 # BAW: According to
2037 #http://home.netscape.com/eng/mozilla/2.0/relnotes/demo/content-length.html
2038 # the only portable, reliable way to find message delimiters in a BSD (i.e
2039 # Unix mailbox) style folder is to search for "\n\nFrom .*\n", or at the
2040 # beginning of the file, "^From .*\n". While _fromlinepattern below seems
2041 # like a good idea, in practice, there are too many variations for more
2042 # strict parsing of the line to be completely accurate.
2043 #
2044 # _strict_isrealfromline() is the old version which tries to do stricter
2045 # parsing of the From_ line. _portable_isrealfromline() simply returns
2046 # true, since it's never called if the line doesn't already start with
2047 # "From ".
2048 #
2049 # This algorithm, and the way it interacts with _search_start() and
2050 # _search_end() may not be completely correct, because it doesn't check
2051 # that the two characters preceding "From " are \n\n or the beginning of
2052 # the file. Fixing this would require a more extensive rewrite than is
Barry Warsawda5628f2002-08-26 16:44:56 +00002053 # necessary. For convenience, we've added a PortableUnixMailbox class
Andrew M. Kuchlingb94c0c32007-01-22 20:27:50 +00002054 # which does no checking of the format of the 'From' line.
Guido van Rossumc7b68821994-04-28 09:53:33 +00002055
Andrew M. Kuchlingb78bb742007-01-22 20:26:40 +00002056 _fromlinepattern = (r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+"
2057 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*"
2058 r"[^\s]*\s*"
2059 "$")
Fred Drakedbbf76b2000-07-09 16:44:26 +00002060 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002061
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002062 def _strict_isrealfromline(self, line):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002063 if not self._regexp:
2064 import re
2065 self._regexp = re.compile(self._fromlinepattern)
2066 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002067
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002068 def _portable_isrealfromline(self, line):
Tim Petersbc0e9102002-04-04 22:55:58 +00002069 return True
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002070
2071 _isrealfromline = _strict_isrealfromline
2072
2073
2074class PortableUnixMailbox(UnixMailbox):
2075 _isrealfromline = UnixMailbox._portable_isrealfromline
2076
Guido van Rossumfbe63de1998-04-03 16:04:05 +00002077
Guido van Rossumc7b68821994-04-28 09:53:33 +00002078class MmdfMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002079
Fred Drakedbbf76b2000-07-09 16:44:26 +00002080 def _search_start(self):
2081 while 1:
2082 line = self.fp.readline()
2083 if not line:
2084 raise EOFError
2085 if line[:5] == '\001\001\001\001\n':
2086 return
Guido van Rossum8ca84201998-03-26 20:56:10 +00002087
Fred Drakedbbf76b2000-07-09 16:44:26 +00002088 def _search_end(self):
2089 while 1:
2090 pos = self.fp.tell()
2091 line = self.fp.readline()
2092 if not line:
2093 return
2094 if line == '\001\001\001\001\n':
2095 self.fp.seek(pos)
2096 return
Guido van Rossumc7b68821994-04-28 09:53:33 +00002097
Guido van Rossumc7b68821994-04-28 09:53:33 +00002098
Jack Jansen97157791995-10-23 13:59:53 +00002099class MHMailbox:
Guido van Rossum4bf12542002-09-12 05:08:00 +00002100
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002101 def __init__(self, dirname, factory=rfc822.Message):
Fred Drakedbbf76b2000-07-09 16:44:26 +00002102 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +00002103 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +00002104 self.dirname = dirname
Sjoerd Mullenderd2653a92000-08-11 07:48:36 +00002105 # the three following lines could be combined into:
2106 # list = map(long, filter(pat.match, os.listdir(self.dirname)))
2107 list = os.listdir(self.dirname)
2108 list = filter(pat.match, list)
Guido van Rossum0707fea2000-08-10 03:05:26 +00002109 list = map(long, list)
2110 list.sort()
2111 # This only works in Python 1.6 or later;
2112 # before that str() added 'L':
2113 self.boxes = map(str, list)
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002114 self.boxes.reverse()
Barry Warsaw81ad67c2001-01-31 22:13:15 +00002115 self.factory = factory
Jack Jansen97157791995-10-23 13:59:53 +00002116
Fred Drake72987a42001-05-02 20:20:53 +00002117 def __iter__(self):
Guido van Rossum93a696f2001-09-13 01:29:13 +00002118 return iter(self.next, None)
Fred Drake72987a42001-05-02 20:20:53 +00002119
Fred Drakedbbf76b2000-07-09 16:44:26 +00002120 def next(self):
2121 if not self.boxes:
2122 return None
Raymond Hettingerb5ba8d72004-02-07 02:16:24 +00002123 fn = self.boxes.pop()
Fred Drakedbbf76b2000-07-09 16:44:26 +00002124 fp = open(os.path.join(self.dirname, fn))
Guido van Rossum4bf12542002-09-12 05:08:00 +00002125 msg = self.factory(fp)
2126 try:
2127 msg._mh_msgno = fn
2128 except (AttributeError, TypeError):
2129 pass
2130 return msg
Guido van Rossum8ca84201998-03-26 20:56:10 +00002131
Guido van Rossum9a4d6371998-12-23 22:05:42 +00002132
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002133class BabylMailbox(_Mailbox):
Guido van Rossum4bf12542002-09-12 05:08:00 +00002134
Fred Drakedbbf76b2000-07-09 16:44:26 +00002135 def _search_start(self):
2136 while 1:
2137 line = self.fp.readline()
2138 if not line:
2139 raise EOFError
2140 if line == '*** EOOH ***\n':
2141 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002142
Fred Drakedbbf76b2000-07-09 16:44:26 +00002143 def _search_end(self):
2144 while 1:
2145 pos = self.fp.tell()
2146 line = self.fp.readline()
2147 if not line:
2148 return
Johannes Gijsbers6abc6852004-08-21 12:30:26 +00002149 if line == '\037\014\n' or line == '\037':
Fred Drakedbbf76b2000-07-09 16:44:26 +00002150 self.fp.seek(pos)
2151 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +00002152
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002153## End: classes from the original module (for backward compatibility).
Guido van Rossum62448671996-09-17 21:33:15 +00002154
2155
Andrew M. Kuchling1da4a942006-04-22 02:32:43 +00002156class Error(Exception):
2157 """Raised for module-specific errors."""
2158
2159class NoSuchMailboxError(Error):
2160 """The specified mailbox does not exist and won't be created."""
2161
2162class NotEmptyError(Error):
2163 """The specified mailbox is not empty and deletion was requested."""
2164
2165class ExternalClashError(Error):
2166 """Another process caused an action to fail."""
2167
2168class FormatError(Error):
2169 """A file appears to have an invalid format."""