blob: afd9a55760007fd70c901a44cceb74c1dc025eae [file] [log] [blame]
Guido van Rossumf06ee5f1996-11-27 19:52:01 +00001#! /usr/bin/env python
Guido van Rossum62448671996-09-17 21:33:15 +00002
3"""Classes to handle Unix style, MMDF style, and MH style mailboxes."""
4
5
Guido van Rossumc7b68821994-04-28 09:53:33 +00006import rfc822
Jack Jansen97157791995-10-23 13:59:53 +00007import os
Guido van Rossumc7b68821994-04-28 09:53:33 +00008
9class _Mailbox:
Fred Drakedbbf76b2000-07-09 16:44:26 +000010 def __init__(self, fp):
11 self.fp = fp
12 self.seekp = 0
Guido van Rossum8ca84201998-03-26 20:56:10 +000013
Fred Drakedbbf76b2000-07-09 16:44:26 +000014 def seek(self, pos, whence=0):
15 if whence==1: # Relative to current position
16 self.pos = self.pos + pos
17 if whence==2: # Relative to file's end
18 self.pos = self.stop + pos
19 else: # Default - absolute position
20 self.pos = self.start + pos
Guido van Rossumc7b68821994-04-28 09:53:33 +000021
Fred Drakedbbf76b2000-07-09 16:44:26 +000022 def next(self):
23 while 1:
24 self.fp.seek(self.seekp)
25 try:
26 self._search_start()
27 except EOFError:
28 self.seekp = self.fp.tell()
29 return None
30 start = self.fp.tell()
31 self._search_end()
32 self.seekp = stop = self.fp.tell()
33 if start <> stop:
34 break
35 return rfc822.Message(_Subfile(self.fp, start, stop))
Guido van Rossumc7b68821994-04-28 09:53:33 +000036
Guido van Rossumc7b68821994-04-28 09:53:33 +000037
38class _Subfile:
Fred Drakedbbf76b2000-07-09 16:44:26 +000039 def __init__(self, fp, start, stop):
40 self.fp = fp
41 self.start = start
42 self.stop = stop
43 self.pos = self.start
Guido van Rossum8ca84201998-03-26 20:56:10 +000044
Fred Drakedbbf76b2000-07-09 16:44:26 +000045 def read(self, length = None):
46 if self.pos >= self.stop:
47 return ''
48 remaining = self.stop - self.pos
49 if length is None or length < 0:
50 length = remaining
51 elif length > remaining:
52 length = remaining
53 self.fp.seek(self.pos)
54 data = self.fp.read(length)
55 self.pos = self.fp.tell()
56 return data
Guido van Rossumc7b68821994-04-28 09:53:33 +000057
Fred Drakedbbf76b2000-07-09 16:44:26 +000058 def readline(self, length = None):
59 if self.pos >= self.stop:
60 return ''
61 if length is None:
62 length = self.stop - self.pos
63 self.fp.seek(self.pos)
64 data = self.fp.readline(length)
65 self.pos = self.fp.tell()
66 return data
Guido van Rossumc7b68821994-04-28 09:53:33 +000067
Fred Drakedbbf76b2000-07-09 16:44:26 +000068 def readlines(self, sizehint = -1):
69 lines = []
70 while 1:
71 line = self.readline()
72 if not line:
73 break
74 lines.append(line)
75 if sizehint >= 0:
76 sizehint = sizehint - len(line)
77 if sizehint <= 0:
78 break
79 return lines
Guido van Rossumc7b68821994-04-28 09:53:33 +000080
Fred Drakedbbf76b2000-07-09 16:44:26 +000081 def tell(self):
82 return self.pos - self.start
Guido van Rossume256a0f1999-03-24 16:20:45 +000083
Fred Drakedbbf76b2000-07-09 16:44:26 +000084 def seek(self, pos, whence=0):
85 if whence == 0:
86 self.pos = self.start + pos
87 elif whence == 1:
88 self.pos = self.pos + pos
89 elif whence == 2:
90 self.pos = self.stop + pos
Guido van Rossumc7b68821994-04-28 09:53:33 +000091
Fred Drakedbbf76b2000-07-09 16:44:26 +000092 def close(self):
93 del self.fp
Guido van Rossumc7b68821994-04-28 09:53:33 +000094
Guido van Rossumc7b68821994-04-28 09:53:33 +000095
96class UnixMailbox(_Mailbox):
Fred Drakedbbf76b2000-07-09 16:44:26 +000097 def _search_start(self):
98 while 1:
99 pos = self.fp.tell()
100 line = self.fp.readline()
101 if not line:
102 raise EOFError
103 if line[:5] == 'From ' and self._isrealfromline(line):
104 self.fp.seek(pos)
105 return
Guido van Rossum8ca84201998-03-26 20:56:10 +0000106
Fred Drakedbbf76b2000-07-09 16:44:26 +0000107 def _search_end(self):
108 self.fp.readline() # Throw away header line
109 while 1:
110 pos = self.fp.tell()
111 line = self.fp.readline()
112 if not line:
113 return
114 if line[:5] == 'From ' and self._isrealfromline(line):
115 self.fp.seek(pos)
116 return
Guido van Rossumc7b68821994-04-28 09:53:33 +0000117
Fred Drakedbbf76b2000-07-09 16:44:26 +0000118 # An overridable mechanism to test for From-line-ness.
119 # You can either specify a different regular expression
120 # or define a whole new _isrealfromline() method.
121 # Note that this only gets called for lines starting with
122 # the 5 characters "From ".
Guido van Rossumc7b68821994-04-28 09:53:33 +0000123
Fred Drakedbbf76b2000-07-09 16:44:26 +0000124 _fromlinepattern = r"From \s*[^\s]+\s+\w\w\w\s+\w\w\w\s+\d?\d\s+" \
125 r"\d?\d:\d\d(:\d\d)?(\s+[^\s]+)?\s+\d\d\d\d\s*$"
126 _regexp = None
Guido van Rossumfbe63de1998-04-03 16:04:05 +0000127
Fred Drakedbbf76b2000-07-09 16:44:26 +0000128 def _isrealfromline(self, line):
129 if not self._regexp:
130 import re
131 self._regexp = re.compile(self._fromlinepattern)
132 return self._regexp.match(line)
Guido van Rossumfbe63de1998-04-03 16:04:05 +0000133
Guido van Rossumfbe63de1998-04-03 16:04:05 +0000134
Guido van Rossumc7b68821994-04-28 09:53:33 +0000135class MmdfMailbox(_Mailbox):
Fred Drakedbbf76b2000-07-09 16:44:26 +0000136 def _search_start(self):
137 while 1:
138 line = self.fp.readline()
139 if not line:
140 raise EOFError
141 if line[:5] == '\001\001\001\001\n':
142 return
Guido van Rossum8ca84201998-03-26 20:56:10 +0000143
Fred Drakedbbf76b2000-07-09 16:44:26 +0000144 def _search_end(self):
145 while 1:
146 pos = self.fp.tell()
147 line = self.fp.readline()
148 if not line:
149 return
150 if line == '\001\001\001\001\n':
151 self.fp.seek(pos)
152 return
Guido van Rossumc7b68821994-04-28 09:53:33 +0000153
Guido van Rossumc7b68821994-04-28 09:53:33 +0000154
Jack Jansen97157791995-10-23 13:59:53 +0000155class MHMailbox:
Fred Drakedbbf76b2000-07-09 16:44:26 +0000156 def __init__(self, dirname):
157 import re
Guido van Rossum0707fea2000-08-10 03:05:26 +0000158 pat = re.compile('^[1-9][0-9]*$')
Fred Drakedbbf76b2000-07-09 16:44:26 +0000159 self.dirname = dirname
160 files = os.listdir(self.dirname)
Guido van Rossum0707fea2000-08-10 03:05:26 +0000161 list = []
Fred Drakedbbf76b2000-07-09 16:44:26 +0000162 for f in files:
163 if pat.match(f):
Guido van Rossum0707fea2000-08-10 03:05:26 +0000164 list.append(f)
165 list = map(long, list)
166 list.sort()
167 # This only works in Python 1.6 or later;
168 # before that str() added 'L':
169 self.boxes = map(str, list)
Jack Jansen97157791995-10-23 13:59:53 +0000170
Fred Drakedbbf76b2000-07-09 16:44:26 +0000171 def next(self):
172 if not self.boxes:
173 return None
174 fn = self.boxes[0]
175 del self.boxes[0]
176 fp = open(os.path.join(self.dirname, fn))
177 return rfc822.Message(fp)
Guido van Rossum8ca84201998-03-26 20:56:10 +0000178
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000179
180class Maildir:
Fred Drakedbbf76b2000-07-09 16:44:26 +0000181 # Qmail directory mailbox
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000182
Fred Drakedbbf76b2000-07-09 16:44:26 +0000183 def __init__(self, dirname):
184 import string
185 self.dirname = dirname
186 self.boxes = []
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000187
Fred Drakedbbf76b2000-07-09 16:44:26 +0000188 # check for new mail
189 newdir = os.path.join(self.dirname, 'new')
190 for file in os.listdir(newdir):
191 if len(string.split(file, '.')) > 2:
192 self.boxes.append(os.path.join(newdir, file))
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000193
Fred Drakedbbf76b2000-07-09 16:44:26 +0000194 # Now check for current mail in this maildir
195 curdir = os.path.join(self.dirname, 'cur')
196 for file in os.listdir(curdir):
197 if len(string.split(file, '.')) > 2:
198 self.boxes.append(os.path.join(curdir, file))
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000199
Fred Drakedbbf76b2000-07-09 16:44:26 +0000200 def next(self):
201 if not self.boxes:
202 return None
203 fn = self.boxes[0]
204 del self.boxes[0]
205 fp = open(os.path.join(self.dirname, fn))
206 return rfc822.Message(fp)
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000207
Guido van Rossum9a4d6371998-12-23 22:05:42 +0000208
Guido van Rossumfdf58fe1997-05-15 14:33:09 +0000209class BabylMailbox(_Mailbox):
Fred Drakedbbf76b2000-07-09 16:44:26 +0000210 def _search_start(self):
211 while 1:
212 line = self.fp.readline()
213 if not line:
214 raise EOFError
215 if line == '*** EOOH ***\n':
216 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +0000217
Fred Drakedbbf76b2000-07-09 16:44:26 +0000218 def _search_end(self):
219 while 1:
220 pos = self.fp.tell()
221 line = self.fp.readline()
222 if not line:
223 return
224 if line == '\037\014\n':
225 self.fp.seek(pos)
226 return
Guido van Rossumfdf58fe1997-05-15 14:33:09 +0000227
228
Guido van Rossum62448671996-09-17 21:33:15 +0000229def _test():
Fred Drakedbbf76b2000-07-09 16:44:26 +0000230 import time
231 import sys
232 import string
233 import os
Jack Jansen97157791995-10-23 13:59:53 +0000234
Fred Drakedbbf76b2000-07-09 16:44:26 +0000235 args = sys.argv[1:]
236 if not args:
237 for key in 'MAILDIR', 'MAIL', 'LOGNAME', 'USER':
238 if os.environ.has_key(key):
239 mbox = os.environ[key]
240 break
Fred Drake13a2c272000-02-10 17:17:14 +0000241 else:
Fred Drakedbbf76b2000-07-09 16:44:26 +0000242 print "$MAIL, $LOGNAME nor $USER set -- who are you?"
243 return
244 else:
245 mbox = args[0]
246 if mbox[:1] == '+':
247 mbox = os.environ['HOME'] + '/Mail/' + mbox[1:]
248 elif not '/' in mbox:
249 mbox = '/usr/mail/' + mbox
250 if os.path.isdir(mbox):
251 if os.path.isdir(os.path.join(mbox, 'cur')):
252 mb = Maildir(mbox)
Fred Drake13a2c272000-02-10 17:17:14 +0000253 else:
Fred Drakedbbf76b2000-07-09 16:44:26 +0000254 mb = MHMailbox(mbox)
255 else:
256 fp = open(mbox, 'r')
257 mb = UnixMailbox(fp)
258
259 msgs = []
260 while 1:
261 msg = mb.next()
262 if msg is None:
263 break
264 msgs.append(msg)
265 if len(args) <= 1:
266 msg.fp = None
267 if len(args) > 1:
268 num = string.atoi(args[1])
269 print 'Message %d body:'%num
270 msg = msgs[num-1]
271 msg.rewindbody()
272 sys.stdout.write(msg.fp.read())
273 else:
274 print 'Mailbox',mbox,'has',len(msgs),'messages:'
275 for msg in msgs:
276 f = msg.getheader('from') or ""
277 s = msg.getheader('subject') or ""
278 d = msg.getheader('date') or ""
279 print '%20.20s %18.18s %-30.30s'%(f, d[5:], s)
Guido van Rossum62448671996-09-17 21:33:15 +0000280
281
282if __name__ == '__main__':
Fred Drakedbbf76b2000-07-09 16:44:26 +0000283 _test()