blob: ce84087a5eea5cea7845fd96071ed1c1f122cecb [file] [log] [blame]
Guido van Rossum741c81a1992-07-13 14:40:45 +00001# A class that makes each part of a multipart message "feel" like an
2# ordinary file, as long as you use fp.readline(). Allows recursive
3# use, for nested multipart messages. Probably best used together
4# with module mimetools.
5#
6# Suggested use:
7#
8# real_fp = open(...)
Guido van Rossum7bc817d1993-12-17 15:25:27 +00009# fp = MultiFile(real_fp)
Guido van Rossum741c81a1992-07-13 14:40:45 +000010#
11# "read some lines from fp"
12# fp.push(separator)
13# while 1:
14# "read lines from fp until it returns an empty string" (A)
15# if not fp.next(): break
16# fp.pop()
17# "read remaining lines from fp until it returns an empty string"
18#
19# The latter sequence may be used recursively at (A).
20# It is also allowed to use multiple push()...pop() sequences.
Guido van Rossum4d40b0a1998-06-23 14:20:27 +000021#
22# If seekable is given as 0, the class code will not do the bookeeping
23# it normally attempts in order to make seeks relative to the beginning of the
24# current file part. This may be useful when using MultiFile with a non-
25# seekable stream object.
Guido van Rossum741c81a1992-07-13 14:40:45 +000026
27import sys
28import string
29
Guido van Rossum741c81a1992-07-13 14:40:45 +000030Error = 'multifile.Error'
31
32class MultiFile:
33 #
Guido van Rossum4d40b0a1998-06-23 14:20:27 +000034 seekable = 0
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000035 #
Guido van Rossum4d40b0a1998-06-23 14:20:27 +000036 def __init__(self, fp, seekable=1):
Guido van Rossum741c81a1992-07-13 14:40:45 +000037 self.fp = fp
38 self.stack = [] # Grows down
39 self.level = 0
40 self.last = 0
Guido van Rossum4d40b0a1998-06-23 14:20:27 +000041 if seekable:
42 self.seekable = 1
43 self.start = self.fp.tell()
44 self.posstack = [] # Grows down
Guido van Rossum741c81a1992-07-13 14:40:45 +000045 #
46 def tell(self):
47 if self.level > 0:
48 return self.lastpos
49 return self.fp.tell() - self.start
50 #
Guido van Rossum69c70a21998-03-25 16:25:26 +000051 def seek(self, pos, whence=0):
Guido van Rossum8ca84201998-03-26 20:56:10 +000052 here = self.tell()
53 if whence:
54 if whence == 1:
55 pos = pos + here
56 elif whence == 2:
57 if self.level > 0:
58 pos = pos + self.lastpos
59 else:
60 raise Error, "can't use whence=2 yet"
Guido van Rossum69c70a21998-03-25 16:25:26 +000061 if not 0 <= pos <= here or \
Guido van Rossum741c81a1992-07-13 14:40:45 +000062 self.level > 0 and pos > self.lastpos:
63 raise Error, 'bad MultiFile.seek() call'
64 self.fp.seek(pos + self.start)
65 self.level = 0
66 self.last = 0
67 #
68 def readline(self):
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000069 if self.level > 0:
70 return ''
Guido van Rossum741c81a1992-07-13 14:40:45 +000071 line = self.fp.readline()
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000072 # Real EOF?
Guido van Rossum741c81a1992-07-13 14:40:45 +000073 if not line:
74 self.level = len(self.stack)
75 self.last = (self.level > 0)
76 if self.last:
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000077 raise Error, 'sudden EOF in MultiFile.readline()'
Guido van Rossum741c81a1992-07-13 14:40:45 +000078 return ''
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000079 assert self.level == 0
80 # Fast check to see if this is just data
81 if self.is_data(line):
82 return line
83 else:
84 # Ignore trailing whitespace on marker lines
85 k = len(line) - 1;
86 while line[k] in string.whitespace:
87 k = k - 1
88 marker = line[:k+1]
89 # No? OK, try to match a boundary.
90 # Return the line (unstripped) if we don't.
Guido van Rossum741c81a1992-07-13 14:40:45 +000091 for i in range(len(self.stack)):
92 sep = self.stack[i]
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000093 if marker == self.section_divider(sep):
Guido van Rossum741c81a1992-07-13 14:40:45 +000094 self.last = 0
95 break
Guido van Rossum3ad9dd51998-06-29 17:56:06 +000096 elif marker == self.end_marker(sep):
Guido van Rossum741c81a1992-07-13 14:40:45 +000097 self.last = 1
98 break
99 else:
100 return line
Guido van Rossum3ad9dd51998-06-29 17:56:06 +0000101 # We only get here if we see a section divider or EOM line
Guido van Rossum4d40b0a1998-06-23 14:20:27 +0000102 if self.seekable:
103 self.lastpos = self.tell() - len(line)
Guido van Rossum741c81a1992-07-13 14:40:45 +0000104 self.level = i+1
105 if self.level > 1:
Guido van Rossum3ad9dd51998-06-29 17:56:06 +0000106 raise Error,'Missing endmarker in MultiFile.readline()'
Guido van Rossum741c81a1992-07-13 14:40:45 +0000107 return ''
108 #
Guido van Rossumb6775db1994-08-01 11:34:53 +0000109 def readlines(self):
110 list = []
111 while 1:
112 line = self.readline()
113 if not line: break
114 list.append(line)
115 return list
116 #
117 def read(self): # Note: no size argument -- read until EOF only!
118 return string.joinfields(self.readlines(), '')
119 #
Guido van Rossum741c81a1992-07-13 14:40:45 +0000120 def next(self):
121 while self.readline(): pass
122 if self.level > 1 or self.last:
123 return 0
124 self.level = 0
125 self.last = 0
Guido van Rossum4d40b0a1998-06-23 14:20:27 +0000126 if self.seekable:
127 self.start = self.fp.tell()
Guido van Rossum741c81a1992-07-13 14:40:45 +0000128 return 1
129 #
130 def push(self, sep):
131 if self.level > 0:
132 raise Error, 'bad MultiFile.push() call'
133 self.stack.insert(0, sep)
Guido van Rossum716b7841998-06-29 17:58:43 +0000134 if self.seekable:
135 self.posstack.insert(0, self.start)
136 self.start = self.fp.tell()
Guido van Rossum741c81a1992-07-13 14:40:45 +0000137 #
138 def pop(self):
139 if self.stack == []:
140 raise Error, 'bad MultiFile.pop() call'
141 if self.level <= 1:
142 self.last = 0
143 else:
144 abslastpos = self.lastpos + self.start
145 self.level = max(0, self.level - 1)
146 del self.stack[0]
Guido van Rossum4d40b0a1998-06-23 14:20:27 +0000147 if self.seekable:
148 self.start = self.posstack[0]
149 del self.posstack[0]
150 if self.level > 0:
151 self.lastpos = abslastpos - self.start
Guido van Rossum741c81a1992-07-13 14:40:45 +0000152 #
Guido van Rossum3ad9dd51998-06-29 17:56:06 +0000153 def is_data(self, line):
154 return line[:2] <> '--'
155 #
156 def section_divider(self, str):
157 return "--" + str
158 #
159 def end_marker(self, str):
160 return "--" + str + "--"