blob: cc88e9de4d8f8af4b6f893af5e2ea7179a09891d [file] [log] [blame]
Guido van Rossum4acc25b2000-02-02 15:10:15 +00001"""File-like objects that read from or write to a string buffer.
2
3This implements (nearly) all stdio methods.
4
5f = StringIO() # ready for writing
6f = StringIO(buf) # ready for reading
7f.close() # explicitly release resources held
8flag = f.isatty() # always false
9pos = f.tell() # get current position
10f.seek(pos) # set current position
11f.seek(pos, mode) # mode 0: absolute; 1: relative; 2: relative to EOF
12buf = f.read() # read until EOF
13buf = f.read(n) # read up to n bytes
14buf = f.readline() # read until end of line ('\n') or EOF
15list = f.readlines()# list of f.readline() results until EOF
Fred Drakee0a7f4f2000-09-28 04:21:06 +000016f.truncate([size]) # truncate file at to at most size (default: current pos)
Guido van Rossum4acc25b2000-02-02 15:10:15 +000017f.write(buf) # write at current position
18f.writelines(list) # for line in list: f.write(line)
19f.getvalue() # return whole file's contents as a string
20
21Notes:
22- Using a real file is often faster (but less convenient).
Guido van Rossum98d9fd32000-02-28 15:12:25 +000023- There's also a much faster implementation in C, called cStringIO, but
24 it's not subclassable.
Guido van Rossum4acc25b2000-02-02 15:10:15 +000025- fileno() is left unimplemented so that code which uses it triggers
26 an exception early.
27- Seeking far beyond EOF and then writing will insert real null
28 bytes that occupy space in the buffer.
29- There's a simple test set (see end of this file).
30"""
Marc-André Lemburgf853be92002-01-06 17:15:05 +000031import types
Barry Warsawc7ed0e32000-12-12 23:12:23 +000032try:
Barry Warsawc1401312000-12-12 23:16:51 +000033 from errno import EINVAL
Barry Warsawc7ed0e32000-12-12 23:12:23 +000034except ImportError:
Barry Warsawc1401312000-12-12 23:16:51 +000035 EINVAL = 22
Barry Warsawc7ed0e32000-12-12 23:12:23 +000036
Skip Montanaroe99d5ea2001-01-20 19:54:20 +000037__all__ = ["StringIO"]
38
Guido van Rossum85d89451994-06-23 11:53:27 +000039class StringIO:
Barry Warsawc1401312000-12-12 23:16:51 +000040 def __init__(self, buf = ''):
Marc-André Lemburgf853be92002-01-06 17:15:05 +000041 # Force self.buf to be a string or unicode
42 if type(buf) is not types.UnicodeType:
43 buf = str(buf)
44 self.buf = buf
Fred Drakea63bd1c2000-12-13 20:23:11 +000045 self.len = len(buf)
46 self.buflist = []
47 self.pos = 0
48 self.closed = 0
49 self.softspace = 0
Barry Warsawc1401312000-12-12 23:16:51 +000050
Barry Warsawbdefa0b2001-09-22 04:34:54 +000051 def __iter__(self):
52 return iter(self.readline, '')
53
Barry Warsawc1401312000-12-12 23:16:51 +000054 def close(self):
Fred Drakea63bd1c2000-12-13 20:23:11 +000055 if not self.closed:
56 self.closed = 1
57 del self.buf, self.pos
Barry Warsawc1401312000-12-12 23:16:51 +000058
59 def isatty(self):
Fred Drakea63bd1c2000-12-13 20:23:11 +000060 if self.closed:
61 raise ValueError, "I/O operation on closed file"
Guido van Rossum8ca162f2002-04-07 06:36:23 +000062 return False
Barry Warsawc1401312000-12-12 23:16:51 +000063
64 def seek(self, pos, mode = 0):
Fred Drakea63bd1c2000-12-13 20:23:11 +000065 if self.closed:
66 raise ValueError, "I/O operation on closed file"
67 if self.buflist:
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +000068 self.buf += ''.join(self.buflist)
Fred Drakea63bd1c2000-12-13 20:23:11 +000069 self.buflist = []
70 if mode == 1:
71 pos += self.pos
72 elif mode == 2:
73 pos += self.len
74 self.pos = max(0, pos)
Barry Warsawc1401312000-12-12 23:16:51 +000075
76 def tell(self):
Fred Drakea63bd1c2000-12-13 20:23:11 +000077 if self.closed:
78 raise ValueError, "I/O operation on closed file"
79 return self.pos
Barry Warsawc1401312000-12-12 23:16:51 +000080
81 def read(self, n = -1):
Fred Drakea63bd1c2000-12-13 20:23:11 +000082 if self.closed:
83 raise ValueError, "I/O operation on closed file"
84 if self.buflist:
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +000085 self.buf += ''.join(self.buflist)
Fred Drakea63bd1c2000-12-13 20:23:11 +000086 self.buflist = []
87 if n < 0:
88 newpos = self.len
89 else:
90 newpos = min(self.pos+n, self.len)
91 r = self.buf[self.pos:newpos]
92 self.pos = newpos
93 return r
Barry Warsawc1401312000-12-12 23:16:51 +000094
95 def readline(self, length=None):
Fred Drakea63bd1c2000-12-13 20:23:11 +000096 if self.closed:
97 raise ValueError, "I/O operation on closed file"
98 if self.buflist:
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +000099 self.buf += ''.join(self.buflist)
Fred Drakea63bd1c2000-12-13 20:23:11 +0000100 self.buflist = []
101 i = self.buf.find('\n', self.pos)
102 if i < 0:
103 newpos = self.len
104 else:
105 newpos = i+1
106 if length is not None:
107 if self.pos + length < newpos:
108 newpos = self.pos + length
109 r = self.buf[self.pos:newpos]
110 self.pos = newpos
111 return r
Barry Warsawc1401312000-12-12 23:16:51 +0000112
113 def readlines(self, sizehint = 0):
Fred Drakea63bd1c2000-12-13 20:23:11 +0000114 total = 0
115 lines = []
116 line = self.readline()
117 while line:
118 lines.append(line)
119 total += len(line)
120 if 0 < sizehint <= total:
121 break
122 line = self.readline()
123 return lines
Barry Warsawc1401312000-12-12 23:16:51 +0000124
125 def truncate(self, size=None):
Fred Drakea63bd1c2000-12-13 20:23:11 +0000126 if self.closed:
127 raise ValueError, "I/O operation on closed file"
128 if size is None:
129 size = self.pos
130 elif size < 0:
131 raise IOError(EINVAL, "Negative size not allowed")
132 elif size < self.pos:
133 self.pos = size
134 self.buf = self.getvalue()[:size]
Barry Warsawc1401312000-12-12 23:16:51 +0000135
136 def write(self, s):
Fred Drakea63bd1c2000-12-13 20:23:11 +0000137 if self.closed:
138 raise ValueError, "I/O operation on closed file"
139 if not s: return
Marc-André Lemburgf853be92002-01-06 17:15:05 +0000140 # Force s to be a string or unicode
141 if type(s) is not types.UnicodeType:
142 s = str(s)
Fred Drakea63bd1c2000-12-13 20:23:11 +0000143 if self.pos > self.len:
144 self.buflist.append('\0'*(self.pos - self.len))
145 self.len = self.pos
146 newpos = self.pos + len(s)
147 if self.pos < self.len:
148 if self.buflist:
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +0000149 self.buf += ''.join(self.buflist)
Fred Drakea63bd1c2000-12-13 20:23:11 +0000150 self.buflist = []
151 self.buflist = [self.buf[:self.pos], s, self.buf[newpos:]]
152 self.buf = ''
153 if newpos > self.len:
154 self.len = newpos
155 else:
156 self.buflist.append(s)
157 self.len = newpos
158 self.pos = newpos
Barry Warsawc1401312000-12-12 23:16:51 +0000159
160 def writelines(self, list):
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +0000161 self.write(''.join(list))
Barry Warsawc1401312000-12-12 23:16:51 +0000162
163 def flush(self):
Fred Drakea63bd1c2000-12-13 20:23:11 +0000164 if self.closed:
165 raise ValueError, "I/O operation on closed file"
Barry Warsawc1401312000-12-12 23:16:51 +0000166
167 def getvalue(self):
Fred Drakea63bd1c2000-12-13 20:23:11 +0000168 if self.buflist:
Marc-André Lemburg85d6edf2001-02-09 13:37:37 +0000169 self.buf += ''.join(self.buflist)
Fred Drakea63bd1c2000-12-13 20:23:11 +0000170 self.buflist = []
171 return self.buf
Guido van Rossum85d89451994-06-23 11:53:27 +0000172
173
174# A little test suite
175
176def test():
Barry Warsawc1401312000-12-12 23:16:51 +0000177 import sys
178 if sys.argv[1:]:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000179 file = sys.argv[1]
Barry Warsawc1401312000-12-12 23:16:51 +0000180 else:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000181 file = '/etc/passwd'
Barry Warsawc1401312000-12-12 23:16:51 +0000182 lines = open(file, 'r').readlines()
183 text = open(file, 'r').read()
184 f = StringIO()
185 for line in lines[:-2]:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000186 f.write(line)
Barry Warsawc1401312000-12-12 23:16:51 +0000187 f.writelines(lines[-2:])
188 if f.getvalue() != text:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000189 raise RuntimeError, 'write failed'
Barry Warsawc1401312000-12-12 23:16:51 +0000190 length = f.tell()
191 print 'File length =', length
192 f.seek(len(lines[0]))
193 f.write(lines[1])
194 f.seek(0)
195 print 'First line =', `f.readline()`
Neal Norwitz9fb289d2002-02-11 17:52:18 +0000196 print 'Position =', f.tell()
Barry Warsawc1401312000-12-12 23:16:51 +0000197 line = f.readline()
198 print 'Second line =', `line`
199 f.seek(-len(line), 1)
200 line2 = f.read(len(line))
201 if line != line2:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000202 raise RuntimeError, 'bad result after seek back'
Barry Warsawc1401312000-12-12 23:16:51 +0000203 f.seek(len(line2), 1)
204 list = f.readlines()
205 line = list[-1]
206 f.seek(f.tell() - len(line))
207 line2 = f.read()
208 if line != line2:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000209 raise RuntimeError, 'bad result after seek back from EOF'
Barry Warsawc1401312000-12-12 23:16:51 +0000210 print 'Read', len(list), 'more lines'
211 print 'File length =', f.tell()
212 if f.tell() != length:
Fred Drakea63bd1c2000-12-13 20:23:11 +0000213 raise RuntimeError, 'bad length'
Barry Warsawc1401312000-12-12 23:16:51 +0000214 f.close()
Guido van Rossum85d89451994-06-23 11:53:27 +0000215
216if __name__ == '__main__':
Barry Warsawc1401312000-12-12 23:16:51 +0000217 test()