blob: a9d2fa6a3a38ce2c6a55c3ea86969bee9c9161f5 [file] [log] [blame]
Tim Peters3230d5c2001-07-11 22:21:17 +00001'''
2Tests for fileinput module.
3Nick Mathewson
4'''
5
Guido van Rossumd8faa362007-04-27 19:54:29 +00006import unittest
7from test.test_support import verbose, TESTFN, run_unittest
8from test.test_support import unlink as safe_unlink
Tim Peters3230d5c2001-07-11 22:21:17 +00009import sys, os, re
Guido van Rossum34d19282007-08-09 01:03:29 +000010from io import StringIO
Georg Brandlc98eeed2006-02-19 14:57:47 +000011from fileinput import FileInput, hook_encoded
Tim Peters3230d5c2001-07-11 22:21:17 +000012
13# The fileinput module has 2 interfaces: the FileInput class which does
14# all the work, and a few functions (input, etc.) that use a global _state
15# variable. We only test the FileInput class, since the other functions
16# only provide a thin facade over FileInput.
17
18# Write lines (a list of lines) to temp file number i, and return the
19# temp file's name.
Tim Peters4d7cad12006-02-19 21:22:10 +000020def writeTmp(i, lines, mode='w'): # opening in text mode is the default
Tim Peters3230d5c2001-07-11 22:21:17 +000021 name = TESTFN + str(i)
Tim Peters4d7cad12006-02-19 21:22:10 +000022 f = open(name, mode)
Guido van Rossumc43e79f2007-06-18 18:26:36 +000023 for line in lines:
24 f.write(line)
Tim Peters3230d5c2001-07-11 22:21:17 +000025 f.close()
26 return name
27
Tim Peters3230d5c2001-07-11 22:21:17 +000028def remove_tempfiles(*names):
29 for name in names:
Guido van Rossumd8faa362007-04-27 19:54:29 +000030 safe_unlink(name)
Tim Peters3230d5c2001-07-11 22:21:17 +000031
Guido van Rossumd8faa362007-04-27 19:54:29 +000032class BufferSizesTests(unittest.TestCase):
33 def test_buffer_sizes(self):
34 # First, run the tests with default and teeny buffer size.
35 for round, bs in (0, 0), (1, 30):
36 try:
37 t1 = writeTmp(1, ["Line %s of file 1\n" % (i+1) for i in range(15)])
38 t2 = writeTmp(2, ["Line %s of file 2\n" % (i+1) for i in range(10)])
39 t3 = writeTmp(3, ["Line %s of file 3\n" % (i+1) for i in range(5)])
40 t4 = writeTmp(4, ["Line %s of file 4\n" % (i+1) for i in range(1)])
41 self.buffer_size_test(t1, t2, t3, t4, bs, round)
42 finally:
43 remove_tempfiles(t1, t2, t3, t4)
Tim Peters3230d5c2001-07-11 22:21:17 +000044
Guido van Rossumd8faa362007-04-27 19:54:29 +000045 def buffer_size_test(self, t1, t2, t3, t4, bs=0, round=0):
46 pat = re.compile(r'LINE (\d+) OF FILE (\d+)')
Tim Peters3230d5c2001-07-11 22:21:17 +000047
Guido van Rossumd8faa362007-04-27 19:54:29 +000048 start = 1 + round*6
49 if verbose:
50 print('%s. Simple iteration (bs=%s)' % (start+0, bs))
51 fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
Tim Peters3230d5c2001-07-11 22:21:17 +000052 lines = list(fi)
Tim Peters3230d5c2001-07-11 22:21:17 +000053 fi.close()
Guido van Rossumd8faa362007-04-27 19:54:29 +000054 self.assertEqual(len(lines), 31)
55 self.assertEqual(lines[4], 'Line 5 of file 1\n')
56 self.assertEqual(lines[30], 'Line 1 of file 4\n')
57 self.assertEqual(fi.lineno(), 31)
58 self.assertEqual(fi.filename(), t4)
Tim Peters3230d5c2001-07-11 22:21:17 +000059
Guido van Rossumd8faa362007-04-27 19:54:29 +000060 if verbose:
61 print('%s. Status variables (bs=%s)' % (start+1, bs))
62 fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
63 s = "x"
64 while s and s != 'Line 6 of file 2\n':
65 s = fi.readline()
66 self.assertEqual(fi.filename(), t2)
67 self.assertEqual(fi.lineno(), 21)
68 self.assertEqual(fi.filelineno(), 6)
69 self.failIf(fi.isfirstline())
70 self.failIf(fi.isstdin())
Tim Peters3230d5c2001-07-11 22:21:17 +000071
Guido van Rossumd8faa362007-04-27 19:54:29 +000072 if verbose:
73 print('%s. Nextfile (bs=%s)' % (start+2, bs))
74 fi.nextfile()
75 self.assertEqual(fi.readline(), 'Line 1 of file 3\n')
76 self.assertEqual(fi.lineno(), 22)
77 fi.close()
Tim Peters3230d5c2001-07-11 22:21:17 +000078
Guido van Rossumd8faa362007-04-27 19:54:29 +000079 if verbose:
80 print('%s. Stdin (bs=%s)' % (start+3, bs))
81 fi = FileInput(files=(t1, t2, t3, t4, '-'), bufsize=bs)
82 savestdin = sys.stdin
83 try:
84 sys.stdin = StringIO("Line 1 of stdin\nLine 2 of stdin\n")
85 lines = list(fi)
86 self.assertEqual(len(lines), 33)
87 self.assertEqual(lines[32], 'Line 2 of stdin\n')
88 self.assertEqual(fi.filename(), '<stdin>')
89 fi.nextfile()
90 finally:
91 sys.stdin = savestdin
Tim Peters3230d5c2001-07-11 22:21:17 +000092
Guido van Rossumd8faa362007-04-27 19:54:29 +000093 if verbose:
94 print('%s. Boundary conditions (bs=%s)' % (start+4, bs))
95 fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
96 self.assertEqual(fi.lineno(), 0)
97 self.assertEqual(fi.filename(), None)
98 fi.nextfile()
99 self.assertEqual(fi.lineno(), 0)
100 self.assertEqual(fi.filename(), None)
Tim Peters3230d5c2001-07-11 22:21:17 +0000101
Guido van Rossumd8faa362007-04-27 19:54:29 +0000102 if verbose:
103 print('%s. Inplace (bs=%s)' % (start+5, bs))
104 savestdout = sys.stdout
105 try:
106 fi = FileInput(files=(t1, t2, t3, t4), inplace=1, bufsize=bs)
107 for line in fi:
108 line = line[:-1].upper()
109 print(line)
110 fi.close()
111 finally:
112 sys.stdout = savestdout
Tim Peters3230d5c2001-07-11 22:21:17 +0000113
Guido van Rossumd8faa362007-04-27 19:54:29 +0000114 fi = FileInput(files=(t1, t2, t3, t4), bufsize=bs)
115 for line in fi:
116 self.assertEqual(line[-1], '\n')
117 m = pat.match(line[:-1])
118 self.assertNotEqual(m, None)
119 self.assertEqual(int(m.group(1)), fi.filelineno())
120 fi.close()
Georg Brandle4662172006-02-19 09:51:27 +0000121
Guido van Rossumd8faa362007-04-27 19:54:29 +0000122class FileInputTests(unittest.TestCase):
123 def test_zero_byte_files(self):
124 try:
125 t1 = writeTmp(1, [""])
126 t2 = writeTmp(2, [""])
127 t3 = writeTmp(3, ["The only line there is.\n"])
128 t4 = writeTmp(4, [""])
129 fi = FileInput(files=(t1, t2, t3, t4))
Georg Brandl67e9fb92006-02-19 13:56:17 +0000130
Guido van Rossumd8faa362007-04-27 19:54:29 +0000131 line = fi.readline()
132 self.assertEqual(line, 'The only line there is.\n')
133 self.assertEqual(fi.lineno(), 1)
134 self.assertEqual(fi.filelineno(), 1)
135 self.assertEqual(fi.filename(), t3)
Georg Brandlc029f872006-02-19 14:12:34 +0000136
Guido van Rossumd8faa362007-04-27 19:54:29 +0000137 line = fi.readline()
138 self.failIf(line)
139 self.assertEqual(fi.lineno(), 1)
140 self.assertEqual(fi.filelineno(), 0)
141 self.assertEqual(fi.filename(), t4)
142 fi.close()
143 finally:
144 remove_tempfiles(t1, t2, t3, t4)
Georg Brandlc98eeed2006-02-19 14:57:47 +0000145
Guido van Rossumd8faa362007-04-27 19:54:29 +0000146 def test_files_that_dont_end_with_newline(self):
147 try:
148 t1 = writeTmp(1, ["A\nB\nC"])
149 t2 = writeTmp(2, ["D\nE\nF"])
150 fi = FileInput(files=(t1, t2))
151 lines = list(fi)
152 self.assertEqual(lines, ["A\n", "B\n", "C", "D\n", "E\n", "F"])
153 self.assertEqual(fi.filelineno(), 3)
154 self.assertEqual(fi.lineno(), 6)
155 finally:
156 remove_tempfiles(t1, t2)
157
Guido van Rossumc43e79f2007-06-18 18:26:36 +0000158## def test_unicode_filenames(self):
159## # XXX A unicode string is always returned by writeTmp.
160## # So is this needed?
161## try:
162## t1 = writeTmp(1, ["A\nB"])
163## encoding = sys.getfilesystemencoding()
164## if encoding is None:
165## encoding = 'ascii'
166## fi = FileInput(files=str(t1, encoding))
167## lines = list(fi)
168## self.assertEqual(lines, ["A\n", "B"])
169## finally:
170## remove_tempfiles(t1)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000171
172 def test_fileno(self):
173 try:
174 t1 = writeTmp(1, ["A\nB"])
175 t2 = writeTmp(2, ["C\nD"])
176 fi = FileInput(files=(t1, t2))
177 self.assertEqual(fi.fileno(), -1)
178 line =next( fi)
179 self.assertNotEqual(fi.fileno(), -1)
180 fi.nextfile()
181 self.assertEqual(fi.fileno(), -1)
182 line = list(fi)
183 self.assertEqual(fi.fileno(), -1)
184 finally:
185 remove_tempfiles(t1, t2)
186
187 def test_opening_mode(self):
188 try:
189 # invalid mode, should raise ValueError
190 fi = FileInput(mode="w")
191 self.fail("FileInput should reject invalid mode argument")
192 except ValueError:
193 pass
194 try:
195 # try opening in universal newline mode
196 t1 = writeTmp(1, ["A\nB\r\nC\rD"], mode="wb")
197 fi = FileInput(files=t1, mode="U")
198 lines = list(fi)
199 self.assertEqual(lines, ["A\n", "B\n", "C\n", "D"])
200 finally:
201 remove_tempfiles(t1)
202
Guido van Rossumc43e79f2007-06-18 18:26:36 +0000203## def test_file_opening_hook(self):
204## # XXX The rot13 codec was removed.
205## # So this test needs to be changed to use something else.
206## try:
207## # cannot use openhook and inplace mode
208## fi = FileInput(inplace=1, openhook=lambda f, m: None)
209## self.fail("FileInput should raise if both inplace "
210## "and openhook arguments are given")
211## except ValueError:
212## pass
213## try:
214## fi = FileInput(openhook=1)
215## self.fail("FileInput should check openhook for being callable")
216## except ValueError:
217## pass
218## try:
219## t1 = writeTmp(1, ["A\nB"], mode="wb")
220## fi = FileInput(files=t1, openhook=hook_encoded("rot13"))
221## lines = list(fi)
222## self.assertEqual(lines, ["N\n", "O"])
223## finally:
224## remove_tempfiles(t1)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000225
226def test_main():
227 run_unittest(BufferSizesTests, FileInputTests)
228
229if __name__ == "__main__":
230 test_main()