blob: a6b99091ff6e0e5ac5dc57ff1d17f3103ba00873 [file] [log] [blame]
Jack Jansen518d2612002-04-14 20:17:18 +00001# Tests universal newline support for both reading and parsing files.
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +00002import io
3import _pyio as pyio
Jack Jansen518d2612002-04-14 20:17:18 +00004import unittest
Jack Jansen518d2612002-04-14 20:17:18 +00005import os
6import sys
Benjamin Petersonee8712c2008-05-20 21:35:26 +00007from test import support
Jack Jansen518d2612002-04-14 20:17:18 +00008
Jack Jansen518d2612002-04-14 20:17:18 +00009if not hasattr(sys.stdin, 'newlines'):
Benjamin Petersonee8712c2008-05-20 21:35:26 +000010 raise support.TestSkipped(
Collin Winter3add4d72007-08-29 23:37:32 +000011 "This Python does not have universal newline support")
Jack Jansen518d2612002-04-14 20:17:18 +000012
Tim Petersea572b22002-04-21 06:12:02 +000013FATX = 'x' * (2**14)
14
15DATA_TEMPLATE = [
16 "line1=1",
Guido van Rossum8358db22007-08-18 21:39:55 +000017 "line2='this is a very long line designed to go past any default " +
18 "buffer limits that exist in io.py but we also want to test " +
Tim Petersea572b22002-04-21 06:12:02 +000019 "the uncommon case, naturally.'",
20 "def line3():pass",
21 "line4 = '%s'" % FATX,
22 ]
23
24DATA_LF = "\n".join(DATA_TEMPLATE) + "\n"
25DATA_CR = "\r".join(DATA_TEMPLATE) + "\r"
26DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n"
27
28# Note that DATA_MIXED also tests the ability to recognize a lone \r
29# before end-of-file.
30DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r"
31DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE]
Tim Petersea572b22002-04-21 06:12:02 +000032
Jack Jansen518d2612002-04-14 20:17:18 +000033class TestGenericUnivNewlines(unittest.TestCase):
34 # use a class variable DATA to define the data to write to the file
35 # and a class variable NEWLINE to set the expected newlines value
Guido van Rossum8358db22007-08-18 21:39:55 +000036 READMODE = 'r'
Jack Jansen518d2612002-04-14 20:17:18 +000037 WRITEMODE = 'wb'
38
39 def setUp(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000040 fp = self.open(support.TESTFN, self.WRITEMODE)
Guido van Rossum9c627722007-08-27 18:31:48 +000041 data = self.DATA
42 if "b" in self.WRITEMODE:
43 data = data.encode("ascii")
44 fp.write(data)
Jack Jansen518d2612002-04-14 20:17:18 +000045 fp.close()
46
47 def tearDown(self):
48 try:
Benjamin Petersonee8712c2008-05-20 21:35:26 +000049 os.unlink(support.TESTFN)
Jack Jansen518d2612002-04-14 20:17:18 +000050 except:
51 pass
Tim Peters863ac442002-04-16 01:38:40 +000052
Jack Jansen518d2612002-04-14 20:17:18 +000053 def test_read(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000054 fp = self.open(support.TESTFN, self.READMODE)
Jack Jansen518d2612002-04-14 20:17:18 +000055 data = fp.read()
56 self.assertEqual(data, DATA_LF)
Walter Dörwald70a6b492004-02-12 17:35:32 +000057 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000058
Jack Jansen518d2612002-04-14 20:17:18 +000059 def test_readlines(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000060 fp = self.open(support.TESTFN, self.READMODE)
Jack Jansen518d2612002-04-14 20:17:18 +000061 data = fp.readlines()
62 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000063 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Jack Jansen518d2612002-04-14 20:17:18 +000064
65 def test_readline(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000066 fp = self.open(support.TESTFN, self.READMODE)
Jack Jansen518d2612002-04-14 20:17:18 +000067 data = []
68 d = fp.readline()
69 while d:
70 data.append(d)
71 d = fp.readline()
72 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000073 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000074
Jack Jansen518d2612002-04-14 20:17:18 +000075 def test_seek(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000076 fp = self.open(support.TESTFN, self.READMODE)
Jack Jansen518d2612002-04-14 20:17:18 +000077 fp.readline()
78 pos = fp.tell()
79 data = fp.readlines()
80 self.assertEqual(data, DATA_SPLIT[1:])
81 fp.seek(pos)
82 data = fp.readlines()
83 self.assertEqual(data, DATA_SPLIT[1:])
Tim Peters863ac442002-04-16 01:38:40 +000084
Jack Jansen518d2612002-04-14 20:17:18 +000085
Jack Jansen518d2612002-04-14 20:17:18 +000086class TestCRNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000087 NEWLINE = '\r'
88 DATA = DATA_CR
Tim Peters863ac442002-04-16 01:38:40 +000089
Jack Jansen518d2612002-04-14 20:17:18 +000090class TestLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000091 NEWLINE = '\n'
92 DATA = DATA_LF
Tim Peters863ac442002-04-16 01:38:40 +000093
Jack Jansen518d2612002-04-14 20:17:18 +000094class TestCRLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000095 NEWLINE = '\r\n'
96 DATA = DATA_CRLF
Tim Peters863ac442002-04-16 01:38:40 +000097
Guido van Rossum8ce8a782007-11-01 19:42:39 +000098 def test_tell(self):
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +000099 fp = self.open(support.TESTFN, self.READMODE)
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000100 self.assertEqual(repr(fp.newlines), repr(None))
101 data = fp.readline()
102 pos = fp.tell()
103 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
104
Jack Jansen518d2612002-04-14 20:17:18 +0000105class TestMixedNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000106 NEWLINE = ('\r', '\n')
107 DATA = DATA_MIXED
Tim Peters863ac442002-04-16 01:38:40 +0000108
Jack Jansen518d2612002-04-14 20:17:18 +0000109
110def test_main():
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +0000111 base_tests = (TestCRNewlines,
112 TestLFNewlines,
113 TestCRLFNewlines,
114 TestMixedNewlines)
115 tests = []
116 # Test the C and Python implementations.
117 for test in base_tests:
118 class CTest(test):
119 open = io.open
120 CTest.__name__ = "C" + test.__name__
121 class PyTest(test):
122 open = staticmethod(pyio.open)
123 PyTest.__name__ = "Py" + test.__name__
124 tests.append(CTest)
125 tests.append(PyTest)
126 support.run_unittest(*tests)
Jack Jansen518d2612002-04-14 20:17:18 +0000127
128if __name__ == '__main__':
129 test_main()