blob: 1f7352aa818f0261f5351ec858c2ade69d068d32 [file] [log] [blame]
Jack Jansen518d2612002-04-14 20:17:18 +00001# Tests universal newline support for both reading and parsing files.
Antoine Pitrou19690592009-06-12 20:14:08 +00002
3from __future__ import print_function
4from __future__ import unicode_literals
5
6import io
7import _pyio as pyio
Jack Jansen518d2612002-04-14 20:17:18 +00008import unittest
Jack Jansen518d2612002-04-14 20:17:18 +00009import os
10import sys
Antoine Pitrou19690592009-06-12 20:14:08 +000011from test import test_support as support
Jack Jansen518d2612002-04-14 20:17:18 +000012
Jack Jansen518d2612002-04-14 20:17:18 +000013if not hasattr(sys.stdin, 'newlines'):
Antoine Pitrou19690592009-06-12 20:14:08 +000014 raise unittest.SkipTest(
15 "This Python does not have universal newline support")
Jack Jansen518d2612002-04-14 20:17:18 +000016
Tim Petersea572b22002-04-21 06:12:02 +000017FATX = 'x' * (2**14)
18
19DATA_TEMPLATE = [
20 "line1=1",
Antoine Pitrou19690592009-06-12 20:14:08 +000021 "line2='this is a very long line designed to go past any default " +
22 "buffer limits that exist in io.py but we also want to test " +
Tim Petersea572b22002-04-21 06:12:02 +000023 "the uncommon case, naturally.'",
24 "def line3():pass",
25 "line4 = '%s'" % FATX,
26 ]
27
28DATA_LF = "\n".join(DATA_TEMPLATE) + "\n"
29DATA_CR = "\r".join(DATA_TEMPLATE) + "\r"
30DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n"
31
32# Note that DATA_MIXED also tests the ability to recognize a lone \r
33# before end-of-file.
34DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r"
35DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE]
Tim Petersea572b22002-04-21 06:12:02 +000036
Jack Jansen518d2612002-04-14 20:17:18 +000037class TestGenericUnivNewlines(unittest.TestCase):
38 # use a class variable DATA to define the data to write to the file
39 # and a class variable NEWLINE to set the expected newlines value
Antoine Pitrou19690592009-06-12 20:14:08 +000040 READMODE = 'r'
Jack Jansen518d2612002-04-14 20:17:18 +000041 WRITEMODE = 'wb'
42
43 def setUp(self):
Antoine Pitrou19690592009-06-12 20:14:08 +000044 data = self.DATA
45 if "b" in self.WRITEMODE:
46 data = data.encode("ascii")
47 with self.open(support.TESTFN, self.WRITEMODE) as fp:
48 fp.write(data)
Jack Jansen518d2612002-04-14 20:17:18 +000049
50 def tearDown(self):
51 try:
Antoine Pitrou19690592009-06-12 20:14:08 +000052 os.unlink(support.TESTFN)
Jack Jansen518d2612002-04-14 20:17:18 +000053 except:
54 pass
Tim Peters863ac442002-04-16 01:38:40 +000055
Jack Jansen518d2612002-04-14 20:17:18 +000056 def test_read(self):
Antoine Pitrou19690592009-06-12 20:14:08 +000057 with self.open(support.TESTFN, self.READMODE) as fp:
Philip Jenvey6a111022009-05-28 05:58:44 +000058 data = fp.read()
Jack Jansen518d2612002-04-14 20:17:18 +000059 self.assertEqual(data, DATA_LF)
Antoine Pitrou19690592009-06-12 20:14:08 +000060 self.assertEqual(set(fp.newlines), set(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000061
Jack Jansen518d2612002-04-14 20:17:18 +000062 def test_readlines(self):
Antoine Pitrou19690592009-06-12 20:14:08 +000063 with self.open(support.TESTFN, self.READMODE) as fp:
Philip Jenvey6a111022009-05-28 05:58:44 +000064 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000065 self.assertEqual(data, DATA_SPLIT)
Antoine Pitrou19690592009-06-12 20:14:08 +000066 self.assertEqual(set(fp.newlines), set(self.NEWLINE))
Jack Jansen518d2612002-04-14 20:17:18 +000067
68 def test_readline(self):
Antoine Pitrou19690592009-06-12 20:14:08 +000069 with self.open(support.TESTFN, self.READMODE) as fp:
Philip Jenvey6a111022009-05-28 05:58:44 +000070 data = []
Jack Jansen518d2612002-04-14 20:17:18 +000071 d = fp.readline()
Philip Jenvey6a111022009-05-28 05:58:44 +000072 while d:
73 data.append(d)
74 d = fp.readline()
Jack Jansen518d2612002-04-14 20:17:18 +000075 self.assertEqual(data, DATA_SPLIT)
Antoine Pitrou19690592009-06-12 20:14:08 +000076 self.assertEqual(set(fp.newlines), set(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000077
Jack Jansen518d2612002-04-14 20:17:18 +000078 def test_seek(self):
Antoine Pitrou19690592009-06-12 20:14:08 +000079 with self.open(support.TESTFN, self.READMODE) as fp:
Philip Jenvey6a111022009-05-28 05:58:44 +000080 fp.readline()
81 pos = fp.tell()
82 data = fp.readlines()
83 self.assertEqual(data, DATA_SPLIT[1:])
84 fp.seek(pos)
85 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000086 self.assertEqual(data, DATA_SPLIT[1:])
Tim Peters863ac442002-04-16 01:38:40 +000087
Tim Peters863ac442002-04-16 01:38:40 +000088
Jack Jansen518d2612002-04-14 20:17:18 +000089class TestCRNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000090 NEWLINE = '\r'
91 DATA = DATA_CR
Tim Peters863ac442002-04-16 01:38:40 +000092
Jack Jansen518d2612002-04-14 20:17:18 +000093class TestLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000094 NEWLINE = '\n'
95 DATA = DATA_LF
Tim Peters863ac442002-04-16 01:38:40 +000096
Jack Jansen518d2612002-04-14 20:17:18 +000097class TestCRLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000098 NEWLINE = '\r\n'
99 DATA = DATA_CRLF
Tim Peters863ac442002-04-16 01:38:40 +0000100
Guido van Rossumad8fb0d2007-09-22 20:18:03 +0000101 def test_tell(self):
Antoine Pitrou19690592009-06-12 20:14:08 +0000102 with self.open(support.TESTFN, self.READMODE) as fp:
Philip Jenvey6a111022009-05-28 05:58:44 +0000103 self.assertEqual(repr(fp.newlines), repr(None))
104 data = fp.readline()
105 pos = fp.tell()
Guido van Rossumad8fb0d2007-09-22 20:18:03 +0000106 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
107
Jack Jansen518d2612002-04-14 20:17:18 +0000108class TestMixedNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000109 NEWLINE = ('\r', '\n')
110 DATA = DATA_MIXED
Tim Peters863ac442002-04-16 01:38:40 +0000111
Jack Jansen518d2612002-04-14 20:17:18 +0000112
113def test_main():
Antoine Pitrou19690592009-06-12 20:14:08 +0000114 base_tests = (TestCRNewlines,
115 TestLFNewlines,
116 TestCRLFNewlines,
117 TestMixedNewlines)
118 tests = []
119 # Test the C and Python implementations.
120 for test in base_tests:
121 class CTest(test):
122 open = io.open
123 CTest.__name__ = str("C" + test.__name__)
124 class PyTest(test):
125 open = staticmethod(pyio.open)
126 PyTest.__name__ = str("Py" + test.__name__)
127 tests.append(CTest)
128 tests.append(PyTest)
129 support.run_unittest(*tests)
Jack Jansen518d2612002-04-14 20:17:18 +0000130
131if __name__ == '__main__':
132 test_main()