blob: b905491878001c0634c9b7c1bbf778d049d9cd37 [file] [log] [blame]
Jack Jansen518d2612002-04-14 20:17:18 +00001# Tests universal newline support for both reading and parsing files.
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +00002import io
3import _pyio as pyio
Jack Jansen518d2612002-04-14 20:17:18 +00004import unittest
Jack Jansen518d2612002-04-14 20:17:18 +00005import os
6import sys
Benjamin Petersonee8712c2008-05-20 21:35:26 +00007from test import support
Hai Shi883bc632020-07-06 17:12:49 +08008from test.support import os_helper
9
Jack Jansen518d2612002-04-14 20:17:18 +000010
Jack Jansen518d2612002-04-14 20:17:18 +000011if not hasattr(sys.stdin, 'newlines'):
Benjamin Petersone549ead2009-03-28 21:42:05 +000012 raise unittest.SkipTest(
13 "This Python does not have universal newline support")
Jack Jansen518d2612002-04-14 20:17:18 +000014
Tim Petersea572b22002-04-21 06:12:02 +000015FATX = 'x' * (2**14)
16
17DATA_TEMPLATE = [
18 "line1=1",
Guido van Rossum8358db22007-08-18 21:39:55 +000019 "line2='this is a very long line designed to go past any default " +
20 "buffer limits that exist in io.py but we also want to test " +
Tim Petersea572b22002-04-21 06:12:02 +000021 "the uncommon case, naturally.'",
22 "def line3():pass",
23 "line4 = '%s'" % FATX,
24 ]
25
26DATA_LF = "\n".join(DATA_TEMPLATE) + "\n"
27DATA_CR = "\r".join(DATA_TEMPLATE) + "\r"
28DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n"
29
30# Note that DATA_MIXED also tests the ability to recognize a lone \r
31# before end-of-file.
32DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r"
33DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE]
Tim Petersea572b22002-04-21 06:12:02 +000034
Ezio Melotti28b0d9d2013-06-09 00:07:06 +030035class CTest:
36 open = io.open
37
38class PyTest:
39 open = staticmethod(pyio.open)
40
41class TestGenericUnivNewlines:
Jack Jansen518d2612002-04-14 20:17:18 +000042 # use a class variable DATA to define the data to write to the file
43 # and a class variable NEWLINE to set the expected newlines value
Guido van Rossum8358db22007-08-18 21:39:55 +000044 READMODE = 'r'
Jack Jansen518d2612002-04-14 20:17:18 +000045 WRITEMODE = 'wb'
46
47 def setUp(self):
Guido van Rossum9c627722007-08-27 18:31:48 +000048 data = self.DATA
49 if "b" in self.WRITEMODE:
50 data = data.encode("ascii")
Hai Shi883bc632020-07-06 17:12:49 +080051 with self.open(os_helper.TESTFN, self.WRITEMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +000052 fp.write(data)
Jack Jansen518d2612002-04-14 20:17:18 +000053
54 def tearDown(self):
55 try:
Hai Shi883bc632020-07-06 17:12:49 +080056 os.unlink(os_helper.TESTFN)
Jack Jansen518d2612002-04-14 20:17:18 +000057 except:
58 pass
Tim Peters863ac442002-04-16 01:38:40 +000059
Jack Jansen518d2612002-04-14 20:17:18 +000060 def test_read(self):
Hai Shi883bc632020-07-06 17:12:49 +080061 with self.open(os_helper.TESTFN, self.READMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +000062 data = fp.read()
Jack Jansen518d2612002-04-14 20:17:18 +000063 self.assertEqual(data, DATA_LF)
Walter Dörwald70a6b492004-02-12 17:35:32 +000064 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000065
Jack Jansen518d2612002-04-14 20:17:18 +000066 def test_readlines(self):
Hai Shi883bc632020-07-06 17:12:49 +080067 with self.open(os_helper.TESTFN, self.READMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +000068 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000069 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000070 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Jack Jansen518d2612002-04-14 20:17:18 +000071
72 def test_readline(self):
Hai Shi883bc632020-07-06 17:12:49 +080073 with self.open(os_helper.TESTFN, self.READMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +000074 data = []
Jack Jansen518d2612002-04-14 20:17:18 +000075 d = fp.readline()
Philip Jenveya27c5bd2009-05-28 06:09:08 +000076 while d:
77 data.append(d)
78 d = fp.readline()
Jack Jansen518d2612002-04-14 20:17:18 +000079 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000080 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000081
Jack Jansen518d2612002-04-14 20:17:18 +000082 def test_seek(self):
Hai Shi883bc632020-07-06 17:12:49 +080083 with self.open(os_helper.TESTFN, self.READMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +000084 fp.readline()
85 pos = fp.tell()
86 data = fp.readlines()
87 self.assertEqual(data, DATA_SPLIT[1:])
88 fp.seek(pos)
89 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000090 self.assertEqual(data, DATA_SPLIT[1:])
Tim Peters863ac442002-04-16 01:38:40 +000091
Jack Jansen518d2612002-04-14 20:17:18 +000092
Jack Jansen518d2612002-04-14 20:17:18 +000093class TestCRNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000094 NEWLINE = '\r'
95 DATA = DATA_CR
Ezio Melotti28b0d9d2013-06-09 00:07:06 +030096class CTestCRNewlines(CTest, TestCRNewlines, unittest.TestCase): pass
97class PyTestCRNewlines(PyTest, TestCRNewlines, unittest.TestCase): pass
Tim Peters863ac442002-04-16 01:38:40 +000098
Jack Jansen518d2612002-04-14 20:17:18 +000099class TestLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000100 NEWLINE = '\n'
101 DATA = DATA_LF
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300102class CTestLFNewlines(CTest, TestLFNewlines, unittest.TestCase): pass
103class PyTestLFNewlines(PyTest, TestLFNewlines, unittest.TestCase): pass
Tim Peters863ac442002-04-16 01:38:40 +0000104
Jack Jansen518d2612002-04-14 20:17:18 +0000105class TestCRLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000106 NEWLINE = '\r\n'
107 DATA = DATA_CRLF
Tim Peters863ac442002-04-16 01:38:40 +0000108
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000109 def test_tell(self):
Hai Shi883bc632020-07-06 17:12:49 +0800110 with self.open(os_helper.TESTFN, self.READMODE) as fp:
Philip Jenveya27c5bd2009-05-28 06:09:08 +0000111 self.assertEqual(repr(fp.newlines), repr(None))
112 data = fp.readline()
113 pos = fp.tell()
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000114 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300115class CTestCRLFNewlines(CTest, TestCRLFNewlines, unittest.TestCase): pass
116class PyTestCRLFNewlines(PyTest, TestCRLFNewlines, unittest.TestCase): pass
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000117
Jack Jansen518d2612002-04-14 20:17:18 +0000118class TestMixedNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000119 NEWLINE = ('\r', '\n')
120 DATA = DATA_MIXED
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300121class CTestMixedNewlines(CTest, TestMixedNewlines, unittest.TestCase): pass
122class PyTestMixedNewlines(PyTest, TestMixedNewlines, unittest.TestCase): pass
Jack Jansen518d2612002-04-14 20:17:18 +0000123
124if __name__ == '__main__':
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300125 unittest.main()