Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 1 | # Tests universal newline support for both reading and parsing files. |
Benjamin Peterson | 4fa88fa | 2009-03-04 00:14:51 +0000 | [diff] [blame] | 2 | import io |
| 3 | import _pyio as pyio |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 4 | import unittest |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 5 | import os |
| 6 | import sys |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 7 | from test import support |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 8 | from test.support import os_helper |
| 9 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 10 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 11 | if not hasattr(sys.stdin, 'newlines'): |
Benjamin Peterson | e549ead | 2009-03-28 21:42:05 +0000 | [diff] [blame] | 12 | raise unittest.SkipTest( |
| 13 | "This Python does not have universal newline support") |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 14 | |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 15 | FATX = 'x' * (2**14) |
| 16 | |
| 17 | DATA_TEMPLATE = [ |
| 18 | "line1=1", |
Guido van Rossum | 8358db2 | 2007-08-18 21:39:55 +0000 | [diff] [blame] | 19 | "line2='this is a very long line designed to go past any default " + |
| 20 | "buffer limits that exist in io.py but we also want to test " + |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 21 | "the uncommon case, naturally.'", |
| 22 | "def line3():pass", |
| 23 | "line4 = '%s'" % FATX, |
| 24 | ] |
| 25 | |
| 26 | DATA_LF = "\n".join(DATA_TEMPLATE) + "\n" |
| 27 | DATA_CR = "\r".join(DATA_TEMPLATE) + "\r" |
| 28 | DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n" |
| 29 | |
| 30 | # Note that DATA_MIXED also tests the ability to recognize a lone \r |
| 31 | # before end-of-file. |
| 32 | DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r" |
| 33 | DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE] |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 34 | |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 35 | class CTest: |
| 36 | open = io.open |
| 37 | |
| 38 | class PyTest: |
| 39 | open = staticmethod(pyio.open) |
| 40 | |
| 41 | class TestGenericUnivNewlines: |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 42 | # use a class variable DATA to define the data to write to the file |
| 43 | # and a class variable NEWLINE to set the expected newlines value |
Guido van Rossum | 8358db2 | 2007-08-18 21:39:55 +0000 | [diff] [blame] | 44 | READMODE = 'r' |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 45 | WRITEMODE = 'wb' |
| 46 | |
| 47 | def setUp(self): |
Guido van Rossum | 9c62772 | 2007-08-27 18:31:48 +0000 | [diff] [blame] | 48 | data = self.DATA |
| 49 | if "b" in self.WRITEMODE: |
| 50 | data = data.encode("ascii") |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 51 | with self.open(os_helper.TESTFN, self.WRITEMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 52 | fp.write(data) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 53 | |
| 54 | def tearDown(self): |
| 55 | try: |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 56 | os.unlink(os_helper.TESTFN) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 57 | except: |
| 58 | pass |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 59 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 60 | def test_read(self): |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 61 | with self.open(os_helper.TESTFN, self.READMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 62 | data = fp.read() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 63 | self.assertEqual(data, DATA_LF) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 64 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 65 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 66 | def test_readlines(self): |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 67 | with self.open(os_helper.TESTFN, self.READMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 68 | data = fp.readlines() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 69 | self.assertEqual(data, DATA_SPLIT) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 70 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 71 | |
| 72 | def test_readline(self): |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 73 | with self.open(os_helper.TESTFN, self.READMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 74 | data = [] |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 75 | d = fp.readline() |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 76 | while d: |
| 77 | data.append(d) |
| 78 | d = fp.readline() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 79 | self.assertEqual(data, DATA_SPLIT) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 80 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 81 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 82 | def test_seek(self): |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 83 | with self.open(os_helper.TESTFN, self.READMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 84 | fp.readline() |
| 85 | pos = fp.tell() |
| 86 | data = fp.readlines() |
| 87 | self.assertEqual(data, DATA_SPLIT[1:]) |
| 88 | fp.seek(pos) |
| 89 | data = fp.readlines() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 90 | self.assertEqual(data, DATA_SPLIT[1:]) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 91 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 92 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 93 | class TestCRNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 94 | NEWLINE = '\r' |
| 95 | DATA = DATA_CR |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 96 | class CTestCRNewlines(CTest, TestCRNewlines, unittest.TestCase): pass |
| 97 | class PyTestCRNewlines(PyTest, TestCRNewlines, unittest.TestCase): pass |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 98 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 99 | class TestLFNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 100 | NEWLINE = '\n' |
| 101 | DATA = DATA_LF |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 102 | class CTestLFNewlines(CTest, TestLFNewlines, unittest.TestCase): pass |
| 103 | class PyTestLFNewlines(PyTest, TestLFNewlines, unittest.TestCase): pass |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 104 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 105 | class TestCRLFNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 106 | NEWLINE = '\r\n' |
| 107 | DATA = DATA_CRLF |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 108 | |
Guido van Rossum | 8ce8a78 | 2007-11-01 19:42:39 +0000 | [diff] [blame] | 109 | def test_tell(self): |
Hai Shi | 883bc63 | 2020-07-06 17:12:49 +0800 | [diff] [blame^] | 110 | with self.open(os_helper.TESTFN, self.READMODE) as fp: |
Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 111 | self.assertEqual(repr(fp.newlines), repr(None)) |
| 112 | data = fp.readline() |
| 113 | pos = fp.tell() |
Guido van Rossum | 8ce8a78 | 2007-11-01 19:42:39 +0000 | [diff] [blame] | 114 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 115 | class CTestCRLFNewlines(CTest, TestCRLFNewlines, unittest.TestCase): pass |
| 116 | class PyTestCRLFNewlines(PyTest, TestCRLFNewlines, unittest.TestCase): pass |
Guido van Rossum | 8ce8a78 | 2007-11-01 19:42:39 +0000 | [diff] [blame] | 117 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 118 | class TestMixedNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 119 | NEWLINE = ('\r', '\n') |
| 120 | DATA = DATA_MIXED |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 121 | class CTestMixedNewlines(CTest, TestMixedNewlines, unittest.TestCase): pass |
| 122 | class PyTestMixedNewlines(PyTest, TestMixedNewlines, unittest.TestCase): pass |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 123 | |
| 124 | if __name__ == '__main__': |
Ezio Melotti | 28b0d9d | 2013-06-09 00:07:06 +0300 | [diff] [blame] | 125 | unittest.main() |