| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 1 | # Tests universal newline support for both reading and parsing files. | 
| Benjamin Peterson | 4fa88fa | 2009-03-04 00:14:51 +0000 | [diff] [blame] | 2 | import io | 
 | 3 | import _pyio as pyio | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 4 | import unittest | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 5 | import os | 
 | 6 | import sys | 
| Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 7 | from test import support | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 8 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 9 | if not hasattr(sys.stdin, 'newlines'): | 
| Benjamin Peterson | e549ead | 2009-03-28 21:42:05 +0000 | [diff] [blame] | 10 |     raise unittest.SkipTest( | 
 | 11 |         "This Python does not have universal newline support") | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 12 |  | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 13 | FATX = 'x' * (2**14) | 
 | 14 |  | 
 | 15 | DATA_TEMPLATE = [ | 
 | 16 |     "line1=1", | 
| Guido van Rossum | 8358db2 | 2007-08-18 21:39:55 +0000 | [diff] [blame] | 17 |     "line2='this is a very long line designed to go past any default " + | 
 | 18 |         "buffer limits that exist in io.py but we also want to test " + | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 19 |         "the uncommon case, naturally.'", | 
 | 20 |     "def line3():pass", | 
 | 21 |     "line4 = '%s'" % FATX, | 
 | 22 |     ] | 
 | 23 |  | 
 | 24 | DATA_LF = "\n".join(DATA_TEMPLATE) + "\n" | 
 | 25 | DATA_CR = "\r".join(DATA_TEMPLATE) + "\r" | 
 | 26 | DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n" | 
 | 27 |  | 
 | 28 | # Note that DATA_MIXED also tests the ability to recognize a lone \r | 
 | 29 | # before end-of-file. | 
 | 30 | DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r" | 
 | 31 | DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE] | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 32 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 33 | class TestGenericUnivNewlines(unittest.TestCase): | 
 | 34 |     # use a class variable DATA to define the data to write to the file | 
 | 35 |     # and a class variable NEWLINE to set the expected newlines value | 
| Guido van Rossum | 8358db2 | 2007-08-18 21:39:55 +0000 | [diff] [blame] | 36 |     READMODE = 'r' | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 37 |     WRITEMODE = 'wb' | 
 | 38 |  | 
 | 39 |     def setUp(self): | 
| Guido van Rossum | 9c62772 | 2007-08-27 18:31:48 +0000 | [diff] [blame] | 40 |         data = self.DATA | 
 | 41 |         if "b" in self.WRITEMODE: | 
 | 42 |             data = data.encode("ascii") | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 43 |         with self.open(support.TESTFN, self.WRITEMODE) as fp: | 
 | 44 |             fp.write(data) | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 45 |  | 
 | 46 |     def tearDown(self): | 
 | 47 |         try: | 
| Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 48 |             os.unlink(support.TESTFN) | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 49 |         except: | 
 | 50 |             pass | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 51 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 52 |     def test_read(self): | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 53 |         with self.open(support.TESTFN, self.READMODE) as fp: | 
 | 54 |             data = fp.read() | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 55 |         self.assertEqual(data, DATA_LF) | 
| Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 56 |         self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 57 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 58 |     def test_readlines(self): | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 59 |         with self.open(support.TESTFN, self.READMODE) as fp: | 
 | 60 |             data = fp.readlines() | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 61 |         self.assertEqual(data, DATA_SPLIT) | 
| Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 62 |         self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 63 |  | 
 | 64 |     def test_readline(self): | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 65 |         with self.open(support.TESTFN, self.READMODE) as fp: | 
 | 66 |             data = [] | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 67 |             d = fp.readline() | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 68 |             while d: | 
 | 69 |                 data.append(d) | 
 | 70 |                 d = fp.readline() | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 71 |         self.assertEqual(data, DATA_SPLIT) | 
| Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 72 |         self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 73 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 74 |     def test_seek(self): | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 75 |         with self.open(support.TESTFN, self.READMODE) as fp: | 
 | 76 |             fp.readline() | 
 | 77 |             pos = fp.tell() | 
 | 78 |             data = fp.readlines() | 
 | 79 |             self.assertEqual(data, DATA_SPLIT[1:]) | 
 | 80 |             fp.seek(pos) | 
 | 81 |             data = fp.readlines() | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 82 |         self.assertEqual(data, DATA_SPLIT[1:]) | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 83 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 84 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 85 | class TestCRNewlines(TestGenericUnivNewlines): | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 86 |     NEWLINE = '\r' | 
 | 87 |     DATA = DATA_CR | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 88 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 89 | class TestLFNewlines(TestGenericUnivNewlines): | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 90 |     NEWLINE = '\n' | 
 | 91 |     DATA = DATA_LF | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 92 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 93 | class TestCRLFNewlines(TestGenericUnivNewlines): | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 94 |     NEWLINE = '\r\n' | 
 | 95 |     DATA = DATA_CRLF | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 96 |  | 
| Guido van Rossum | 8ce8a78 | 2007-11-01 19:42:39 +0000 | [diff] [blame] | 97 |     def test_tell(self): | 
| Philip Jenvey | a27c5bd | 2009-05-28 06:09:08 +0000 | [diff] [blame] | 98 |         with self.open(support.TESTFN, self.READMODE) as fp: | 
 | 99 |             self.assertEqual(repr(fp.newlines), repr(None)) | 
 | 100 |             data = fp.readline() | 
 | 101 |             pos = fp.tell() | 
| Guido van Rossum | 8ce8a78 | 2007-11-01 19:42:39 +0000 | [diff] [blame] | 102 |         self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) | 
 | 103 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 104 | class TestMixedNewlines(TestGenericUnivNewlines): | 
| Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 105 |     NEWLINE = ('\r', '\n') | 
 | 106 |     DATA = DATA_MIXED | 
| Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 107 |  | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 108 |  | 
 | 109 | def test_main(): | 
| Benjamin Peterson | 4fa88fa | 2009-03-04 00:14:51 +0000 | [diff] [blame] | 110 |     base_tests = (TestCRNewlines, | 
 | 111 |                   TestLFNewlines, | 
 | 112 |                   TestCRLFNewlines, | 
 | 113 |                   TestMixedNewlines) | 
 | 114 |     tests = [] | 
 | 115 |     # Test the C and Python implementations. | 
 | 116 |     for test in base_tests: | 
 | 117 |         class CTest(test): | 
 | 118 |             open = io.open | 
 | 119 |         CTest.__name__ = "C" + test.__name__ | 
 | 120 |         class PyTest(test): | 
 | 121 |             open = staticmethod(pyio.open) | 
 | 122 |         PyTest.__name__ = "Py" + test.__name__ | 
 | 123 |         tests.append(CTest) | 
 | 124 |         tests.append(PyTest) | 
 | 125 |     support.run_unittest(*tests) | 
| Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 126 |  | 
 | 127 | if __name__ == '__main__': | 
 | 128 |     test_main() |