Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 1 | # Tests universal newline support for both reading and parsing files. |
| 2 | import unittest |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 3 | import os |
| 4 | import sys |
Barry Warsaw | 04f357c | 2002-07-23 19:04:11 +0000 | [diff] [blame] | 5 | from test import test_support |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 6 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 7 | if not hasattr(sys.stdin, 'newlines'): |
Benjamin Peterson | 888a39b | 2009-03-26 20:48:25 +0000 | [diff] [blame] | 8 | raise unittest.SkipTest, \ |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 9 | "This Python does not have universal newline support" |
| 10 | |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 11 | FATX = 'x' * (2**14) |
| 12 | |
| 13 | DATA_TEMPLATE = [ |
| 14 | "line1=1", |
| 15 | "line2='this is a very long line designed to go past the magic " + |
| 16 | "hundred character limit that is inside fileobject.c and which " + |
| 17 | "is meant to speed up the common case, but we also want to test " + |
| 18 | "the uncommon case, naturally.'", |
| 19 | "def line3():pass", |
| 20 | "line4 = '%s'" % FATX, |
| 21 | ] |
| 22 | |
| 23 | DATA_LF = "\n".join(DATA_TEMPLATE) + "\n" |
| 24 | DATA_CR = "\r".join(DATA_TEMPLATE) + "\r" |
| 25 | DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n" |
| 26 | |
| 27 | # Note that DATA_MIXED also tests the ability to recognize a lone \r |
| 28 | # before end-of-file. |
| 29 | DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r" |
| 30 | DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE] |
| 31 | del x |
| 32 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 33 | class TestGenericUnivNewlines(unittest.TestCase): |
| 34 | # use a class variable DATA to define the data to write to the file |
| 35 | # and a class variable NEWLINE to set the expected newlines value |
| 36 | READMODE = 'U' |
| 37 | WRITEMODE = 'wb' |
| 38 | |
| 39 | def setUp(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 40 | with open(test_support.TESTFN, self.WRITEMODE) as fp: |
| 41 | fp.write(self.DATA) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 42 | |
| 43 | def tearDown(self): |
| 44 | try: |
| 45 | os.unlink(test_support.TESTFN) |
| 46 | except: |
| 47 | pass |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 48 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 49 | def test_read(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 50 | with open(test_support.TESTFN, self.READMODE) as fp: |
| 51 | data = fp.read() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 52 | self.assertEqual(data, DATA_LF) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 53 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 54 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 55 | def test_readlines(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 56 | with open(test_support.TESTFN, self.READMODE) as fp: |
| 57 | data = fp.readlines() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 58 | self.assertEqual(data, DATA_SPLIT) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 59 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 60 | |
| 61 | def test_readline(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 62 | with open(test_support.TESTFN, self.READMODE) as fp: |
| 63 | data = [] |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 64 | d = fp.readline() |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 65 | while d: |
| 66 | data.append(d) |
| 67 | d = fp.readline() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 68 | self.assertEqual(data, DATA_SPLIT) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 69 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 70 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 71 | def test_seek(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 72 | with open(test_support.TESTFN, self.READMODE) as fp: |
| 73 | fp.readline() |
| 74 | pos = fp.tell() |
| 75 | data = fp.readlines() |
| 76 | self.assertEqual(data, DATA_SPLIT[1:]) |
| 77 | fp.seek(pos) |
| 78 | data = fp.readlines() |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 79 | self.assertEqual(data, DATA_SPLIT[1:]) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 80 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 81 | def test_execfile(self): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 82 | namespace = {} |
| 83 | execfile(test_support.TESTFN, namespace) |
| 84 | func = namespace['line3'] |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 85 | self.assertEqual(func.func_code.co_firstlineno, 3) |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 86 | self.assertEqual(namespace['line4'], FATX) |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 87 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 88 | |
| 89 | class TestNativeNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 90 | NEWLINE = None |
| 91 | DATA = DATA_LF |
| 92 | READMODE = 'r' |
| 93 | WRITEMODE = 'w' |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 94 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 95 | class TestCRNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 96 | NEWLINE = '\r' |
| 97 | DATA = DATA_CR |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 98 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 99 | class TestLFNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 100 | NEWLINE = '\n' |
| 101 | DATA = DATA_LF |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 102 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 103 | class TestCRLFNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 104 | NEWLINE = '\r\n' |
| 105 | DATA = DATA_CRLF |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 106 | |
Guido van Rossum | ad8fb0d | 2007-09-22 20:18:03 +0000 | [diff] [blame] | 107 | def test_tell(self): |
Philip Jenvey | 6a11102 | 2009-05-28 05:58:44 +0000 | [diff] [blame^] | 108 | with open(test_support.TESTFN, self.READMODE) as fp: |
| 109 | self.assertEqual(repr(fp.newlines), repr(None)) |
| 110 | data = fp.readline() |
| 111 | pos = fp.tell() |
Guido van Rossum | ad8fb0d | 2007-09-22 20:18:03 +0000 | [diff] [blame] | 112 | self.assertEqual(repr(fp.newlines), repr(self.NEWLINE)) |
| 113 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 114 | class TestMixedNewlines(TestGenericUnivNewlines): |
Tim Peters | ea572b2 | 2002-04-21 06:12:02 +0000 | [diff] [blame] | 115 | NEWLINE = ('\r', '\n') |
| 116 | DATA = DATA_MIXED |
Tim Peters | 863ac44 | 2002-04-16 01:38:40 +0000 | [diff] [blame] | 117 | |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 118 | |
| 119 | def test_main(): |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 120 | test_support.run_unittest( |
| 121 | TestNativeNewlines, |
| 122 | TestCRNewlines, |
| 123 | TestLFNewlines, |
| 124 | TestCRLFNewlines, |
| 125 | TestMixedNewlines |
| 126 | ) |
Jack Jansen | 518d261 | 2002-04-14 20:17:18 +0000 | [diff] [blame] | 127 | |
| 128 | if __name__ == '__main__': |
| 129 | test_main() |