blob: 63c6fe8240fe839425c234beada55789b9b478bd [file] [log] [blame]
Jack Jansen518d2612002-04-14 20:17:18 +00001# Tests universal newline support for both reading and parsing files.
2import unittest
Jack Jansen518d2612002-04-14 20:17:18 +00003import os
4import sys
Barry Warsaw04f357c2002-07-23 19:04:11 +00005from test import test_support
Jack Jansen518d2612002-04-14 20:17:18 +00006
Jack Jansen518d2612002-04-14 20:17:18 +00007if not hasattr(sys.stdin, 'newlines'):
Benjamin Peterson888a39b2009-03-26 20:48:25 +00008 raise unittest.SkipTest, \
Jack Jansen518d2612002-04-14 20:17:18 +00009 "This Python does not have universal newline support"
10
Tim Petersea572b22002-04-21 06:12:02 +000011FATX = 'x' * (2**14)
12
13DATA_TEMPLATE = [
14 "line1=1",
15 "line2='this is a very long line designed to go past the magic " +
16 "hundred character limit that is inside fileobject.c and which " +
17 "is meant to speed up the common case, but we also want to test " +
18 "the uncommon case, naturally.'",
19 "def line3():pass",
20 "line4 = '%s'" % FATX,
21 ]
22
23DATA_LF = "\n".join(DATA_TEMPLATE) + "\n"
24DATA_CR = "\r".join(DATA_TEMPLATE) + "\r"
25DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n"
26
27# Note that DATA_MIXED also tests the ability to recognize a lone \r
28# before end-of-file.
29DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r"
30DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE]
31del x
32
Jack Jansen518d2612002-04-14 20:17:18 +000033class TestGenericUnivNewlines(unittest.TestCase):
34 # use a class variable DATA to define the data to write to the file
35 # and a class variable NEWLINE to set the expected newlines value
36 READMODE = 'U'
37 WRITEMODE = 'wb'
38
39 def setUp(self):
Philip Jenvey6a111022009-05-28 05:58:44 +000040 with open(test_support.TESTFN, self.WRITEMODE) as fp:
41 fp.write(self.DATA)
Jack Jansen518d2612002-04-14 20:17:18 +000042
43 def tearDown(self):
44 try:
45 os.unlink(test_support.TESTFN)
46 except:
47 pass
Tim Peters863ac442002-04-16 01:38:40 +000048
Jack Jansen518d2612002-04-14 20:17:18 +000049 def test_read(self):
Philip Jenvey6a111022009-05-28 05:58:44 +000050 with open(test_support.TESTFN, self.READMODE) as fp:
51 data = fp.read()
Jack Jansen518d2612002-04-14 20:17:18 +000052 self.assertEqual(data, DATA_LF)
Walter Dörwald70a6b492004-02-12 17:35:32 +000053 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000054
Jack Jansen518d2612002-04-14 20:17:18 +000055 def test_readlines(self):
Philip Jenvey6a111022009-05-28 05:58:44 +000056 with open(test_support.TESTFN, self.READMODE) as fp:
57 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000058 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000059 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Jack Jansen518d2612002-04-14 20:17:18 +000060
61 def test_readline(self):
Philip Jenvey6a111022009-05-28 05:58:44 +000062 with open(test_support.TESTFN, self.READMODE) as fp:
63 data = []
Jack Jansen518d2612002-04-14 20:17:18 +000064 d = fp.readline()
Philip Jenvey6a111022009-05-28 05:58:44 +000065 while d:
66 data.append(d)
67 d = fp.readline()
Jack Jansen518d2612002-04-14 20:17:18 +000068 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000069 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000070
Jack Jansen518d2612002-04-14 20:17:18 +000071 def test_seek(self):
Philip Jenvey6a111022009-05-28 05:58:44 +000072 with open(test_support.TESTFN, self.READMODE) as fp:
73 fp.readline()
74 pos = fp.tell()
75 data = fp.readlines()
76 self.assertEqual(data, DATA_SPLIT[1:])
77 fp.seek(pos)
78 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000079 self.assertEqual(data, DATA_SPLIT[1:])
Tim Peters863ac442002-04-16 01:38:40 +000080
Jack Jansen518d2612002-04-14 20:17:18 +000081 def test_execfile(self):
Tim Petersea572b22002-04-21 06:12:02 +000082 namespace = {}
83 execfile(test_support.TESTFN, namespace)
84 func = namespace['line3']
Jack Jansen518d2612002-04-14 20:17:18 +000085 self.assertEqual(func.func_code.co_firstlineno, 3)
Tim Petersea572b22002-04-21 06:12:02 +000086 self.assertEqual(namespace['line4'], FATX)
Tim Peters863ac442002-04-16 01:38:40 +000087
Jack Jansen518d2612002-04-14 20:17:18 +000088
89class TestNativeNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000090 NEWLINE = None
91 DATA = DATA_LF
92 READMODE = 'r'
93 WRITEMODE = 'w'
Tim Peters863ac442002-04-16 01:38:40 +000094
Jack Jansen518d2612002-04-14 20:17:18 +000095class TestCRNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000096 NEWLINE = '\r'
97 DATA = DATA_CR
Tim Peters863ac442002-04-16 01:38:40 +000098
Jack Jansen518d2612002-04-14 20:17:18 +000099class TestLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000100 NEWLINE = '\n'
101 DATA = DATA_LF
Tim Peters863ac442002-04-16 01:38:40 +0000102
Jack Jansen518d2612002-04-14 20:17:18 +0000103class TestCRLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000104 NEWLINE = '\r\n'
105 DATA = DATA_CRLF
Tim Peters863ac442002-04-16 01:38:40 +0000106
Guido van Rossumad8fb0d2007-09-22 20:18:03 +0000107 def test_tell(self):
Philip Jenvey6a111022009-05-28 05:58:44 +0000108 with open(test_support.TESTFN, self.READMODE) as fp:
109 self.assertEqual(repr(fp.newlines), repr(None))
110 data = fp.readline()
111 pos = fp.tell()
Guido van Rossumad8fb0d2007-09-22 20:18:03 +0000112 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
113
Jack Jansen518d2612002-04-14 20:17:18 +0000114class TestMixedNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000115 NEWLINE = ('\r', '\n')
116 DATA = DATA_MIXED
Tim Peters863ac442002-04-16 01:38:40 +0000117
Jack Jansen518d2612002-04-14 20:17:18 +0000118
119def test_main():
Walter Dörwald21d3a322003-05-01 17:45:56 +0000120 test_support.run_unittest(
121 TestNativeNewlines,
122 TestCRNewlines,
123 TestLFNewlines,
124 TestCRLFNewlines,
125 TestMixedNewlines
126 )
Jack Jansen518d2612002-04-14 20:17:18 +0000127
128if __name__ == '__main__':
129 test_main()