blob: fd07539fb60fdeeb9d08b55dd0f7b0d0021a9bca [file] [log] [blame]
Jack Jansen518d2612002-04-14 20:17:18 +00001# Tests universal newline support for both reading and parsing files.
Benjamin Peterson4fa88fa2009-03-04 00:14:51 +00002import io
3import _pyio as pyio
Jack Jansen518d2612002-04-14 20:17:18 +00004import unittest
Jack Jansen518d2612002-04-14 20:17:18 +00005import os
6import sys
Benjamin Petersonee8712c2008-05-20 21:35:26 +00007from test import support
Jack Jansen518d2612002-04-14 20:17:18 +00008
Jack Jansen518d2612002-04-14 20:17:18 +00009if not hasattr(sys.stdin, 'newlines'):
Benjamin Petersone549ead2009-03-28 21:42:05 +000010 raise unittest.SkipTest(
11 "This Python does not have universal newline support")
Jack Jansen518d2612002-04-14 20:17:18 +000012
Tim Petersea572b22002-04-21 06:12:02 +000013FATX = 'x' * (2**14)
14
15DATA_TEMPLATE = [
16 "line1=1",
Guido van Rossum8358db22007-08-18 21:39:55 +000017 "line2='this is a very long line designed to go past any default " +
18 "buffer limits that exist in io.py but we also want to test " +
Tim Petersea572b22002-04-21 06:12:02 +000019 "the uncommon case, naturally.'",
20 "def line3():pass",
21 "line4 = '%s'" % FATX,
22 ]
23
24DATA_LF = "\n".join(DATA_TEMPLATE) + "\n"
25DATA_CR = "\r".join(DATA_TEMPLATE) + "\r"
26DATA_CRLF = "\r\n".join(DATA_TEMPLATE) + "\r\n"
27
28# Note that DATA_MIXED also tests the ability to recognize a lone \r
29# before end-of-file.
30DATA_MIXED = "\n".join(DATA_TEMPLATE) + "\r"
31DATA_SPLIT = [x + "\n" for x in DATA_TEMPLATE]
Tim Petersea572b22002-04-21 06:12:02 +000032
Ezio Melotti28b0d9d2013-06-09 00:07:06 +030033class CTest:
34 open = io.open
35
36class PyTest:
37 open = staticmethod(pyio.open)
38
39class TestGenericUnivNewlines:
Jack Jansen518d2612002-04-14 20:17:18 +000040 # use a class variable DATA to define the data to write to the file
41 # and a class variable NEWLINE to set the expected newlines value
Guido van Rossum8358db22007-08-18 21:39:55 +000042 READMODE = 'r'
Jack Jansen518d2612002-04-14 20:17:18 +000043 WRITEMODE = 'wb'
44
45 def setUp(self):
Guido van Rossum9c627722007-08-27 18:31:48 +000046 data = self.DATA
47 if "b" in self.WRITEMODE:
48 data = data.encode("ascii")
Philip Jenveya27c5bd2009-05-28 06:09:08 +000049 with self.open(support.TESTFN, self.WRITEMODE) as fp:
50 fp.write(data)
Jack Jansen518d2612002-04-14 20:17:18 +000051
52 def tearDown(self):
53 try:
Benjamin Petersonee8712c2008-05-20 21:35:26 +000054 os.unlink(support.TESTFN)
Jack Jansen518d2612002-04-14 20:17:18 +000055 except:
56 pass
Tim Peters863ac442002-04-16 01:38:40 +000057
Jack Jansen518d2612002-04-14 20:17:18 +000058 def test_read(self):
Philip Jenveya27c5bd2009-05-28 06:09:08 +000059 with self.open(support.TESTFN, self.READMODE) as fp:
60 data = fp.read()
Jack Jansen518d2612002-04-14 20:17:18 +000061 self.assertEqual(data, DATA_LF)
Walter Dörwald70a6b492004-02-12 17:35:32 +000062 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000063
Jack Jansen518d2612002-04-14 20:17:18 +000064 def test_readlines(self):
Philip Jenveya27c5bd2009-05-28 06:09:08 +000065 with self.open(support.TESTFN, self.READMODE) as fp:
66 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000067 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000068 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Jack Jansen518d2612002-04-14 20:17:18 +000069
70 def test_readline(self):
Philip Jenveya27c5bd2009-05-28 06:09:08 +000071 with self.open(support.TESTFN, self.READMODE) as fp:
72 data = []
Jack Jansen518d2612002-04-14 20:17:18 +000073 d = fp.readline()
Philip Jenveya27c5bd2009-05-28 06:09:08 +000074 while d:
75 data.append(d)
76 d = fp.readline()
Jack Jansen518d2612002-04-14 20:17:18 +000077 self.assertEqual(data, DATA_SPLIT)
Walter Dörwald70a6b492004-02-12 17:35:32 +000078 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Tim Peters863ac442002-04-16 01:38:40 +000079
Jack Jansen518d2612002-04-14 20:17:18 +000080 def test_seek(self):
Philip Jenveya27c5bd2009-05-28 06:09:08 +000081 with self.open(support.TESTFN, self.READMODE) as fp:
82 fp.readline()
83 pos = fp.tell()
84 data = fp.readlines()
85 self.assertEqual(data, DATA_SPLIT[1:])
86 fp.seek(pos)
87 data = fp.readlines()
Jack Jansen518d2612002-04-14 20:17:18 +000088 self.assertEqual(data, DATA_SPLIT[1:])
Tim Peters863ac442002-04-16 01:38:40 +000089
Jack Jansen518d2612002-04-14 20:17:18 +000090
Jack Jansen518d2612002-04-14 20:17:18 +000091class TestCRNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000092 NEWLINE = '\r'
93 DATA = DATA_CR
Ezio Melotti28b0d9d2013-06-09 00:07:06 +030094class CTestCRNewlines(CTest, TestCRNewlines, unittest.TestCase): pass
95class PyTestCRNewlines(PyTest, TestCRNewlines, unittest.TestCase): pass
Tim Peters863ac442002-04-16 01:38:40 +000096
Jack Jansen518d2612002-04-14 20:17:18 +000097class TestLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +000098 NEWLINE = '\n'
99 DATA = DATA_LF
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300100class CTestLFNewlines(CTest, TestLFNewlines, unittest.TestCase): pass
101class PyTestLFNewlines(PyTest, TestLFNewlines, unittest.TestCase): pass
Tim Peters863ac442002-04-16 01:38:40 +0000102
Jack Jansen518d2612002-04-14 20:17:18 +0000103class TestCRLFNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000104 NEWLINE = '\r\n'
105 DATA = DATA_CRLF
Tim Peters863ac442002-04-16 01:38:40 +0000106
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000107 def test_tell(self):
Philip Jenveya27c5bd2009-05-28 06:09:08 +0000108 with self.open(support.TESTFN, self.READMODE) as fp:
109 self.assertEqual(repr(fp.newlines), repr(None))
110 data = fp.readline()
111 pos = fp.tell()
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000112 self.assertEqual(repr(fp.newlines), repr(self.NEWLINE))
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300113class CTestCRLFNewlines(CTest, TestCRLFNewlines, unittest.TestCase): pass
114class PyTestCRLFNewlines(PyTest, TestCRLFNewlines, unittest.TestCase): pass
Guido van Rossum8ce8a782007-11-01 19:42:39 +0000115
Jack Jansen518d2612002-04-14 20:17:18 +0000116class TestMixedNewlines(TestGenericUnivNewlines):
Tim Petersea572b22002-04-21 06:12:02 +0000117 NEWLINE = ('\r', '\n')
118 DATA = DATA_MIXED
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300119class CTestMixedNewlines(CTest, TestMixedNewlines, unittest.TestCase): pass
120class PyTestMixedNewlines(PyTest, TestMixedNewlines, unittest.TestCase): pass
Jack Jansen518d2612002-04-14 20:17:18 +0000121
122if __name__ == '__main__':
Ezio Melotti28b0d9d2013-06-09 00:07:06 +0300123 unittest.main()