| # |
| # This file is for everybody to add tests for bugs that aren't |
| # fixed yet. Please add a test case and appropriate bug description. |
| # |
| # When you fix one of the bugs, please move the test to the correct |
| # test_ module. |
| # |
| |
| import unittest |
| from test import test_support |
| |
| # |
| # One test case for outstanding bugs at the moment: |
| # |
| |
| class TestDifflibLongestMatch(unittest.TestCase): |
| # From Patch #1678339: |
| # The find_longest_match method in the difflib's SequenceMatcher has a bug. |
| |
| # The bug is in turn caused by a problem with creating a b2j mapping which |
| # should contain a list of indices for each of the list elements in b. |
| # However, when the b2j mapping is being created (this is being done in |
| # __chain_b method in the SequenceMatcher) the mapping becomes broken. The |
| # cause of this is that for the frequently used elements the list of indices |
| # is removed and the element is being enlisted in the populardict mapping. |
| |
| # The test case tries to match two strings like: |
| # abbbbbb.... and ...bbbbbbc |
| |
| # The number of b is equal and the find_longest_match should have returned |
| # the proper amount. However, in case the number of "b"s is large enough, the |
| # method reports that the length of the longest common substring is 0. It |
| # simply can't find it. |
| |
| # A bug was raised some time ago on this matter. It's ID is 1528074. |
| |
| def test_find_longest_match(self): |
| import difflib |
| for i in (190, 200, 210): |
| text1 = "a" + "b"*i |
| text2 = "b"*i + "c" |
| m = difflib.SequenceMatcher(None, text1, text2) |
| (aptr, bptr, l) = m.find_longest_match(0, len(text1), 0, len(text2)) |
| self.assertEquals(i, l) |
| self.assertEquals(aptr, 1) |
| self.assertEquals(bptr, 0) |
| |
| # test_io |
| import io |
| class TextIOWrapperTest(unittest.TestCase): |
| |
| def setUp(self): |
| self.testdata = b"AAA\r\nBBB\rCCC\r\nDDD\nEEE\r\n" |
| self.normalized = b"AAA\nBBB\nCCC\nDDD\nEEE\n".decode("ASCII") |
| |
| def tearDown(self): |
| test_support.unlink(test_support.TESTFN) |
| |
| |
| def test_issue1395_1(self): |
| txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII") |
| |
| # read one char at a time |
| reads = "" |
| while True: |
| c = txt.read(1) |
| if not c: |
| break |
| reads += c |
| self.assertEquals(reads, self.normalized) |
| |
| def test_issue1395_2(self): |
| txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII") |
| txt._CHUNK_SIZE = 4 |
| |
| reads = "" |
| while True: |
| c = txt.read(4) |
| if not c: |
| break |
| reads += c |
| self.assertEquals(reads, self.normalized) |
| |
| def test_issue1395_3(self): |
| txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII") |
| txt._CHUNK_SIZE = 4 |
| |
| reads = txt.read(4) |
| reads += txt.read(4) |
| reads += txt.readline() |
| reads += txt.readline() |
| reads += txt.readline() |
| self.assertEquals(reads, self.normalized) |
| |
| def test_issue1395_4(self): |
| txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII") |
| txt._CHUNK_SIZE = 4 |
| |
| reads = txt.read(4) |
| reads += txt.read() |
| self.assertEquals(reads, self.normalized) |
| |
| def test_issue1395_5(self): |
| txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII") |
| txt._CHUNK_SIZE = 4 |
| |
| reads = txt.read(4) |
| pos = txt.tell() |
| txt.seek(0) |
| txt.seek(pos) |
| self.assertEquals(txt.read(4), "BBB\n") |
| |
| |
| |
| def test_main(): |
| test_support.run_unittest( |
| TestDifflibLongestMatch, |
| TextIOWrapperTest) |
| |
| if __name__ == "__main__": |
| test_main() |