122 lines
3.7 KiB
Python
122 lines
3.7 KiB
Python
#
|
|
# This file is for everybody to add tests for bugs that aren't
|
|
# fixed yet. Please add a test case and appropriate bug description.
|
|
#
|
|
# When you fix one of the bugs, please move the test to the correct
|
|
# test_ module.
|
|
#
|
|
|
|
import unittest
|
|
from test import test_support
|
|
|
|
#
|
|
# One test case for outstanding bugs at the moment:
|
|
#
|
|
|
|
class TestDifflibLongestMatch(unittest.TestCase):
|
|
# From Patch #1678339:
|
|
# The find_longest_match method in the difflib's SequenceMatcher has a bug.
|
|
|
|
# The bug is in turn caused by a problem with creating a b2j mapping which
|
|
# should contain a list of indices for each of the list elements in b.
|
|
# However, when the b2j mapping is being created (this is being done in
|
|
# __chain_b method in the SequenceMatcher) the mapping becomes broken. The
|
|
# cause of this is that for the frequently used elements the list of indices
|
|
# is removed and the element is being enlisted in the populardict mapping.
|
|
|
|
# The test case tries to match two strings like:
|
|
# abbbbbb.... and ...bbbbbbc
|
|
|
|
# The number of b is equal and the find_longest_match should have returned
|
|
# the proper amount. However, in case the number of "b"s is large enough, the
|
|
# method reports that the length of the longest common substring is 0. It
|
|
# simply can't find it.
|
|
|
|
# A bug was raised some time ago on this matter. It's ID is 1528074.
|
|
|
|
def test_find_longest_match(self):
|
|
import difflib
|
|
for i in (190, 200, 210):
|
|
text1 = "a" + "b"*i
|
|
text2 = "b"*i + "c"
|
|
m = difflib.SequenceMatcher(None, text1, text2)
|
|
(aptr, bptr, l) = m.find_longest_match(0, len(text1), 0, len(text2))
|
|
self.assertEquals(i, l)
|
|
self.assertEquals(aptr, 1)
|
|
self.assertEquals(bptr, 0)
|
|
|
|
# test_io
|
|
import io
|
|
class TextIOWrapperTest(unittest.TestCase):
|
|
|
|
def setUp(self):
|
|
self.testdata = b"AAA\r\nBBB\rCCC\r\nDDD\nEEE\r\n"
|
|
self.normalized = b"AAA\nBBB\nCCC\nDDD\nEEE\n".decode("ASCII")
|
|
|
|
def tearDown(self):
|
|
test_support.unlink(test_support.TESTFN)
|
|
|
|
|
|
def test_issue1395_1(self):
|
|
txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII")
|
|
|
|
# read one char at a time
|
|
reads = ""
|
|
while True:
|
|
c = txt.read(1)
|
|
if not c:
|
|
break
|
|
reads += c
|
|
self.assertEquals(reads, self.normalized)
|
|
|
|
def test_issue1395_2(self):
|
|
txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII")
|
|
txt._CHUNK_SIZE = 4
|
|
|
|
reads = ""
|
|
while True:
|
|
c = txt.read(4)
|
|
if not c:
|
|
break
|
|
reads += c
|
|
self.assertEquals(reads, self.normalized)
|
|
|
|
def test_issue1395_3(self):
|
|
txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII")
|
|
txt._CHUNK_SIZE = 4
|
|
|
|
reads = txt.read(4)
|
|
reads += txt.read(4)
|
|
reads += txt.readline()
|
|
reads += txt.readline()
|
|
reads += txt.readline()
|
|
self.assertEquals(reads, self.normalized)
|
|
|
|
def test_issue1395_4(self):
|
|
txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII")
|
|
txt._CHUNK_SIZE = 4
|
|
|
|
reads = txt.read(4)
|
|
reads += txt.read()
|
|
self.assertEquals(reads, self.normalized)
|
|
|
|
def test_issue1395_5(self):
|
|
txt = io.TextIOWrapper(io.BytesIO(self.testdata), encoding="ASCII")
|
|
txt._CHUNK_SIZE = 4
|
|
|
|
reads = txt.read(4)
|
|
pos = txt.tell()
|
|
txt.seek(0)
|
|
txt.seek(pos)
|
|
self.assertEquals(txt.read(4), "BBB\n")
|
|
|
|
|
|
|
|
def test_main():
|
|
test_support.run_unittest(
|
|
TestDifflibLongestMatch,
|
|
TextIOWrapperTest)
|
|
|
|
if __name__ == "__main__":
|
|
test_main()
|