# Codec encoding tests for ISO 2022 encodings. from test import multibytecodec_support import unittest COMMON_CODEC_TESTS = ( # invalid bytes (b'ab\xFFcd', 'replace', 'ab\uFFFDcd'), (b'ab\x1Bdef', 'replace', 'ab\x1Bdef'), (b'ab\x1B$def', 'replace', 'ab\uFFFD'), ) class Test_ISO2022_JP(multibytecodec_support.TestBase, unittest.TestCase): encoding = 'iso2022_jp' tstring = multibytecodec_support.load_teststring('iso2022_jp') codectests = COMMON_CODEC_TESTS + ( (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), ) class Test_ISO2022_JP2(multibytecodec_support.TestBase, unittest.TestCase): encoding = 'iso2022_jp_2' tstring = multibytecodec_support.load_teststring('iso2022_jp') codectests = COMMON_CODEC_TESTS + ( (b'ab\x1BNdef', 'replace', 'abdef'), ) class Test_ISO2022_JP3(multibytecodec_support.TestBase, unittest.TestCase): encoding = 'iso2022_jp_3' tstring = multibytecodec_support.load_teststring('iso2022_jp') codectests = COMMON_CODEC_TESTS + ( (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), (b'\x1B$(O\x2E\x23\x1B(B', 'strict', '\u3402' ), (b'\x1B$(O\x2E\x22\x1B(B', 'strict', '\U0002000B' ), (b'\x1B$(O\x24\x77\x1B(B', 'strict', '\u304B\u309A'), (b'\x1B$(P\x21\x22\x1B(B', 'strict', '\u4E02' ), (b'\x1B$(P\x7E\x76\x1B(B', 'strict', '\U0002A6B2' ), ('\u3402', 'strict', b'\x1B$(O\x2E\x23\x1B(B'), ('\U0002000B', 'strict', b'\x1B$(O\x2E\x22\x1B(B'), ('\u304B\u309A', 'strict', b'\x1B$(O\x24\x77\x1B(B'), ('\u4E02', 'strict', b'\x1B$(P\x21\x22\x1B(B'), ('\U0002A6B2', 'strict', b'\x1B$(P\x7E\x76\x1B(B'), (b'ab\x1B$(O\x2E\x21\x1B(Bdef', 'replace', 'ab\uFFFDdef'), ('ab\u4FF1def', 'replace', b'ab?def'), ) xmlcharnametest = ( '\xAB\u211C\xBB = \u2329\u1234\u232A', b'\x1B$(O\x29\x28\x1B(Bℜ\x1B$(O\x29\x32\x1B(B = ⟨ሴ⟩' ) class Test_ISO2022_JP2004(multibytecodec_support.TestBase, unittest.TestCase): encoding = 'iso2022_jp_2004' tstring = multibytecodec_support.load_teststring('iso2022_jp') codectests = COMMON_CODEC_TESTS + ( (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), (b'\x1B$(Q\x2E\x23\x1B(B', 'strict', '\u3402' ), (b'\x1B$(Q\x2E\x22\x1B(B', 'strict', '\U0002000B' ), (b'\x1B$(Q\x24\x77\x1B(B', 'strict', '\u304B\u309A'), (b'\x1B$(P\x21\x22\x1B(B', 'strict', '\u4E02' ), (b'\x1B$(P\x7E\x76\x1B(B', 'strict', '\U0002A6B2' ), ('\u3402', 'strict', b'\x1B$(Q\x2E\x23\x1B(B'), ('\U0002000B', 'strict', b'\x1B$(Q\x2E\x22\x1B(B'), ('\u304B\u309A', 'strict', b'\x1B$(Q\x24\x77\x1B(B'), ('\u4E02', 'strict', b'\x1B$(P\x21\x22\x1B(B'), ('\U0002A6B2', 'strict', b'\x1B$(P\x7E\x76\x1B(B'), (b'ab\x1B$(Q\x2E\x21\x1B(Bdef', 'replace', 'ab\u4FF1def'), ('ab\u4FF1def', 'replace', b'ab\x1B$(Q\x2E\x21\x1B(Bdef'), ) xmlcharnametest = ( '\xAB\u211C\xBB = \u2329\u1234\u232A', b'\x1B$(Q\x29\x28\x1B(Bℜ\x1B$(Q\x29\x32\x1B(B = ⟨ሴ⟩' ) class Test_ISO2022_KR(multibytecodec_support.TestBase, unittest.TestCase): encoding = 'iso2022_kr' tstring = multibytecodec_support.load_teststring('iso2022_kr') codectests = COMMON_CODEC_TESTS + ( (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), ) # iso2022_kr.txt cannot be used to test "chunk coding": the escape # sequence is only written on the first line @unittest.skip('iso2022_kr.txt cannot be used to test "chunk coding"') def test_chunkcoding(self): pass if __name__ == "__main__": unittest.main()