| # Codec encoding tests for ISO 2022 encodings. |
| |
| from test import multibytecodec_support |
| import unittest |
| |
| COMMON_CODEC_TESTS = ( |
| # invalid bytes |
| (b'ab\xFFcd', 'replace', 'ab\uFFFDcd'), |
| (b'ab\x1Bdef', 'replace', 'ab\x1Bdef'), |
| (b'ab\x1B$def', 'replace', 'ab\uFFFD'), |
| ) |
| |
| class Test_ISO2022_JP(multibytecodec_support.TestBase, unittest.TestCase): |
| encoding = 'iso2022_jp' |
| tstring = multibytecodec_support.load_teststring('iso2022_jp') |
| codectests = COMMON_CODEC_TESTS + ( |
| (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), |
| ) |
| |
| class Test_ISO2022_JP2(multibytecodec_support.TestBase, unittest.TestCase): |
| encoding = 'iso2022_jp_2' |
| tstring = multibytecodec_support.load_teststring('iso2022_jp') |
| codectests = COMMON_CODEC_TESTS + ( |
| (b'ab\x1BNdef', 'replace', 'abdef'), |
| ) |
| |
| class Test_ISO2022_JP3(multibytecodec_support.TestBase, unittest.TestCase): |
| encoding = 'iso2022_jp_3' |
| tstring = multibytecodec_support.load_teststring('iso2022_jp') |
| codectests = COMMON_CODEC_TESTS + ( |
| (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), |
| (b'\x1B$(O\x2E\x23\x1B(B', 'strict', '\u3402' ), |
| (b'\x1B$(O\x2E\x22\x1B(B', 'strict', '\U0002000B' ), |
| (b'\x1B$(O\x24\x77\x1B(B', 'strict', '\u304B\u309A'), |
| (b'\x1B$(P\x21\x22\x1B(B', 'strict', '\u4E02' ), |
| (b'\x1B$(P\x7E\x76\x1B(B', 'strict', '\U0002A6B2' ), |
| ('\u3402', 'strict', b'\x1B$(O\x2E\x23\x1B(B'), |
| ('\U0002000B', 'strict', b'\x1B$(O\x2E\x22\x1B(B'), |
| ('\u304B\u309A', 'strict', b'\x1B$(O\x24\x77\x1B(B'), |
| ('\u4E02', 'strict', b'\x1B$(P\x21\x22\x1B(B'), |
| ('\U0002A6B2', 'strict', b'\x1B$(P\x7E\x76\x1B(B'), |
| (b'ab\x1B$(O\x2E\x21\x1B(Bdef', 'replace', 'ab\uFFFDdef'), |
| ('ab\u4FF1def', 'replace', b'ab?def'), |
| ) |
| xmlcharnametest = ( |
| '\xAB\u211C\xBB = \u2329\u1234\u232A', |
| b'\x1B$(O\x29\x28\x1B(Bℜ\x1B$(O\x29\x32\x1B(B = ⟨ሴ⟩' |
| ) |
| |
| class Test_ISO2022_JP2004(multibytecodec_support.TestBase, unittest.TestCase): |
| encoding = 'iso2022_jp_2004' |
| tstring = multibytecodec_support.load_teststring('iso2022_jp') |
| codectests = COMMON_CODEC_TESTS + ( |
| (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), |
| (b'\x1B$(Q\x2E\x23\x1B(B', 'strict', '\u3402' ), |
| (b'\x1B$(Q\x2E\x22\x1B(B', 'strict', '\U0002000B' ), |
| (b'\x1B$(Q\x24\x77\x1B(B', 'strict', '\u304B\u309A'), |
| (b'\x1B$(P\x21\x22\x1B(B', 'strict', '\u4E02' ), |
| (b'\x1B$(P\x7E\x76\x1B(B', 'strict', '\U0002A6B2' ), |
| ('\u3402', 'strict', b'\x1B$(Q\x2E\x23\x1B(B'), |
| ('\U0002000B', 'strict', b'\x1B$(Q\x2E\x22\x1B(B'), |
| ('\u304B\u309A', 'strict', b'\x1B$(Q\x24\x77\x1B(B'), |
| ('\u4E02', 'strict', b'\x1B$(P\x21\x22\x1B(B'), |
| ('\U0002A6B2', 'strict', b'\x1B$(P\x7E\x76\x1B(B'), |
| (b'ab\x1B$(Q\x2E\x21\x1B(Bdef', 'replace', 'ab\u4FF1def'), |
| ('ab\u4FF1def', 'replace', b'ab\x1B$(Q\x2E\x21\x1B(Bdef'), |
| ) |
| xmlcharnametest = ( |
| '\xAB\u211C\xBB = \u2329\u1234\u232A', |
| b'\x1B$(Q\x29\x28\x1B(Bℜ\x1B$(Q\x29\x32\x1B(B = ⟨ሴ⟩' |
| ) |
| |
| class Test_ISO2022_KR(multibytecodec_support.TestBase, unittest.TestCase): |
| encoding = 'iso2022_kr' |
| tstring = multibytecodec_support.load_teststring('iso2022_kr') |
| codectests = COMMON_CODEC_TESTS + ( |
| (b'ab\x1BNdef', 'replace', 'ab\x1BNdef'), |
| ) |
| |
| # iso2022_kr.txt cannot be used to test "chunk coding": the escape |
| # sequence is only written on the first line |
| @unittest.skip('iso2022_kr.txt cannot be used to test "chunk coding"') |
| def test_chunkcoding(self): |
| pass |
| |
| if __name__ == "__main__": |
| unittest.main() |