Benjamin Peterson | 90f5ba5 | 2010-03-11 22:53:45 +0000 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 2 | # |
| 3 | # test_codecencodings_kr.py |
| 4 | # Codec encoding tests for ROK encodings. |
| 5 | # |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 6 | |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 7 | from test import support |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 8 | from test import multibytecodec_support |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 9 | import unittest |
| 10 | |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 11 | class Test_CP949(multibytecodec_support.TestBase, unittest.TestCase): |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 12 | encoding = 'cp949' |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 13 | tstring = multibytecodec_support.load_teststring('cp949') |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 14 | codectests = ( |
| 15 | # invalid bytes |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 16 | (b"abc\x80\x80\xc1\xc4", "strict", None), |
| 17 | (b"abc\xc8", "strict", None), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 18 | (b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\uc894"), |
| 19 | (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\uc894\ufffd"), |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 20 | (b"abc\x80\x80\xc1\xc4", "ignore", "abc\uc894"), |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 21 | ) |
| 22 | |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 23 | class Test_EUCKR(multibytecodec_support.TestBase, unittest.TestCase): |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 24 | encoding = 'euc_kr' |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 25 | tstring = multibytecodec_support.load_teststring('euc_kr') |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 26 | codectests = ( |
| 27 | # invalid bytes |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 28 | (b"abc\x80\x80\xc1\xc4", "strict", None), |
| 29 | (b"abc\xc8", "strict", None), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 30 | (b"abc\x80\x80\xc1\xc4", "replace", 'abc\ufffd\ufffd\uc894'), |
| 31 | (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\uc894\ufffd"), |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 32 | (b"abc\x80\x80\xc1\xc4", "ignore", "abc\uc894"), |
Guido van Rossum | 61e21b5 | 2007-08-20 19:06:03 +0000 | [diff] [blame] | 33 | |
| 34 | # composed make-up sequence errors |
| 35 | (b"\xa4\xd4", "strict", None), |
| 36 | (b"\xa4\xd4\xa4", "strict", None), |
| 37 | (b"\xa4\xd4\xa4\xb6", "strict", None), |
| 38 | (b"\xa4\xd4\xa4\xb6\xa4", "strict", None), |
| 39 | (b"\xa4\xd4\xa4\xb6\xa4\xd0", "strict", None), |
| 40 | (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4", "strict", None), |
| 41 | (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4", "strict", "\uc4d4"), |
| 42 | (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4x", "strict", "\uc4d4x"), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 43 | (b"a\xa4\xd4\xa4\xb6\xa4", "replace", 'a\ufffd'), |
Guido van Rossum | 61e21b5 | 2007-08-20 19:06:03 +0000 | [diff] [blame] | 44 | (b"\xa4\xd4\xa3\xb6\xa4\xd0\xa4\xd4", "strict", None), |
| 45 | (b"\xa4\xd4\xa4\xb6\xa3\xd0\xa4\xd4", "strict", None), |
| 46 | (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa3\xd4", "strict", None), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 47 | (b"\xa4\xd4\xa4\xff\xa4\xd0\xa4\xd4", "replace", '\ufffd\u6e21\ufffd\u3160\ufffd'), |
| 48 | (b"\xa4\xd4\xa4\xb6\xa4\xff\xa4\xd4", "replace", '\ufffd\u6e21\ub544\ufffd\ufffd'), |
| 49 | (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xff", "replace", '\ufffd\u6e21\ub544\u572d\ufffd'), |
| 50 | (b"\xa4\xd4\xff\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4", "replace", '\ufffd\ufffd\ufffd\uc4d4'), |
Guido van Rossum | 61e21b5 | 2007-08-20 19:06:03 +0000 | [diff] [blame] | 51 | (b"\xc1\xc4", "strict", "\uc894"), |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 52 | ) |
| 53 | |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 54 | class Test_JOHAB(multibytecodec_support.TestBase, unittest.TestCase): |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 55 | encoding = 'johab' |
R David Murray | 75d9aca | 2012-04-09 09:37:52 -0400 | [diff] [blame] | 56 | tstring = multibytecodec_support.load_teststring('johab') |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 57 | codectests = ( |
| 58 | # invalid bytes |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 59 | (b"abc\x80\x80\xc1\xc4", "strict", None), |
| 60 | (b"abc\xc8", "strict", None), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 61 | (b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\ucd27"), |
| 62 | (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\ucd27\ufffd"), |
Guido van Rossum | 024da5c | 2007-05-17 23:59:11 +0000 | [diff] [blame] | 63 | (b"abc\x80\x80\xc1\xc4", "ignore", "abc\ucd27"), |
Victor Stinner | 2cded9c | 2011-07-08 01:45:13 +0200 | [diff] [blame] | 64 | (b"\xD8abc", "replace", "\uFFFDabc"), |
| 65 | (b"\xD8\xFFabc", "replace", "\uFFFD\uFFFDabc"), |
| 66 | (b"\x84bxy", "replace", "\uFFFDbxy"), |
| 67 | (b"\x8CBxy", "replace", "\uFFFDBxy"), |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 68 | ) |
| 69 | |
| 70 | def test_main(): |
Benjamin Peterson | ee8712c | 2008-05-20 21:35:26 +0000 | [diff] [blame] | 71 | support.run_unittest(__name__) |
Hye-Shik Chang | 3e2a306 | 2004-01-17 14:29:29 +0000 | [diff] [blame] | 72 | |
| 73 | if __name__ == "__main__": |
| 74 | test_main() |