Home | History | Annotate | Download | only in test
      1 #
      2 # test_codecencodings_kr.py
      3 #   Codec encoding tests for ROK encodings.
      4 #
      5 
      6 from test import multibytecodec_support
      7 import unittest
      8 
      9 class Test_CP949(multibytecodec_support.TestBase, unittest.TestCase):
     10     encoding = 'cp949'
     11     tstring = multibytecodec_support.load_teststring('cp949')
     12     codectests = (
     13         # invalid bytes
     14         (b"abc\x80\x80\xc1\xc4", "strict",  None),
     15         (b"abc\xc8", "strict",  None),
     16         (b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\uc894"),
     17         (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\uc894\ufffd"),
     18         (b"abc\x80\x80\xc1\xc4", "ignore",  "abc\uc894"),
     19     )
     20 
     21 class Test_EUCKR(multibytecodec_support.TestBase, unittest.TestCase):
     22     encoding = 'euc_kr'
     23     tstring = multibytecodec_support.load_teststring('euc_kr')
     24     codectests = (
     25         # invalid bytes
     26         (b"abc\x80\x80\xc1\xc4", "strict",  None),
     27         (b"abc\xc8", "strict",  None),
     28         (b"abc\x80\x80\xc1\xc4", "replace", 'abc\ufffd\ufffd\uc894'),
     29         (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\uc894\ufffd"),
     30         (b"abc\x80\x80\xc1\xc4", "ignore",  "abc\uc894"),
     31 
     32         # composed make-up sequence errors
     33         (b"\xa4\xd4", "strict", None),
     34         (b"\xa4\xd4\xa4", "strict", None),
     35         (b"\xa4\xd4\xa4\xb6", "strict", None),
     36         (b"\xa4\xd4\xa4\xb6\xa4", "strict", None),
     37         (b"\xa4\xd4\xa4\xb6\xa4\xd0", "strict", None),
     38         (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4", "strict", None),
     39         (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4", "strict", "\uc4d4"),
     40         (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4x", "strict", "\uc4d4x"),
     41         (b"a\xa4\xd4\xa4\xb6\xa4", "replace", 'a\ufffd'),
     42         (b"\xa4\xd4\xa3\xb6\xa4\xd0\xa4\xd4", "strict", None),
     43         (b"\xa4\xd4\xa4\xb6\xa3\xd0\xa4\xd4", "strict", None),
     44         (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa3\xd4", "strict", None),
     45         (b"\xa4\xd4\xa4\xff\xa4\xd0\xa4\xd4", "replace", '\ufffd\u6e21\ufffd\u3160\ufffd'),
     46         (b"\xa4\xd4\xa4\xb6\xa4\xff\xa4\xd4", "replace", '\ufffd\u6e21\ub544\ufffd\ufffd'),
     47         (b"\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xff", "replace", '\ufffd\u6e21\ub544\u572d\ufffd'),
     48         (b"\xa4\xd4\xff\xa4\xd4\xa4\xb6\xa4\xd0\xa4\xd4", "replace", '\ufffd\ufffd\ufffd\uc4d4'),
     49         (b"\xc1\xc4", "strict", "\uc894"),
     50     )
     51 
     52 class Test_JOHAB(multibytecodec_support.TestBase, unittest.TestCase):
     53     encoding = 'johab'
     54     tstring = multibytecodec_support.load_teststring('johab')
     55     codectests = (
     56         # invalid bytes
     57         (b"abc\x80\x80\xc1\xc4", "strict",  None),
     58         (b"abc\xc8", "strict",  None),
     59         (b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\ucd27"),
     60         (b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\ucd27\ufffd"),
     61         (b"abc\x80\x80\xc1\xc4", "ignore",  "abc\ucd27"),
     62         (b"\xD8abc", "replace",  "\uFFFDabc"),
     63         (b"\xD8\xFFabc", "replace",  "\uFFFD\uFFFDabc"),
     64         (b"\x84bxy", "replace",  "\uFFFDbxy"),
     65         (b"\x8CBxy", "replace",  "\uFFFDBxy"),
     66     )
     67 
     68 if __name__ == "__main__":
     69     unittest.main()
     70