diff options
Diffstat (limited to 'lib/python2.7/test/test_codecencodings_jp.py')
-rw-r--r-- | lib/python2.7/test/test_codecencodings_jp.py | 105 |
1 files changed, 105 insertions, 0 deletions
diff --git a/lib/python2.7/test/test_codecencodings_jp.py b/lib/python2.7/test/test_codecencodings_jp.py new file mode 100644 index 0000000..5f81f41 --- /dev/null +++ b/lib/python2.7/test/test_codecencodings_jp.py @@ -0,0 +1,105 @@ +#!/usr/bin/env python +# +# test_codecencodings_jp.py +# Codec encoding tests for Japanese encodings. +# + +from test import test_support +from test import test_multibytecodec_support +import unittest + +class Test_CP932(test_multibytecodec_support.TestBase, unittest.TestCase): + encoding = 'cp932' + tstring = test_multibytecodec_support.load_teststring('shift_jis') + codectests = ( + # invalid bytes + ("abc\x81\x00\x81\x00\x82\x84", "strict", None), + ("abc\xf8", "strict", None), + ("abc\x81\x00\x82\x84", "replace", u"abc\ufffd\uff44"), + ("abc\x81\x00\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"), + ("abc\x81\x00\x82\x84", "ignore", u"abc\uff44"), + # sjis vs cp932 + ("\\\x7e", "replace", u"\\\x7e"), + ("\x81\x5f\x81\x61\x81\x7c", "replace", u"\uff3c\u2225\uff0d"), + ) + +class Test_EUC_JISX0213(test_multibytecodec_support.TestBase, + unittest.TestCase): + encoding = 'euc_jisx0213' + tstring = test_multibytecodec_support.load_teststring('euc_jisx0213') + codectests = ( + # invalid bytes + ("abc\x80\x80\xc1\xc4", "strict", None), + ("abc\xc8", "strict", None), + ("abc\x80\x80\xc1\xc4", "replace", u"abc\ufffd\u7956"), + ("abc\x80\x80\xc1\xc4\xc8", "replace", u"abc\ufffd\u7956\ufffd"), + ("abc\x80\x80\xc1\xc4", "ignore", u"abc\u7956"), + ("abc\x8f\x83\x83", "replace", u"abc\ufffd"), + ("\xc1\x64", "strict", None), + ("\xa1\xc0", "strict", u"\uff3c"), + ) + xmlcharnametest = ( + u"\xab\u211c\xbb = \u2329\u1234\u232a", + "\xa9\xa8ℜ\xa9\xb2 = ⟨ሴ⟩" + ) + +eucjp_commontests = ( + ("abc\x80\x80\xc1\xc4", "strict", None), + ("abc\xc8", "strict", None), + ("abc\x80\x80\xc1\xc4", "replace", u"abc\ufffd\u7956"), + ("abc\x80\x80\xc1\xc4\xc8", "replace", u"abc\ufffd\u7956\ufffd"), + ("abc\x80\x80\xc1\xc4", "ignore", u"abc\u7956"), + ("abc\x8f\x83\x83", "replace", u"abc\ufffd"), + ("\xc1\x64", "strict", None), +) + +class Test_EUC_JP_COMPAT(test_multibytecodec_support.TestBase, + unittest.TestCase): + encoding = 'euc_jp' + tstring = test_multibytecodec_support.load_teststring('euc_jp') + codectests = eucjp_commontests + ( + ("\xa1\xc0\\", "strict", u"\uff3c\\"), + (u"\xa5", "strict", "\x5c"), + (u"\u203e", "strict", "\x7e"), + ) + +shiftjis_commonenctests = ( + ("abc\x80\x80\x82\x84", "strict", None), + ("abc\xf8", "strict", None), + ("abc\x80\x80\x82\x84", "replace", u"abc\ufffd\uff44"), + ("abc\x80\x80\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"), + ("abc\x80\x80\x82\x84def", "ignore", u"abc\uff44def"), +) + +class Test_SJIS_COMPAT(test_multibytecodec_support.TestBase, unittest.TestCase): + encoding = 'shift_jis' + tstring = test_multibytecodec_support.load_teststring('shift_jis') + codectests = shiftjis_commonenctests + ( + ("\\\x7e", "strict", u"\\\x7e"), + ("\x81\x5f\x81\x61\x81\x7c", "strict", u"\uff3c\u2016\u2212"), + ) + +class Test_SJISX0213(test_multibytecodec_support.TestBase, unittest.TestCase): + encoding = 'shift_jisx0213' + tstring = test_multibytecodec_support.load_teststring('shift_jisx0213') + codectests = ( + # invalid bytes + ("abc\x80\x80\x82\x84", "strict", None), + ("abc\xf8", "strict", None), + ("abc\x80\x80\x82\x84", "replace", u"abc\ufffd\uff44"), + ("abc\x80\x80\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"), + ("abc\x80\x80\x82\x84def", "ignore", u"abc\uff44def"), + # sjis vs cp932 + ("\\\x7e", "replace", u"\xa5\u203e"), + ("\x81\x5f\x81\x61\x81\x7c", "replace", u"\x5c\u2016\u2212"), + ) + xmlcharnametest = ( + u"\xab\u211c\xbb = \u2329\u1234\u232a", + "\x85Gℜ\x85Q = ⟨ሴ⟩" + ) + +def test_main(): + test_support.run_unittest(__name__) + +if __name__ == "__main__": + test_main() |