summaryrefslogtreecommitdiff
path: root/sys/lib/python/test/test_codecencodings_jp.py
diff options
context:
space:
mode:
authorcinap_lenrek <cinap_lenrek@localhost>2011-05-03 11:25:13 +0000
committercinap_lenrek <cinap_lenrek@localhost>2011-05-03 11:25:13 +0000
commit458120dd40db6b4df55a4e96b650e16798ef06a0 (patch)
tree8f82685be24fef97e715c6f5ca4c68d34d5074ee /sys/lib/python/test/test_codecencodings_jp.py
parent3a742c699f6806c1145aea5149bf15de15a0afd7 (diff)
add hg and python
Diffstat (limited to 'sys/lib/python/test/test_codecencodings_jp.py')
-rw-r--r--sys/lib/python/test/test_codecencodings_jp.py111
1 files changed, 111 insertions, 0 deletions
diff --git a/sys/lib/python/test/test_codecencodings_jp.py b/sys/lib/python/test/test_codecencodings_jp.py
new file mode 100644
index 000000000..558598a95
--- /dev/null
+++ b/sys/lib/python/test/test_codecencodings_jp.py
@@ -0,0 +1,111 @@
+#!/usr/bin/env python
+#
+# test_codecencodings_jp.py
+# Codec encoding tests for Japanese encodings.
+#
+
+from test import test_support
+from test import test_multibytecodec_support
+import unittest
+
+class Test_CP932(test_multibytecodec_support.TestBase, unittest.TestCase):
+ encoding = 'cp932'
+ tstring = test_multibytecodec_support.load_teststring('shift_jis')
+ codectests = (
+ # invalid bytes
+ ("abc\x81\x00\x81\x00\x82\x84", "strict", None),
+ ("abc\xf8", "strict", None),
+ ("abc\x81\x00\x82\x84", "replace", u"abc\ufffd\uff44"),
+ ("abc\x81\x00\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"),
+ ("abc\x81\x00\x82\x84", "ignore", u"abc\uff44"),
+ # sjis vs cp932
+ ("\\\x7e", "replace", u"\\\x7e"),
+ ("\x81\x5f\x81\x61\x81\x7c", "replace", u"\uff3c\u2225\uff0d"),
+ )
+
+class Test_EUC_JISX0213(test_multibytecodec_support.TestBase,
+ unittest.TestCase):
+ encoding = 'euc_jisx0213'
+ tstring = test_multibytecodec_support.load_teststring('euc_jisx0213')
+ codectests = (
+ # invalid bytes
+ ("abc\x80\x80\xc1\xc4", "strict", None),
+ ("abc\xc8", "strict", None),
+ ("abc\x80\x80\xc1\xc4", "replace", u"abc\ufffd\u7956"),
+ ("abc\x80\x80\xc1\xc4\xc8", "replace", u"abc\ufffd\u7956\ufffd"),
+ ("abc\x80\x80\xc1\xc4", "ignore", u"abc\u7956"),
+ ("abc\x8f\x83\x83", "replace", u"abc\ufffd"),
+ ("\xc1\x64", "strict", None),
+ ("\xa1\xc0", "strict", u"\uff3c"),
+ )
+ xmlcharnametest = (
+ u"\xab\u211c\xbb = \u2329\u1234\u232a",
+ "\xa9\xa8&real;\xa9\xb2 = &lang;&#4660;&rang;"
+ )
+
+eucjp_commontests = (
+ ("abc\x80\x80\xc1\xc4", "strict", None),
+ ("abc\xc8", "strict", None),
+ ("abc\x80\x80\xc1\xc4", "replace", u"abc\ufffd\u7956"),
+ ("abc\x80\x80\xc1\xc4\xc8", "replace", u"abc\ufffd\u7956\ufffd"),
+ ("abc\x80\x80\xc1\xc4", "ignore", u"abc\u7956"),
+ ("abc\x8f\x83\x83", "replace", u"abc\ufffd"),
+ ("\xc1\x64", "strict", None),
+)
+
+class Test_EUC_JP_COMPAT(test_multibytecodec_support.TestBase,
+ unittest.TestCase):
+ encoding = 'euc_jp'
+ tstring = test_multibytecodec_support.load_teststring('euc_jp')
+ codectests = eucjp_commontests + (
+ ("\xa1\xc0\\", "strict", u"\uff3c\\"),
+ (u"\xa5", "strict", "\x5c"),
+ (u"\u203e", "strict", "\x7e"),
+ )
+
+shiftjis_commonenctests = (
+ ("abc\x80\x80\x82\x84", "strict", None),
+ ("abc\xf8", "strict", None),
+ ("abc\x80\x80\x82\x84", "replace", u"abc\ufffd\uff44"),
+ ("abc\x80\x80\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"),
+ ("abc\x80\x80\x82\x84def", "ignore", u"abc\uff44def"),
+)
+
+class Test_SJIS_COMPAT(test_multibytecodec_support.TestBase, unittest.TestCase):
+ encoding = 'shift_jis'
+ tstring = test_multibytecodec_support.load_teststring('shift_jis')
+ codectests = shiftjis_commonenctests + (
+ ("\\\x7e", "strict", u"\\\x7e"),
+ ("\x81\x5f\x81\x61\x81\x7c", "strict", u"\uff3c\u2016\u2212"),
+ )
+
+class Test_SJISX0213(test_multibytecodec_support.TestBase, unittest.TestCase):
+ encoding = 'shift_jisx0213'
+ tstring = test_multibytecodec_support.load_teststring('shift_jisx0213')
+ codectests = (
+ # invalid bytes
+ ("abc\x80\x80\x82\x84", "strict", None),
+ ("abc\xf8", "strict", None),
+ ("abc\x80\x80\x82\x84", "replace", u"abc\ufffd\uff44"),
+ ("abc\x80\x80\x82\x84\x88", "replace", u"abc\ufffd\uff44\ufffd"),
+ ("abc\x80\x80\x82\x84def", "ignore", u"abc\uff44def"),
+ # sjis vs cp932
+ ("\\\x7e", "replace", u"\xa5\u203e"),
+ ("\x81\x5f\x81\x61\x81\x7c", "replace", u"\x5c\u2016\u2212"),
+ )
+ xmlcharnametest = (
+ u"\xab\u211c\xbb = \u2329\u1234\u232a",
+ "\x85G&real;\x85Q = &lang;&#4660;&rang;"
+ )
+
+def test_main():
+ suite = unittest.TestSuite()
+ suite.addTest(unittest.makeSuite(Test_CP932))
+ suite.addTest(unittest.makeSuite(Test_EUC_JISX0213))
+ suite.addTest(unittest.makeSuite(Test_EUC_JP_COMPAT))
+ suite.addTest(unittest.makeSuite(Test_SJIS_COMPAT))
+ suite.addTest(unittest.makeSuite(Test_SJISX0213))
+ test_support.run_suite(suite)
+
+if __name__ == "__main__":
+ test_main()