mirror of
https://github.com/python/cpython.git
synced 2025-07-16 15:55:18 +00:00

requires them. Disable executable bits and shebang lines in test and benchmark files in order to prevent using a random system python, and in source files of modules which don't provide command line interface. Fixed shebang line to use python3 executable in the unittestgui script.
90 lines
3.4 KiB
Python
90 lines
3.4 KiB
Python
#
|
|
# test_codecencodings_cn.py
|
|
# Codec encoding tests for PRC encodings.
|
|
#
|
|
|
|
from test import support
|
|
from test import multibytecodec_support
|
|
import unittest
|
|
|
|
class Test_GB2312(multibytecodec_support.TestBase, unittest.TestCase):
|
|
encoding = 'gb2312'
|
|
tstring = multibytecodec_support.load_teststring('gb2312')
|
|
codectests = (
|
|
# invalid bytes
|
|
(b"abc\x81\x81\xc1\xc4", "strict", None),
|
|
(b"abc\xc8", "strict", None),
|
|
(b"abc\x81\x81\xc1\xc4", "replace", "abc\ufffd\ufffd\u804a"),
|
|
(b"abc\x81\x81\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\u804a\ufffd"),
|
|
(b"abc\x81\x81\xc1\xc4", "ignore", "abc\u804a"),
|
|
(b"\xc1\x64", "strict", None),
|
|
)
|
|
|
|
class Test_GBK(multibytecodec_support.TestBase, unittest.TestCase):
|
|
encoding = 'gbk'
|
|
tstring = multibytecodec_support.load_teststring('gbk')
|
|
codectests = (
|
|
# invalid bytes
|
|
(b"abc\x80\x80\xc1\xc4", "strict", None),
|
|
(b"abc\xc8", "strict", None),
|
|
(b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\u804a"),
|
|
(b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\u804a\ufffd"),
|
|
(b"abc\x80\x80\xc1\xc4", "ignore", "abc\u804a"),
|
|
(b"\x83\x34\x83\x31", "strict", None),
|
|
("\u30fb", "strict", None),
|
|
)
|
|
|
|
class Test_GB18030(multibytecodec_support.TestBase, unittest.TestCase):
|
|
encoding = 'gb18030'
|
|
tstring = multibytecodec_support.load_teststring('gb18030')
|
|
codectests = (
|
|
# invalid bytes
|
|
(b"abc\x80\x80\xc1\xc4", "strict", None),
|
|
(b"abc\xc8", "strict", None),
|
|
(b"abc\x80\x80\xc1\xc4", "replace", "abc\ufffd\ufffd\u804a"),
|
|
(b"abc\x80\x80\xc1\xc4\xc8", "replace", "abc\ufffd\ufffd\u804a\ufffd"),
|
|
(b"abc\x80\x80\xc1\xc4", "ignore", "abc\u804a"),
|
|
(b"abc\x84\x39\x84\x39\xc1\xc4", "replace", "abc\ufffd9\ufffd9\u804a"),
|
|
("\u30fb", "strict", b"\x819\xa79"),
|
|
(b"abc\x84\x32\x80\x80def", "replace", 'abc\ufffd2\ufffd\ufffddef'),
|
|
(b"abc\x81\x30\x81\x30def", "strict", 'abc\x80def'),
|
|
(b"abc\x86\x30\x81\x30def", "replace", 'abc\ufffd0\ufffd0def'),
|
|
)
|
|
has_iso10646 = True
|
|
|
|
class Test_HZ(multibytecodec_support.TestBase, unittest.TestCase):
|
|
encoding = 'hz'
|
|
tstring = multibytecodec_support.load_teststring('hz')
|
|
codectests = (
|
|
# test '~\n' (3 lines)
|
|
(b'This sentence is in ASCII.\n'
|
|
b'The next sentence is in GB.~{<:Ky2;S{#,~}~\n'
|
|
b'~{NpJ)l6HK!#~}Bye.\n',
|
|
'strict',
|
|
'This sentence is in ASCII.\n'
|
|
'The next sentence is in GB.'
|
|
'\u5df1\u6240\u4e0d\u6b32\uff0c\u52ff\u65bd\u65bc\u4eba\u3002'
|
|
'Bye.\n'),
|
|
# test '~\n' (4 lines)
|
|
(b'This sentence is in ASCII.\n'
|
|
b'The next sentence is in GB.~\n'
|
|
b'~{<:Ky2;S{#,NpJ)l6HK!#~}~\n'
|
|
b'Bye.\n',
|
|
'strict',
|
|
'This sentence is in ASCII.\n'
|
|
'The next sentence is in GB.'
|
|
'\u5df1\u6240\u4e0d\u6b32\uff0c\u52ff\u65bd\u65bc\u4eba\u3002'
|
|
'Bye.\n'),
|
|
# invalid bytes
|
|
(b'ab~cd', 'replace', 'ab\uFFFDcd'),
|
|
(b'ab\xffcd', 'replace', 'ab\uFFFDcd'),
|
|
(b'ab~{\x81\x81\x41\x44~}cd', 'replace', 'ab\uFFFD\uFFFD\u804Acd'),
|
|
(b'ab~{\x41\x44~}cd', 'replace', 'ab\u804Acd'),
|
|
(b"ab~{\x79\x79\x41\x44~}cd", "replace", "ab\ufffd\ufffd\u804acd"),
|
|
)
|
|
|
|
def test_main():
|
|
support.run_unittest(__name__)
|
|
|
|
if __name__ == "__main__":
|
|
test_main()
|