mirror of
https://github.com/python/cpython.git
synced 2025-07-24 19:54:21 +00:00
260 lines
9.3 KiB
Python
260 lines
9.3 KiB
Python
"""Tests for the Tools/i18n/msgfmt.py tool."""
|
|
|
|
import json
|
|
import sys
|
|
import unittest
|
|
from gettext import GNUTranslations
|
|
from pathlib import Path
|
|
|
|
from test.support.os_helper import temp_cwd
|
|
from test.support.script_helper import assert_python_failure, assert_python_ok
|
|
from test.test_tools import imports_under_tool, skip_if_missing, toolsdir
|
|
|
|
|
|
skip_if_missing('i18n')
|
|
|
|
data_dir = (Path(__file__).parent / 'msgfmt_data').resolve()
|
|
script_dir = Path(toolsdir) / 'i18n'
|
|
msgfmt_py = script_dir / 'msgfmt.py'
|
|
|
|
with imports_under_tool("i18n"):
|
|
import msgfmt
|
|
|
|
|
|
def compile_messages(po_file, mo_file):
|
|
assert_python_ok(msgfmt_py, '-o', mo_file, po_file)
|
|
|
|
|
|
class CompilationTest(unittest.TestCase):
|
|
|
|
def test_compilation(self):
|
|
self.maxDiff = None
|
|
with temp_cwd():
|
|
for po_file in data_dir.glob('*.po'):
|
|
with self.subTest(po_file=po_file):
|
|
mo_file = po_file.with_suffix('.mo')
|
|
with open(mo_file, 'rb') as f:
|
|
expected = GNUTranslations(f)
|
|
|
|
tmp_mo_file = mo_file.name
|
|
compile_messages(po_file, tmp_mo_file)
|
|
with open(tmp_mo_file, 'rb') as f:
|
|
actual = GNUTranslations(f)
|
|
|
|
self.assertDictEqual(actual._catalog, expected._catalog)
|
|
|
|
def test_translations(self):
|
|
with open(data_dir / 'general.mo', 'rb') as f:
|
|
t = GNUTranslations(f)
|
|
|
|
self.assertEqual(t.gettext('foo'), 'foo')
|
|
self.assertEqual(t.gettext('bar'), 'baz')
|
|
self.assertEqual(t.pgettext('abc', 'foo'), 'bar')
|
|
self.assertEqual(t.pgettext('xyz', 'foo'), 'bar')
|
|
self.assertEqual(t.gettext('Multilinestring'), 'Multilinetranslation')
|
|
self.assertEqual(t.gettext('"escapes"'), '"translated"')
|
|
self.assertEqual(t.gettext('\n newlines \n'), '\n translated \n')
|
|
self.assertEqual(t.ngettext('One email sent.', '%d emails sent.', 1),
|
|
'One email sent.')
|
|
self.assertEqual(t.ngettext('One email sent.', '%d emails sent.', 2),
|
|
'%d emails sent.')
|
|
self.assertEqual(t.npgettext('abc', 'One email sent.',
|
|
'%d emails sent.', 1),
|
|
'One email sent.')
|
|
self.assertEqual(t.npgettext('abc', 'One email sent.',
|
|
'%d emails sent.', 2),
|
|
'%d emails sent.')
|
|
|
|
def test_invalid_msgid_plural(self):
|
|
with temp_cwd():
|
|
Path('invalid.po').write_text('''\
|
|
msgid_plural "plural"
|
|
msgstr[0] "singular"
|
|
''')
|
|
|
|
res = assert_python_failure(msgfmt_py, 'invalid.po')
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('msgid_plural not preceded by msgid', err)
|
|
|
|
def test_plural_without_msgid_plural(self):
|
|
with temp_cwd():
|
|
Path('invalid.po').write_text('''\
|
|
msgid "foo"
|
|
msgstr[0] "bar"
|
|
''')
|
|
|
|
res = assert_python_failure(msgfmt_py, 'invalid.po')
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('plural without msgid_plural', err)
|
|
|
|
def test_indexed_msgstr_without_msgid_plural(self):
|
|
with temp_cwd():
|
|
Path('invalid.po').write_text('''\
|
|
msgid "foo"
|
|
msgid_plural "foos"
|
|
msgstr "bar"
|
|
''')
|
|
|
|
res = assert_python_failure(msgfmt_py, 'invalid.po')
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('indexed msgstr required for plural', err)
|
|
|
|
def test_generic_syntax_error(self):
|
|
with temp_cwd():
|
|
Path('invalid.po').write_text('''\
|
|
"foo"
|
|
''')
|
|
|
|
res = assert_python_failure(msgfmt_py, 'invalid.po')
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('Syntax error', err)
|
|
|
|
|
|
class POParserTest(unittest.TestCase):
|
|
@classmethod
|
|
def tearDownClass(cls):
|
|
# msgfmt uses a global variable to store messages,
|
|
# clear it after the tests.
|
|
msgfmt.MESSAGES.clear()
|
|
|
|
def test_strings(self):
|
|
# Test that the PO parser correctly handles and unescape
|
|
# strings in the PO file.
|
|
# The PO file format allows for a variety of escape sequences,
|
|
# octal and hex escapes.
|
|
valid_strings = (
|
|
# empty strings
|
|
('""', ''),
|
|
('"" "" ""', ''),
|
|
# allowed escape sequences
|
|
(r'"\\"', '\\'),
|
|
(r'"\""', '"'),
|
|
(r'"\t"', '\t'),
|
|
(r'"\n"', '\n'),
|
|
(r'"\r"', '\r'),
|
|
(r'"\f"', '\f'),
|
|
(r'"\a"', '\a'),
|
|
(r'"\b"', '\b'),
|
|
(r'"\v"', '\v'),
|
|
# non-empty strings
|
|
('"foo"', 'foo'),
|
|
('"foo" "bar"', 'foobar'),
|
|
('"foo""bar"', 'foobar'),
|
|
('"" "foo" ""', 'foo'),
|
|
# newlines and tabs
|
|
(r'"foo\nbar"', 'foo\nbar'),
|
|
(r'"foo\n" "bar"', 'foo\nbar'),
|
|
(r'"foo\tbar"', 'foo\tbar'),
|
|
(r'"foo\t" "bar"', 'foo\tbar'),
|
|
# escaped quotes
|
|
(r'"foo\"bar"', 'foo"bar'),
|
|
(r'"foo\"" "bar"', 'foo"bar'),
|
|
(r'"foo\\" "bar"', 'foo\\bar'),
|
|
# octal escapes
|
|
(r'"\120\171\164\150\157\156"', 'Python'),
|
|
(r'"\120\171\164" "\150\157\156"', 'Python'),
|
|
(r'"\"\120\171\164" "\150\157\156\""', '"Python"'),
|
|
# hex escapes
|
|
(r'"\x50\x79\x74\x68\x6f\x6e"', 'Python'),
|
|
(r'"\x50\x79\x74" "\x68\x6f\x6e"', 'Python'),
|
|
(r'"\"\x50\x79\x74" "\x68\x6f\x6e\""', '"Python"'),
|
|
)
|
|
|
|
with temp_cwd():
|
|
for po_string, expected in valid_strings:
|
|
with self.subTest(po_string=po_string):
|
|
# Construct a PO file with a single entry,
|
|
# compile it, read it into a catalog and
|
|
# check the result.
|
|
po = f'msgid {po_string}\nmsgstr "translation"'
|
|
Path('messages.po').write_text(po)
|
|
# Reset the global MESSAGES dictionary
|
|
msgfmt.MESSAGES.clear()
|
|
msgfmt.make('messages.po', 'messages.mo')
|
|
|
|
with open('messages.mo', 'rb') as f:
|
|
actual = GNUTranslations(f)
|
|
|
|
self.assertDictEqual(actual._catalog, {expected: 'translation'})
|
|
|
|
invalid_strings = (
|
|
# "''", # invalid but currently accepted
|
|
'"',
|
|
'"""',
|
|
'"" "',
|
|
'foo',
|
|
'"" "foo',
|
|
'"foo" foo',
|
|
'42',
|
|
'"" 42 ""',
|
|
# disallowed escape sequences
|
|
# r'"\'"', # invalid but currently accepted
|
|
# r'"\e"', # invalid but currently accepted
|
|
# r'"\8"', # invalid but currently accepted
|
|
# r'"\9"', # invalid but currently accepted
|
|
r'"\x"',
|
|
r'"\u1234"',
|
|
r'"\N{ROMAN NUMERAL NINE}"'
|
|
)
|
|
with temp_cwd():
|
|
for invalid_string in invalid_strings:
|
|
with self.subTest(string=invalid_string):
|
|
po = f'msgid {invalid_string}\nmsgstr "translation"'
|
|
Path('messages.po').write_text(po)
|
|
# Reset the global MESSAGES dictionary
|
|
msgfmt.MESSAGES.clear()
|
|
with self.assertRaises(Exception):
|
|
msgfmt.make('messages.po', 'messages.mo')
|
|
|
|
|
|
class CLITest(unittest.TestCase):
|
|
|
|
def test_help(self):
|
|
for option in ('--help', '-h'):
|
|
res = assert_python_ok(msgfmt_py, option)
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('Generate binary message catalog from textual translation description.', err)
|
|
|
|
def test_version(self):
|
|
for option in ('--version', '-V'):
|
|
res = assert_python_ok(msgfmt_py, option)
|
|
out = res.out.decode('utf-8').strip()
|
|
self.assertEqual('msgfmt.py 1.2', out)
|
|
|
|
def test_invalid_option(self):
|
|
res = assert_python_failure(msgfmt_py, '--invalid-option')
|
|
err = res.err.decode('utf-8')
|
|
self.assertIn('Generate binary message catalog from textual translation description.', err)
|
|
self.assertIn('option --invalid-option not recognized', err)
|
|
|
|
def test_no_input_file(self):
|
|
res = assert_python_ok(msgfmt_py)
|
|
err = res.err.decode('utf-8').replace('\r\n', '\n')
|
|
self.assertIn('No input file given\n'
|
|
"Try `msgfmt --help' for more information.", err)
|
|
|
|
def test_nonexistent_file(self):
|
|
assert_python_failure(msgfmt_py, 'nonexistent.po')
|
|
|
|
|
|
def update_catalog_snapshots():
|
|
for po_file in data_dir.glob('*.po'):
|
|
mo_file = po_file.with_suffix('.mo')
|
|
compile_messages(po_file, mo_file)
|
|
# Create a human-readable JSON file which is
|
|
# easier to review than the binary .mo file.
|
|
with open(mo_file, 'rb') as f:
|
|
translations = GNUTranslations(f)
|
|
catalog_file = po_file.with_suffix('.json')
|
|
with open(catalog_file, 'w') as f:
|
|
data = translations._catalog.items()
|
|
data = sorted(data, key=lambda x: (isinstance(x[0], tuple), x[0]))
|
|
json.dump(data, f, indent=4)
|
|
f.write('\n')
|
|
|
|
|
|
if __name__ == '__main__':
|
|
if len(sys.argv) > 1 and sys.argv[1] == '--snapshot-update':
|
|
update_catalog_snapshots()
|
|
sys.exit(0)
|
|
unittest.main()
|