mirror of
https://github.com/python/cpython.git
synced 2025-07-07 19:35:27 +00:00
gh-131020: py.exe launcher does not correctly detect a BOM when searching for the shebang (GH-131021)
This commit is contained in:
parent
5a484714c3
commit
36ef3bfe39
3 changed files with 29 additions and 5 deletions
|
@ -271,7 +271,10 @@ class RunPyMixin:
|
|||
@contextlib.contextmanager
|
||||
def script(self, content, encoding="utf-8"):
|
||||
file = Path(tempfile.mktemp(dir=os.getcwd()) + ".py")
|
||||
file.write_text(content, encoding=encoding)
|
||||
if isinstance(content, bytes):
|
||||
file.write_bytes(content)
|
||||
else:
|
||||
file.write_text(content, encoding=encoding)
|
||||
try:
|
||||
yield file
|
||||
finally:
|
||||
|
@ -624,6 +627,25 @@ class TestLauncher(unittest.TestCase, RunPyMixin):
|
|||
self.assertEqual("3.100", data["SearchInfo.tag"])
|
||||
self.assertEqual(f'X.Y.exe -prearg "{script}" -postarg', data["stdout"].strip())
|
||||
|
||||
def test_py_shebang_valid_bom(self):
|
||||
with self.py_ini(TEST_PY_DEFAULTS):
|
||||
content = "#! /usr/bin/python -prearg".encode("utf-8")
|
||||
with self.script(b"\xEF\xBB\xBF" + content) as script:
|
||||
data = self.run_py([script, "-postarg"])
|
||||
self.assertEqual("PythonTestSuite", data["SearchInfo.company"])
|
||||
self.assertEqual("3.100", data["SearchInfo.tag"])
|
||||
self.assertEqual(f"X.Y.exe -prearg {quote(script)} -postarg", data["stdout"].strip())
|
||||
|
||||
def test_py_shebang_invalid_bom(self):
|
||||
with self.py_ini(TEST_PY_DEFAULTS):
|
||||
content = "#! /usr/bin/python3 -prearg".encode("utf-8")
|
||||
with self.script(b"\xEF\xAA\xBF" + content) as script:
|
||||
data = self.run_py([script, "-postarg"])
|
||||
self.assertIn("Invalid BOM", data["stderr"])
|
||||
self.assertEqual("PythonTestSuite", data["SearchInfo.company"])
|
||||
self.assertEqual("3.100", data["SearchInfo.tag"])
|
||||
self.assertEqual(f"X.Y.exe {quote(script)} -postarg", data["stdout"].strip())
|
||||
|
||||
def test_py_handle_64_in_ini(self):
|
||||
with self.py_ini("\n".join(["[defaults]", "python=3.999-64"])):
|
||||
# Expect this to fail, but should get oldStyleTag flipped on
|
||||
|
|
|
@ -0,0 +1,2 @@
|
|||
:source:`pylauncher <PC/launcher2.c>` correctly detects a BOM when searching for the
|
||||
shebang. Fix by Chris Eibl.
|
|
@ -1062,7 +1062,7 @@ checkShebang(SearchInfo *search)
|
|||
}
|
||||
|
||||
DWORD bytesRead = 0;
|
||||
char buffer[4096];
|
||||
unsigned char buffer[4096];
|
||||
if (!ReadFile(hFile, buffer, sizeof(buffer), &bytesRead, NULL)) {
|
||||
debug(L"# Failed to read %s for shebang parsing (0x%08X)\n",
|
||||
scriptFile, GetLastError());
|
||||
|
@ -1075,7 +1075,7 @@ checkShebang(SearchInfo *search)
|
|||
free(scriptFile);
|
||||
|
||||
|
||||
char *b = buffer;
|
||||
unsigned char *b = buffer;
|
||||
bool onlyUtf8 = false;
|
||||
if (bytesRead > 3 && *b == 0xEF) {
|
||||
if (*++b == 0xBB && *++b == 0xBF) {
|
||||
|
@ -1096,13 +1096,13 @@ checkShebang(SearchInfo *search)
|
|||
++b;
|
||||
--bytesRead;
|
||||
while (--bytesRead > 0 && isspace(*++b)) { }
|
||||
char *start = b;
|
||||
const unsigned char *start = b;
|
||||
while (--bytesRead > 0 && *++b != '\r' && *b != '\n') { }
|
||||
wchar_t *shebang;
|
||||
int shebangLength;
|
||||
// We add 1 when bytesRead==0, as in that case we hit EOF and b points
|
||||
// to the last character in the file, not the newline
|
||||
int exitCode = _decodeShebang(search, start, (int)(b - start + (bytesRead == 0)), onlyUtf8, &shebang, &shebangLength);
|
||||
int exitCode = _decodeShebang(search, (const char*)start, (int)(b - start + (bytesRead == 0)), onlyUtf8, &shebang, &shebangLength);
|
||||
if (exitCode) {
|
||||
return exitCode;
|
||||
}
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue