mirror of
https://github.com/python/cpython.git
synced 2025-08-22 17:55:18 +00:00
Issue #14629: Raise SyntaxError in tokenizer.detect_encoding
if the first two lines have non-UTF-8 characters without an encoding declaration.
This commit is contained in:
parent
8e6e0fdb7f
commit
63674f4b52
3 changed files with 18 additions and 2 deletions
|
@ -292,9 +292,12 @@ def detect_encoding(readline):
|
|||
|
||||
def find_cookie(line):
|
||||
try:
|
||||
line_string = line.decode('ascii')
|
||||
# Decode as UTF-8. Either the line is an encoding declaration,
|
||||
# in which case it should be pure ASCII, or it must be UTF-8
|
||||
# per default encoding.
|
||||
line_string = line.decode('utf-8')
|
||||
except UnicodeDecodeError:
|
||||
return None
|
||||
raise SyntaxError("invalid or missing encoding declaration")
|
||||
|
||||
matches = cookie_re.findall(line_string)
|
||||
if not matches:
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue