Issue #11467: Fix urlparse behavior when handling urls which contains scheme

specific part only digits. Patch by Santoso Wijaya.
This commit is contained in:
Senthil Kumaran 2011-04-15 18:07:33 +08:00
parent 1bb18cc39e
commit ddaea1c38a
3 changed files with 17 additions and 7 deletions

View file

@ -187,11 +187,15 @@ def urlsplit(url, scheme='', allow_fragments=True):
v = SplitResult(scheme, netloc, url, query, fragment)
_parse_cache[key] = v
return v
if url.endswith(':') or not url[i+1].isdigit():
for c in url[:i]:
if c not in scheme_chars:
break
else:
for c in url[:i]:
if c not in scheme_chars:
break
else:
try:
# make sure "url" is not actually a port number (in which case
# "scheme" is really part of the path
_testportnum = int(url[i+1:])
except ValueError:
scheme, url = url[:i].lower(), url[i+1:]
if url[:2] == '//':