amk's fix attached to

[ 516299 ] urlparse can get fragments wrong
2025-09-26 18:29:57 +00:00 · 2002-03-18 13:06:00 +00:00 · 2002-03-18 13:06:00 +00:00 · bd3e771a97
commit bd3e771a97
parent 5c137c2251
3 changed files with 26 additions and 1 deletions
--- a/Lib/test/output/test_urlparse
+++ b/Lib/test/output/test_urlparse
@ -1,4 +1,9 @@
 test_urlparse
 http://www.python.org = ('http', 'www.python.org', '', '', '', '')
 http://www.python.org#abc = ('http', 'www.python.org', '', '', '', 'abc')
 http://www.python.org/#abc = ('http', 'www.python.org', '/', '', '', 'abc')
 http://a/b/c/d;p?q#f = ('http', 'a', '/b/c/d', 'p', 'q', 'f')
 urlparse.urljoin() tests
 g:h           = 'g:h'
--- a/Lib/test/test_urlparse.py
+++ b/Lib/test/test_urlparse.py
@ -4,6 +4,24 @@ errors = 0
 RFC1808_BASE = "http://a/b/c/d;p?q#f"
 for url, expected in [('http://www.python.org',
                       ('http', 'www.python.org', '', '', '', '')),
                      ('http://www.python.org#abc',
                       ('http', 'www.python.org', '', '', '', 'abc')),
                      ('http://www.python.org/#abc',
                       ('http', 'www.python.org', '/', '', '', 'abc')),
                      (RFC1808_BASE,
                       ('http', 'a', '/b/c/d', 'p', 'q', 'f')),
                      ]:
    result = urlparse.urlparse(url)
    print "%-13s = %r" % (url, result)
    if result != expected:
        errors += 1
        print "urlparse(%r)" % url
        print ("expected %r,\n"
               "     got %r") % (expected, result)
 print
 def checkJoin(relurl, expected):
    global errors
    result = urlparse.urljoin(RFC1808_BASE, relurl)
--- a/Lib/urlparse.py
+++ b/Lib/urlparse.py
@ -86,6 +86,8 @@ def urlsplit(url, scheme='', allow_fragments=1):
            url = url[i+1:]
            if url[:2] == '//':
                i = url.find('/', 2)
                if i < 0:
                    i = url.find('#')
                    if i < 0:
                        i = len(url)
                netloc = url[2:i]