mirror of
				https://github.com/python/cpython.git
				synced 2025-10-25 07:48:51 +00:00 
			
		
		
		
	 579d5cd643
			
		
	
	
		579d5cd643
		
	
	
	
	
		
			
			parent: 80003:be83cbf4a789 parent: 80006:32df036e6b75 user: Georg Brandl <georg@python.org> date: Sun Oct 28 10:50:11 2012 +0100 summary: merge with 3.3
		
			
				
	
	
		
			363 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			363 lines
		
	
	
	
		
			13 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| #!/usr/bin/env python3
 | |
| 
 | |
| import unittest
 | |
| from test import support
 | |
| from test.test_urllib2 import sanepathname2url
 | |
| 
 | |
| import os
 | |
| import socket
 | |
| import urllib.error
 | |
| import urllib.request
 | |
| import sys
 | |
| try:
 | |
|     import ssl
 | |
| except ImportError:
 | |
|     ssl = None
 | |
| 
 | |
| TIMEOUT = 60  # seconds
 | |
| 
 | |
| 
 | |
| def _retry_thrice(func, exc, *args, **kwargs):
 | |
|     for i in range(3):
 | |
|         try:
 | |
|             return func(*args, **kwargs)
 | |
|         except exc as e:
 | |
|             last_exc = e
 | |
|             continue
 | |
|         except:
 | |
|             raise
 | |
|     raise last_exc
 | |
| 
 | |
| def _wrap_with_retry_thrice(func, exc):
 | |
|     def wrapped(*args, **kwargs):
 | |
|         return _retry_thrice(func, exc, *args, **kwargs)
 | |
|     return wrapped
 | |
| 
 | |
| # Connecting to remote hosts is flaky.  Make it more robust by retrying
 | |
| # the connection several times.
 | |
| _urlopen_with_retry = _wrap_with_retry_thrice(urllib.request.urlopen,
 | |
|                                               urllib.error.URLError)
 | |
| 
 | |
| 
 | |
| class AuthTests(unittest.TestCase):
 | |
|     """Tests urllib2 authentication features."""
 | |
| 
 | |
| ## Disabled at the moment since there is no page under python.org which
 | |
| ## could be used to HTTP authentication.
 | |
| #
 | |
| #    def test_basic_auth(self):
 | |
| #        import http.client
 | |
| #
 | |
| #        test_url = "http://www.python.org/test/test_urllib2/basic_auth"
 | |
| #        test_hostport = "www.python.org"
 | |
| #        test_realm = 'Test Realm'
 | |
| #        test_user = 'test.test_urllib2net'
 | |
| #        test_password = 'blah'
 | |
| #
 | |
| #        # failure
 | |
| #        try:
 | |
| #            _urlopen_with_retry(test_url)
 | |
| #        except urllib2.HTTPError, exc:
 | |
| #            self.assertEqual(exc.code, 401)
 | |
| #        else:
 | |
| #            self.fail("urlopen() should have failed with 401")
 | |
| #
 | |
| #        # success
 | |
| #        auth_handler = urllib2.HTTPBasicAuthHandler()
 | |
| #        auth_handler.add_password(test_realm, test_hostport,
 | |
| #                                  test_user, test_password)
 | |
| #        opener = urllib2.build_opener(auth_handler)
 | |
| #        f = opener.open('http://localhost/')
 | |
| #        response = _urlopen_with_retry("http://www.python.org/")
 | |
| #
 | |
| #        # The 'userinfo' URL component is deprecated by RFC 3986 for security
 | |
| #        # reasons, let's not implement it!  (it's already implemented for proxy
 | |
| #        # specification strings (that is, URLs or authorities specifying a
 | |
| #        # proxy), so we must keep that)
 | |
| #        self.assertRaises(http.client.InvalidURL,
 | |
| #                          urllib2.urlopen, "http://evil:thing@example.com")
 | |
| 
 | |
| 
 | |
| class CloseSocketTest(unittest.TestCase):
 | |
| 
 | |
|     def test_close(self):
 | |
|         # calling .close() on urllib2's response objects should close the
 | |
|         # underlying socket
 | |
| 
 | |
|         response = _urlopen_with_retry("http://www.python.org/")
 | |
|         sock = response.fp
 | |
|         self.assertTrue(not sock.closed)
 | |
|         response.close()
 | |
|         self.assertTrue(sock.closed)
 | |
| 
 | |
| class OtherNetworkTests(unittest.TestCase):
 | |
|     def setUp(self):
 | |
|         if 0:  # for debugging
 | |
|             import logging
 | |
|             logger = logging.getLogger("test_urllib2net")
 | |
|             logger.addHandler(logging.StreamHandler())
 | |
| 
 | |
|     # XXX The rest of these tests aren't very good -- they don't check much.
 | |
|     # They do sometimes catch some major disasters, though.
 | |
| 
 | |
|     def test_ftp(self):
 | |
|         urls = [
 | |
|             'ftp://ftp.kernel.org/pub/linux/kernel/README',
 | |
|             'ftp://ftp.kernel.org/pub/linux/kernel/non-existent-file',
 | |
|             #'ftp://ftp.kernel.org/pub/leenox/kernel/test',
 | |
|             'ftp://gatekeeper.research.compaq.com/pub/DEC/SRC'
 | |
|                 '/research-reports/00README-Legal-Rules-Regs',
 | |
|             ]
 | |
|         self._test_urls(urls, self._extra_handlers())
 | |
| 
 | |
|     def test_file(self):
 | |
|         TESTFN = support.TESTFN
 | |
|         f = open(TESTFN, 'w')
 | |
|         try:
 | |
|             f.write('hi there\n')
 | |
|             f.close()
 | |
|             urls = [
 | |
|                 'file:' + sanepathname2url(os.path.abspath(TESTFN)),
 | |
|                 ('file:///nonsensename/etc/passwd', None,
 | |
|                  urllib.error.URLError),
 | |
|                 ]
 | |
|             self._test_urls(urls, self._extra_handlers(), retry=True)
 | |
|         finally:
 | |
|             os.remove(TESTFN)
 | |
| 
 | |
|         self.assertRaises(ValueError, urllib.request.urlopen,'./relative_path/to/file')
 | |
| 
 | |
|     # XXX Following test depends on machine configurations that are internal
 | |
|     # to CNRI.  Need to set up a public server with the right authentication
 | |
|     # configuration for test purposes.
 | |
| 
 | |
| ##     def test_cnri(self):
 | |
| ##         if socket.gethostname() == 'bitdiddle':
 | |
| ##             localhost = 'bitdiddle.cnri.reston.va.us'
 | |
| ##         elif socket.gethostname() == 'bitdiddle.concentric.net':
 | |
| ##             localhost = 'localhost'
 | |
| ##         else:
 | |
| ##             localhost = None
 | |
| ##         if localhost is not None:
 | |
| ##             urls = [
 | |
| ##                 'file://%s/etc/passwd' % localhost,
 | |
| ##                 'http://%s/simple/' % localhost,
 | |
| ##                 'http://%s/digest/' % localhost,
 | |
| ##                 'http://%s/not/found.h' % localhost,
 | |
| ##                 ]
 | |
| 
 | |
| ##             bauth = HTTPBasicAuthHandler()
 | |
| ##             bauth.add_password('basic_test_realm', localhost, 'jhylton',
 | |
| ##                                'password')
 | |
| ##             dauth = HTTPDigestAuthHandler()
 | |
| ##             dauth.add_password('digest_test_realm', localhost, 'jhylton',
 | |
| ##                                'password')
 | |
| 
 | |
| ##             self._test_urls(urls, self._extra_handlers()+[bauth, dauth])
 | |
| 
 | |
|     def test_urlwithfrag(self):
 | |
|         urlwith_frag = "http://docs.python.org/2/glossary.html#glossary"
 | |
|         with support.transient_internet(urlwith_frag):
 | |
|             req = urllib.request.Request(urlwith_frag)
 | |
|             res = urllib.request.urlopen(req)
 | |
|             self.assertEqual(res.geturl(),
 | |
|                     "http://docs.python.org/2/glossary.html#glossary")
 | |
| 
 | |
|     def test_custom_headers(self):
 | |
|         url = "http://www.example.com"
 | |
|         with support.transient_internet(url):
 | |
|             opener = urllib.request.build_opener()
 | |
|             request = urllib.request.Request(url)
 | |
|             self.assertFalse(request.header_items())
 | |
|             opener.open(request)
 | |
|             self.assertTrue(request.header_items())
 | |
|             self.assertTrue(request.has_header('User-agent'))
 | |
|             request.add_header('User-Agent','Test-Agent')
 | |
|             opener.open(request)
 | |
|             self.assertEqual(request.get_header('User-agent'),'Test-Agent')
 | |
| 
 | |
|     def test_sites_no_connection_close(self):
 | |
|         # Some sites do not send Connection: close header.
 | |
|         # Verify that those work properly. (#issue12576)
 | |
| 
 | |
|         URL = 'http://www.imdb.com' # mangles Connection:close
 | |
| 
 | |
|         with support.transient_internet(URL):
 | |
|             try:
 | |
|                 with urllib.request.urlopen(URL) as res:
 | |
|                     pass
 | |
|             except ValueError as e:
 | |
|                 self.fail("urlopen failed for site not sending \
 | |
|                            Connection:close")
 | |
|             else:
 | |
|                 self.assertTrue(res)
 | |
| 
 | |
|             req = urllib.request.urlopen(URL)
 | |
|             res = req.read()
 | |
|             self.assertTrue(res)
 | |
| 
 | |
|     def _test_urls(self, urls, handlers, retry=True):
 | |
|         import time
 | |
|         import logging
 | |
|         debug = logging.getLogger("test_urllib2").debug
 | |
| 
 | |
|         urlopen = urllib.request.build_opener(*handlers).open
 | |
|         if retry:
 | |
|             urlopen = _wrap_with_retry_thrice(urlopen, urllib.error.URLError)
 | |
| 
 | |
|         for url in urls:
 | |
|             if isinstance(url, tuple):
 | |
|                 url, req, expected_err = url
 | |
|             else:
 | |
|                 req = expected_err = None
 | |
| 
 | |
|             with support.transient_internet(url):
 | |
|                 debug(url)
 | |
|                 try:
 | |
|                     f = urlopen(url, req, TIMEOUT)
 | |
|                 except EnvironmentError as err:
 | |
|                     debug(err)
 | |
|                     if expected_err:
 | |
|                         msg = ("Didn't get expected error(s) %s for %s %s, got %s: %s" %
 | |
|                                (expected_err, url, req, type(err), err))
 | |
|                         self.assertIsInstance(err, expected_err, msg)
 | |
|                 except urllib.error.URLError as err:
 | |
|                     if isinstance(err[0], socket.timeout):
 | |
|                         print("<timeout: %s>" % url, file=sys.stderr)
 | |
|                         continue
 | |
|                     else:
 | |
|                         raise
 | |
|                 else:
 | |
|                     try:
 | |
|                         with support.time_out, \
 | |
|                              support.socket_peer_reset, \
 | |
|                              support.ioerror_peer_reset:
 | |
|                             buf = f.read()
 | |
|                             debug("read %d bytes" % len(buf))
 | |
|                     except socket.timeout:
 | |
|                         print("<timeout: %s>" % url, file=sys.stderr)
 | |
|                     f.close()
 | |
|             debug("******** next url coming up...")
 | |
|             time.sleep(0.1)
 | |
| 
 | |
|     def _extra_handlers(self):
 | |
|         handlers = []
 | |
| 
 | |
|         cfh = urllib.request.CacheFTPHandler()
 | |
|         self.addCleanup(cfh.clear_cache)
 | |
|         cfh.setTimeout(1)
 | |
|         handlers.append(cfh)
 | |
| 
 | |
|         return handlers
 | |
| 
 | |
| 
 | |
| class TimeoutTest(unittest.TestCase):
 | |
|     def test_http_basic(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         url = "http://www.python.org"
 | |
|         with support.transient_internet(url, timeout=None):
 | |
|             u = _urlopen_with_retry(url)
 | |
|             self.addCleanup(u.close)
 | |
|             self.assertTrue(u.fp.raw._sock.gettimeout() is None)
 | |
| 
 | |
|     def test_http_default_timeout(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         url = "http://www.python.org"
 | |
|         with support.transient_internet(url):
 | |
|             socket.setdefaulttimeout(60)
 | |
|             try:
 | |
|                 u = _urlopen_with_retry(url)
 | |
|                 self.addCleanup(u.close)
 | |
|             finally:
 | |
|                 socket.setdefaulttimeout(None)
 | |
|             self.assertEqual(u.fp.raw._sock.gettimeout(), 60)
 | |
| 
 | |
|     def test_http_no_timeout(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         url = "http://www.python.org"
 | |
|         with support.transient_internet(url):
 | |
|             socket.setdefaulttimeout(60)
 | |
|             try:
 | |
|                 u = _urlopen_with_retry(url, timeout=None)
 | |
|                 self.addCleanup(u.close)
 | |
|             finally:
 | |
|                 socket.setdefaulttimeout(None)
 | |
|             self.assertTrue(u.fp.raw._sock.gettimeout() is None)
 | |
| 
 | |
|     def test_http_timeout(self):
 | |
|         url = "http://www.python.org"
 | |
|         with support.transient_internet(url):
 | |
|             u = _urlopen_with_retry(url, timeout=120)
 | |
|             self.addCleanup(u.close)
 | |
|             self.assertEqual(u.fp.raw._sock.gettimeout(), 120)
 | |
| 
 | |
|     FTP_HOST = "ftp://ftp.mirror.nl/pub/gnu/"
 | |
| 
 | |
|     def test_ftp_basic(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         with support.transient_internet(self.FTP_HOST, timeout=None):
 | |
|             u = _urlopen_with_retry(self.FTP_HOST)
 | |
|             self.addCleanup(u.close)
 | |
|             self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
 | |
| 
 | |
|     def test_ftp_default_timeout(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         with support.transient_internet(self.FTP_HOST):
 | |
|             socket.setdefaulttimeout(60)
 | |
|             try:
 | |
|                 u = _urlopen_with_retry(self.FTP_HOST)
 | |
|                 self.addCleanup(u.close)
 | |
|             finally:
 | |
|                 socket.setdefaulttimeout(None)
 | |
|             self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
 | |
| 
 | |
|     def test_ftp_no_timeout(self):
 | |
|         self.assertTrue(socket.getdefaulttimeout() is None)
 | |
|         with support.transient_internet(self.FTP_HOST):
 | |
|             socket.setdefaulttimeout(60)
 | |
|             try:
 | |
|                 u = _urlopen_with_retry(self.FTP_HOST, timeout=None)
 | |
|                 self.addCleanup(u.close)
 | |
|             finally:
 | |
|                 socket.setdefaulttimeout(None)
 | |
|             self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
 | |
| 
 | |
|     def test_ftp_timeout(self):
 | |
|         with support.transient_internet(self.FTP_HOST):
 | |
|             u = _urlopen_with_retry(self.FTP_HOST, timeout=60)
 | |
|             self.addCleanup(u.close)
 | |
|             self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
 | |
| 
 | |
| 
 | |
| @unittest.skipUnless(ssl, "requires SSL support")
 | |
| class HTTPSTests(unittest.TestCase):
 | |
| 
 | |
|     def test_sni(self):
 | |
|         self.skipTest("test disabled - test server needed")
 | |
|         # Checks that Server Name Indication works, if supported by the
 | |
|         # OpenSSL linked to.
 | |
|         # The ssl module itself doesn't have server-side support for SNI,
 | |
|         # so we rely on a third-party test site.
 | |
|         expect_sni = ssl.HAS_SNI
 | |
|         with support.transient_internet("XXX"):
 | |
|             u = urllib.request.urlopen("XXX")
 | |
|             contents = u.readall()
 | |
|             if expect_sni:
 | |
|                 self.assertIn(b"Great", contents)
 | |
|                 self.assertNotIn(b"Unfortunately", contents)
 | |
|             else:
 | |
|                 self.assertNotIn(b"Great", contents)
 | |
|                 self.assertIn(b"Unfortunately", contents)
 | |
| 
 | |
| 
 | |
| def test_main():
 | |
|     support.requires("network")
 | |
|     support.run_unittest(AuthTests,
 | |
|                          HTTPSTests,
 | |
|                          OtherNetworkTests,
 | |
|                          CloseSocketTest,
 | |
|                          TimeoutTest,
 | |
|                          )
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     test_main()
 |