/Lib/test/test_urllib2net.py
https://bitbucket.org/arigo/cpython-withatomic/ · Python · 364 lines · 240 code · 51 blank · 73 comment · 51 complexity · a6cb7830efa24ff0e2a3e3c8a9f54d10 MD5 · raw file
- #!/usr/bin/env python3
- import unittest
- from test import support
- from test.test_urllib2 import sanepathname2url
- import os
- import socket
- import urllib.error
- import urllib.request
- import sys
- try:
- import ssl
- except ImportError:
- ssl = None
- TIMEOUT = 60 # seconds
- def _retry_thrice(func, exc, *args, **kwargs):
- for i in range(3):
- try:
- return func(*args, **kwargs)
- except exc as e:
- last_exc = e
- continue
- except:
- raise
- raise last_exc
- def _wrap_with_retry_thrice(func, exc):
- def wrapped(*args, **kwargs):
- return _retry_thrice(func, exc, *args, **kwargs)
- return wrapped
- # Connecting to remote hosts is flaky. Make it more robust by retrying
- # the connection several times.
- _urlopen_with_retry = _wrap_with_retry_thrice(urllib.request.urlopen,
- urllib.error.URLError)
- class AuthTests(unittest.TestCase):
- """Tests urllib2 authentication features."""
- ## Disabled at the moment since there is no page under python.org which
- ## could be used to HTTP authentication.
- #
- # def test_basic_auth(self):
- # import http.client
- #
- # test_url = "http://www.python.org/test/test_urllib2/basic_auth"
- # test_hostport = "www.python.org"
- # test_realm = 'Test Realm'
- # test_user = 'test.test_urllib2net'
- # test_password = 'blah'
- #
- # # failure
- # try:
- # _urlopen_with_retry(test_url)
- # except urllib2.HTTPError, exc:
- # self.assertEqual(exc.code, 401)
- # else:
- # self.fail("urlopen() should have failed with 401")
- #
- # # success
- # auth_handler = urllib2.HTTPBasicAuthHandler()
- # auth_handler.add_password(test_realm, test_hostport,
- # test_user, test_password)
- # opener = urllib2.build_opener(auth_handler)
- # f = opener.open('http://localhost/')
- # response = _urlopen_with_retry("http://www.python.org/")
- #
- # # The 'userinfo' URL component is deprecated by RFC 3986 for security
- # # reasons, let's not implement it! (it's already implemented for proxy
- # # specification strings (that is, URLs or authorities specifying a
- # # proxy), so we must keep that)
- # self.assertRaises(http.client.InvalidURL,
- # urllib2.urlopen, "http://evil:thing@example.com")
- class CloseSocketTest(unittest.TestCase):
- def test_close(self):
- # calling .close() on urllib2's response objects should close the
- # underlying socket
- url = "http://www.python.org/"
- with support.transient_internet(url):
- response = _urlopen_with_retry(url)
- sock = response.fp
- self.assertTrue(not sock.closed)
- response.close()
- self.assertTrue(sock.closed)
- class OtherNetworkTests(unittest.TestCase):
- def setUp(self):
- if 0: # for debugging
- import logging
- logger = logging.getLogger("test_urllib2net")
- logger.addHandler(logging.StreamHandler())
- # XXX The rest of these tests aren't very good -- they don't check much.
- # They do sometimes catch some major disasters, though.
- def test_ftp(self):
- urls = [
- 'ftp://ftp.kernel.org/pub/linux/kernel/README',
- 'ftp://ftp.kernel.org/pub/linux/kernel/non-existent-file',
- #'ftp://ftp.kernel.org/pub/leenox/kernel/test',
- 'ftp://gatekeeper.research.compaq.com/pub/DEC/SRC'
- '/research-reports/00README-Legal-Rules-Regs',
- ]
- self._test_urls(urls, self._extra_handlers())
- def test_file(self):
- TESTFN = support.TESTFN
- f = open(TESTFN, 'w')
- try:
- f.write('hi there\n')
- f.close()
- urls = [
- 'file:' + sanepathname2url(os.path.abspath(TESTFN)),
- ('file:///nonsensename/etc/passwd', None,
- urllib.error.URLError),
- ]
- self._test_urls(urls, self._extra_handlers(), retry=True)
- finally:
- os.remove(TESTFN)
- self.assertRaises(ValueError, urllib.request.urlopen,'./relative_path/to/file')
- # XXX Following test depends on machine configurations that are internal
- # to CNRI. Need to set up a public server with the right authentication
- # configuration for test purposes.
- ## def test_cnri(self):
- ## if socket.gethostname() == 'bitdiddle':
- ## localhost = 'bitdiddle.cnri.reston.va.us'
- ## elif socket.gethostname() == 'bitdiddle.concentric.net':
- ## localhost = 'localhost'
- ## else:
- ## localhost = None
- ## if localhost is not None:
- ## urls = [
- ## 'file://%s/etc/passwd' % localhost,
- ## 'http://%s/simple/' % localhost,
- ## 'http://%s/digest/' % localhost,
- ## 'http://%s/not/found.h' % localhost,
- ## ]
- ## bauth = HTTPBasicAuthHandler()
- ## bauth.add_password('basic_test_realm', localhost, 'jhylton',
- ## 'password')
- ## dauth = HTTPDigestAuthHandler()
- ## dauth.add_password('digest_test_realm', localhost, 'jhylton',
- ## 'password')
- ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth])
- def test_urlwithfrag(self):
- urlwith_frag = "http://docs.python.org/glossary.html#glossary"
- with support.transient_internet(urlwith_frag):
- req = urllib.request.Request(urlwith_frag)
- res = urllib.request.urlopen(req)
- self.assertEqual(res.geturl(),
- "http://docs.python.org/glossary.html#glossary")
- def test_custom_headers(self):
- url = "http://www.example.com"
- with support.transient_internet(url):
- opener = urllib.request.build_opener()
- request = urllib.request.Request(url)
- self.assertFalse(request.header_items())
- opener.open(request)
- self.assertTrue(request.header_items())
- self.assertTrue(request.has_header('User-agent'))
- request.add_header('User-Agent','Test-Agent')
- opener.open(request)
- self.assertEqual(request.get_header('User-agent'),'Test-Agent')
- def test_sites_no_connection_close(self):
- # Some sites do not send Connection: close header.
- # Verify that those work properly. (#issue12576)
- URL = 'http://www.imdb.com' # mangles Connection:close
- with support.transient_internet(URL):
- try:
- with urllib.request.urlopen(URL) as res:
- pass
- except ValueError as e:
- self.fail("urlopen failed for site not sending \
- Connection:close")
- else:
- self.assertTrue(res)
- req = urllib.request.urlopen(URL)
- res = req.read()
- self.assertTrue(res)
- def _test_urls(self, urls, handlers, retry=True):
- import time
- import logging
- debug = logging.getLogger("test_urllib2").debug
- urlopen = urllib.request.build_opener(*handlers).open
- if retry:
- urlopen = _wrap_with_retry_thrice(urlopen, urllib.error.URLError)
- for url in urls:
- if isinstance(url, tuple):
- url, req, expected_err = url
- else:
- req = expected_err = None
- with support.transient_internet(url):
- debug(url)
- try:
- f = urlopen(url, req, TIMEOUT)
- except EnvironmentError as err:
- debug(err)
- if expected_err:
- msg = ("Didn't get expected error(s) %s for %s %s, got %s: %s" %
- (expected_err, url, req, type(err), err))
- self.assertIsInstance(err, expected_err, msg)
- except urllib.error.URLError as err:
- if isinstance(err[0], socket.timeout):
- print("<timeout: %s>" % url, file=sys.stderr)
- continue
- else:
- raise
- else:
- try:
- with support.time_out, \
- support.socket_peer_reset, \
- support.ioerror_peer_reset:
- buf = f.read()
- debug("read %d bytes" % len(buf))
- except socket.timeout:
- print("<timeout: %s>" % url, file=sys.stderr)
- f.close()
- debug("******** next url coming up...")
- time.sleep(0.1)
- def _extra_handlers(self):
- handlers = []
- cfh = urllib.request.CacheFTPHandler()
- self.addCleanup(cfh.clear_cache)
- cfh.setTimeout(1)
- handlers.append(cfh)
- return handlers
- class TimeoutTest(unittest.TestCase):
- def test_http_basic(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- url = "http://www.python.org"
- with support.transient_internet(url, timeout=None):
- u = _urlopen_with_retry(url)
- self.addCleanup(u.close)
- self.assertTrue(u.fp.raw._sock.gettimeout() is None)
- def test_http_default_timeout(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- url = "http://www.python.org"
- with support.transient_internet(url):
- socket.setdefaulttimeout(60)
- try:
- u = _urlopen_with_retry(url)
- self.addCleanup(u.close)
- finally:
- socket.setdefaulttimeout(None)
- self.assertEqual(u.fp.raw._sock.gettimeout(), 60)
- def test_http_no_timeout(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- url = "http://www.python.org"
- with support.transient_internet(url):
- socket.setdefaulttimeout(60)
- try:
- u = _urlopen_with_retry(url, timeout=None)
- self.addCleanup(u.close)
- finally:
- socket.setdefaulttimeout(None)
- self.assertTrue(u.fp.raw._sock.gettimeout() is None)
- def test_http_timeout(self):
- url = "http://www.python.org"
- with support.transient_internet(url):
- u = _urlopen_with_retry(url, timeout=120)
- self.addCleanup(u.close)
- self.assertEqual(u.fp.raw._sock.gettimeout(), 120)
- FTP_HOST = "ftp://ftp.mirror.nl/pub/gnu/"
- def test_ftp_basic(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- with support.transient_internet(self.FTP_HOST, timeout=None):
- u = _urlopen_with_retry(self.FTP_HOST)
- self.addCleanup(u.close)
- self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
- def test_ftp_default_timeout(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- with support.transient_internet(self.FTP_HOST):
- socket.setdefaulttimeout(60)
- try:
- u = _urlopen_with_retry(self.FTP_HOST)
- self.addCleanup(u.close)
- finally:
- socket.setdefaulttimeout(None)
- self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
- def test_ftp_no_timeout(self):
- self.assertTrue(socket.getdefaulttimeout() is None)
- with support.transient_internet(self.FTP_HOST):
- socket.setdefaulttimeout(60)
- try:
- u = _urlopen_with_retry(self.FTP_HOST, timeout=None)
- self.addCleanup(u.close)
- finally:
- socket.setdefaulttimeout(None)
- self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
- def test_ftp_timeout(self):
- with support.transient_internet(self.FTP_HOST):
- u = _urlopen_with_retry(self.FTP_HOST, timeout=60)
- self.addCleanup(u.close)
- self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
- @unittest.skipUnless(ssl, "requires SSL support")
- class HTTPSTests(unittest.TestCase):
- def test_sni(self):
- self.skipTest("test disabled - test server needed")
- # Checks that Server Name Indication works, if supported by the
- # OpenSSL linked to.
- # The ssl module itself doesn't have server-side support for SNI,
- # so we rely on a third-party test site.
- expect_sni = ssl.HAS_SNI
- with support.transient_internet("XXX"):
- u = urllib.request.urlopen("XXX")
- contents = u.readall()
- if expect_sni:
- self.assertIn(b"Great", contents)
- self.assertNotIn(b"Unfortunately", contents)
- else:
- self.assertNotIn(b"Great", contents)
- self.assertIn(b"Unfortunately", contents)
- def test_main():
- support.requires("network")
- support.run_unittest(AuthTests,
- HTTPSTests,
- OtherNetworkTests,
- CloseSocketTest,
- TimeoutTest,
- )
- if __name__ == "__main__":
- test_main()