PageRenderTime 51ms CodeModel.GetById 19ms RepoModel.GetById 1ms app.codeStats 0ms

/Lib/test/test_urllib2net.py

https://bitbucket.org/arigo/cpython-withatomic/
Python | 364 lines | 240 code | 51 blank | 73 comment | 51 complexity | a6cb7830efa24ff0e2a3e3c8a9f54d10 MD5 | raw file
Possible License(s): 0BSD
  1. #!/usr/bin/env python3
  2. import unittest
  3. from test import support
  4. from test.test_urllib2 import sanepathname2url
  5. import os
  6. import socket
  7. import urllib.error
  8. import urllib.request
  9. import sys
  10. try:
  11. import ssl
  12. except ImportError:
  13. ssl = None
  14. TIMEOUT = 60 # seconds
  15. def _retry_thrice(func, exc, *args, **kwargs):
  16. for i in range(3):
  17. try:
  18. return func(*args, **kwargs)
  19. except exc as e:
  20. last_exc = e
  21. continue
  22. except:
  23. raise
  24. raise last_exc
  25. def _wrap_with_retry_thrice(func, exc):
  26. def wrapped(*args, **kwargs):
  27. return _retry_thrice(func, exc, *args, **kwargs)
  28. return wrapped
  29. # Connecting to remote hosts is flaky. Make it more robust by retrying
  30. # the connection several times.
  31. _urlopen_with_retry = _wrap_with_retry_thrice(urllib.request.urlopen,
  32. urllib.error.URLError)
  33. class AuthTests(unittest.TestCase):
  34. """Tests urllib2 authentication features."""
  35. ## Disabled at the moment since there is no page under python.org which
  36. ## could be used to HTTP authentication.
  37. #
  38. # def test_basic_auth(self):
  39. # import http.client
  40. #
  41. # test_url = "http://www.python.org/test/test_urllib2/basic_auth"
  42. # test_hostport = "www.python.org"
  43. # test_realm = 'Test Realm'
  44. # test_user = 'test.test_urllib2net'
  45. # test_password = 'blah'
  46. #
  47. # # failure
  48. # try:
  49. # _urlopen_with_retry(test_url)
  50. # except urllib2.HTTPError, exc:
  51. # self.assertEqual(exc.code, 401)
  52. # else:
  53. # self.fail("urlopen() should have failed with 401")
  54. #
  55. # # success
  56. # auth_handler = urllib2.HTTPBasicAuthHandler()
  57. # auth_handler.add_password(test_realm, test_hostport,
  58. # test_user, test_password)
  59. # opener = urllib2.build_opener(auth_handler)
  60. # f = opener.open('http://localhost/')
  61. # response = _urlopen_with_retry("http://www.python.org/")
  62. #
  63. # # The 'userinfo' URL component is deprecated by RFC 3986 for security
  64. # # reasons, let's not implement it! (it's already implemented for proxy
  65. # # specification strings (that is, URLs or authorities specifying a
  66. # # proxy), so we must keep that)
  67. # self.assertRaises(http.client.InvalidURL,
  68. # urllib2.urlopen, "http://evil:thing@example.com")
  69. class CloseSocketTest(unittest.TestCase):
  70. def test_close(self):
  71. # calling .close() on urllib2's response objects should close the
  72. # underlying socket
  73. url = "http://www.python.org/"
  74. with support.transient_internet(url):
  75. response = _urlopen_with_retry(url)
  76. sock = response.fp
  77. self.assertTrue(not sock.closed)
  78. response.close()
  79. self.assertTrue(sock.closed)
  80. class OtherNetworkTests(unittest.TestCase):
  81. def setUp(self):
  82. if 0: # for debugging
  83. import logging
  84. logger = logging.getLogger("test_urllib2net")
  85. logger.addHandler(logging.StreamHandler())
  86. # XXX The rest of these tests aren't very good -- they don't check much.
  87. # They do sometimes catch some major disasters, though.
  88. def test_ftp(self):
  89. urls = [
  90. 'ftp://ftp.kernel.org/pub/linux/kernel/README',
  91. 'ftp://ftp.kernel.org/pub/linux/kernel/non-existent-file',
  92. #'ftp://ftp.kernel.org/pub/leenox/kernel/test',
  93. 'ftp://gatekeeper.research.compaq.com/pub/DEC/SRC'
  94. '/research-reports/00README-Legal-Rules-Regs',
  95. ]
  96. self._test_urls(urls, self._extra_handlers())
  97. def test_file(self):
  98. TESTFN = support.TESTFN
  99. f = open(TESTFN, 'w')
  100. try:
  101. f.write('hi there\n')
  102. f.close()
  103. urls = [
  104. 'file:' + sanepathname2url(os.path.abspath(TESTFN)),
  105. ('file:///nonsensename/etc/passwd', None,
  106. urllib.error.URLError),
  107. ]
  108. self._test_urls(urls, self._extra_handlers(), retry=True)
  109. finally:
  110. os.remove(TESTFN)
  111. self.assertRaises(ValueError, urllib.request.urlopen,'./relative_path/to/file')
  112. # XXX Following test depends on machine configurations that are internal
  113. # to CNRI. Need to set up a public server with the right authentication
  114. # configuration for test purposes.
  115. ## def test_cnri(self):
  116. ## if socket.gethostname() == 'bitdiddle':
  117. ## localhost = 'bitdiddle.cnri.reston.va.us'
  118. ## elif socket.gethostname() == 'bitdiddle.concentric.net':
  119. ## localhost = 'localhost'
  120. ## else:
  121. ## localhost = None
  122. ## if localhost is not None:
  123. ## urls = [
  124. ## 'file://%s/etc/passwd' % localhost,
  125. ## 'http://%s/simple/' % localhost,
  126. ## 'http://%s/digest/' % localhost,
  127. ## 'http://%s/not/found.h' % localhost,
  128. ## ]
  129. ## bauth = HTTPBasicAuthHandler()
  130. ## bauth.add_password('basic_test_realm', localhost, 'jhylton',
  131. ## 'password')
  132. ## dauth = HTTPDigestAuthHandler()
  133. ## dauth.add_password('digest_test_realm', localhost, 'jhylton',
  134. ## 'password')
  135. ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth])
  136. def test_urlwithfrag(self):
  137. urlwith_frag = "http://docs.python.org/glossary.html#glossary"
  138. with support.transient_internet(urlwith_frag):
  139. req = urllib.request.Request(urlwith_frag)
  140. res = urllib.request.urlopen(req)
  141. self.assertEqual(res.geturl(),
  142. "http://docs.python.org/glossary.html#glossary")
  143. def test_custom_headers(self):
  144. url = "http://www.example.com"
  145. with support.transient_internet(url):
  146. opener = urllib.request.build_opener()
  147. request = urllib.request.Request(url)
  148. self.assertFalse(request.header_items())
  149. opener.open(request)
  150. self.assertTrue(request.header_items())
  151. self.assertTrue(request.has_header('User-agent'))
  152. request.add_header('User-Agent','Test-Agent')
  153. opener.open(request)
  154. self.assertEqual(request.get_header('User-agent'),'Test-Agent')
  155. def test_sites_no_connection_close(self):
  156. # Some sites do not send Connection: close header.
  157. # Verify that those work properly. (#issue12576)
  158. URL = 'http://www.imdb.com' # mangles Connection:close
  159. with support.transient_internet(URL):
  160. try:
  161. with urllib.request.urlopen(URL) as res:
  162. pass
  163. except ValueError as e:
  164. self.fail("urlopen failed for site not sending \
  165. Connection:close")
  166. else:
  167. self.assertTrue(res)
  168. req = urllib.request.urlopen(URL)
  169. res = req.read()
  170. self.assertTrue(res)
  171. def _test_urls(self, urls, handlers, retry=True):
  172. import time
  173. import logging
  174. debug = logging.getLogger("test_urllib2").debug
  175. urlopen = urllib.request.build_opener(*handlers).open
  176. if retry:
  177. urlopen = _wrap_with_retry_thrice(urlopen, urllib.error.URLError)
  178. for url in urls:
  179. if isinstance(url, tuple):
  180. url, req, expected_err = url
  181. else:
  182. req = expected_err = None
  183. with support.transient_internet(url):
  184. debug(url)
  185. try:
  186. f = urlopen(url, req, TIMEOUT)
  187. except EnvironmentError as err:
  188. debug(err)
  189. if expected_err:
  190. msg = ("Didn't get expected error(s) %s for %s %s, got %s: %s" %
  191. (expected_err, url, req, type(err), err))
  192. self.assertIsInstance(err, expected_err, msg)
  193. except urllib.error.URLError as err:
  194. if isinstance(err[0], socket.timeout):
  195. print("<timeout: %s>" % url, file=sys.stderr)
  196. continue
  197. else:
  198. raise
  199. else:
  200. try:
  201. with support.time_out, \
  202. support.socket_peer_reset, \
  203. support.ioerror_peer_reset:
  204. buf = f.read()
  205. debug("read %d bytes" % len(buf))
  206. except socket.timeout:
  207. print("<timeout: %s>" % url, file=sys.stderr)
  208. f.close()
  209. debug("******** next url coming up...")
  210. time.sleep(0.1)
  211. def _extra_handlers(self):
  212. handlers = []
  213. cfh = urllib.request.CacheFTPHandler()
  214. self.addCleanup(cfh.clear_cache)
  215. cfh.setTimeout(1)
  216. handlers.append(cfh)
  217. return handlers
  218. class TimeoutTest(unittest.TestCase):
  219. def test_http_basic(self):
  220. self.assertTrue(socket.getdefaulttimeout() is None)
  221. url = "http://www.python.org"
  222. with support.transient_internet(url, timeout=None):
  223. u = _urlopen_with_retry(url)
  224. self.addCleanup(u.close)
  225. self.assertTrue(u.fp.raw._sock.gettimeout() is None)
  226. def test_http_default_timeout(self):
  227. self.assertTrue(socket.getdefaulttimeout() is None)
  228. url = "http://www.python.org"
  229. with support.transient_internet(url):
  230. socket.setdefaulttimeout(60)
  231. try:
  232. u = _urlopen_with_retry(url)
  233. self.addCleanup(u.close)
  234. finally:
  235. socket.setdefaulttimeout(None)
  236. self.assertEqual(u.fp.raw._sock.gettimeout(), 60)
  237. def test_http_no_timeout(self):
  238. self.assertTrue(socket.getdefaulttimeout() is None)
  239. url = "http://www.python.org"
  240. with support.transient_internet(url):
  241. socket.setdefaulttimeout(60)
  242. try:
  243. u = _urlopen_with_retry(url, timeout=None)
  244. self.addCleanup(u.close)
  245. finally:
  246. socket.setdefaulttimeout(None)
  247. self.assertTrue(u.fp.raw._sock.gettimeout() is None)
  248. def test_http_timeout(self):
  249. url = "http://www.python.org"
  250. with support.transient_internet(url):
  251. u = _urlopen_with_retry(url, timeout=120)
  252. self.addCleanup(u.close)
  253. self.assertEqual(u.fp.raw._sock.gettimeout(), 120)
  254. FTP_HOST = "ftp://ftp.mirror.nl/pub/gnu/"
  255. def test_ftp_basic(self):
  256. self.assertTrue(socket.getdefaulttimeout() is None)
  257. with support.transient_internet(self.FTP_HOST, timeout=None):
  258. u = _urlopen_with_retry(self.FTP_HOST)
  259. self.addCleanup(u.close)
  260. self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
  261. def test_ftp_default_timeout(self):
  262. self.assertTrue(socket.getdefaulttimeout() is None)
  263. with support.transient_internet(self.FTP_HOST):
  264. socket.setdefaulttimeout(60)
  265. try:
  266. u = _urlopen_with_retry(self.FTP_HOST)
  267. self.addCleanup(u.close)
  268. finally:
  269. socket.setdefaulttimeout(None)
  270. self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
  271. def test_ftp_no_timeout(self):
  272. self.assertTrue(socket.getdefaulttimeout() is None)
  273. with support.transient_internet(self.FTP_HOST):
  274. socket.setdefaulttimeout(60)
  275. try:
  276. u = _urlopen_with_retry(self.FTP_HOST, timeout=None)
  277. self.addCleanup(u.close)
  278. finally:
  279. socket.setdefaulttimeout(None)
  280. self.assertTrue(u.fp.fp.raw._sock.gettimeout() is None)
  281. def test_ftp_timeout(self):
  282. with support.transient_internet(self.FTP_HOST):
  283. u = _urlopen_with_retry(self.FTP_HOST, timeout=60)
  284. self.addCleanup(u.close)
  285. self.assertEqual(u.fp.fp.raw._sock.gettimeout(), 60)
  286. @unittest.skipUnless(ssl, "requires SSL support")
  287. class HTTPSTests(unittest.TestCase):
  288. def test_sni(self):
  289. self.skipTest("test disabled - test server needed")
  290. # Checks that Server Name Indication works, if supported by the
  291. # OpenSSL linked to.
  292. # The ssl module itself doesn't have server-side support for SNI,
  293. # so we rely on a third-party test site.
  294. expect_sni = ssl.HAS_SNI
  295. with support.transient_internet("XXX"):
  296. u = urllib.request.urlopen("XXX")
  297. contents = u.readall()
  298. if expect_sni:
  299. self.assertIn(b"Great", contents)
  300. self.assertNotIn(b"Unfortunately", contents)
  301. else:
  302. self.assertNotIn(b"Great", contents)
  303. self.assertIn(b"Unfortunately", contents)
  304. def test_main():
  305. support.requires("network")
  306. support.run_unittest(AuthTests,
  307. HTTPSTests,
  308. OtherNetworkTests,
  309. CloseSocketTest,
  310. TimeoutTest,
  311. )
  312. if __name__ == "__main__":
  313. test_main()