| #!/usr/bin/env python3 |
| |
| import unittest |
| from test import support |
| |
| import socket |
| import urllib.request |
| import sys |
| import os |
| import email.message |
| import time |
| |
| |
| def _open_with_retry(func, host, *args, **kwargs): |
| # Connecting to remote hosts is flaky. Make it more robust |
| # by retrying the connection several times. |
| last_exc = None |
| for i in range(3): |
| try: |
| return func(host, *args, **kwargs) |
| except IOError as err: |
| last_exc = err |
| continue |
| except: |
| raise |
| raise last_exc |
| |
| |
| class URLTimeoutTest(unittest.TestCase): |
| |
| TIMEOUT = 10.0 |
| |
| def setUp(self): |
| socket.setdefaulttimeout(self.TIMEOUT) |
| |
| def tearDown(self): |
| socket.setdefaulttimeout(None) |
| |
| def testURLread(self): |
| f = _open_with_retry(urllib.request.urlopen, "http://www.python.org/") |
| x = f.read() |
| |
| class urlopenNetworkTests(unittest.TestCase): |
| """Tests urllib.reqest.urlopen using the network. |
| |
| These tests are not exhaustive. Assuming that testing using files does a |
| good job overall of some of the basic interface features. There are no |
| tests exercising the optional 'data' and 'proxies' arguments. No tests |
| for transparent redirection have been written. |
| |
| setUp is not used for always constructing a connection to |
| http://www.python.org/ since there a few tests that don't use that address |
| and making a connection is expensive enough to warrant minimizing unneeded |
| connections. |
| |
| """ |
| |
| def urlopen(self, *args): |
| return _open_with_retry(urllib.request.urlopen, *args) |
| |
| def test_basic(self): |
| # Simple test expected to pass. |
| open_url = self.urlopen("http://www.python.org/") |
| for attr in ("read", "readline", "readlines", "fileno", "close", |
| "info", "geturl"): |
| self.assertTrue(hasattr(open_url, attr), "object returned from " |
| "urlopen lacks the %s attribute" % attr) |
| try: |
| self.assertTrue(open_url.read(), "calling 'read' failed") |
| finally: |
| open_url.close() |
| |
| def test_readlines(self): |
| # Test both readline and readlines. |
| open_url = self.urlopen("http://www.python.org/") |
| try: |
| self.assertIsInstance(open_url.readline(), bytes, |
| "readline did not return a string") |
| self.assertIsInstance(open_url.readlines(), list, |
| "readlines did not return a list") |
| finally: |
| open_url.close() |
| |
| def test_info(self): |
| # Test 'info'. |
| open_url = self.urlopen("http://www.python.org/") |
| try: |
| info_obj = open_url.info() |
| finally: |
| open_url.close() |
| self.assertIsInstance(info_obj, email.message.Message, |
| "object returned by 'info' is not an " |
| "instance of email.message.Message") |
| self.assertEqual(info_obj.get_content_subtype(), "html") |
| |
| def test_geturl(self): |
| # Make sure same URL as opened is returned by geturl. |
| URL = "http://www.python.org/" |
| open_url = self.urlopen(URL) |
| try: |
| gotten_url = open_url.geturl() |
| finally: |
| open_url.close() |
| self.assertEqual(gotten_url, URL) |
| |
| def test_getcode(self): |
| # test getcode() with the fancy opener to get 404 error codes |
| URL = "http://www.python.org/XXXinvalidXXX" |
| open_url = urllib.request.FancyURLopener().open(URL) |
| try: |
| code = open_url.getcode() |
| finally: |
| open_url.close() |
| self.assertEqual(code, 404) |
| |
| def test_fileno(self): |
| if sys.platform in ('win32',): |
| # On Windows, socket handles are not file descriptors; this |
| # test can't pass on Windows. |
| return |
| # Make sure fd returned by fileno is valid. |
| open_url = self.urlopen("http://www.python.org/") |
| fd = open_url.fileno() |
| FILE = os.fdopen(fd, encoding='utf-8') |
| try: |
| self.assertTrue(FILE.read(), "reading from file created using fd " |
| "returned by fileno failed") |
| finally: |
| FILE.close() |
| |
| def test_bad_address(self): |
| # Make sure proper exception is raised when connecting to a bogus |
| # address. |
| self.assertRaises(IOError, |
| # SF patch 809915: In Sep 2003, VeriSign started |
| # highjacking invalid .com and .net addresses to |
| # boost traffic to their own site. This test |
| # started failing then. One hopes the .invalid |
| # domain will be spared to serve its defined |
| # purpose. |
| # urllib.urlopen, "http://www.sadflkjsasadf.com/") |
| urllib.request.urlopen, |
| "http://sadflkjsasf.i.nvali.d/") |
| |
| class urlretrieveNetworkTests(unittest.TestCase): |
| """Tests urllib.request.urlretrieve using the network.""" |
| |
| def urlretrieve(self, *args): |
| return _open_with_retry(urllib.request.urlretrieve, *args) |
| |
| def test_basic(self): |
| # Test basic functionality. |
| file_location,info = self.urlretrieve("http://www.python.org/") |
| self.assertTrue(os.path.exists(file_location), "file location returned by" |
| " urlretrieve is not a valid path") |
| FILE = open(file_location, encoding='utf-8') |
| try: |
| self.assertTrue(FILE.read(), "reading from the file location returned" |
| " by urlretrieve failed") |
| finally: |
| FILE.close() |
| os.unlink(file_location) |
| |
| def test_specified_path(self): |
| # Make sure that specifying the location of the file to write to works. |
| file_location,info = self.urlretrieve("http://www.python.org/", |
| support.TESTFN) |
| self.assertEqual(file_location, support.TESTFN) |
| self.assertTrue(os.path.exists(file_location)) |
| FILE = open(file_location, encoding='utf-8') |
| try: |
| self.assertTrue(FILE.read(), "reading from temporary file failed") |
| finally: |
| FILE.close() |
| os.unlink(file_location) |
| |
| def test_header(self): |
| # Make sure header returned as 2nd value from urlretrieve is good. |
| file_location, header = self.urlretrieve("http://www.python.org/") |
| os.unlink(file_location) |
| self.assertIsInstance(header, email.message.Message, |
| "header is not an instance of email.message.Message") |
| |
| def test_data_header(self): |
| logo = "http://www.python.org/community/logos/python-logo-master-v3-TM.png" |
| file_location, fileheaders = self.urlretrieve(logo) |
| os.unlink(file_location) |
| datevalue = fileheaders.get('Date') |
| dateformat = '%a, %d %b %Y %H:%M:%S GMT' |
| try: |
| time.strptime(datevalue, dateformat) |
| except ValueError: |
| self.fail('Date value not in %r format', dateformat) |
| |
| |
| def test_main(): |
| support.requires('network') |
| support.run_unittest(URLTimeoutTest, |
| urlopenNetworkTests, |
| urlretrieveNetworkTests) |
| |
| if __name__ == "__main__": |
| test_main() |