blob: 1d88331146aaf90f27be56937ce4ff37d743ebe9 [file] [log] [blame]
Skip Montanaro89feabc2003-03-30 04:54:24 +00001#!/usr/bin/env python
2
3import unittest
4from test import test_support
5
6import socket
Brett Cannona71319e2003-05-14 02:18:31 +00007import urllib
Skip Montanaro89feabc2003-03-30 04:54:24 +00008import sys
Brett Cannona71319e2003-05-14 02:18:31 +00009import os
Senthil Kumaran1b7f9e52010-05-01 08:01:56 +000010import time
11
Ezio Melottia2d46532010-01-30 07:22:54 +000012mimetools = test_support.import_module("mimetools", deprecated=True)
Skip Montanaro89feabc2003-03-30 04:54:24 +000013
Neal Norwitz5be30672008-01-26 05:54:48 +000014
15def _open_with_retry(func, host, *args, **kwargs):
16 # Connecting to remote hosts is flaky. Make it more robust
17 # by retrying the connection several times.
18 for i in range(3):
19 try:
20 return func(host, *args, **kwargs)
21 except IOError, last_exc:
22 continue
23 except:
24 raise
25 raise last_exc
26
27
Skip Montanaro89feabc2003-03-30 04:54:24 +000028class URLTimeoutTest(unittest.TestCase):
29
30 TIMEOUT = 10.0
31
32 def setUp(self):
33 socket.setdefaulttimeout(self.TIMEOUT)
34
35 def tearDown(self):
36 socket.setdefaulttimeout(None)
37
38 def testURLread(self):
Neal Norwitz5be30672008-01-26 05:54:48 +000039 f = _open_with_retry(urllib.urlopen, "http://www.python.org/")
Skip Montanaro89feabc2003-03-30 04:54:24 +000040 x = f.read()
41
Brett Cannona71319e2003-05-14 02:18:31 +000042class urlopenNetworkTests(unittest.TestCase):
43 """Tests urllib.urlopen using the network.
Tim Peters813cec92003-05-16 15:35:10 +000044
Brett Cannona71319e2003-05-14 02:18:31 +000045 These tests are not exhaustive. Assuming that testing using files does a
46 good job overall of some of the basic interface features. There are no
47 tests exercising the optional 'data' and 'proxies' arguments. No tests
48 for transparent redirection have been written.
Tim Peters813cec92003-05-16 15:35:10 +000049
Brett Cannona71319e2003-05-14 02:18:31 +000050 setUp is not used for always constructing a connection to
51 http://www.python.org/ since there a few tests that don't use that address
52 and making a connection is expensive enough to warrant minimizing unneeded
53 connections.
Tim Peters813cec92003-05-16 15:35:10 +000054
Brett Cannona71319e2003-05-14 02:18:31 +000055 """
56
Neal Norwitz5be30672008-01-26 05:54:48 +000057 def urlopen(self, *args):
58 return _open_with_retry(urllib.urlopen, *args)
59
Brett Cannona71319e2003-05-14 02:18:31 +000060 def test_basic(self):
61 # Simple test expected to pass.
Neal Norwitz5be30672008-01-26 05:54:48 +000062 open_url = self.urlopen("http://www.python.org/")
Brett Cannona71319e2003-05-14 02:18:31 +000063 for attr in ("read", "readline", "readlines", "fileno", "close",
64 "info", "geturl"):
Benjamin Peterson5c8da862009-06-30 22:57:08 +000065 self.assertTrue(hasattr(open_url, attr), "object returned from "
Brett Cannona71319e2003-05-14 02:18:31 +000066 "urlopen lacks the %s attribute" % attr)
67 try:
Benjamin Peterson5c8da862009-06-30 22:57:08 +000068 self.assertTrue(open_url.read(), "calling 'read' failed")
Brett Cannona71319e2003-05-14 02:18:31 +000069 finally:
70 open_url.close()
71
72 def test_readlines(self):
73 # Test both readline and readlines.
Neal Norwitz5be30672008-01-26 05:54:48 +000074 open_url = self.urlopen("http://www.python.org/")
Brett Cannona71319e2003-05-14 02:18:31 +000075 try:
Ezio Melottib0f5adc2010-01-24 16:58:36 +000076 self.assertIsInstance(open_url.readline(), basestring,
77 "readline did not return a string")
78 self.assertIsInstance(open_url.readlines(), list,
79 "readlines did not return a list")
Brett Cannona71319e2003-05-14 02:18:31 +000080 finally:
81 open_url.close()
82
83 def test_info(self):
84 # Test 'info'.
Neal Norwitz5be30672008-01-26 05:54:48 +000085 open_url = self.urlopen("http://www.python.org/")
Brett Cannona71319e2003-05-14 02:18:31 +000086 try:
87 info_obj = open_url.info()
88 finally:
89 open_url.close()
Ezio Melottib0f5adc2010-01-24 16:58:36 +000090 self.assertIsInstance(info_obj, mimetools.Message,
91 "object returned by 'info' is not an "
92 "instance of mimetools.Message")
Brett Cannona71319e2003-05-14 02:18:31 +000093 self.assertEqual(info_obj.getsubtype(), "html")
94
95 def test_geturl(self):
96 # Make sure same URL as opened is returned by geturl.
97 URL = "http://www.python.org/"
Neal Norwitz5be30672008-01-26 05:54:48 +000098 open_url = self.urlopen(URL)
Brett Cannona71319e2003-05-14 02:18:31 +000099 try:
100 gotten_url = open_url.geturl()
101 finally:
102 open_url.close()
103 self.assertEqual(gotten_url, URL)
104
Georg Brandl9b0d46d2008-01-20 11:43:03 +0000105 def test_getcode(self):
106 # test getcode() with the fancy opener to get 404 error codes
107 URL = "http://www.python.org/XXXinvalidXXX"
108 open_url = urllib.FancyURLopener().open(URL)
109 try:
110 code = open_url.getcode()
111 finally:
112 open_url.close()
113 self.assertEqual(code, 404)
114
Brett Cannona71319e2003-05-14 02:18:31 +0000115 def test_fileno(self):
Tim Petersf545baa2003-06-15 23:26:30 +0000116 if (sys.platform in ('win32',) or
Tim Peters813cec92003-05-16 15:35:10 +0000117 not hasattr(os, 'fdopen')):
118 # On Windows, socket handles are not file descriptors; this
119 # test can't pass on Windows.
120 return
Brett Cannona71319e2003-05-14 02:18:31 +0000121 # Make sure fd returned by fileno is valid.
Neal Norwitz5be30672008-01-26 05:54:48 +0000122 open_url = self.urlopen("http://www.python.org/")
Tim Peters813cec92003-05-16 15:35:10 +0000123 fd = open_url.fileno()
124 FILE = os.fdopen(fd)
125 try:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000126 self.assertTrue(FILE.read(), "reading from file created using fd "
Tim Peters813cec92003-05-16 15:35:10 +0000127 "returned by fileno failed")
128 finally:
129 FILE.close()
Brett Cannona71319e2003-05-14 02:18:31 +0000130
131 def test_bad_address(self):
132 # Make sure proper exception is raised when connecting to a bogus
133 # address.
Antoine Pitroua4d58d22011-07-08 19:14:19 +0200134 bogus_domain = "sadflkjsasf.i.nvali.d"
135 try:
136 socket.gethostbyname(bogus_domain)
137 except socket.gaierror:
138 pass
139 else:
140 # This happens with some overzealous DNS providers such as OpenDNS
141 self.skipTest("%r should not resolve for test to work" % bogus_domain)
Brett Cannona71319e2003-05-14 02:18:31 +0000142 self.assertRaises(IOError,
Tim Peters0aab0022003-09-20 22:16:26 +0000143 # SF patch 809915: In Sep 2003, VeriSign started
144 # highjacking invalid .com and .net addresses to
145 # boost traffic to their own site. This test
146 # started failing then. One hopes the .invalid
147 # domain will be spared to serve its defined
148 # purpose.
149 # urllib.urlopen, "http://www.sadflkjsasadf.com/")
Antoine Pitroucc5b64a2008-12-15 00:39:51 +0000150 urllib.urlopen, "http://sadflkjsasf.i.nvali.d/")
Brett Cannona71319e2003-05-14 02:18:31 +0000151
152class urlretrieveNetworkTests(unittest.TestCase):
153 """Tests urllib.urlretrieve using the network."""
154
Neal Norwitz5be30672008-01-26 05:54:48 +0000155 def urlretrieve(self, *args):
156 return _open_with_retry(urllib.urlretrieve, *args)
157
Brett Cannona71319e2003-05-14 02:18:31 +0000158 def test_basic(self):
159 # Test basic functionality.
Neal Norwitz5be30672008-01-26 05:54:48 +0000160 file_location,info = self.urlretrieve("http://www.python.org/")
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000161 self.assertTrue(os.path.exists(file_location), "file location returned by"
Brett Cannona71319e2003-05-14 02:18:31 +0000162 " urlretrieve is not a valid path")
163 FILE = file(file_location)
164 try:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000165 self.assertTrue(FILE.read(), "reading from the file location returned"
Jeremy Hyltonbd9f5202003-07-17 16:31:00 +0000166 " by urlretrieve failed")
Brett Cannona71319e2003-05-14 02:18:31 +0000167 finally:
168 FILE.close()
169 os.unlink(file_location)
170
171 def test_specified_path(self):
172 # Make sure that specifying the location of the file to write to works.
Neal Norwitz5be30672008-01-26 05:54:48 +0000173 file_location,info = self.urlretrieve("http://www.python.org/",
174 test_support.TESTFN)
Brett Cannona71319e2003-05-14 02:18:31 +0000175 self.assertEqual(file_location, test_support.TESTFN)
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000176 self.assertTrue(os.path.exists(file_location))
Brett Cannona71319e2003-05-14 02:18:31 +0000177 FILE = file(file_location)
178 try:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000179 self.assertTrue(FILE.read(), "reading from temporary file failed")
Brett Cannona71319e2003-05-14 02:18:31 +0000180 finally:
181 FILE.close()
182 os.unlink(file_location)
183
184 def test_header(self):
185 # Make sure header returned as 2nd value from urlretrieve is good.
Neal Norwitz5be30672008-01-26 05:54:48 +0000186 file_location, header = self.urlretrieve("http://www.python.org/")
Brett Cannona71319e2003-05-14 02:18:31 +0000187 os.unlink(file_location)
Ezio Melottib0f5adc2010-01-24 16:58:36 +0000188 self.assertIsInstance(header, mimetools.Message,
189 "header is not an instance of mimetools.Message")
Tim Peters813cec92003-05-16 15:35:10 +0000190
Senthil Kumaran1b7f9e52010-05-01 08:01:56 +0000191 def test_data_header(self):
192 logo = "http://www.python.org/community/logos/python-logo-master-v3-TM.png"
193 file_location, fileheaders = self.urlretrieve(logo)
194 os.unlink(file_location)
195 datevalue = fileheaders.getheader('Date')
196 dateformat = '%a, %d %b %Y %H:%M:%S GMT'
197 try:
198 time.strptime(datevalue, dateformat)
199 except ValueError:
200 self.fail('Date value not in %r format', dateformat)
201
Brett Cannona71319e2003-05-14 02:18:31 +0000202
203
Skip Montanaro89feabc2003-03-30 04:54:24 +0000204def test_main():
205 test_support.requires('network')
Florent Xicluna6257a7b2010-03-31 22:01:03 +0000206 with test_support.check_py3k_warnings(
207 ("urllib.urlopen.. has been removed", DeprecationWarning)):
Brett Cannon8bb8fa52008-07-02 01:57:08 +0000208 test_support.run_unittest(URLTimeoutTest,
209 urlopenNetworkTests,
210 urlretrieveNetworkTests)
Skip Montanaro89feabc2003-03-30 04:54:24 +0000211
212if __name__ == "__main__":
213 test_main()