blob: 52b9292e18de8c8ec0c9ee4e909b24a7ee671439 [file] [log] [blame]
Brett Cannon74bfd702003-04-25 09:39:47 +00001"""Regresssion tests for urllib"""
2
Jeremy Hylton1afc1692008-06-18 20:49:58 +00003import urllib.parse
4import urllib.request
guido@google.coma119df92011-03-29 11:41:02 -07005import urllib.error
Georg Brandl24420152008-05-26 16:32:26 +00006import http.client
Barry Warsaw820c1202008-06-12 04:06:45 +00007import email.message
Jeremy Hylton66dc8c52007-08-04 03:42:26 +00008import io
Brett Cannon74bfd702003-04-25 09:39:47 +00009import unittest
Benjamin Petersonee8712c2008-05-20 21:35:26 +000010from test import support
Brett Cannon74bfd702003-04-25 09:39:47 +000011import os
Senthil Kumaran2d2ea1b2011-04-14 13:16:30 +080012import sys
Georg Brandl5a650a22005-08-26 08:51:34 +000013import tempfile
Jeremy Hylton6102e292000-08-31 15:48:10 +000014
Senthil Kumaranc5c5a142012-01-14 19:09:04 +080015from base64 import b64encode
Georg Brandl2daf6ae2012-02-20 19:54:16 +010016import collections
Senthil Kumaranc5c5a142012-01-14 19:09:04 +080017
Brett Cannon74bfd702003-04-25 09:39:47 +000018def hexescape(char):
19 """Escape char as RFC 2396 specifies"""
20 hex_repr = hex(ord(char))[2:].upper()
21 if len(hex_repr) == 1:
22 hex_repr = "0%s" % hex_repr
23 return "%" + hex_repr
Jeremy Hylton6102e292000-08-31 15:48:10 +000024
Jeremy Hylton1afc1692008-06-18 20:49:58 +000025# Shortcut for testing FancyURLopener
26_urlopener = None
27def urlopen(url, data=None, proxies=None):
28 """urlopen(url [, data]) -> open file-like object"""
29 global _urlopener
30 if proxies is not None:
31 opener = urllib.request.FancyURLopener(proxies=proxies)
32 elif not _urlopener:
33 opener = urllib.request.FancyURLopener()
34 _urlopener = opener
35 else:
36 opener = _urlopener
37 if data is None:
38 return opener.open(url)
39 else:
40 return opener.open(url, data)
41
Senthil Kumarance260142011-11-01 01:35:17 +080042
43class FakeHTTPMixin(object):
44 def fakehttp(self, fakedata):
45 class FakeSocket(io.BytesIO):
46 io_refs = 1
47
Senthil Kumaranc5c5a142012-01-14 19:09:04 +080048 def sendall(self, data):
49 FakeHTTPConnection.buf = data
Senthil Kumarance260142011-11-01 01:35:17 +080050
51 def makefile(self, *args, **kwds):
52 self.io_refs += 1
53 return self
54
55 def read(self, amt=None):
56 if self.closed:
57 return b""
58 return io.BytesIO.read(self, amt)
59
60 def readline(self, length=None):
61 if self.closed:
62 return b""
63 return io.BytesIO.readline(self, length)
64
65 def close(self):
66 self.io_refs -= 1
67 if self.io_refs == 0:
68 io.BytesIO.close(self)
69
70 class FakeHTTPConnection(http.client.HTTPConnection):
Senthil Kumaranc5c5a142012-01-14 19:09:04 +080071
72 # buffer to store data for verification in urlopen tests.
73 buf = None
74
Senthil Kumarance260142011-11-01 01:35:17 +080075 def connect(self):
76 self.sock = FakeSocket(fakedata)
Senthil Kumaranc5c5a142012-01-14 19:09:04 +080077
Senthil Kumarance260142011-11-01 01:35:17 +080078 self._connection_class = http.client.HTTPConnection
79 http.client.HTTPConnection = FakeHTTPConnection
80
81 def unfakehttp(self):
82 http.client.HTTPConnection = self._connection_class
83
84
Brett Cannon74bfd702003-04-25 09:39:47 +000085class urlopen_FileTests(unittest.TestCase):
86 """Test urlopen() opening a temporary file.
Jeremy Hylton6102e292000-08-31 15:48:10 +000087
Brett Cannon74bfd702003-04-25 09:39:47 +000088 Try to test as much functionality as possible so as to cut down on reliance
Andrew M. Kuchlingf1a2f9e2004-06-29 13:07:53 +000089 on connecting to the Net for testing.
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000090
Brett Cannon74bfd702003-04-25 09:39:47 +000091 """
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000092
Brett Cannon74bfd702003-04-25 09:39:47 +000093 def setUp(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +000094 # Create a temp file to use for testing
95 self.text = bytes("test_urllib: %s\n" % self.__class__.__name__,
96 "ascii")
97 f = open(support.TESTFN, 'wb')
Brett Cannon74bfd702003-04-25 09:39:47 +000098 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +000099 f.write(self.text)
Brett Cannon74bfd702003-04-25 09:39:47 +0000100 finally:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000101 f.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000102 self.pathname = support.TESTFN
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000103 self.returned_obj = urlopen("file:%s" % self.pathname)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +0000104
Brett Cannon74bfd702003-04-25 09:39:47 +0000105 def tearDown(self):
106 """Shut down the open object"""
107 self.returned_obj.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000108 os.remove(support.TESTFN)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +0000109
Brett Cannon74bfd702003-04-25 09:39:47 +0000110 def test_interface(self):
111 # Make sure object returned by urlopen() has the specified methods
112 for attr in ("read", "readline", "readlines", "fileno",
Christian Heimes9bd667a2008-01-20 15:14:11 +0000113 "close", "info", "geturl", "getcode", "__iter__"):
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000114 self.assertTrue(hasattr(self.returned_obj, attr),
Brett Cannon74bfd702003-04-25 09:39:47 +0000115 "object returned by urlopen() lacks %s attribute" %
116 attr)
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000117
Brett Cannon74bfd702003-04-25 09:39:47 +0000118 def test_read(self):
119 self.assertEqual(self.text, self.returned_obj.read())
Skip Montanaro080c9972001-01-28 21:12:22 +0000120
Brett Cannon74bfd702003-04-25 09:39:47 +0000121 def test_readline(self):
122 self.assertEqual(self.text, self.returned_obj.readline())
Guido van Rossuma0982942007-07-10 08:30:03 +0000123 self.assertEqual(b'', self.returned_obj.readline(),
Brett Cannon74bfd702003-04-25 09:39:47 +0000124 "calling readline() after exhausting the file did not"
125 " return an empty string")
Skip Montanaro080c9972001-01-28 21:12:22 +0000126
Brett Cannon74bfd702003-04-25 09:39:47 +0000127 def test_readlines(self):
128 lines_list = self.returned_obj.readlines()
129 self.assertEqual(len(lines_list), 1,
130 "readlines() returned the wrong number of lines")
131 self.assertEqual(lines_list[0], self.text,
132 "readlines() returned improper text")
Skip Montanaro080c9972001-01-28 21:12:22 +0000133
Brett Cannon74bfd702003-04-25 09:39:47 +0000134 def test_fileno(self):
135 file_num = self.returned_obj.fileno()
Ezio Melottie9615932010-01-24 19:26:24 +0000136 self.assertIsInstance(file_num, int, "fileno() did not return an int")
Brett Cannon74bfd702003-04-25 09:39:47 +0000137 self.assertEqual(os.read(file_num, len(self.text)), self.text,
138 "Reading on the file descriptor returned by fileno() "
139 "did not return the expected text")
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000140
Brett Cannon74bfd702003-04-25 09:39:47 +0000141 def test_close(self):
Senthil Kumarand91ffca2011-03-19 17:25:27 +0800142 # Test close() by calling it here and then having it be called again
Brett Cannon74bfd702003-04-25 09:39:47 +0000143 # by the tearDown() method for the test
144 self.returned_obj.close()
Skip Montanaro080c9972001-01-28 21:12:22 +0000145
Brett Cannon74bfd702003-04-25 09:39:47 +0000146 def test_info(self):
Ezio Melottie9615932010-01-24 19:26:24 +0000147 self.assertIsInstance(self.returned_obj.info(), email.message.Message)
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000148
Brett Cannon74bfd702003-04-25 09:39:47 +0000149 def test_geturl(self):
150 self.assertEqual(self.returned_obj.geturl(), self.pathname)
Skip Montanaro080c9972001-01-28 21:12:22 +0000151
Christian Heimes9bd667a2008-01-20 15:14:11 +0000152 def test_getcode(self):
Florent Xicluna419e3842010-08-08 16:16:07 +0000153 self.assertIsNone(self.returned_obj.getcode())
Christian Heimes9bd667a2008-01-20 15:14:11 +0000154
Brett Cannon74bfd702003-04-25 09:39:47 +0000155 def test_iter(self):
156 # Test iterator
157 # Don't need to count number of iterations since test would fail the
158 # instant it returned anything beyond the first line from the
Raymond Hettinger038018a2011-06-26 14:29:35 +0200159 # comparison.
160 # Use the iterator in the usual implicit way to test for ticket #4608.
161 for line in self.returned_obj:
Brett Cannon74bfd702003-04-25 09:39:47 +0000162 self.assertEqual(line, self.text)
Skip Montanaro080c9972001-01-28 21:12:22 +0000163
Senthil Kumaran3800ea92012-01-21 11:52:48 +0800164 def test_relativelocalfile(self):
165 self.assertRaises(ValueError,urllib.request.urlopen,'./' + self.pathname)
166
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000167class ProxyTests(unittest.TestCase):
168
169 def setUp(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000170 # Records changes to env vars
171 self.env = support.EnvironmentVarGuard()
Benjamin Peterson46a99002010-01-09 18:45:30 +0000172 # Delete all proxy related env vars
Antoine Pitroub3a88b52010-10-14 18:31:39 +0000173 for k in list(os.environ):
Antoine Pitrou8c8f1ac2010-10-14 18:32:54 +0000174 if 'proxy' in k.lower():
Benjamin Peterson46a99002010-01-09 18:45:30 +0000175 self.env.unset(k)
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000176
177 def tearDown(self):
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000178 # Restore all proxy related env vars
Walter Dörwaldb525e182009-04-26 21:39:21 +0000179 self.env.__exit__()
180 del self.env
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000181
182 def test_getproxies_environment_keep_no_proxies(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000183 self.env.set('NO_PROXY', 'localhost')
184 proxies = urllib.request.getproxies_environment()
185 # getproxies_environment use lowered case truncated (no '_proxy') keys
Florent Xicluna419e3842010-08-08 16:16:07 +0000186 self.assertEqual('localhost', proxies['no'])
Senthil Kumaran89976f12011-08-06 12:27:40 +0800187 # List of no_proxies with space.
188 self.env.set('NO_PROXY', 'localhost, anotherdomain.com, newdomain.com')
189 self.assertTrue(urllib.request.proxy_bypass_environment('anotherdomain.com'))
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000190
Senthil Kumarance260142011-11-01 01:35:17 +0800191class urlopen_HttpTests(unittest.TestCase, FakeHTTPMixin):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000192 """Test urlopen() opening a fake http connection."""
193
Antoine Pitrou988dbd72010-12-17 17:35:56 +0000194 def check_read(self, ver):
195 self.fakehttp(b"HTTP/" + ver + b" 200 OK\r\n\r\nHello!")
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000196 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000197 fp = urlopen("http://python.org/")
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000198 self.assertEqual(fp.readline(), b"Hello!")
199 self.assertEqual(fp.readline(), b"")
Christian Heimes9bd667a2008-01-20 15:14:11 +0000200 self.assertEqual(fp.geturl(), 'http://python.org/')
201 self.assertEqual(fp.getcode(), 200)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000202 finally:
203 self.unfakehttp()
204
Senthil Kumaran26430412011-04-13 07:01:19 +0800205 def test_url_fragment(self):
206 # Issue #11703: geturl() omits fragments in the original URL.
207 url = 'http://docs.python.org/library/urllib.html#OK'
Senthil Kumaranb17abb12011-04-13 07:22:29 +0800208 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello!")
Senthil Kumaran26430412011-04-13 07:01:19 +0800209 try:
210 fp = urllib.request.urlopen(url)
211 self.assertEqual(fp.geturl(), url)
212 finally:
213 self.unfakehttp()
214
Senthil Kumarand91ffca2011-03-19 17:25:27 +0800215 def test_willclose(self):
216 self.fakehttp(b"HTTP/1.1 200 OK\r\n\r\nHello!")
Senthil Kumaranacbaa922011-03-20 05:30:16 +0800217 try:
218 resp = urlopen("http://www.python.org")
219 self.assertTrue(resp.fp.will_close)
220 finally:
221 self.unfakehttp()
Senthil Kumarand91ffca2011-03-19 17:25:27 +0800222
Antoine Pitrou988dbd72010-12-17 17:35:56 +0000223 def test_read_0_9(self):
224 # "0.9" response accepted (but not "simple responses" without
225 # a status line)
226 self.check_read(b"0.9")
227
228 def test_read_1_0(self):
229 self.check_read(b"1.0")
230
231 def test_read_1_1(self):
232 self.check_read(b"1.1")
233
Christian Heimes57dddfb2008-01-02 18:30:52 +0000234 def test_read_bogus(self):
235 # urlopen() should raise IOError for many error codes.
236 self.fakehttp(b'''HTTP/1.1 401 Authentication Required
237Date: Wed, 02 Jan 2008 03:03:54 GMT
238Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
239Connection: close
240Content-Type: text/html; charset=iso-8859-1
241''')
242 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000243 self.assertRaises(IOError, urlopen, "http://python.org/")
Christian Heimes57dddfb2008-01-02 18:30:52 +0000244 finally:
245 self.unfakehttp()
246
guido@google.coma119df92011-03-29 11:41:02 -0700247 def test_invalid_redirect(self):
248 # urlopen() should raise IOError for many error codes.
249 self.fakehttp(b'''HTTP/1.1 302 Found
250Date: Wed, 02 Jan 2008 03:03:54 GMT
251Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
252Location: file://guidocomputer.athome.com:/python/license
253Connection: close
254Content-Type: text/html; charset=iso-8859-1
255''')
256 try:
257 self.assertRaises(urllib.error.HTTPError, urlopen,
258 "http://python.org/")
259 finally:
260 self.unfakehttp()
261
Guido van Rossumd8faa362007-04-27 19:54:29 +0000262 def test_empty_socket(self):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000263 # urlopen() raises IOError if the underlying socket does not send any
264 # data. (#1680230)
Christian Heimes57dddfb2008-01-02 18:30:52 +0000265 self.fakehttp(b'')
Guido van Rossumd8faa362007-04-27 19:54:29 +0000266 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000267 self.assertRaises(IOError, urlopen, "http://something")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000268 finally:
269 self.unfakehttp()
270
Senthil Kumaranf5776862012-10-21 13:30:02 -0700271 def test_missing_localfile(self):
272 # Test for #10836
Senthil Kumaran3ebef362012-10-21 18:31:25 -0700273 with self.assertRaises(urllib.error.URLError) as e:
Senthil Kumaranf5776862012-10-21 13:30:02 -0700274 urlopen('file://localhost/a/file/which/doesnot/exists.py')
Senthil Kumaran3ebef362012-10-21 18:31:25 -0700275 self.assertTrue(e.exception.filename)
276 self.assertTrue(e.exception.reason)
277
278 def test_file_notexists(self):
279 fd, tmp_file = tempfile.mkstemp()
Senthil Kumaran3194d7c2012-10-23 09:40:53 -0700280 tmp_fileurl = 'file://localhost/' + tmp_file.replace(os.path.sep, '/')
Senthil Kumaranbf644c52012-10-23 11:07:02 -0700281 try:
282 self.assertTrue(os.path.exists(tmp_file))
283 with urlopen(tmp_fileurl) as fobj:
284 self.assertTrue(fobj)
285 finally:
286 os.close(fd)
287 os.unlink(tmp_file)
Senthil Kumaran3ebef362012-10-21 18:31:25 -0700288 self.assertFalse(os.path.exists(tmp_file))
289 with self.assertRaises(urllib.error.URLError):
290 urlopen(tmp_fileurl)
291
292 def test_ftp_nohost(self):
293 test_ftp_url = 'ftp:///path'
294 with self.assertRaises(urllib.error.URLError) as e:
295 urlopen(test_ftp_url)
296 self.assertFalse(e.exception.filename)
297 self.assertTrue(e.exception.reason)
298
299 def test_ftp_nonexisting(self):
300 with self.assertRaises(urllib.error.URLError) as e:
301 urlopen('ftp://localhost/a/file/which/doesnot/exists.py')
302 self.assertFalse(e.exception.filename)
303 self.assertTrue(e.exception.reason)
304
Senthil Kumaranf5776862012-10-21 13:30:02 -0700305
Senthil Kumarande0eb242010-08-01 17:53:37 +0000306 def test_userpass_inurl(self):
Antoine Pitrou988dbd72010-12-17 17:35:56 +0000307 self.fakehttp(b"HTTP/1.0 200 OK\r\n\r\nHello!")
Senthil Kumarande0eb242010-08-01 17:53:37 +0000308 try:
309 fp = urlopen("http://user:pass@python.org/")
310 self.assertEqual(fp.readline(), b"Hello!")
311 self.assertEqual(fp.readline(), b"")
312 self.assertEqual(fp.geturl(), 'http://user:pass@python.org/')
313 self.assertEqual(fp.getcode(), 200)
314 finally:
315 self.unfakehttp()
316
Senthil Kumaranc5c5a142012-01-14 19:09:04 +0800317 def test_userpass_inurl_w_spaces(self):
318 self.fakehttp(b"HTTP/1.0 200 OK\r\n\r\nHello!")
319 try:
320 userpass = "a b:c d"
321 url = "http://{}@python.org/".format(userpass)
322 fakehttp_wrapper = http.client.HTTPConnection
323 authorization = ("Authorization: Basic %s\r\n" %
324 b64encode(userpass.encode("ASCII")).decode("ASCII"))
325 fp = urlopen(url)
326 # The authorization header must be in place
327 self.assertIn(authorization, fakehttp_wrapper.buf.decode("UTF-8"))
328 self.assertEqual(fp.readline(), b"Hello!")
329 self.assertEqual(fp.readline(), b"")
330 # the spaces are quoted in URL so no match
331 self.assertNotEqual(fp.geturl(), url)
332 self.assertEqual(fp.getcode(), 200)
333 finally:
334 self.unfakehttp()
335
Senthil Kumaran38b968b92012-03-14 13:43:53 -0700336 def test_URLopener_deprecation(self):
337 with support.check_warnings(('',DeprecationWarning)):
Senthil Kumaran3ebef362012-10-21 18:31:25 -0700338 urllib.request.URLopener()
Senthil Kumaran38b968b92012-03-14 13:43:53 -0700339
Brett Cannon19691362003-04-29 05:08:06 +0000340class urlretrieve_FileTests(unittest.TestCase):
Brett Cannon74bfd702003-04-25 09:39:47 +0000341 """Test urllib.urlretrieve() on local files"""
Skip Montanaro080c9972001-01-28 21:12:22 +0000342
Brett Cannon19691362003-04-29 05:08:06 +0000343 def setUp(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000344 # Create a list of temporary files. Each item in the list is a file
345 # name (absolute path or relative to the current working directory).
346 # All files in this list will be deleted in the tearDown method. Note,
347 # this only helps to makes sure temporary files get deleted, but it
348 # does nothing about trying to close files that may still be open. It
349 # is the responsibility of the developer to properly close files even
350 # when exceptional conditions occur.
351 self.tempFiles = []
352
Brett Cannon19691362003-04-29 05:08:06 +0000353 # Create a temporary file.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000354 self.registerFileForCleanUp(support.TESTFN)
Guido van Rossuma0982942007-07-10 08:30:03 +0000355 self.text = b'testing urllib.urlretrieve'
Georg Brandl5a650a22005-08-26 08:51:34 +0000356 try:
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000357 FILE = open(support.TESTFN, 'wb')
Georg Brandl5a650a22005-08-26 08:51:34 +0000358 FILE.write(self.text)
359 FILE.close()
360 finally:
361 try: FILE.close()
362 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000363
364 def tearDown(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000365 # Delete the temporary files.
366 for each in self.tempFiles:
367 try: os.remove(each)
368 except: pass
369
370 def constructLocalFileUrl(self, filePath):
Victor Stinner6c6f8512010-08-07 10:09:35 +0000371 filePath = os.path.abspath(filePath)
372 try:
Marc-André Lemburg8f36af72011-02-25 15:42:01 +0000373 filePath.encode("utf-8")
Victor Stinner6c6f8512010-08-07 10:09:35 +0000374 except UnicodeEncodeError:
375 raise unittest.SkipTest("filePath is not encodable to utf8")
376 return "file://%s" % urllib.request.pathname2url(filePath)
Georg Brandl5a650a22005-08-26 08:51:34 +0000377
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000378 def createNewTempFile(self, data=b""):
Georg Brandl5a650a22005-08-26 08:51:34 +0000379 """Creates a new temporary file containing the specified data,
380 registers the file for deletion during the test fixture tear down, and
381 returns the absolute path of the file."""
382
383 newFd, newFilePath = tempfile.mkstemp()
384 try:
385 self.registerFileForCleanUp(newFilePath)
386 newFile = os.fdopen(newFd, "wb")
387 newFile.write(data)
388 newFile.close()
389 finally:
390 try: newFile.close()
391 except: pass
392 return newFilePath
393
394 def registerFileForCleanUp(self, fileName):
395 self.tempFiles.append(fileName)
Brett Cannon19691362003-04-29 05:08:06 +0000396
397 def test_basic(self):
398 # Make sure that a local file just gets its own location returned and
399 # a headers value is returned.
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000400 result = urllib.request.urlretrieve("file:%s" % support.TESTFN)
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000401 self.assertEqual(result[0], support.TESTFN)
Ezio Melottie9615932010-01-24 19:26:24 +0000402 self.assertIsInstance(result[1], email.message.Message,
403 "did not get a email.message.Message instance "
404 "as second returned value")
Brett Cannon19691362003-04-29 05:08:06 +0000405
406 def test_copy(self):
407 # Test that setting the filename argument works.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000408 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000409 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000410 result = urllib.request.urlretrieve(self.constructLocalFileUrl(
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000411 support.TESTFN), second_temp)
Brett Cannon19691362003-04-29 05:08:06 +0000412 self.assertEqual(second_temp, result[0])
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000413 self.assertTrue(os.path.exists(second_temp), "copy of the file was not "
Brett Cannon19691362003-04-29 05:08:06 +0000414 "made")
Alex Martelli01c77c62006-08-24 02:58:11 +0000415 FILE = open(second_temp, 'rb')
Brett Cannon19691362003-04-29 05:08:06 +0000416 try:
417 text = FILE.read()
Brett Cannon19691362003-04-29 05:08:06 +0000418 FILE.close()
Georg Brandl5a650a22005-08-26 08:51:34 +0000419 finally:
420 try: FILE.close()
421 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000422 self.assertEqual(self.text, text)
423
424 def test_reporthook(self):
425 # Make sure that the reporthook works.
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700426 def hooktester(block_count, block_read_size, file_size, count_holder=[0]):
427 self.assertIsInstance(block_count, int)
428 self.assertIsInstance(block_read_size, int)
429 self.assertIsInstance(file_size, int)
430 self.assertEqual(block_count, count_holder[0])
Brett Cannon19691362003-04-29 05:08:06 +0000431 count_holder[0] = count_holder[0] + 1
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000432 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000433 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000434 urllib.request.urlretrieve(
435 self.constructLocalFileUrl(support.TESTFN),
Georg Brandl5a650a22005-08-26 08:51:34 +0000436 second_temp, hooktester)
437
438 def test_reporthook_0_bytes(self):
439 # Test on zero length file. Should call reporthook only 1 time.
440 report = []
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700441 def hooktester(block_count, block_read_size, file_size, _report=report):
442 _report.append((block_count, block_read_size, file_size))
Georg Brandl5a650a22005-08-26 08:51:34 +0000443 srcFileName = self.createNewTempFile()
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000444 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000445 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000446 self.assertEqual(len(report), 1)
447 self.assertEqual(report[0][2], 0)
448
449 def test_reporthook_5_bytes(self):
450 # Test on 5 byte file. Should call reporthook only 2 times (once when
451 # the "network connection" is established and once when the block is
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700452 # read).
Georg Brandl5a650a22005-08-26 08:51:34 +0000453 report = []
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700454 def hooktester(block_count, block_read_size, file_size, _report=report):
455 _report.append((block_count, block_read_size, file_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000456 srcFileName = self.createNewTempFile(b"x" * 5)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000457 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000458 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000459 self.assertEqual(len(report), 2)
Gregory P. Smith6d9388f2012-11-10 15:12:55 -0800460 self.assertEqual(report[0][2], 5)
461 self.assertEqual(report[1][2], 5)
Georg Brandl5a650a22005-08-26 08:51:34 +0000462
463 def test_reporthook_8193_bytes(self):
464 # Test on 8193 byte file. Should call reporthook only 3 times (once
465 # when the "network connection" is established, once for the next 8192
466 # bytes, and once for the last byte).
467 report = []
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700468 def hooktester(block_count, block_read_size, file_size, _report=report):
469 _report.append((block_count, block_read_size, file_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000470 srcFileName = self.createNewTempFile(b"x" * 8193)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000471 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000472 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000473 self.assertEqual(len(report), 3)
Gregory P. Smith6d9388f2012-11-10 15:12:55 -0800474 self.assertEqual(report[0][2], 8193)
475 self.assertEqual(report[0][1], 8192)
Senthil Kumarane24f96a2012-03-13 19:29:33 -0700476 self.assertEqual(report[1][1], 8192)
Gregory P. Smith6d9388f2012-11-10 15:12:55 -0800477 self.assertEqual(report[2][1], 8192)
Skip Montanaro080c9972001-01-28 21:12:22 +0000478
Senthil Kumarance260142011-11-01 01:35:17 +0800479
480class urlretrieve_HttpTests(unittest.TestCase, FakeHTTPMixin):
481 """Test urllib.urlretrieve() using fake http connections"""
482
483 def test_short_content_raises_ContentTooShortError(self):
484 self.fakehttp(b'''HTTP/1.1 200 OK
485Date: Wed, 02 Jan 2008 03:03:54 GMT
486Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
487Connection: close
488Content-Length: 100
489Content-Type: text/html; charset=iso-8859-1
490
491FF
492''')
493
494 def _reporthook(par1, par2, par3):
495 pass
496
497 with self.assertRaises(urllib.error.ContentTooShortError):
498 try:
499 urllib.request.urlretrieve('http://example.com/',
500 reporthook=_reporthook)
501 finally:
502 self.unfakehttp()
503
504 def test_short_content_raises_ContentTooShortError_without_reporthook(self):
505 self.fakehttp(b'''HTTP/1.1 200 OK
506Date: Wed, 02 Jan 2008 03:03:54 GMT
507Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
508Connection: close
509Content-Length: 100
510Content-Type: text/html; charset=iso-8859-1
511
512FF
513''')
514 with self.assertRaises(urllib.error.ContentTooShortError):
515 try:
516 urllib.request.urlretrieve('http://example.com/')
517 finally:
518 self.unfakehttp()
519
520
Brett Cannon74bfd702003-04-25 09:39:47 +0000521class QuotingTests(unittest.TestCase):
522 """Tests for urllib.quote() and urllib.quote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000523
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000524 According to RFC 2396 (Uniform Resource Identifiers), to escape a
525 character you write it as '%' + <2 character US-ASCII hex value>.
526 The Python code of ``'%' + hex(ord(<character>))[2:]`` escapes a
527 character properly. Case does not matter on the hex letters.
Brett Cannon74bfd702003-04-25 09:39:47 +0000528
529 The various character sets specified are:
Tim Petersc2659cf2003-05-12 20:19:37 +0000530
Brett Cannon74bfd702003-04-25 09:39:47 +0000531 Reserved characters : ";/?:@&=+$,"
532 Have special meaning in URIs and must be escaped if not being used for
533 their special meaning
534 Data characters : letters, digits, and "-_.!~*'()"
535 Unreserved and do not need to be escaped; can be, though, if desired
536 Control characters : 0x00 - 0x1F, 0x7F
537 Have no use in URIs so must be escaped
538 space : 0x20
539 Must be escaped
540 Delimiters : '<>#%"'
541 Must be escaped
542 Unwise : "{}|\^[]`"
543 Must be escaped
Tim Petersc2659cf2003-05-12 20:19:37 +0000544
Brett Cannon74bfd702003-04-25 09:39:47 +0000545 """
546
547 def test_never_quote(self):
548 # Make sure quote() does not quote letters, digits, and "_,.-"
549 do_not_quote = '' .join(["ABCDEFGHIJKLMNOPQRSTUVWXYZ",
550 "abcdefghijklmnopqrstuvwxyz",
551 "0123456789",
552 "_.-"])
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000553 result = urllib.parse.quote(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000554 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000555 "using quote(): %r != %r" % (do_not_quote, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000556 result = urllib.parse.quote_plus(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000557 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000558 "using quote_plus(): %r != %r" % (do_not_quote, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000559
560 def test_default_safe(self):
561 # Test '/' is default value for 'safe' parameter
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000562 self.assertEqual(urllib.parse.quote.__defaults__[0], '/')
Brett Cannon74bfd702003-04-25 09:39:47 +0000563
564 def test_safe(self):
565 # Test setting 'safe' parameter does what it should do
566 quote_by_default = "<>"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000567 result = urllib.parse.quote(quote_by_default, safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000568 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000569 "using quote(): %r != %r" % (quote_by_default, result))
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000570 result = urllib.parse.quote_plus(quote_by_default,
571 safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000572 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000573 "using quote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000574 (quote_by_default, result))
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000575 # Safe expressed as bytes rather than str
576 result = urllib.parse.quote(quote_by_default, safe=b"<>")
577 self.assertEqual(quote_by_default, result,
578 "using quote(): %r != %r" % (quote_by_default, result))
579 # "Safe" non-ASCII characters should have no effect
580 # (Since URIs are not allowed to have non-ASCII characters)
581 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="\xfc")
582 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
583 self.assertEqual(expect, result,
584 "using quote(): %r != %r" %
585 (expect, result))
586 # Same as above, but using a bytes rather than str
587 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe=b"\xfc")
588 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
589 self.assertEqual(expect, result,
590 "using quote(): %r != %r" %
591 (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000592
593 def test_default_quoting(self):
594 # Make sure all characters that should be quoted are by default sans
595 # space (separate test for that).
596 should_quote = [chr(num) for num in range(32)] # For 0x00 - 0x1F
597 should_quote.append('<>#%"{}|\^[]`')
598 should_quote.append(chr(127)) # For 0x7F
599 should_quote = ''.join(should_quote)
600 for char in should_quote:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000601 result = urllib.parse.quote(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000602 self.assertEqual(hexescape(char), result,
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000603 "using quote(): "
604 "%s should be escaped to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000605 (char, hexescape(char), result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000606 result = urllib.parse.quote_plus(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000607 self.assertEqual(hexescape(char), result,
608 "using quote_plus(): "
Tim Petersc2659cf2003-05-12 20:19:37 +0000609 "%s should be escapes to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000610 (char, hexescape(char), result))
611 del should_quote
612 partial_quote = "ab[]cd"
613 expected = "ab%5B%5Dcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000614 result = urllib.parse.quote(partial_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000615 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000616 "using quote(): %r != %r" % (expected, result))
Senthil Kumaran305a68e2011-09-13 06:40:27 +0800617 result = urllib.parse.quote_plus(partial_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000618 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000619 "using quote_plus(): %r != %r" % (expected, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000620
621 def test_quoting_space(self):
622 # Make sure quote() and quote_plus() handle spaces as specified in
623 # their unique way
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000624 result = urllib.parse.quote(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000625 self.assertEqual(result, hexescape(' '),
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000626 "using quote(): %r != %r" % (result, hexescape(' ')))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000627 result = urllib.parse.quote_plus(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000628 self.assertEqual(result, '+',
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000629 "using quote_plus(): %r != +" % result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000630 given = "a b cd e f"
631 expect = given.replace(' ', hexescape(' '))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000632 result = urllib.parse.quote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000633 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000634 "using quote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000635 expect = given.replace(' ', '+')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000636 result = urllib.parse.quote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000637 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000638 "using quote_plus(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000639
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000640 def test_quoting_plus(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000641 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000642 'alpha%2Bbeta+gamma')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000643 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', '+'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000644 'alpha+beta+gamma')
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000645 # Test with bytes
646 self.assertEqual(urllib.parse.quote_plus(b'alpha+beta gamma'),
647 'alpha%2Bbeta+gamma')
648 # Test with safe bytes
649 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', b'+'),
650 'alpha+beta+gamma')
651
652 def test_quote_bytes(self):
653 # Bytes should quote directly to percent-encoded values
654 given = b"\xa2\xd8ab\xff"
655 expect = "%A2%D8ab%FF"
656 result = urllib.parse.quote(given)
657 self.assertEqual(expect, result,
658 "using quote(): %r != %r" % (expect, result))
659 # Encoding argument should raise type error on bytes input
660 self.assertRaises(TypeError, urllib.parse.quote, given,
661 encoding="latin-1")
662 # quote_from_bytes should work the same
663 result = urllib.parse.quote_from_bytes(given)
664 self.assertEqual(expect, result,
665 "using quote_from_bytes(): %r != %r"
666 % (expect, result))
667
668 def test_quote_with_unicode(self):
669 # Characters in Latin-1 range, encoded by default in UTF-8
670 given = "\xa2\xd8ab\xff"
671 expect = "%C2%A2%C3%98ab%C3%BF"
672 result = urllib.parse.quote(given)
673 self.assertEqual(expect, result,
674 "using quote(): %r != %r" % (expect, result))
675 # Characters in Latin-1 range, encoded by with None (default)
676 result = urllib.parse.quote(given, encoding=None, errors=None)
677 self.assertEqual(expect, result,
678 "using quote(): %r != %r" % (expect, result))
679 # Characters in Latin-1 range, encoded with Latin-1
680 given = "\xa2\xd8ab\xff"
681 expect = "%A2%D8ab%FF"
682 result = urllib.parse.quote(given, encoding="latin-1")
683 self.assertEqual(expect, result,
684 "using quote(): %r != %r" % (expect, result))
685 # Characters in BMP, encoded by default in UTF-8
686 given = "\u6f22\u5b57" # "Kanji"
687 expect = "%E6%BC%A2%E5%AD%97"
688 result = urllib.parse.quote(given)
689 self.assertEqual(expect, result,
690 "using quote(): %r != %r" % (expect, result))
691 # Characters in BMP, encoded with Latin-1
692 given = "\u6f22\u5b57"
693 self.assertRaises(UnicodeEncodeError, urllib.parse.quote, given,
694 encoding="latin-1")
695 # Characters in BMP, encoded with Latin-1, with replace error handling
696 given = "\u6f22\u5b57"
697 expect = "%3F%3F" # "??"
698 result = urllib.parse.quote(given, encoding="latin-1",
699 errors="replace")
700 self.assertEqual(expect, result,
701 "using quote(): %r != %r" % (expect, result))
702 # Characters in BMP, Latin-1, with xmlcharref error handling
703 given = "\u6f22\u5b57"
704 expect = "%26%2328450%3B%26%2323383%3B" # "&#28450;&#23383;"
705 result = urllib.parse.quote(given, encoding="latin-1",
706 errors="xmlcharrefreplace")
707 self.assertEqual(expect, result,
708 "using quote(): %r != %r" % (expect, result))
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000709
Georg Brandlfaf41492009-05-26 18:31:11 +0000710 def test_quote_plus_with_unicode(self):
711 # Encoding (latin-1) test for quote_plus
712 given = "\xa2\xd8 \xff"
713 expect = "%A2%D8+%FF"
714 result = urllib.parse.quote_plus(given, encoding="latin-1")
715 self.assertEqual(expect, result,
716 "using quote_plus(): %r != %r" % (expect, result))
717 # Errors test for quote_plus
718 given = "ab\u6f22\u5b57 cd"
719 expect = "ab%3F%3F+cd"
720 result = urllib.parse.quote_plus(given, encoding="latin-1",
721 errors="replace")
722 self.assertEqual(expect, result,
723 "using quote_plus(): %r != %r" % (expect, result))
724
Senthil Kumarand496c4c2010-07-30 19:34:36 +0000725
Brett Cannon74bfd702003-04-25 09:39:47 +0000726class UnquotingTests(unittest.TestCase):
727 """Tests for unquote() and unquote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000728
Brett Cannon74bfd702003-04-25 09:39:47 +0000729 See the doc string for quoting_Tests for details on quoting and such.
730
731 """
732
733 def test_unquoting(self):
734 # Make sure unquoting of all ASCII values works
735 escape_list = []
736 for num in range(128):
737 given = hexescape(chr(num))
738 expect = chr(num)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000739 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000740 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000741 "using unquote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000742 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000743 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000744 "using unquote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000745 (expect, result))
746 escape_list.append(given)
747 escape_string = ''.join(escape_list)
748 del escape_list
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000749 result = urllib.parse.unquote(escape_string)
Brett Cannon74bfd702003-04-25 09:39:47 +0000750 self.assertEqual(result.count('%'), 1,
Brett Cannon74bfd702003-04-25 09:39:47 +0000751 "using unquote(): not all characters escaped: "
752 "%s" % result)
Georg Brandl604ef372010-07-31 08:20:02 +0000753 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, None)
754 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, ())
Florent Xicluna62829dc2010-08-14 20:51:58 +0000755 with support.check_warnings(('', BytesWarning), quiet=True):
756 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, b'')
Brett Cannon74bfd702003-04-25 09:39:47 +0000757
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000758 def test_unquoting_badpercent(self):
759 # Test unquoting on bad percent-escapes
760 given = '%xab'
761 expect = given
762 result = urllib.parse.unquote(given)
763 self.assertEqual(expect, result, "using unquote(): %r != %r"
764 % (expect, result))
765 given = '%x'
766 expect = given
767 result = urllib.parse.unquote(given)
768 self.assertEqual(expect, result, "using unquote(): %r != %r"
769 % (expect, result))
770 given = '%'
771 expect = given
772 result = urllib.parse.unquote(given)
773 self.assertEqual(expect, result, "using unquote(): %r != %r"
774 % (expect, result))
775 # unquote_to_bytes
776 given = '%xab'
777 expect = bytes(given, 'ascii')
778 result = urllib.parse.unquote_to_bytes(given)
779 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
780 % (expect, result))
781 given = '%x'
782 expect = bytes(given, 'ascii')
783 result = urllib.parse.unquote_to_bytes(given)
784 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
785 % (expect, result))
786 given = '%'
787 expect = bytes(given, 'ascii')
788 result = urllib.parse.unquote_to_bytes(given)
789 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
790 % (expect, result))
Georg Brandl604ef372010-07-31 08:20:02 +0000791 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, None)
792 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, ())
Senthil Kumaran79e17f62010-07-19 18:17:19 +0000793
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000794 def test_unquoting_mixed_case(self):
795 # Test unquoting on mixed-case hex digits in the percent-escapes
796 given = '%Ab%eA'
797 expect = b'\xab\xea'
798 result = urllib.parse.unquote_to_bytes(given)
799 self.assertEqual(expect, result,
800 "using unquote_to_bytes(): %r != %r"
801 % (expect, result))
802
Brett Cannon74bfd702003-04-25 09:39:47 +0000803 def test_unquoting_parts(self):
804 # Make sure unquoting works when have non-quoted characters
805 # interspersed
806 given = 'ab%sd' % hexescape('c')
807 expect = "abcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000808 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000809 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000810 "using quote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000811 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000812 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000813 "using unquote_plus(): %r != %r" % (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000814
Brett Cannon74bfd702003-04-25 09:39:47 +0000815 def test_unquoting_plus(self):
816 # Test difference between unquote() and unquote_plus()
817 given = "are+there+spaces..."
818 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000819 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000820 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000821 "using unquote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000822 expect = given.replace('+', ' ')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000823 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000824 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000825 "using unquote_plus(): %r != %r" % (expect, result))
826
827 def test_unquote_to_bytes(self):
828 given = 'br%C3%BCckner_sapporo_20050930.doc'
829 expect = b'br\xc3\xbcckner_sapporo_20050930.doc'
830 result = urllib.parse.unquote_to_bytes(given)
831 self.assertEqual(expect, result,
832 "using unquote_to_bytes(): %r != %r"
833 % (expect, result))
834 # Test on a string with unescaped non-ASCII characters
835 # (Technically an invalid URI; expect those characters to be UTF-8
836 # encoded).
837 result = urllib.parse.unquote_to_bytes("\u6f22%C3%BC")
838 expect = b'\xe6\xbc\xa2\xc3\xbc' # UTF-8 for "\u6f22\u00fc"
839 self.assertEqual(expect, result,
840 "using unquote_to_bytes(): %r != %r"
841 % (expect, result))
842 # Test with a bytes as input
843 given = b'%A2%D8ab%FF'
844 expect = b'\xa2\xd8ab\xff'
845 result = urllib.parse.unquote_to_bytes(given)
846 self.assertEqual(expect, result,
847 "using unquote_to_bytes(): %r != %r"
848 % (expect, result))
849 # Test with a bytes as input, with unescaped non-ASCII bytes
850 # (Technically an invalid URI; expect those bytes to be preserved)
851 given = b'%A2\xd8ab%FF'
852 expect = b'\xa2\xd8ab\xff'
853 result = urllib.parse.unquote_to_bytes(given)
854 self.assertEqual(expect, result,
855 "using unquote_to_bytes(): %r != %r"
856 % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000857
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000858 def test_unquote_with_unicode(self):
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000859 # Characters in the Latin-1 range, encoded with UTF-8
860 given = 'br%C3%BCckner_sapporo_20050930.doc'
861 expect = 'br\u00fcckner_sapporo_20050930.doc'
862 result = urllib.parse.unquote(given)
863 self.assertEqual(expect, result,
864 "using unquote(): %r != %r" % (expect, result))
865 # Characters in the Latin-1 range, encoded with None (default)
866 result = urllib.parse.unquote(given, encoding=None, errors=None)
867 self.assertEqual(expect, result,
868 "using unquote(): %r != %r" % (expect, result))
869
870 # Characters in the Latin-1 range, encoded with Latin-1
871 result = urllib.parse.unquote('br%FCckner_sapporo_20050930.doc',
872 encoding="latin-1")
873 expect = 'br\u00fcckner_sapporo_20050930.doc'
874 self.assertEqual(expect, result,
875 "using unquote(): %r != %r" % (expect, result))
876
877 # Characters in BMP, encoded with UTF-8
878 given = "%E6%BC%A2%E5%AD%97"
879 expect = "\u6f22\u5b57" # "Kanji"
880 result = urllib.parse.unquote(given)
881 self.assertEqual(expect, result,
882 "using unquote(): %r != %r" % (expect, result))
883
884 # Decode with UTF-8, invalid sequence
885 given = "%F3%B1"
886 expect = "\ufffd" # Replacement character
887 result = urllib.parse.unquote(given)
888 self.assertEqual(expect, result,
889 "using unquote(): %r != %r" % (expect, result))
890
891 # Decode with UTF-8, invalid sequence, replace errors
892 result = urllib.parse.unquote(given, errors="replace")
893 self.assertEqual(expect, result,
894 "using unquote(): %r != %r" % (expect, result))
895
896 # Decode with UTF-8, invalid sequence, ignoring errors
897 given = "%F3%B1"
898 expect = ""
899 result = urllib.parse.unquote(given, errors="ignore")
900 self.assertEqual(expect, result,
901 "using unquote(): %r != %r" % (expect, result))
902
903 # A mix of non-ASCII and percent-encoded characters, UTF-8
904 result = urllib.parse.unquote("\u6f22%C3%BC")
905 expect = '\u6f22\u00fc'
906 self.assertEqual(expect, result,
907 "using unquote(): %r != %r" % (expect, result))
908
909 # A mix of non-ASCII and percent-encoded characters, Latin-1
910 # (Note, the string contains non-Latin-1-representable characters)
911 result = urllib.parse.unquote("\u6f22%FC", encoding="latin-1")
912 expect = '\u6f22\u00fc'
913 self.assertEqual(expect, result,
914 "using unquote(): %r != %r" % (expect, result))
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000915
Brett Cannon74bfd702003-04-25 09:39:47 +0000916class urlencode_Tests(unittest.TestCase):
917 """Tests for urlencode()"""
918
919 def help_inputtype(self, given, test_type):
920 """Helper method for testing different input types.
Tim Petersc2659cf2003-05-12 20:19:37 +0000921
Brett Cannon74bfd702003-04-25 09:39:47 +0000922 'given' must lead to only the pairs:
923 * 1st, 1
924 * 2nd, 2
925 * 3rd, 3
Tim Petersc2659cf2003-05-12 20:19:37 +0000926
Brett Cannon74bfd702003-04-25 09:39:47 +0000927 Test cannot assume anything about order. Docs make no guarantee and
928 have possible dictionary input.
Tim Petersc2659cf2003-05-12 20:19:37 +0000929
Brett Cannon74bfd702003-04-25 09:39:47 +0000930 """
931 expect_somewhere = ["1st=1", "2nd=2", "3rd=3"]
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000932 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000933 for expected in expect_somewhere:
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000934 self.assertIn(expected, result,
Brett Cannon74bfd702003-04-25 09:39:47 +0000935 "testing %s: %s not found in %s" %
936 (test_type, expected, result))
937 self.assertEqual(result.count('&'), 2,
938 "testing %s: expected 2 '&'s; got %s" %
939 (test_type, result.count('&')))
940 amp_location = result.index('&')
941 on_amp_left = result[amp_location - 1]
942 on_amp_right = result[amp_location + 1]
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000943 self.assertTrue(on_amp_left.isdigit() and on_amp_right.isdigit(),
Brett Cannon74bfd702003-04-25 09:39:47 +0000944 "testing %s: '&' not located in proper place in %s" %
945 (test_type, result))
946 self.assertEqual(len(result), (5 * 3) + 2, #5 chars per thing and amps
947 "testing %s: "
948 "unexpected number of characters: %s != %s" %
949 (test_type, len(result), (5 * 3) + 2))
950
951 def test_using_mapping(self):
952 # Test passing in a mapping object as an argument.
953 self.help_inputtype({"1st":'1', "2nd":'2', "3rd":'3'},
954 "using dict as input type")
955
956 def test_using_sequence(self):
957 # Test passing in a sequence of two-item sequences as an argument.
958 self.help_inputtype([('1st', '1'), ('2nd', '2'), ('3rd', '3')],
959 "using sequence of two-item tuples as input")
960
961 def test_quoting(self):
962 # Make sure keys and values are quoted using quote_plus()
963 given = {"&":"="}
964 expect = "%s=%s" % (hexescape('&'), hexescape('='))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000965 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000966 self.assertEqual(expect, result)
967 given = {"key name":"A bunch of pluses"}
968 expect = "key+name=A+bunch+of+pluses"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000969 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000970 self.assertEqual(expect, result)
971
972 def test_doseq(self):
973 # Test that passing True for 'doseq' parameter works correctly
974 given = {'sequence':['1', '2', '3']}
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000975 expect = "sequence=%s" % urllib.parse.quote_plus(str(['1', '2', '3']))
976 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000977 self.assertEqual(expect, result)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000978 result = urllib.parse.urlencode(given, True)
Brett Cannon74bfd702003-04-25 09:39:47 +0000979 for value in given["sequence"]:
980 expect = "sequence=%s" % value
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000981 self.assertIn(expect, result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000982 self.assertEqual(result.count('&'), 2,
983 "Expected 2 '&'s, got %s" % result.count('&'))
984
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000985 def test_empty_sequence(self):
986 self.assertEqual("", urllib.parse.urlencode({}))
987 self.assertEqual("", urllib.parse.urlencode([]))
988
989 def test_nonstring_values(self):
990 self.assertEqual("a=1", urllib.parse.urlencode({"a": 1}))
991 self.assertEqual("a=None", urllib.parse.urlencode({"a": None}))
992
993 def test_nonstring_seq_values(self):
994 self.assertEqual("a=1&a=2", urllib.parse.urlencode({"a": [1, 2]}, True))
995 self.assertEqual("a=None&a=a",
996 urllib.parse.urlencode({"a": [None, "a"]}, True))
Georg Brandl2daf6ae2012-02-20 19:54:16 +0100997 data = collections.OrderedDict([("a", 1), ("b", 1)])
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000998 self.assertEqual("a=a&a=b",
Georg Brandl2daf6ae2012-02-20 19:54:16 +0100999 urllib.parse.urlencode({"a": data}, True))
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +00001000
Senthil Kumarandf022da2010-07-03 17:48:22 +00001001 def test_urlencode_encoding(self):
1002 # ASCII encoding. Expect %3F with errors="replace'
1003 given = (('\u00a0', '\u00c1'),)
1004 expect = '%3F=%3F'
1005 result = urllib.parse.urlencode(given, encoding="ASCII", errors="replace")
1006 self.assertEqual(expect, result)
1007
1008 # Default is UTF-8 encoding.
1009 given = (('\u00a0', '\u00c1'),)
1010 expect = '%C2%A0=%C3%81'
1011 result = urllib.parse.urlencode(given)
1012 self.assertEqual(expect, result)
1013
1014 # Latin-1 encoding.
1015 given = (('\u00a0', '\u00c1'),)
1016 expect = '%A0=%C1'
1017 result = urllib.parse.urlencode(given, encoding="latin-1")
1018 self.assertEqual(expect, result)
1019
1020 def test_urlencode_encoding_doseq(self):
1021 # ASCII Encoding. Expect %3F with errors="replace'
1022 given = (('\u00a0', '\u00c1'),)
1023 expect = '%3F=%3F'
1024 result = urllib.parse.urlencode(given, doseq=True,
1025 encoding="ASCII", errors="replace")
1026 self.assertEqual(expect, result)
1027
1028 # ASCII Encoding. On a sequence of values.
1029 given = (("\u00a0", (1, "\u00c1")),)
1030 expect = '%3F=1&%3F=%3F'
1031 result = urllib.parse.urlencode(given, True,
1032 encoding="ASCII", errors="replace")
1033 self.assertEqual(expect, result)
1034
1035 # Utf-8
1036 given = (("\u00a0", "\u00c1"),)
1037 expect = '%C2%A0=%C3%81'
1038 result = urllib.parse.urlencode(given, True)
1039 self.assertEqual(expect, result)
1040
1041 given = (("\u00a0", (42, "\u00c1")),)
1042 expect = '%C2%A0=42&%C2%A0=%C3%81'
1043 result = urllib.parse.urlencode(given, True)
1044 self.assertEqual(expect, result)
1045
1046 # latin-1
1047 given = (("\u00a0", "\u00c1"),)
1048 expect = '%A0=%C1'
1049 result = urllib.parse.urlencode(given, True, encoding="latin-1")
1050 self.assertEqual(expect, result)
1051
1052 given = (("\u00a0", (42, "\u00c1")),)
1053 expect = '%A0=42&%A0=%C1'
1054 result = urllib.parse.urlencode(given, True, encoding="latin-1")
1055 self.assertEqual(expect, result)
1056
1057 def test_urlencode_bytes(self):
1058 given = ((b'\xa0\x24', b'\xc1\x24'),)
1059 expect = '%A0%24=%C1%24'
1060 result = urllib.parse.urlencode(given)
1061 self.assertEqual(expect, result)
1062 result = urllib.parse.urlencode(given, True)
1063 self.assertEqual(expect, result)
1064
1065 # Sequence of values
1066 given = ((b'\xa0\x24', (42, b'\xc1\x24')),)
1067 expect = '%A0%24=42&%A0%24=%C1%24'
1068 result = urllib.parse.urlencode(given, True)
1069 self.assertEqual(expect, result)
1070
1071 def test_urlencode_encoding_safe_parameter(self):
1072
1073 # Send '$' (\x24) as safe character
1074 # Default utf-8 encoding
1075
1076 given = ((b'\xa0\x24', b'\xc1\x24'),)
1077 result = urllib.parse.urlencode(given, safe=":$")
1078 expect = '%A0$=%C1$'
1079 self.assertEqual(expect, result)
1080
1081 given = ((b'\xa0\x24', b'\xc1\x24'),)
1082 result = urllib.parse.urlencode(given, doseq=True, safe=":$")
1083 expect = '%A0$=%C1$'
1084 self.assertEqual(expect, result)
1085
1086 # Safe parameter in sequence
1087 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
1088 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
1089 result = urllib.parse.urlencode(given, True, safe=":$")
1090 self.assertEqual(expect, result)
1091
1092 # Test all above in latin-1 encoding
1093
1094 given = ((b'\xa0\x24', b'\xc1\x24'),)
1095 result = urllib.parse.urlencode(given, safe=":$",
1096 encoding="latin-1")
1097 expect = '%A0$=%C1$'
1098 self.assertEqual(expect, result)
1099
1100 given = ((b'\xa0\x24', b'\xc1\x24'),)
1101 expect = '%A0$=%C1$'
1102 result = urllib.parse.urlencode(given, doseq=True, safe=":$",
1103 encoding="latin-1")
1104
1105 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
1106 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
1107 result = urllib.parse.urlencode(given, True, safe=":$",
1108 encoding="latin-1")
1109 self.assertEqual(expect, result)
1110
Brett Cannon74bfd702003-04-25 09:39:47 +00001111class Pathname_Tests(unittest.TestCase):
1112 """Test pathname2url() and url2pathname()"""
1113
1114 def test_basic(self):
1115 # Make sure simple tests pass
1116 expected_path = os.path.join("parts", "of", "a", "path")
1117 expected_url = "parts/of/a/path"
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001118 result = urllib.request.pathname2url(expected_path)
Brett Cannon74bfd702003-04-25 09:39:47 +00001119 self.assertEqual(expected_url, result,
1120 "pathname2url() failed; %s != %s" %
1121 (result, expected_url))
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001122 result = urllib.request.url2pathname(expected_url)
Brett Cannon74bfd702003-04-25 09:39:47 +00001123 self.assertEqual(expected_path, result,
1124 "url2pathame() failed; %s != %s" %
1125 (result, expected_path))
1126
1127 def test_quoting(self):
1128 # Test automatic quoting and unquoting works for pathnam2url() and
1129 # url2pathname() respectively
1130 given = os.path.join("needs", "quot=ing", "here")
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001131 expect = "needs/%s/here" % urllib.parse.quote("quot=ing")
1132 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +00001133 self.assertEqual(expect, result,
1134 "pathname2url() failed; %s != %s" %
1135 (expect, result))
1136 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001137 result = urllib.request.url2pathname(result)
Brett Cannon74bfd702003-04-25 09:39:47 +00001138 self.assertEqual(expect, result,
1139 "url2pathname() failed; %s != %s" %
1140 (expect, result))
1141 given = os.path.join("make sure", "using_quote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001142 expect = "%s/using_quote" % urllib.parse.quote("make sure")
1143 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +00001144 self.assertEqual(expect, result,
1145 "pathname2url() failed; %s != %s" %
1146 (expect, result))
1147 given = "make+sure/using_unquote"
1148 expect = os.path.join("make+sure", "using_unquote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +00001149 result = urllib.request.url2pathname(given)
Brett Cannon74bfd702003-04-25 09:39:47 +00001150 self.assertEqual(expect, result,
1151 "url2pathname() failed; %s != %s" %
1152 (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +00001153
Senthil Kumaran2d2ea1b2011-04-14 13:16:30 +08001154 @unittest.skipUnless(sys.platform == 'win32',
1155 'test specific to the urllib.url2path function.')
1156 def test_ntpath(self):
1157 given = ('/C:/', '///C:/', '/C|//')
1158 expect = 'C:\\'
1159 for url in given:
1160 result = urllib.request.url2pathname(url)
1161 self.assertEqual(expect, result,
1162 'urllib.request..url2pathname() failed; %s != %s' %
1163 (expect, result))
1164 given = '///C|/path'
1165 expect = 'C:\\path'
1166 result = urllib.request.url2pathname(given)
1167 self.assertEqual(expect, result,
1168 'urllib.request.url2pathname() failed; %s != %s' %
1169 (expect, result))
1170
Senthil Kumaraneaaec272009-03-30 21:54:41 +00001171class Utility_Tests(unittest.TestCase):
1172 """Testcase to test the various utility functions in the urllib."""
1173
1174 def test_splitpasswd(self):
1175 """Some of password examples are not sensible, but it is added to
1176 confirming to RFC2617 and addressing issue4675.
1177 """
1178 self.assertEqual(('user', 'ab'),urllib.parse.splitpasswd('user:ab'))
1179 self.assertEqual(('user', 'a\nb'),urllib.parse.splitpasswd('user:a\nb'))
1180 self.assertEqual(('user', 'a\tb'),urllib.parse.splitpasswd('user:a\tb'))
1181 self.assertEqual(('user', 'a\rb'),urllib.parse.splitpasswd('user:a\rb'))
1182 self.assertEqual(('user', 'a\fb'),urllib.parse.splitpasswd('user:a\fb'))
1183 self.assertEqual(('user', 'a\vb'),urllib.parse.splitpasswd('user:a\vb'))
1184 self.assertEqual(('user', 'a:b'),urllib.parse.splitpasswd('user:a:b'))
Senthil Kumaranc5c5a142012-01-14 19:09:04 +08001185 self.assertEqual(('user', 'a b'),urllib.parse.splitpasswd('user:a b'))
1186 self.assertEqual(('user 2', 'ab'),urllib.parse.splitpasswd('user 2:ab'))
1187 self.assertEqual(('user+1', 'a+b'),urllib.parse.splitpasswd('user+1:a+b'))
Senthil Kumaraneaaec272009-03-30 21:54:41 +00001188
Senthil Kumaran1b7da512011-10-06 00:32:02 +08001189 def test_thishost(self):
1190 """Test the urllib.request.thishost utility function returns a tuple"""
1191 self.assertIsInstance(urllib.request.thishost(), tuple)
1192
Senthil Kumaran690ce9b2009-05-05 18:41:13 +00001193
1194class URLopener_Tests(unittest.TestCase):
1195 """Testcase to test the open method of URLopener class."""
1196
1197 def test_quoted_open(self):
1198 class DummyURLopener(urllib.request.URLopener):
1199 def open_spam(self, url):
1200 return url
1201
1202 self.assertEqual(DummyURLopener().open(
1203 'spam://example/ /'),'//example/%20/')
1204
Senthil Kumaran734f0592010-02-20 22:19:04 +00001205 # test the safe characters are not quoted by urlopen
1206 self.assertEqual(DummyURLopener().open(
1207 "spam://c:|windows%/:=&?~#+!$,;'@()*[]|/path/"),
1208 "//c:|windows%/:=&?~#+!$,;'@()*[]|/path/")
1209
Guido van Rossume7ba4952007-06-06 23:52:48 +00001210# Just commented them out.
1211# Can't really tell why keep failing in windows and sparc.
Ezio Melotti13925002011-03-16 11:05:33 +02001212# Everywhere else they work ok, but on those machines, sometimes
Guido van Rossume7ba4952007-06-06 23:52:48 +00001213# fail in one of the tests, sometimes in other. I have a linux, and
1214# the tests go ok.
1215# If anybody has one of the problematic enviroments, please help!
1216# . Facundo
1217#
1218# def server(evt):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001219# import socket, time
Guido van Rossume7ba4952007-06-06 23:52:48 +00001220# serv = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
1221# serv.settimeout(3)
1222# serv.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
1223# serv.bind(("", 9093))
1224# serv.listen(5)
1225# try:
1226# conn, addr = serv.accept()
1227# conn.send("1 Hola mundo\n")
1228# cantdata = 0
1229# while cantdata < 13:
1230# data = conn.recv(13-cantdata)
1231# cantdata += len(data)
1232# time.sleep(.3)
1233# conn.send("2 No more lines\n")
1234# conn.close()
1235# except socket.timeout:
1236# pass
1237# finally:
1238# serv.close()
1239# evt.set()
1240#
1241# class FTPWrapperTests(unittest.TestCase):
1242#
1243# def setUp(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001244# import ftplib, time, threading
Guido van Rossume7ba4952007-06-06 23:52:48 +00001245# ftplib.FTP.port = 9093
1246# self.evt = threading.Event()
1247# threading.Thread(target=server, args=(self.evt,)).start()
1248# time.sleep(.1)
1249#
1250# def tearDown(self):
1251# self.evt.wait()
1252#
1253# def testBasic(self):
1254# # connects
1255# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
Georg Brandlf78e02b2008-06-10 17:40:04 +00001256# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001257#
1258# def testTimeoutNone(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001259# # global default timeout is ignored
1260# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001261# self.assertTrue(socket.getdefaulttimeout() is None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001262# socket.setdefaulttimeout(30)
1263# try:
1264# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1265# finally:
Georg Brandlf78e02b2008-06-10 17:40:04 +00001266# socket.setdefaulttimeout(None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001267# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001268# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001269#
Georg Brandlf78e02b2008-06-10 17:40:04 +00001270# def testTimeoutDefault(self):
1271# # global default timeout is used
1272# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001273# self.assertTrue(socket.getdefaulttimeout() is None)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001274# socket.setdefaulttimeout(30)
1275# try:
1276# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1277# finally:
1278# socket.setdefaulttimeout(None)
1279# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1280# ftp.close()
1281#
1282# def testTimeoutValue(self):
1283# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [],
1284# timeout=30)
1285# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1286# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001287
Senthil Kumarande49d642011-10-16 23:54:44 +08001288class RequestTests(unittest.TestCase):
1289 """Unit tests for urllib.request.Request."""
1290
1291 def test_default_values(self):
1292 Request = urllib.request.Request
1293 request = Request("http://www.python.org")
1294 self.assertEqual(request.get_method(), 'GET')
1295 request = Request("http://www.python.org", {})
1296 self.assertEqual(request.get_method(), 'POST')
1297
1298 def test_with_method_arg(self):
1299 Request = urllib.request.Request
1300 request = Request("http://www.python.org", method='HEAD')
1301 self.assertEqual(request.method, 'HEAD')
1302 self.assertEqual(request.get_method(), 'HEAD')
1303 request = Request("http://www.python.org", {}, method='HEAD')
1304 self.assertEqual(request.method, 'HEAD')
1305 self.assertEqual(request.get_method(), 'HEAD')
1306 request = Request("http://www.python.org", method='GET')
1307 self.assertEqual(request.get_method(), 'GET')
1308 request.method = 'HEAD'
1309 self.assertEqual(request.get_method(), 'HEAD')
Skip Montanaro080c9972001-01-28 21:12:22 +00001310
1311
Brett Cannon74bfd702003-04-25 09:39:47 +00001312def test_main():
Benjamin Petersonee8712c2008-05-20 21:35:26 +00001313 support.run_unittest(
Walter Dörwald21d3a322003-05-01 17:45:56 +00001314 urlopen_FileTests,
Hye-Shik Chang39aef792004-06-05 13:30:56 +00001315 urlopen_HttpTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001316 urlretrieve_FileTests,
Senthil Kumarance260142011-11-01 01:35:17 +08001317 urlretrieve_HttpTests,
Benjamin Peterson9bc93512008-09-22 22:10:59 +00001318 ProxyTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001319 QuotingTests,
1320 UnquotingTests,
1321 urlencode_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001322 Pathname_Tests,
Senthil Kumaraneaaec272009-03-30 21:54:41 +00001323 Utility_Tests,
Senthil Kumaran690ce9b2009-05-05 18:41:13 +00001324 URLopener_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001325 #FTPWrapperTests,
Senthil Kumarande49d642011-10-16 23:54:44 +08001326 RequestTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001327 )
Brett Cannon74bfd702003-04-25 09:39:47 +00001328
1329
1330
1331if __name__ == '__main__':
1332 test_main()