blob: 98308b6af1c5c15bb707b10a33a39ca7b730108d [file] [log] [blame]
Brett Cannon74bfd702003-04-25 09:39:47 +00001"""Regresssion tests for urllib"""
2
Jeremy Hylton1afc1692008-06-18 20:49:58 +00003import urllib.parse
4import urllib.request
Georg Brandl24420152008-05-26 16:32:26 +00005import http.client
Barry Warsaw820c1202008-06-12 04:06:45 +00006import email.message
Jeremy Hylton66dc8c52007-08-04 03:42:26 +00007import io
Brett Cannon74bfd702003-04-25 09:39:47 +00008import unittest
Benjamin Petersonee8712c2008-05-20 21:35:26 +00009from test import support
Brett Cannon74bfd702003-04-25 09:39:47 +000010import os
Georg Brandl5a650a22005-08-26 08:51:34 +000011import tempfile
Jeremy Hylton6102e292000-08-31 15:48:10 +000012
Brett Cannon74bfd702003-04-25 09:39:47 +000013def hexescape(char):
14 """Escape char as RFC 2396 specifies"""
15 hex_repr = hex(ord(char))[2:].upper()
16 if len(hex_repr) == 1:
17 hex_repr = "0%s" % hex_repr
18 return "%" + hex_repr
Jeremy Hylton6102e292000-08-31 15:48:10 +000019
Jeremy Hylton1afc1692008-06-18 20:49:58 +000020# Shortcut for testing FancyURLopener
21_urlopener = None
22def urlopen(url, data=None, proxies=None):
23 """urlopen(url [, data]) -> open file-like object"""
24 global _urlopener
25 if proxies is not None:
26 opener = urllib.request.FancyURLopener(proxies=proxies)
27 elif not _urlopener:
28 opener = urllib.request.FancyURLopener()
29 _urlopener = opener
30 else:
31 opener = _urlopener
32 if data is None:
33 return opener.open(url)
34 else:
35 return opener.open(url, data)
36
Brett Cannon74bfd702003-04-25 09:39:47 +000037class urlopen_FileTests(unittest.TestCase):
38 """Test urlopen() opening a temporary file.
Jeremy Hylton6102e292000-08-31 15:48:10 +000039
Brett Cannon74bfd702003-04-25 09:39:47 +000040 Try to test as much functionality as possible so as to cut down on reliance
Andrew M. Kuchlingf1a2f9e2004-06-29 13:07:53 +000041 on connecting to the Net for testing.
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000042
Brett Cannon74bfd702003-04-25 09:39:47 +000043 """
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000044
Brett Cannon74bfd702003-04-25 09:39:47 +000045 def setUp(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +000046 # Create a temp file to use for testing
47 self.text = bytes("test_urllib: %s\n" % self.__class__.__name__,
48 "ascii")
49 f = open(support.TESTFN, 'wb')
Brett Cannon74bfd702003-04-25 09:39:47 +000050 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +000051 f.write(self.text)
Brett Cannon74bfd702003-04-25 09:39:47 +000052 finally:
Jeremy Hylton1afc1692008-06-18 20:49:58 +000053 f.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +000054 self.pathname = support.TESTFN
Jeremy Hylton1afc1692008-06-18 20:49:58 +000055 self.returned_obj = urlopen("file:%s" % self.pathname)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000056
Brett Cannon74bfd702003-04-25 09:39:47 +000057 def tearDown(self):
58 """Shut down the open object"""
59 self.returned_obj.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +000060 os.remove(support.TESTFN)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000061
Brett Cannon74bfd702003-04-25 09:39:47 +000062 def test_interface(self):
63 # Make sure object returned by urlopen() has the specified methods
64 for attr in ("read", "readline", "readlines", "fileno",
Christian Heimes9bd667a2008-01-20 15:14:11 +000065 "close", "info", "geturl", "getcode", "__iter__"):
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000066 self.assertTrue(hasattr(self.returned_obj, attr),
Brett Cannon74bfd702003-04-25 09:39:47 +000067 "object returned by urlopen() lacks %s attribute" %
68 attr)
Skip Montanaroe78b92a2001-01-20 20:22:30 +000069
Brett Cannon74bfd702003-04-25 09:39:47 +000070 def test_read(self):
71 self.assertEqual(self.text, self.returned_obj.read())
Skip Montanaro080c9972001-01-28 21:12:22 +000072
Brett Cannon74bfd702003-04-25 09:39:47 +000073 def test_readline(self):
74 self.assertEqual(self.text, self.returned_obj.readline())
Guido van Rossuma0982942007-07-10 08:30:03 +000075 self.assertEqual(b'', self.returned_obj.readline(),
Brett Cannon74bfd702003-04-25 09:39:47 +000076 "calling readline() after exhausting the file did not"
77 " return an empty string")
Skip Montanaro080c9972001-01-28 21:12:22 +000078
Brett Cannon74bfd702003-04-25 09:39:47 +000079 def test_readlines(self):
80 lines_list = self.returned_obj.readlines()
81 self.assertEqual(len(lines_list), 1,
82 "readlines() returned the wrong number of lines")
83 self.assertEqual(lines_list[0], self.text,
84 "readlines() returned improper text")
Skip Montanaro080c9972001-01-28 21:12:22 +000085
Brett Cannon74bfd702003-04-25 09:39:47 +000086 def test_fileno(self):
87 file_num = self.returned_obj.fileno()
Ezio Melottie9615932010-01-24 19:26:24 +000088 self.assertIsInstance(file_num, int, "fileno() did not return an int")
Brett Cannon74bfd702003-04-25 09:39:47 +000089 self.assertEqual(os.read(file_num, len(self.text)), self.text,
90 "Reading on the file descriptor returned by fileno() "
91 "did not return the expected text")
Skip Montanaroe78b92a2001-01-20 20:22:30 +000092
Brett Cannon74bfd702003-04-25 09:39:47 +000093 def test_close(self):
94 # Test close() by calling it hear and then having it be called again
95 # by the tearDown() method for the test
96 self.returned_obj.close()
Skip Montanaro080c9972001-01-28 21:12:22 +000097
Brett Cannon74bfd702003-04-25 09:39:47 +000098 def test_info(self):
Ezio Melottie9615932010-01-24 19:26:24 +000099 self.assertIsInstance(self.returned_obj.info(), email.message.Message)
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000100
Brett Cannon74bfd702003-04-25 09:39:47 +0000101 def test_geturl(self):
102 self.assertEqual(self.returned_obj.geturl(), self.pathname)
Skip Montanaro080c9972001-01-28 21:12:22 +0000103
Christian Heimes9bd667a2008-01-20 15:14:11 +0000104 def test_getcode(self):
105 self.assertEqual(self.returned_obj.getcode(), None)
106
Brett Cannon74bfd702003-04-25 09:39:47 +0000107 def test_iter(self):
108 # Test iterator
109 # Don't need to count number of iterations since test would fail the
110 # instant it returned anything beyond the first line from the
111 # comparison
112 for line in self.returned_obj.__iter__():
113 self.assertEqual(line, self.text)
Skip Montanaro080c9972001-01-28 21:12:22 +0000114
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000115class ProxyTests(unittest.TestCase):
116
117 def setUp(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000118 # Records changes to env vars
119 self.env = support.EnvironmentVarGuard()
Benjamin Peterson46a99002010-01-09 18:45:30 +0000120 # Delete all proxy related env vars
121 for k in os.environ.keys():
122 if 'proxy' in k.lower():
123 self.env.unset(k)
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000124
125 def tearDown(self):
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000126 # Restore all proxy related env vars
Walter Dörwaldb525e182009-04-26 21:39:21 +0000127 self.env.__exit__()
128 del self.env
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000129
130 def test_getproxies_environment_keep_no_proxies(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000131 self.env.set('NO_PROXY', 'localhost')
132 proxies = urllib.request.getproxies_environment()
133 # getproxies_environment use lowered case truncated (no '_proxy') keys
134 self.assertEquals('localhost', proxies['no'])
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000135
136
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000137class urlopen_HttpTests(unittest.TestCase):
138 """Test urlopen() opening a fake http connection."""
139
140 def fakehttp(self, fakedata):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000141 class FakeSocket(io.BytesIO):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000142 def sendall(self, str): pass
Nick Coghlan598c3a82009-02-08 04:01:00 +0000143 def makefile(self, *args, **kwds):
144 return self
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000145 def read(self, amt=None):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000146 if self.closed: return b""
147 return io.BytesIO.read(self, amt)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000148 def readline(self, length=None):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000149 if self.closed: return b""
150 return io.BytesIO.readline(self, length)
Georg Brandl24420152008-05-26 16:32:26 +0000151 class FakeHTTPConnection(http.client.HTTPConnection):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000152 def connect(self):
153 self.sock = FakeSocket(fakedata)
Georg Brandl24420152008-05-26 16:32:26 +0000154 self._connection_class = http.client.HTTPConnection
155 http.client.HTTPConnection = FakeHTTPConnection
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000156
157 def unfakehttp(self):
Georg Brandl24420152008-05-26 16:32:26 +0000158 http.client.HTTPConnection = self._connection_class
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000159
160 def test_read(self):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000161 self.fakehttp(b"Hello!")
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000162 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000163 fp = urlopen("http://python.org/")
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000164 self.assertEqual(fp.readline(), b"Hello!")
165 self.assertEqual(fp.readline(), b"")
Christian Heimes9bd667a2008-01-20 15:14:11 +0000166 self.assertEqual(fp.geturl(), 'http://python.org/')
167 self.assertEqual(fp.getcode(), 200)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000168 finally:
169 self.unfakehttp()
170
Christian Heimes57dddfb2008-01-02 18:30:52 +0000171 def test_read_bogus(self):
172 # urlopen() should raise IOError for many error codes.
173 self.fakehttp(b'''HTTP/1.1 401 Authentication Required
174Date: Wed, 02 Jan 2008 03:03:54 GMT
175Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
176Connection: close
177Content-Type: text/html; charset=iso-8859-1
178''')
179 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000180 self.assertRaises(IOError, urlopen, "http://python.org/")
Christian Heimes57dddfb2008-01-02 18:30:52 +0000181 finally:
182 self.unfakehttp()
183
Guido van Rossumd8faa362007-04-27 19:54:29 +0000184 def test_empty_socket(self):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000185 # urlopen() raises IOError if the underlying socket does not send any
186 # data. (#1680230)
Christian Heimes57dddfb2008-01-02 18:30:52 +0000187 self.fakehttp(b'')
Guido van Rossumd8faa362007-04-27 19:54:29 +0000188 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000189 self.assertRaises(IOError, urlopen, "http://something")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000190 finally:
191 self.unfakehttp()
192
Senthil Kumarande0eb242010-08-01 17:53:37 +0000193 def test_userpass_inurl(self):
194 self.fakehttp(b"Hello!")
195 try:
196 fp = urlopen("http://user:pass@python.org/")
197 self.assertEqual(fp.readline(), b"Hello!")
198 self.assertEqual(fp.readline(), b"")
199 self.assertEqual(fp.geturl(), 'http://user:pass@python.org/')
200 self.assertEqual(fp.getcode(), 200)
201 finally:
202 self.unfakehttp()
203
Brett Cannon19691362003-04-29 05:08:06 +0000204class urlretrieve_FileTests(unittest.TestCase):
Brett Cannon74bfd702003-04-25 09:39:47 +0000205 """Test urllib.urlretrieve() on local files"""
Skip Montanaro080c9972001-01-28 21:12:22 +0000206
Brett Cannon19691362003-04-29 05:08:06 +0000207 def setUp(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000208 # Create a list of temporary files. Each item in the list is a file
209 # name (absolute path or relative to the current working directory).
210 # All files in this list will be deleted in the tearDown method. Note,
211 # this only helps to makes sure temporary files get deleted, but it
212 # does nothing about trying to close files that may still be open. It
213 # is the responsibility of the developer to properly close files even
214 # when exceptional conditions occur.
215 self.tempFiles = []
216
Brett Cannon19691362003-04-29 05:08:06 +0000217 # Create a temporary file.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000218 self.registerFileForCleanUp(support.TESTFN)
Guido van Rossuma0982942007-07-10 08:30:03 +0000219 self.text = b'testing urllib.urlretrieve'
Georg Brandl5a650a22005-08-26 08:51:34 +0000220 try:
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000221 FILE = open(support.TESTFN, 'wb')
Georg Brandl5a650a22005-08-26 08:51:34 +0000222 FILE.write(self.text)
223 FILE.close()
224 finally:
225 try: FILE.close()
226 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000227
228 def tearDown(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000229 # Delete the temporary files.
230 for each in self.tempFiles:
231 try: os.remove(each)
232 except: pass
233
234 def constructLocalFileUrl(self, filePath):
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000235 return "file://%s" % urllib.request.pathname2url(
236 os.path.abspath(filePath))
Georg Brandl5a650a22005-08-26 08:51:34 +0000237
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000238 def createNewTempFile(self, data=b""):
Georg Brandl5a650a22005-08-26 08:51:34 +0000239 """Creates a new temporary file containing the specified data,
240 registers the file for deletion during the test fixture tear down, and
241 returns the absolute path of the file."""
242
243 newFd, newFilePath = tempfile.mkstemp()
244 try:
245 self.registerFileForCleanUp(newFilePath)
246 newFile = os.fdopen(newFd, "wb")
247 newFile.write(data)
248 newFile.close()
249 finally:
250 try: newFile.close()
251 except: pass
252 return newFilePath
253
254 def registerFileForCleanUp(self, fileName):
255 self.tempFiles.append(fileName)
Brett Cannon19691362003-04-29 05:08:06 +0000256
257 def test_basic(self):
258 # Make sure that a local file just gets its own location returned and
259 # a headers value is returned.
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000260 result = urllib.request.urlretrieve("file:%s" % support.TESTFN)
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000261 self.assertEqual(result[0], support.TESTFN)
Ezio Melottie9615932010-01-24 19:26:24 +0000262 self.assertIsInstance(result[1], email.message.Message,
263 "did not get a email.message.Message instance "
264 "as second returned value")
Brett Cannon19691362003-04-29 05:08:06 +0000265
266 def test_copy(self):
267 # Test that setting the filename argument works.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000268 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000269 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000270 result = urllib.request.urlretrieve(self.constructLocalFileUrl(
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000271 support.TESTFN), second_temp)
Brett Cannon19691362003-04-29 05:08:06 +0000272 self.assertEqual(second_temp, result[0])
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000273 self.assertTrue(os.path.exists(second_temp), "copy of the file was not "
Brett Cannon19691362003-04-29 05:08:06 +0000274 "made")
Alex Martelli01c77c62006-08-24 02:58:11 +0000275 FILE = open(second_temp, 'rb')
Brett Cannon19691362003-04-29 05:08:06 +0000276 try:
277 text = FILE.read()
Brett Cannon19691362003-04-29 05:08:06 +0000278 FILE.close()
Georg Brandl5a650a22005-08-26 08:51:34 +0000279 finally:
280 try: FILE.close()
281 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000282 self.assertEqual(self.text, text)
283
284 def test_reporthook(self):
285 # Make sure that the reporthook works.
286 def hooktester(count, block_size, total_size, count_holder=[0]):
Ezio Melottie9615932010-01-24 19:26:24 +0000287 self.assertIsInstance(count, int)
288 self.assertIsInstance(block_size, int)
289 self.assertIsInstance(total_size, int)
Brett Cannon19691362003-04-29 05:08:06 +0000290 self.assertEqual(count, count_holder[0])
291 count_holder[0] = count_holder[0] + 1
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000292 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000293 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000294 urllib.request.urlretrieve(
295 self.constructLocalFileUrl(support.TESTFN),
Georg Brandl5a650a22005-08-26 08:51:34 +0000296 second_temp, hooktester)
297
298 def test_reporthook_0_bytes(self):
299 # Test on zero length file. Should call reporthook only 1 time.
300 report = []
301 def hooktester(count, block_size, total_size, _report=report):
302 _report.append((count, block_size, total_size))
303 srcFileName = self.createNewTempFile()
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000304 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000305 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000306 self.assertEqual(len(report), 1)
307 self.assertEqual(report[0][2], 0)
308
309 def test_reporthook_5_bytes(self):
310 # Test on 5 byte file. Should call reporthook only 2 times (once when
311 # the "network connection" is established and once when the block is
312 # read). Since the block size is 8192 bytes, only one block read is
313 # required to read the entire file.
314 report = []
315 def hooktester(count, block_size, total_size, _report=report):
316 _report.append((count, block_size, total_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000317 srcFileName = self.createNewTempFile(b"x" * 5)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000318 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000319 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000320 self.assertEqual(len(report), 2)
321 self.assertEqual(report[0][1], 8192)
322 self.assertEqual(report[0][2], 5)
323
324 def test_reporthook_8193_bytes(self):
325 # Test on 8193 byte file. Should call reporthook only 3 times (once
326 # when the "network connection" is established, once for the next 8192
327 # bytes, and once for the last byte).
328 report = []
329 def hooktester(count, block_size, total_size, _report=report):
330 _report.append((count, block_size, total_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000331 srcFileName = self.createNewTempFile(b"x" * 8193)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000332 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000333 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000334 self.assertEqual(len(report), 3)
335 self.assertEqual(report[0][1], 8192)
336 self.assertEqual(report[0][2], 8193)
Skip Montanaro080c9972001-01-28 21:12:22 +0000337
Brett Cannon74bfd702003-04-25 09:39:47 +0000338class QuotingTests(unittest.TestCase):
339 """Tests for urllib.quote() and urllib.quote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000340
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000341 According to RFC 2396 (Uniform Resource Identifiers), to escape a
342 character you write it as '%' + <2 character US-ASCII hex value>.
343 The Python code of ``'%' + hex(ord(<character>))[2:]`` escapes a
344 character properly. Case does not matter on the hex letters.
Brett Cannon74bfd702003-04-25 09:39:47 +0000345
346 The various character sets specified are:
Tim Petersc2659cf2003-05-12 20:19:37 +0000347
Brett Cannon74bfd702003-04-25 09:39:47 +0000348 Reserved characters : ";/?:@&=+$,"
349 Have special meaning in URIs and must be escaped if not being used for
350 their special meaning
351 Data characters : letters, digits, and "-_.!~*'()"
352 Unreserved and do not need to be escaped; can be, though, if desired
353 Control characters : 0x00 - 0x1F, 0x7F
354 Have no use in URIs so must be escaped
355 space : 0x20
356 Must be escaped
357 Delimiters : '<>#%"'
358 Must be escaped
359 Unwise : "{}|\^[]`"
360 Must be escaped
Tim Petersc2659cf2003-05-12 20:19:37 +0000361
Brett Cannon74bfd702003-04-25 09:39:47 +0000362 """
363
364 def test_never_quote(self):
365 # Make sure quote() does not quote letters, digits, and "_,.-"
366 do_not_quote = '' .join(["ABCDEFGHIJKLMNOPQRSTUVWXYZ",
367 "abcdefghijklmnopqrstuvwxyz",
368 "0123456789",
369 "_.-"])
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000370 result = urllib.parse.quote(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000371 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000372 "using quote(): %r != %r" % (do_not_quote, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000373 result = urllib.parse.quote_plus(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000374 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000375 "using quote_plus(): %r != %r" % (do_not_quote, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000376
377 def test_default_safe(self):
378 # Test '/' is default value for 'safe' parameter
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000379 self.assertEqual(urllib.parse.quote.__defaults__[0], '/')
Brett Cannon74bfd702003-04-25 09:39:47 +0000380
381 def test_safe(self):
382 # Test setting 'safe' parameter does what it should do
383 quote_by_default = "<>"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000384 result = urllib.parse.quote(quote_by_default, safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000385 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000386 "using quote(): %r != %r" % (quote_by_default, result))
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000387 result = urllib.parse.quote_plus(quote_by_default,
388 safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000389 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000390 "using quote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000391 (quote_by_default, result))
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000392 # Safe expressed as bytes rather than str
393 result = urllib.parse.quote(quote_by_default, safe=b"<>")
394 self.assertEqual(quote_by_default, result,
395 "using quote(): %r != %r" % (quote_by_default, result))
396 # "Safe" non-ASCII characters should have no effect
397 # (Since URIs are not allowed to have non-ASCII characters)
398 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="\xfc")
399 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
400 self.assertEqual(expect, result,
401 "using quote(): %r != %r" %
402 (expect, result))
403 # Same as above, but using a bytes rather than str
404 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe=b"\xfc")
405 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
406 self.assertEqual(expect, result,
407 "using quote(): %r != %r" %
408 (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000409
410 def test_default_quoting(self):
411 # Make sure all characters that should be quoted are by default sans
412 # space (separate test for that).
413 should_quote = [chr(num) for num in range(32)] # For 0x00 - 0x1F
414 should_quote.append('<>#%"{}|\^[]`')
415 should_quote.append(chr(127)) # For 0x7F
416 should_quote = ''.join(should_quote)
417 for char in should_quote:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000418 result = urllib.parse.quote(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000419 self.assertEqual(hexescape(char), result,
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000420 "using quote(): "
421 "%s should be escaped to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000422 (char, hexescape(char), result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000423 result = urllib.parse.quote_plus(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000424 self.assertEqual(hexescape(char), result,
425 "using quote_plus(): "
Tim Petersc2659cf2003-05-12 20:19:37 +0000426 "%s should be escapes to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000427 (char, hexescape(char), result))
428 del should_quote
429 partial_quote = "ab[]cd"
430 expected = "ab%5B%5Dcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000431 result = urllib.parse.quote(partial_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000432 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000433 "using quote(): %r != %r" % (expected, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000434 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000435 "using quote_plus(): %r != %r" % (expected, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000436
437 def test_quoting_space(self):
438 # Make sure quote() and quote_plus() handle spaces as specified in
439 # their unique way
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000440 result = urllib.parse.quote(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000441 self.assertEqual(result, hexescape(' '),
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000442 "using quote(): %r != %r" % (result, hexescape(' ')))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000443 result = urllib.parse.quote_plus(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000444 self.assertEqual(result, '+',
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000445 "using quote_plus(): %r != +" % result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000446 given = "a b cd e f"
447 expect = given.replace(' ', hexescape(' '))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000448 result = urllib.parse.quote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000449 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000450 "using quote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000451 expect = given.replace(' ', '+')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000452 result = urllib.parse.quote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000453 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000454 "using quote_plus(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000455
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000456 def test_quoting_plus(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000457 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000458 'alpha%2Bbeta+gamma')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000459 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', '+'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000460 'alpha+beta+gamma')
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000461 # Test with bytes
462 self.assertEqual(urllib.parse.quote_plus(b'alpha+beta gamma'),
463 'alpha%2Bbeta+gamma')
464 # Test with safe bytes
465 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', b'+'),
466 'alpha+beta+gamma')
467
468 def test_quote_bytes(self):
469 # Bytes should quote directly to percent-encoded values
470 given = b"\xa2\xd8ab\xff"
471 expect = "%A2%D8ab%FF"
472 result = urllib.parse.quote(given)
473 self.assertEqual(expect, result,
474 "using quote(): %r != %r" % (expect, result))
475 # Encoding argument should raise type error on bytes input
476 self.assertRaises(TypeError, urllib.parse.quote, given,
477 encoding="latin-1")
478 # quote_from_bytes should work the same
479 result = urllib.parse.quote_from_bytes(given)
480 self.assertEqual(expect, result,
481 "using quote_from_bytes(): %r != %r"
482 % (expect, result))
483
484 def test_quote_with_unicode(self):
485 # Characters in Latin-1 range, encoded by default in UTF-8
486 given = "\xa2\xd8ab\xff"
487 expect = "%C2%A2%C3%98ab%C3%BF"
488 result = urllib.parse.quote(given)
489 self.assertEqual(expect, result,
490 "using quote(): %r != %r" % (expect, result))
491 # Characters in Latin-1 range, encoded by with None (default)
492 result = urllib.parse.quote(given, encoding=None, errors=None)
493 self.assertEqual(expect, result,
494 "using quote(): %r != %r" % (expect, result))
495 # Characters in Latin-1 range, encoded with Latin-1
496 given = "\xa2\xd8ab\xff"
497 expect = "%A2%D8ab%FF"
498 result = urllib.parse.quote(given, encoding="latin-1")
499 self.assertEqual(expect, result,
500 "using quote(): %r != %r" % (expect, result))
501 # Characters in BMP, encoded by default in UTF-8
502 given = "\u6f22\u5b57" # "Kanji"
503 expect = "%E6%BC%A2%E5%AD%97"
504 result = urllib.parse.quote(given)
505 self.assertEqual(expect, result,
506 "using quote(): %r != %r" % (expect, result))
507 # Characters in BMP, encoded with Latin-1
508 given = "\u6f22\u5b57"
509 self.assertRaises(UnicodeEncodeError, urllib.parse.quote, given,
510 encoding="latin-1")
511 # Characters in BMP, encoded with Latin-1, with replace error handling
512 given = "\u6f22\u5b57"
513 expect = "%3F%3F" # "??"
514 result = urllib.parse.quote(given, encoding="latin-1",
515 errors="replace")
516 self.assertEqual(expect, result,
517 "using quote(): %r != %r" % (expect, result))
518 # Characters in BMP, Latin-1, with xmlcharref error handling
519 given = "\u6f22\u5b57"
520 expect = "%26%2328450%3B%26%2323383%3B" # "&#28450;&#23383;"
521 result = urllib.parse.quote(given, encoding="latin-1",
522 errors="xmlcharrefreplace")
523 self.assertEqual(expect, result,
524 "using quote(): %r != %r" % (expect, result))
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000525
Georg Brandlfaf41492009-05-26 18:31:11 +0000526 def test_quote_plus_with_unicode(self):
527 # Encoding (latin-1) test for quote_plus
528 given = "\xa2\xd8 \xff"
529 expect = "%A2%D8+%FF"
530 result = urllib.parse.quote_plus(given, encoding="latin-1")
531 self.assertEqual(expect, result,
532 "using quote_plus(): %r != %r" % (expect, result))
533 # Errors test for quote_plus
534 given = "ab\u6f22\u5b57 cd"
535 expect = "ab%3F%3F+cd"
536 result = urllib.parse.quote_plus(given, encoding="latin-1",
537 errors="replace")
538 self.assertEqual(expect, result,
539 "using quote_plus(): %r != %r" % (expect, result))
540
Senthil Kumarand496c4c2010-07-30 19:34:36 +0000541
Brett Cannon74bfd702003-04-25 09:39:47 +0000542class UnquotingTests(unittest.TestCase):
543 """Tests for unquote() and unquote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000544
Brett Cannon74bfd702003-04-25 09:39:47 +0000545 See the doc string for quoting_Tests for details on quoting and such.
546
547 """
548
549 def test_unquoting(self):
550 # Make sure unquoting of all ASCII values works
551 escape_list = []
552 for num in range(128):
553 given = hexescape(chr(num))
554 expect = chr(num)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000555 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000556 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000557 "using unquote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000558 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000559 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000560 "using unquote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000561 (expect, result))
562 escape_list.append(given)
563 escape_string = ''.join(escape_list)
564 del escape_list
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000565 result = urllib.parse.unquote(escape_string)
Brett Cannon74bfd702003-04-25 09:39:47 +0000566 self.assertEqual(result.count('%'), 1,
Brett Cannon74bfd702003-04-25 09:39:47 +0000567 "using unquote(): not all characters escaped: "
568 "%s" % result)
Georg Brandl604ef372010-07-31 08:20:02 +0000569 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, None)
570 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, ())
Florent Xiclunac049fca2010-07-31 08:56:55 +0000571 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, b'')
Brett Cannon74bfd702003-04-25 09:39:47 +0000572
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000573 def test_unquoting_badpercent(self):
574 # Test unquoting on bad percent-escapes
575 given = '%xab'
576 expect = given
577 result = urllib.parse.unquote(given)
578 self.assertEqual(expect, result, "using unquote(): %r != %r"
579 % (expect, result))
580 given = '%x'
581 expect = given
582 result = urllib.parse.unquote(given)
583 self.assertEqual(expect, result, "using unquote(): %r != %r"
584 % (expect, result))
585 given = '%'
586 expect = given
587 result = urllib.parse.unquote(given)
588 self.assertEqual(expect, result, "using unquote(): %r != %r"
589 % (expect, result))
590 # unquote_to_bytes
591 given = '%xab'
592 expect = bytes(given, 'ascii')
593 result = urllib.parse.unquote_to_bytes(given)
594 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
595 % (expect, result))
596 given = '%x'
597 expect = bytes(given, 'ascii')
598 result = urllib.parse.unquote_to_bytes(given)
599 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
600 % (expect, result))
601 given = '%'
602 expect = bytes(given, 'ascii')
603 result = urllib.parse.unquote_to_bytes(given)
604 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
605 % (expect, result))
Georg Brandl604ef372010-07-31 08:20:02 +0000606 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, None)
607 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, ())
Senthil Kumaran79e17f62010-07-19 18:17:19 +0000608
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000609 def test_unquoting_mixed_case(self):
610 # Test unquoting on mixed-case hex digits in the percent-escapes
611 given = '%Ab%eA'
612 expect = b'\xab\xea'
613 result = urllib.parse.unquote_to_bytes(given)
614 self.assertEqual(expect, result,
615 "using unquote_to_bytes(): %r != %r"
616 % (expect, result))
617
Brett Cannon74bfd702003-04-25 09:39:47 +0000618 def test_unquoting_parts(self):
619 # Make sure unquoting works when have non-quoted characters
620 # interspersed
621 given = 'ab%sd' % hexescape('c')
622 expect = "abcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000623 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000624 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000625 "using quote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000626 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000627 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000628 "using unquote_plus(): %r != %r" % (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000629
Brett Cannon74bfd702003-04-25 09:39:47 +0000630 def test_unquoting_plus(self):
631 # Test difference between unquote() and unquote_plus()
632 given = "are+there+spaces..."
633 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000634 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000635 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000636 "using unquote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000637 expect = given.replace('+', ' ')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000638 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000639 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000640 "using unquote_plus(): %r != %r" % (expect, result))
641
642 def test_unquote_to_bytes(self):
643 given = 'br%C3%BCckner_sapporo_20050930.doc'
644 expect = b'br\xc3\xbcckner_sapporo_20050930.doc'
645 result = urllib.parse.unquote_to_bytes(given)
646 self.assertEqual(expect, result,
647 "using unquote_to_bytes(): %r != %r"
648 % (expect, result))
649 # Test on a string with unescaped non-ASCII characters
650 # (Technically an invalid URI; expect those characters to be UTF-8
651 # encoded).
652 result = urllib.parse.unquote_to_bytes("\u6f22%C3%BC")
653 expect = b'\xe6\xbc\xa2\xc3\xbc' # UTF-8 for "\u6f22\u00fc"
654 self.assertEqual(expect, result,
655 "using unquote_to_bytes(): %r != %r"
656 % (expect, result))
657 # Test with a bytes as input
658 given = b'%A2%D8ab%FF'
659 expect = b'\xa2\xd8ab\xff'
660 result = urllib.parse.unquote_to_bytes(given)
661 self.assertEqual(expect, result,
662 "using unquote_to_bytes(): %r != %r"
663 % (expect, result))
664 # Test with a bytes as input, with unescaped non-ASCII bytes
665 # (Technically an invalid URI; expect those bytes to be preserved)
666 given = b'%A2\xd8ab%FF'
667 expect = b'\xa2\xd8ab\xff'
668 result = urllib.parse.unquote_to_bytes(given)
669 self.assertEqual(expect, result,
670 "using unquote_to_bytes(): %r != %r"
671 % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000672
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000673 def test_unquote_with_unicode(self):
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000674 # Characters in the Latin-1 range, encoded with UTF-8
675 given = 'br%C3%BCckner_sapporo_20050930.doc'
676 expect = 'br\u00fcckner_sapporo_20050930.doc'
677 result = urllib.parse.unquote(given)
678 self.assertEqual(expect, result,
679 "using unquote(): %r != %r" % (expect, result))
680 # Characters in the Latin-1 range, encoded with None (default)
681 result = urllib.parse.unquote(given, encoding=None, errors=None)
682 self.assertEqual(expect, result,
683 "using unquote(): %r != %r" % (expect, result))
684
685 # Characters in the Latin-1 range, encoded with Latin-1
686 result = urllib.parse.unquote('br%FCckner_sapporo_20050930.doc',
687 encoding="latin-1")
688 expect = 'br\u00fcckner_sapporo_20050930.doc'
689 self.assertEqual(expect, result,
690 "using unquote(): %r != %r" % (expect, result))
691
692 # Characters in BMP, encoded with UTF-8
693 given = "%E6%BC%A2%E5%AD%97"
694 expect = "\u6f22\u5b57" # "Kanji"
695 result = urllib.parse.unquote(given)
696 self.assertEqual(expect, result,
697 "using unquote(): %r != %r" % (expect, result))
698
699 # Decode with UTF-8, invalid sequence
700 given = "%F3%B1"
701 expect = "\ufffd" # Replacement character
702 result = urllib.parse.unquote(given)
703 self.assertEqual(expect, result,
704 "using unquote(): %r != %r" % (expect, result))
705
706 # Decode with UTF-8, invalid sequence, replace errors
707 result = urllib.parse.unquote(given, errors="replace")
708 self.assertEqual(expect, result,
709 "using unquote(): %r != %r" % (expect, result))
710
711 # Decode with UTF-8, invalid sequence, ignoring errors
712 given = "%F3%B1"
713 expect = ""
714 result = urllib.parse.unquote(given, errors="ignore")
715 self.assertEqual(expect, result,
716 "using unquote(): %r != %r" % (expect, result))
717
718 # A mix of non-ASCII and percent-encoded characters, UTF-8
719 result = urllib.parse.unquote("\u6f22%C3%BC")
720 expect = '\u6f22\u00fc'
721 self.assertEqual(expect, result,
722 "using unquote(): %r != %r" % (expect, result))
723
724 # A mix of non-ASCII and percent-encoded characters, Latin-1
725 # (Note, the string contains non-Latin-1-representable characters)
726 result = urllib.parse.unquote("\u6f22%FC", encoding="latin-1")
727 expect = '\u6f22\u00fc'
728 self.assertEqual(expect, result,
729 "using unquote(): %r != %r" % (expect, result))
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000730
Brett Cannon74bfd702003-04-25 09:39:47 +0000731class urlencode_Tests(unittest.TestCase):
732 """Tests for urlencode()"""
733
734 def help_inputtype(self, given, test_type):
735 """Helper method for testing different input types.
Tim Petersc2659cf2003-05-12 20:19:37 +0000736
Brett Cannon74bfd702003-04-25 09:39:47 +0000737 'given' must lead to only the pairs:
738 * 1st, 1
739 * 2nd, 2
740 * 3rd, 3
Tim Petersc2659cf2003-05-12 20:19:37 +0000741
Brett Cannon74bfd702003-04-25 09:39:47 +0000742 Test cannot assume anything about order. Docs make no guarantee and
743 have possible dictionary input.
Tim Petersc2659cf2003-05-12 20:19:37 +0000744
Brett Cannon74bfd702003-04-25 09:39:47 +0000745 """
746 expect_somewhere = ["1st=1", "2nd=2", "3rd=3"]
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000747 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000748 for expected in expect_somewhere:
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000749 self.assertIn(expected, result,
Brett Cannon74bfd702003-04-25 09:39:47 +0000750 "testing %s: %s not found in %s" %
751 (test_type, expected, result))
752 self.assertEqual(result.count('&'), 2,
753 "testing %s: expected 2 '&'s; got %s" %
754 (test_type, result.count('&')))
755 amp_location = result.index('&')
756 on_amp_left = result[amp_location - 1]
757 on_amp_right = result[amp_location + 1]
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000758 self.assertTrue(on_amp_left.isdigit() and on_amp_right.isdigit(),
Brett Cannon74bfd702003-04-25 09:39:47 +0000759 "testing %s: '&' not located in proper place in %s" %
760 (test_type, result))
761 self.assertEqual(len(result), (5 * 3) + 2, #5 chars per thing and amps
762 "testing %s: "
763 "unexpected number of characters: %s != %s" %
764 (test_type, len(result), (5 * 3) + 2))
765
766 def test_using_mapping(self):
767 # Test passing in a mapping object as an argument.
768 self.help_inputtype({"1st":'1', "2nd":'2', "3rd":'3'},
769 "using dict as input type")
770
771 def test_using_sequence(self):
772 # Test passing in a sequence of two-item sequences as an argument.
773 self.help_inputtype([('1st', '1'), ('2nd', '2'), ('3rd', '3')],
774 "using sequence of two-item tuples as input")
775
776 def test_quoting(self):
777 # Make sure keys and values are quoted using quote_plus()
778 given = {"&":"="}
779 expect = "%s=%s" % (hexescape('&'), hexescape('='))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000780 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000781 self.assertEqual(expect, result)
782 given = {"key name":"A bunch of pluses"}
783 expect = "key+name=A+bunch+of+pluses"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000784 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000785 self.assertEqual(expect, result)
786
787 def test_doseq(self):
788 # Test that passing True for 'doseq' parameter works correctly
789 given = {'sequence':['1', '2', '3']}
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000790 expect = "sequence=%s" % urllib.parse.quote_plus(str(['1', '2', '3']))
791 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000792 self.assertEqual(expect, result)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000793 result = urllib.parse.urlencode(given, True)
Brett Cannon74bfd702003-04-25 09:39:47 +0000794 for value in given["sequence"]:
795 expect = "sequence=%s" % value
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000796 self.assertIn(expect, result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000797 self.assertEqual(result.count('&'), 2,
798 "Expected 2 '&'s, got %s" % result.count('&'))
799
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000800 def test_empty_sequence(self):
801 self.assertEqual("", urllib.parse.urlencode({}))
802 self.assertEqual("", urllib.parse.urlencode([]))
803
804 def test_nonstring_values(self):
805 self.assertEqual("a=1", urllib.parse.urlencode({"a": 1}))
806 self.assertEqual("a=None", urllib.parse.urlencode({"a": None}))
807
808 def test_nonstring_seq_values(self):
809 self.assertEqual("a=1&a=2", urllib.parse.urlencode({"a": [1, 2]}, True))
810 self.assertEqual("a=None&a=a",
811 urllib.parse.urlencode({"a": [None, "a"]}, True))
812 self.assertEqual("a=a&a=b",
813 urllib.parse.urlencode({"a": {"a": 1, "b": 1}}, True))
814
Senthil Kumarandf022da2010-07-03 17:48:22 +0000815 def test_urlencode_encoding(self):
816 # ASCII encoding. Expect %3F with errors="replace'
817 given = (('\u00a0', '\u00c1'),)
818 expect = '%3F=%3F'
819 result = urllib.parse.urlencode(given, encoding="ASCII", errors="replace")
820 self.assertEqual(expect, result)
821
822 # Default is UTF-8 encoding.
823 given = (('\u00a0', '\u00c1'),)
824 expect = '%C2%A0=%C3%81'
825 result = urllib.parse.urlencode(given)
826 self.assertEqual(expect, result)
827
828 # Latin-1 encoding.
829 given = (('\u00a0', '\u00c1'),)
830 expect = '%A0=%C1'
831 result = urllib.parse.urlencode(given, encoding="latin-1")
832 self.assertEqual(expect, result)
833
834 def test_urlencode_encoding_doseq(self):
835 # ASCII Encoding. Expect %3F with errors="replace'
836 given = (('\u00a0', '\u00c1'),)
837 expect = '%3F=%3F'
838 result = urllib.parse.urlencode(given, doseq=True,
839 encoding="ASCII", errors="replace")
840 self.assertEqual(expect, result)
841
842 # ASCII Encoding. On a sequence of values.
843 given = (("\u00a0", (1, "\u00c1")),)
844 expect = '%3F=1&%3F=%3F'
845 result = urllib.parse.urlencode(given, True,
846 encoding="ASCII", errors="replace")
847 self.assertEqual(expect, result)
848
849 # Utf-8
850 given = (("\u00a0", "\u00c1"),)
851 expect = '%C2%A0=%C3%81'
852 result = urllib.parse.urlencode(given, True)
853 self.assertEqual(expect, result)
854
855 given = (("\u00a0", (42, "\u00c1")),)
856 expect = '%C2%A0=42&%C2%A0=%C3%81'
857 result = urllib.parse.urlencode(given, True)
858 self.assertEqual(expect, result)
859
860 # latin-1
861 given = (("\u00a0", "\u00c1"),)
862 expect = '%A0=%C1'
863 result = urllib.parse.urlencode(given, True, encoding="latin-1")
864 self.assertEqual(expect, result)
865
866 given = (("\u00a0", (42, "\u00c1")),)
867 expect = '%A0=42&%A0=%C1'
868 result = urllib.parse.urlencode(given, True, encoding="latin-1")
869 self.assertEqual(expect, result)
870
871 def test_urlencode_bytes(self):
872 given = ((b'\xa0\x24', b'\xc1\x24'),)
873 expect = '%A0%24=%C1%24'
874 result = urllib.parse.urlencode(given)
875 self.assertEqual(expect, result)
876 result = urllib.parse.urlencode(given, True)
877 self.assertEqual(expect, result)
878
879 # Sequence of values
880 given = ((b'\xa0\x24', (42, b'\xc1\x24')),)
881 expect = '%A0%24=42&%A0%24=%C1%24'
882 result = urllib.parse.urlencode(given, True)
883 self.assertEqual(expect, result)
884
885 def test_urlencode_encoding_safe_parameter(self):
886
887 # Send '$' (\x24) as safe character
888 # Default utf-8 encoding
889
890 given = ((b'\xa0\x24', b'\xc1\x24'),)
891 result = urllib.parse.urlencode(given, safe=":$")
892 expect = '%A0$=%C1$'
893 self.assertEqual(expect, result)
894
895 given = ((b'\xa0\x24', b'\xc1\x24'),)
896 result = urllib.parse.urlencode(given, doseq=True, safe=":$")
897 expect = '%A0$=%C1$'
898 self.assertEqual(expect, result)
899
900 # Safe parameter in sequence
901 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
902 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
903 result = urllib.parse.urlencode(given, True, safe=":$")
904 self.assertEqual(expect, result)
905
906 # Test all above in latin-1 encoding
907
908 given = ((b'\xa0\x24', b'\xc1\x24'),)
909 result = urllib.parse.urlencode(given, safe=":$",
910 encoding="latin-1")
911 expect = '%A0$=%C1$'
912 self.assertEqual(expect, result)
913
914 given = ((b'\xa0\x24', b'\xc1\x24'),)
915 expect = '%A0$=%C1$'
916 result = urllib.parse.urlencode(given, doseq=True, safe=":$",
917 encoding="latin-1")
918
919 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
920 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
921 result = urllib.parse.urlencode(given, True, safe=":$",
922 encoding="latin-1")
923 self.assertEqual(expect, result)
924
Brett Cannon74bfd702003-04-25 09:39:47 +0000925class Pathname_Tests(unittest.TestCase):
926 """Test pathname2url() and url2pathname()"""
927
928 def test_basic(self):
929 # Make sure simple tests pass
930 expected_path = os.path.join("parts", "of", "a", "path")
931 expected_url = "parts/of/a/path"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000932 result = urllib.request.pathname2url(expected_path)
Brett Cannon74bfd702003-04-25 09:39:47 +0000933 self.assertEqual(expected_url, result,
934 "pathname2url() failed; %s != %s" %
935 (result, expected_url))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000936 result = urllib.request.url2pathname(expected_url)
Brett Cannon74bfd702003-04-25 09:39:47 +0000937 self.assertEqual(expected_path, result,
938 "url2pathame() failed; %s != %s" %
939 (result, expected_path))
940
941 def test_quoting(self):
942 # Test automatic quoting and unquoting works for pathnam2url() and
943 # url2pathname() respectively
944 given = os.path.join("needs", "quot=ing", "here")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000945 expect = "needs/%s/here" % urllib.parse.quote("quot=ing")
946 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000947 self.assertEqual(expect, result,
948 "pathname2url() failed; %s != %s" %
949 (expect, result))
950 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000951 result = urllib.request.url2pathname(result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000952 self.assertEqual(expect, result,
953 "url2pathname() failed; %s != %s" %
954 (expect, result))
955 given = os.path.join("make sure", "using_quote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000956 expect = "%s/using_quote" % urllib.parse.quote("make sure")
957 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000958 self.assertEqual(expect, result,
959 "pathname2url() failed; %s != %s" %
960 (expect, result))
961 given = "make+sure/using_unquote"
962 expect = os.path.join("make+sure", "using_unquote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000963 result = urllib.request.url2pathname(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000964 self.assertEqual(expect, result,
965 "url2pathname() failed; %s != %s" %
966 (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000967
Senthil Kumaraneaaec272009-03-30 21:54:41 +0000968class Utility_Tests(unittest.TestCase):
969 """Testcase to test the various utility functions in the urllib."""
970
971 def test_splitpasswd(self):
972 """Some of password examples are not sensible, but it is added to
973 confirming to RFC2617 and addressing issue4675.
974 """
975 self.assertEqual(('user', 'ab'),urllib.parse.splitpasswd('user:ab'))
976 self.assertEqual(('user', 'a\nb'),urllib.parse.splitpasswd('user:a\nb'))
977 self.assertEqual(('user', 'a\tb'),urllib.parse.splitpasswd('user:a\tb'))
978 self.assertEqual(('user', 'a\rb'),urllib.parse.splitpasswd('user:a\rb'))
979 self.assertEqual(('user', 'a\fb'),urllib.parse.splitpasswd('user:a\fb'))
980 self.assertEqual(('user', 'a\vb'),urllib.parse.splitpasswd('user:a\vb'))
981 self.assertEqual(('user', 'a:b'),urllib.parse.splitpasswd('user:a:b'))
982
Senthil Kumaran690ce9b2009-05-05 18:41:13 +0000983
984class URLopener_Tests(unittest.TestCase):
985 """Testcase to test the open method of URLopener class."""
986
987 def test_quoted_open(self):
988 class DummyURLopener(urllib.request.URLopener):
989 def open_spam(self, url):
990 return url
991
992 self.assertEqual(DummyURLopener().open(
993 'spam://example/ /'),'//example/%20/')
994
Senthil Kumaran734f0592010-02-20 22:19:04 +0000995 # test the safe characters are not quoted by urlopen
996 self.assertEqual(DummyURLopener().open(
997 "spam://c:|windows%/:=&?~#+!$,;'@()*[]|/path/"),
998 "//c:|windows%/:=&?~#+!$,;'@()*[]|/path/")
999
Guido van Rossume7ba4952007-06-06 23:52:48 +00001000# Just commented them out.
1001# Can't really tell why keep failing in windows and sparc.
1002# Everywhere else they work ok, but on those machines, someteimes
1003# fail in one of the tests, sometimes in other. I have a linux, and
1004# the tests go ok.
1005# If anybody has one of the problematic enviroments, please help!
1006# . Facundo
1007#
1008# def server(evt):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001009# import socket, time
Guido van Rossume7ba4952007-06-06 23:52:48 +00001010# serv = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
1011# serv.settimeout(3)
1012# serv.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
1013# serv.bind(("", 9093))
1014# serv.listen(5)
1015# try:
1016# conn, addr = serv.accept()
1017# conn.send("1 Hola mundo\n")
1018# cantdata = 0
1019# while cantdata < 13:
1020# data = conn.recv(13-cantdata)
1021# cantdata += len(data)
1022# time.sleep(.3)
1023# conn.send("2 No more lines\n")
1024# conn.close()
1025# except socket.timeout:
1026# pass
1027# finally:
1028# serv.close()
1029# evt.set()
1030#
1031# class FTPWrapperTests(unittest.TestCase):
1032#
1033# def setUp(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001034# import ftplib, time, threading
Guido van Rossume7ba4952007-06-06 23:52:48 +00001035# ftplib.FTP.port = 9093
1036# self.evt = threading.Event()
1037# threading.Thread(target=server, args=(self.evt,)).start()
1038# time.sleep(.1)
1039#
1040# def tearDown(self):
1041# self.evt.wait()
1042#
1043# def testBasic(self):
1044# # connects
1045# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
Georg Brandlf78e02b2008-06-10 17:40:04 +00001046# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001047#
1048# def testTimeoutNone(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001049# # global default timeout is ignored
1050# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001051# self.assertTrue(socket.getdefaulttimeout() is None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001052# socket.setdefaulttimeout(30)
1053# try:
1054# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1055# finally:
Georg Brandlf78e02b2008-06-10 17:40:04 +00001056# socket.setdefaulttimeout(None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001057# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001058# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001059#
Georg Brandlf78e02b2008-06-10 17:40:04 +00001060# def testTimeoutDefault(self):
1061# # global default timeout is used
1062# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001063# self.assertTrue(socket.getdefaulttimeout() is None)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001064# socket.setdefaulttimeout(30)
1065# try:
1066# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1067# finally:
1068# socket.setdefaulttimeout(None)
1069# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1070# ftp.close()
1071#
1072# def testTimeoutValue(self):
1073# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [],
1074# timeout=30)
1075# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1076# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001077
Skip Montanaro080c9972001-01-28 21:12:22 +00001078
1079
Brett Cannon74bfd702003-04-25 09:39:47 +00001080def test_main():
Benjamin Petersonee8712c2008-05-20 21:35:26 +00001081 support.run_unittest(
Walter Dörwald21d3a322003-05-01 17:45:56 +00001082 urlopen_FileTests,
Hye-Shik Chang39aef792004-06-05 13:30:56 +00001083 urlopen_HttpTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001084 urlretrieve_FileTests,
Benjamin Peterson9bc93512008-09-22 22:10:59 +00001085 ProxyTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001086 QuotingTests,
1087 UnquotingTests,
1088 urlencode_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001089 Pathname_Tests,
Senthil Kumaraneaaec272009-03-30 21:54:41 +00001090 Utility_Tests,
Senthil Kumaran690ce9b2009-05-05 18:41:13 +00001091 URLopener_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001092 #FTPWrapperTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001093 )
Brett Cannon74bfd702003-04-25 09:39:47 +00001094
1095
1096
1097if __name__ == '__main__':
1098 test_main()