blob: cea153e907a6330afa0e7d30d326605ceb95979e [file] [log] [blame]
Brett Cannon74bfd702003-04-25 09:39:47 +00001"""Regresssion tests for urllib"""
2
Jeremy Hylton1afc1692008-06-18 20:49:58 +00003import urllib.parse
4import urllib.request
Georg Brandl24420152008-05-26 16:32:26 +00005import http.client
Barry Warsaw820c1202008-06-12 04:06:45 +00006import email.message
Jeremy Hylton66dc8c52007-08-04 03:42:26 +00007import io
Brett Cannon74bfd702003-04-25 09:39:47 +00008import unittest
Benjamin Petersonee8712c2008-05-20 21:35:26 +00009from test import support
Brett Cannon74bfd702003-04-25 09:39:47 +000010import os
Georg Brandl5a650a22005-08-26 08:51:34 +000011import tempfile
Jeremy Hylton6102e292000-08-31 15:48:10 +000012
Brett Cannon74bfd702003-04-25 09:39:47 +000013def hexescape(char):
14 """Escape char as RFC 2396 specifies"""
15 hex_repr = hex(ord(char))[2:].upper()
16 if len(hex_repr) == 1:
17 hex_repr = "0%s" % hex_repr
18 return "%" + hex_repr
Jeremy Hylton6102e292000-08-31 15:48:10 +000019
Jeremy Hylton1afc1692008-06-18 20:49:58 +000020# Shortcut for testing FancyURLopener
21_urlopener = None
22def urlopen(url, data=None, proxies=None):
23 """urlopen(url [, data]) -> open file-like object"""
24 global _urlopener
25 if proxies is not None:
26 opener = urllib.request.FancyURLopener(proxies=proxies)
27 elif not _urlopener:
28 opener = urllib.request.FancyURLopener()
29 _urlopener = opener
30 else:
31 opener = _urlopener
32 if data is None:
33 return opener.open(url)
34 else:
35 return opener.open(url, data)
36
Brett Cannon74bfd702003-04-25 09:39:47 +000037class urlopen_FileTests(unittest.TestCase):
38 """Test urlopen() opening a temporary file.
Jeremy Hylton6102e292000-08-31 15:48:10 +000039
Brett Cannon74bfd702003-04-25 09:39:47 +000040 Try to test as much functionality as possible so as to cut down on reliance
Andrew M. Kuchlingf1a2f9e2004-06-29 13:07:53 +000041 on connecting to the Net for testing.
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000042
Brett Cannon74bfd702003-04-25 09:39:47 +000043 """
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000044
Brett Cannon74bfd702003-04-25 09:39:47 +000045 def setUp(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +000046 # Create a temp file to use for testing
47 self.text = bytes("test_urllib: %s\n" % self.__class__.__name__,
48 "ascii")
49 f = open(support.TESTFN, 'wb')
Brett Cannon74bfd702003-04-25 09:39:47 +000050 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +000051 f.write(self.text)
Brett Cannon74bfd702003-04-25 09:39:47 +000052 finally:
Jeremy Hylton1afc1692008-06-18 20:49:58 +000053 f.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +000054 self.pathname = support.TESTFN
Jeremy Hylton1afc1692008-06-18 20:49:58 +000055 self.returned_obj = urlopen("file:%s" % self.pathname)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000056
Brett Cannon74bfd702003-04-25 09:39:47 +000057 def tearDown(self):
58 """Shut down the open object"""
59 self.returned_obj.close()
Benjamin Petersonee8712c2008-05-20 21:35:26 +000060 os.remove(support.TESTFN)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000061
Brett Cannon74bfd702003-04-25 09:39:47 +000062 def test_interface(self):
63 # Make sure object returned by urlopen() has the specified methods
64 for attr in ("read", "readline", "readlines", "fileno",
Christian Heimes9bd667a2008-01-20 15:14:11 +000065 "close", "info", "geturl", "getcode", "__iter__"):
Benjamin Petersonc9c0f202009-06-30 23:06:06 +000066 self.assertTrue(hasattr(self.returned_obj, attr),
Brett Cannon74bfd702003-04-25 09:39:47 +000067 "object returned by urlopen() lacks %s attribute" %
68 attr)
Skip Montanaroe78b92a2001-01-20 20:22:30 +000069
Brett Cannon74bfd702003-04-25 09:39:47 +000070 def test_read(self):
71 self.assertEqual(self.text, self.returned_obj.read())
Skip Montanaro080c9972001-01-28 21:12:22 +000072
Brett Cannon74bfd702003-04-25 09:39:47 +000073 def test_readline(self):
74 self.assertEqual(self.text, self.returned_obj.readline())
Guido van Rossuma0982942007-07-10 08:30:03 +000075 self.assertEqual(b'', self.returned_obj.readline(),
Brett Cannon74bfd702003-04-25 09:39:47 +000076 "calling readline() after exhausting the file did not"
77 " return an empty string")
Skip Montanaro080c9972001-01-28 21:12:22 +000078
Brett Cannon74bfd702003-04-25 09:39:47 +000079 def test_readlines(self):
80 lines_list = self.returned_obj.readlines()
81 self.assertEqual(len(lines_list), 1,
82 "readlines() returned the wrong number of lines")
83 self.assertEqual(lines_list[0], self.text,
84 "readlines() returned improper text")
Skip Montanaro080c9972001-01-28 21:12:22 +000085
Brett Cannon74bfd702003-04-25 09:39:47 +000086 def test_fileno(self):
87 file_num = self.returned_obj.fileno()
Ezio Melottie9615932010-01-24 19:26:24 +000088 self.assertIsInstance(file_num, int, "fileno() did not return an int")
Brett Cannon74bfd702003-04-25 09:39:47 +000089 self.assertEqual(os.read(file_num, len(self.text)), self.text,
90 "Reading on the file descriptor returned by fileno() "
91 "did not return the expected text")
Skip Montanaroe78b92a2001-01-20 20:22:30 +000092
Brett Cannon74bfd702003-04-25 09:39:47 +000093 def test_close(self):
94 # Test close() by calling it hear and then having it be called again
95 # by the tearDown() method for the test
96 self.returned_obj.close()
Skip Montanaro080c9972001-01-28 21:12:22 +000097
Brett Cannon74bfd702003-04-25 09:39:47 +000098 def test_info(self):
Ezio Melottie9615932010-01-24 19:26:24 +000099 self.assertIsInstance(self.returned_obj.info(), email.message.Message)
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000100
Brett Cannon74bfd702003-04-25 09:39:47 +0000101 def test_geturl(self):
102 self.assertEqual(self.returned_obj.geturl(), self.pathname)
Skip Montanaro080c9972001-01-28 21:12:22 +0000103
Christian Heimes9bd667a2008-01-20 15:14:11 +0000104 def test_getcode(self):
105 self.assertEqual(self.returned_obj.getcode(), None)
106
Brett Cannon74bfd702003-04-25 09:39:47 +0000107 def test_iter(self):
108 # Test iterator
109 # Don't need to count number of iterations since test would fail the
110 # instant it returned anything beyond the first line from the
111 # comparison
112 for line in self.returned_obj.__iter__():
113 self.assertEqual(line, self.text)
Skip Montanaro080c9972001-01-28 21:12:22 +0000114
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000115class ProxyTests(unittest.TestCase):
116
117 def setUp(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000118 # Records changes to env vars
119 self.env = support.EnvironmentVarGuard()
Benjamin Peterson46a99002010-01-09 18:45:30 +0000120 # Delete all proxy related env vars
121 for k in os.environ.keys():
122 if 'proxy' in k.lower():
123 self.env.unset(k)
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000124
125 def tearDown(self):
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000126 # Restore all proxy related env vars
Walter Dörwaldb525e182009-04-26 21:39:21 +0000127 self.env.__exit__()
128 del self.env
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000129
130 def test_getproxies_environment_keep_no_proxies(self):
Walter Dörwaldb525e182009-04-26 21:39:21 +0000131 self.env.set('NO_PROXY', 'localhost')
132 proxies = urllib.request.getproxies_environment()
133 # getproxies_environment use lowered case truncated (no '_proxy') keys
134 self.assertEquals('localhost', proxies['no'])
Benjamin Peterson9bc93512008-09-22 22:10:59 +0000135
136
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000137class urlopen_HttpTests(unittest.TestCase):
138 """Test urlopen() opening a fake http connection."""
139
140 def fakehttp(self, fakedata):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000141 class FakeSocket(io.BytesIO):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000142 def sendall(self, str): pass
Nick Coghlan598c3a82009-02-08 04:01:00 +0000143 def makefile(self, *args, **kwds):
144 return self
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000145 def read(self, amt=None):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000146 if self.closed: return b""
147 return io.BytesIO.read(self, amt)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000148 def readline(self, length=None):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000149 if self.closed: return b""
150 return io.BytesIO.readline(self, length)
Georg Brandl24420152008-05-26 16:32:26 +0000151 class FakeHTTPConnection(http.client.HTTPConnection):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000152 def connect(self):
153 self.sock = FakeSocket(fakedata)
Georg Brandl24420152008-05-26 16:32:26 +0000154 self._connection_class = http.client.HTTPConnection
155 http.client.HTTPConnection = FakeHTTPConnection
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000156
157 def unfakehttp(self):
Georg Brandl24420152008-05-26 16:32:26 +0000158 http.client.HTTPConnection = self._connection_class
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000159
160 def test_read(self):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000161 self.fakehttp(b"Hello!")
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000162 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000163 fp = urlopen("http://python.org/")
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000164 self.assertEqual(fp.readline(), b"Hello!")
165 self.assertEqual(fp.readline(), b"")
Christian Heimes9bd667a2008-01-20 15:14:11 +0000166 self.assertEqual(fp.geturl(), 'http://python.org/')
167 self.assertEqual(fp.getcode(), 200)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000168 finally:
169 self.unfakehttp()
170
Christian Heimes57dddfb2008-01-02 18:30:52 +0000171 def test_read_bogus(self):
172 # urlopen() should raise IOError for many error codes.
173 self.fakehttp(b'''HTTP/1.1 401 Authentication Required
174Date: Wed, 02 Jan 2008 03:03:54 GMT
175Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
176Connection: close
177Content-Type: text/html; charset=iso-8859-1
178''')
179 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000180 self.assertRaises(IOError, urlopen, "http://python.org/")
Christian Heimes57dddfb2008-01-02 18:30:52 +0000181 finally:
182 self.unfakehttp()
183
Guido van Rossumd8faa362007-04-27 19:54:29 +0000184 def test_empty_socket(self):
Jeremy Hylton66dc8c52007-08-04 03:42:26 +0000185 # urlopen() raises IOError if the underlying socket does not send any
186 # data. (#1680230)
Christian Heimes57dddfb2008-01-02 18:30:52 +0000187 self.fakehttp(b'')
Guido van Rossumd8faa362007-04-27 19:54:29 +0000188 try:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000189 self.assertRaises(IOError, urlopen, "http://something")
Guido van Rossumd8faa362007-04-27 19:54:29 +0000190 finally:
191 self.unfakehttp()
192
Brett Cannon19691362003-04-29 05:08:06 +0000193class urlretrieve_FileTests(unittest.TestCase):
Brett Cannon74bfd702003-04-25 09:39:47 +0000194 """Test urllib.urlretrieve() on local files"""
Skip Montanaro080c9972001-01-28 21:12:22 +0000195
Brett Cannon19691362003-04-29 05:08:06 +0000196 def setUp(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000197 # Create a list of temporary files. Each item in the list is a file
198 # name (absolute path or relative to the current working directory).
199 # All files in this list will be deleted in the tearDown method. Note,
200 # this only helps to makes sure temporary files get deleted, but it
201 # does nothing about trying to close files that may still be open. It
202 # is the responsibility of the developer to properly close files even
203 # when exceptional conditions occur.
204 self.tempFiles = []
205
Brett Cannon19691362003-04-29 05:08:06 +0000206 # Create a temporary file.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000207 self.registerFileForCleanUp(support.TESTFN)
Guido van Rossuma0982942007-07-10 08:30:03 +0000208 self.text = b'testing urllib.urlretrieve'
Georg Brandl5a650a22005-08-26 08:51:34 +0000209 try:
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000210 FILE = open(support.TESTFN, 'wb')
Georg Brandl5a650a22005-08-26 08:51:34 +0000211 FILE.write(self.text)
212 FILE.close()
213 finally:
214 try: FILE.close()
215 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000216
217 def tearDown(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000218 # Delete the temporary files.
219 for each in self.tempFiles:
220 try: os.remove(each)
221 except: pass
222
223 def constructLocalFileUrl(self, filePath):
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000224 return "file://%s" % urllib.request.pathname2url(
225 os.path.abspath(filePath))
Georg Brandl5a650a22005-08-26 08:51:34 +0000226
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000227 def createNewTempFile(self, data=b""):
Georg Brandl5a650a22005-08-26 08:51:34 +0000228 """Creates a new temporary file containing the specified data,
229 registers the file for deletion during the test fixture tear down, and
230 returns the absolute path of the file."""
231
232 newFd, newFilePath = tempfile.mkstemp()
233 try:
234 self.registerFileForCleanUp(newFilePath)
235 newFile = os.fdopen(newFd, "wb")
236 newFile.write(data)
237 newFile.close()
238 finally:
239 try: newFile.close()
240 except: pass
241 return newFilePath
242
243 def registerFileForCleanUp(self, fileName):
244 self.tempFiles.append(fileName)
Brett Cannon19691362003-04-29 05:08:06 +0000245
246 def test_basic(self):
247 # Make sure that a local file just gets its own location returned and
248 # a headers value is returned.
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000249 result = urllib.request.urlretrieve("file:%s" % support.TESTFN)
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000250 self.assertEqual(result[0], support.TESTFN)
Ezio Melottie9615932010-01-24 19:26:24 +0000251 self.assertIsInstance(result[1], email.message.Message,
252 "did not get a email.message.Message instance "
253 "as second returned value")
Brett Cannon19691362003-04-29 05:08:06 +0000254
255 def test_copy(self):
256 # Test that setting the filename argument works.
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000257 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000258 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000259 result = urllib.request.urlretrieve(self.constructLocalFileUrl(
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000260 support.TESTFN), second_temp)
Brett Cannon19691362003-04-29 05:08:06 +0000261 self.assertEqual(second_temp, result[0])
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000262 self.assertTrue(os.path.exists(second_temp), "copy of the file was not "
Brett Cannon19691362003-04-29 05:08:06 +0000263 "made")
Alex Martelli01c77c62006-08-24 02:58:11 +0000264 FILE = open(second_temp, 'rb')
Brett Cannon19691362003-04-29 05:08:06 +0000265 try:
266 text = FILE.read()
Brett Cannon19691362003-04-29 05:08:06 +0000267 FILE.close()
Georg Brandl5a650a22005-08-26 08:51:34 +0000268 finally:
269 try: FILE.close()
270 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000271 self.assertEqual(self.text, text)
272
273 def test_reporthook(self):
274 # Make sure that the reporthook works.
275 def hooktester(count, block_size, total_size, count_holder=[0]):
Ezio Melottie9615932010-01-24 19:26:24 +0000276 self.assertIsInstance(count, int)
277 self.assertIsInstance(block_size, int)
278 self.assertIsInstance(total_size, int)
Brett Cannon19691362003-04-29 05:08:06 +0000279 self.assertEqual(count, count_holder[0])
280 count_holder[0] = count_holder[0] + 1
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000281 second_temp = "%s.2" % support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000282 self.registerFileForCleanUp(second_temp)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000283 urllib.request.urlretrieve(
284 self.constructLocalFileUrl(support.TESTFN),
Georg Brandl5a650a22005-08-26 08:51:34 +0000285 second_temp, hooktester)
286
287 def test_reporthook_0_bytes(self):
288 # Test on zero length file. Should call reporthook only 1 time.
289 report = []
290 def hooktester(count, block_size, total_size, _report=report):
291 _report.append((count, block_size, total_size))
292 srcFileName = self.createNewTempFile()
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000293 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000294 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000295 self.assertEqual(len(report), 1)
296 self.assertEqual(report[0][2], 0)
297
298 def test_reporthook_5_bytes(self):
299 # Test on 5 byte file. Should call reporthook only 2 times (once when
300 # the "network connection" is established and once when the block is
301 # read). Since the block size is 8192 bytes, only one block read is
302 # required to read the entire file.
303 report = []
304 def hooktester(count, block_size, total_size, _report=report):
305 _report.append((count, block_size, total_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000306 srcFileName = self.createNewTempFile(b"x" * 5)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000307 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000308 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000309 self.assertEqual(len(report), 2)
310 self.assertEqual(report[0][1], 8192)
311 self.assertEqual(report[0][2], 5)
312
313 def test_reporthook_8193_bytes(self):
314 # Test on 8193 byte file. Should call reporthook only 3 times (once
315 # when the "network connection" is established, once for the next 8192
316 # bytes, and once for the last byte).
317 report = []
318 def hooktester(count, block_size, total_size, _report=report):
319 _report.append((count, block_size, total_size))
Guido van Rossum70d0dda2007-08-29 01:53:26 +0000320 srcFileName = self.createNewTempFile(b"x" * 8193)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000321 urllib.request.urlretrieve(self.constructLocalFileUrl(srcFileName),
Benjamin Petersonee8712c2008-05-20 21:35:26 +0000322 support.TESTFN, hooktester)
Georg Brandl5a650a22005-08-26 08:51:34 +0000323 self.assertEqual(len(report), 3)
324 self.assertEqual(report[0][1], 8192)
325 self.assertEqual(report[0][2], 8193)
Skip Montanaro080c9972001-01-28 21:12:22 +0000326
Brett Cannon74bfd702003-04-25 09:39:47 +0000327class QuotingTests(unittest.TestCase):
328 """Tests for urllib.quote() and urllib.quote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000329
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000330 According to RFC 2396 (Uniform Resource Identifiers), to escape a
331 character you write it as '%' + <2 character US-ASCII hex value>.
332 The Python code of ``'%' + hex(ord(<character>))[2:]`` escapes a
333 character properly. Case does not matter on the hex letters.
Brett Cannon74bfd702003-04-25 09:39:47 +0000334
335 The various character sets specified are:
Tim Petersc2659cf2003-05-12 20:19:37 +0000336
Brett Cannon74bfd702003-04-25 09:39:47 +0000337 Reserved characters : ";/?:@&=+$,"
338 Have special meaning in URIs and must be escaped if not being used for
339 their special meaning
340 Data characters : letters, digits, and "-_.!~*'()"
341 Unreserved and do not need to be escaped; can be, though, if desired
342 Control characters : 0x00 - 0x1F, 0x7F
343 Have no use in URIs so must be escaped
344 space : 0x20
345 Must be escaped
346 Delimiters : '<>#%"'
347 Must be escaped
348 Unwise : "{}|\^[]`"
349 Must be escaped
Tim Petersc2659cf2003-05-12 20:19:37 +0000350
Brett Cannon74bfd702003-04-25 09:39:47 +0000351 """
352
353 def test_never_quote(self):
354 # Make sure quote() does not quote letters, digits, and "_,.-"
355 do_not_quote = '' .join(["ABCDEFGHIJKLMNOPQRSTUVWXYZ",
356 "abcdefghijklmnopqrstuvwxyz",
357 "0123456789",
358 "_.-"])
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000359 result = urllib.parse.quote(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000360 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000361 "using quote(): %r != %r" % (do_not_quote, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000362 result = urllib.parse.quote_plus(do_not_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000363 self.assertEqual(do_not_quote, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000364 "using quote_plus(): %r != %r" % (do_not_quote, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000365
366 def test_default_safe(self):
367 # Test '/' is default value for 'safe' parameter
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000368 self.assertEqual(urllib.parse.quote.__defaults__[0], '/')
Brett Cannon74bfd702003-04-25 09:39:47 +0000369
370 def test_safe(self):
371 # Test setting 'safe' parameter does what it should do
372 quote_by_default = "<>"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000373 result = urllib.parse.quote(quote_by_default, safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000374 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000375 "using quote(): %r != %r" % (quote_by_default, result))
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000376 result = urllib.parse.quote_plus(quote_by_default,
377 safe=quote_by_default)
Brett Cannon74bfd702003-04-25 09:39:47 +0000378 self.assertEqual(quote_by_default, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000379 "using quote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000380 (quote_by_default, result))
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000381 # Safe expressed as bytes rather than str
382 result = urllib.parse.quote(quote_by_default, safe=b"<>")
383 self.assertEqual(quote_by_default, result,
384 "using quote(): %r != %r" % (quote_by_default, result))
385 # "Safe" non-ASCII characters should have no effect
386 # (Since URIs are not allowed to have non-ASCII characters)
387 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="\xfc")
388 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
389 self.assertEqual(expect, result,
390 "using quote(): %r != %r" %
391 (expect, result))
392 # Same as above, but using a bytes rather than str
393 result = urllib.parse.quote("a\xfcb", encoding="latin-1", safe=b"\xfc")
394 expect = urllib.parse.quote("a\xfcb", encoding="latin-1", safe="")
395 self.assertEqual(expect, result,
396 "using quote(): %r != %r" %
397 (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000398
399 def test_default_quoting(self):
400 # Make sure all characters that should be quoted are by default sans
401 # space (separate test for that).
402 should_quote = [chr(num) for num in range(32)] # For 0x00 - 0x1F
403 should_quote.append('<>#%"{}|\^[]`')
404 should_quote.append(chr(127)) # For 0x7F
405 should_quote = ''.join(should_quote)
406 for char in should_quote:
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000407 result = urllib.parse.quote(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000408 self.assertEqual(hexescape(char), result,
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000409 "using quote(): "
410 "%s should be escaped to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000411 (char, hexescape(char), result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000412 result = urllib.parse.quote_plus(char)
Brett Cannon74bfd702003-04-25 09:39:47 +0000413 self.assertEqual(hexescape(char), result,
414 "using quote_plus(): "
Tim Petersc2659cf2003-05-12 20:19:37 +0000415 "%s should be escapes to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000416 (char, hexescape(char), result))
417 del should_quote
418 partial_quote = "ab[]cd"
419 expected = "ab%5B%5Dcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000420 result = urllib.parse.quote(partial_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000421 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000422 "using quote(): %r != %r" % (expected, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000423 self.assertEqual(expected, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000424 "using quote_plus(): %r != %r" % (expected, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000425
426 def test_quoting_space(self):
427 # Make sure quote() and quote_plus() handle spaces as specified in
428 # their unique way
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000429 result = urllib.parse.quote(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000430 self.assertEqual(result, hexescape(' '),
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000431 "using quote(): %r != %r" % (result, hexescape(' ')))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000432 result = urllib.parse.quote_plus(' ')
Brett Cannon74bfd702003-04-25 09:39:47 +0000433 self.assertEqual(result, '+',
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000434 "using quote_plus(): %r != +" % result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000435 given = "a b cd e f"
436 expect = given.replace(' ', hexescape(' '))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000437 result = urllib.parse.quote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000438 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000439 "using quote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000440 expect = given.replace(' ', '+')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000441 result = urllib.parse.quote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000442 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000443 "using quote_plus(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000444
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000445 def test_quoting_plus(self):
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000446 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000447 'alpha%2Bbeta+gamma')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000448 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', '+'),
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000449 'alpha+beta+gamma')
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000450 # Test with bytes
451 self.assertEqual(urllib.parse.quote_plus(b'alpha+beta gamma'),
452 'alpha%2Bbeta+gamma')
453 # Test with safe bytes
454 self.assertEqual(urllib.parse.quote_plus('alpha+beta gamma', b'+'),
455 'alpha+beta+gamma')
456
457 def test_quote_bytes(self):
458 # Bytes should quote directly to percent-encoded values
459 given = b"\xa2\xd8ab\xff"
460 expect = "%A2%D8ab%FF"
461 result = urllib.parse.quote(given)
462 self.assertEqual(expect, result,
463 "using quote(): %r != %r" % (expect, result))
464 # Encoding argument should raise type error on bytes input
465 self.assertRaises(TypeError, urllib.parse.quote, given,
466 encoding="latin-1")
467 # quote_from_bytes should work the same
468 result = urllib.parse.quote_from_bytes(given)
469 self.assertEqual(expect, result,
470 "using quote_from_bytes(): %r != %r"
471 % (expect, result))
472
473 def test_quote_with_unicode(self):
474 # Characters in Latin-1 range, encoded by default in UTF-8
475 given = "\xa2\xd8ab\xff"
476 expect = "%C2%A2%C3%98ab%C3%BF"
477 result = urllib.parse.quote(given)
478 self.assertEqual(expect, result,
479 "using quote(): %r != %r" % (expect, result))
480 # Characters in Latin-1 range, encoded by with None (default)
481 result = urllib.parse.quote(given, encoding=None, errors=None)
482 self.assertEqual(expect, result,
483 "using quote(): %r != %r" % (expect, result))
484 # Characters in Latin-1 range, encoded with Latin-1
485 given = "\xa2\xd8ab\xff"
486 expect = "%A2%D8ab%FF"
487 result = urllib.parse.quote(given, encoding="latin-1")
488 self.assertEqual(expect, result,
489 "using quote(): %r != %r" % (expect, result))
490 # Characters in BMP, encoded by default in UTF-8
491 given = "\u6f22\u5b57" # "Kanji"
492 expect = "%E6%BC%A2%E5%AD%97"
493 result = urllib.parse.quote(given)
494 self.assertEqual(expect, result,
495 "using quote(): %r != %r" % (expect, result))
496 # Characters in BMP, encoded with Latin-1
497 given = "\u6f22\u5b57"
498 self.assertRaises(UnicodeEncodeError, urllib.parse.quote, given,
499 encoding="latin-1")
500 # Characters in BMP, encoded with Latin-1, with replace error handling
501 given = "\u6f22\u5b57"
502 expect = "%3F%3F" # "??"
503 result = urllib.parse.quote(given, encoding="latin-1",
504 errors="replace")
505 self.assertEqual(expect, result,
506 "using quote(): %r != %r" % (expect, result))
507 # Characters in BMP, Latin-1, with xmlcharref error handling
508 given = "\u6f22\u5b57"
509 expect = "%26%2328450%3B%26%2323383%3B" # "&#28450;&#23383;"
510 result = urllib.parse.quote(given, encoding="latin-1",
511 errors="xmlcharrefreplace")
512 self.assertEqual(expect, result,
513 "using quote(): %r != %r" % (expect, result))
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000514
Georg Brandlfaf41492009-05-26 18:31:11 +0000515 def test_quote_plus_with_unicode(self):
516 # Encoding (latin-1) test for quote_plus
517 given = "\xa2\xd8 \xff"
518 expect = "%A2%D8+%FF"
519 result = urllib.parse.quote_plus(given, encoding="latin-1")
520 self.assertEqual(expect, result,
521 "using quote_plus(): %r != %r" % (expect, result))
522 # Errors test for quote_plus
523 given = "ab\u6f22\u5b57 cd"
524 expect = "ab%3F%3F+cd"
525 result = urllib.parse.quote_plus(given, encoding="latin-1",
526 errors="replace")
527 self.assertEqual(expect, result,
528 "using quote_plus(): %r != %r" % (expect, result))
529
Senthil Kumarand496c4c2010-07-30 19:34:36 +0000530
Brett Cannon74bfd702003-04-25 09:39:47 +0000531class UnquotingTests(unittest.TestCase):
532 """Tests for unquote() and unquote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000533
Brett Cannon74bfd702003-04-25 09:39:47 +0000534 See the doc string for quoting_Tests for details on quoting and such.
535
536 """
537
538 def test_unquoting(self):
539 # Make sure unquoting of all ASCII values works
540 escape_list = []
541 for num in range(128):
542 given = hexescape(chr(num))
543 expect = chr(num)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000544 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000545 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000546 "using unquote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000547 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000548 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000549 "using unquote_plus(): %r != %r" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000550 (expect, result))
551 escape_list.append(given)
552 escape_string = ''.join(escape_list)
553 del escape_list
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000554 result = urllib.parse.unquote(escape_string)
Brett Cannon74bfd702003-04-25 09:39:47 +0000555 self.assertEqual(result.count('%'), 1,
Brett Cannon74bfd702003-04-25 09:39:47 +0000556 "using unquote(): not all characters escaped: "
557 "%s" % result)
Georg Brandl604ef372010-07-31 08:20:02 +0000558 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, None)
559 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, ())
Florent Xiclunac049fca2010-07-31 08:56:55 +0000560 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote, b'')
Brett Cannon74bfd702003-04-25 09:39:47 +0000561
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000562 def test_unquoting_badpercent(self):
563 # Test unquoting on bad percent-escapes
564 given = '%xab'
565 expect = given
566 result = urllib.parse.unquote(given)
567 self.assertEqual(expect, result, "using unquote(): %r != %r"
568 % (expect, result))
569 given = '%x'
570 expect = given
571 result = urllib.parse.unquote(given)
572 self.assertEqual(expect, result, "using unquote(): %r != %r"
573 % (expect, result))
574 given = '%'
575 expect = given
576 result = urllib.parse.unquote(given)
577 self.assertEqual(expect, result, "using unquote(): %r != %r"
578 % (expect, result))
579 # unquote_to_bytes
580 given = '%xab'
581 expect = bytes(given, 'ascii')
582 result = urllib.parse.unquote_to_bytes(given)
583 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
584 % (expect, result))
585 given = '%x'
586 expect = bytes(given, 'ascii')
587 result = urllib.parse.unquote_to_bytes(given)
588 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
589 % (expect, result))
590 given = '%'
591 expect = bytes(given, 'ascii')
592 result = urllib.parse.unquote_to_bytes(given)
593 self.assertEqual(expect, result, "using unquote_to_bytes(): %r != %r"
594 % (expect, result))
Georg Brandl604ef372010-07-31 08:20:02 +0000595 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, None)
596 self.assertRaises((TypeError, AttributeError), urllib.parse.unquote_to_bytes, ())
Senthil Kumaran79e17f62010-07-19 18:17:19 +0000597
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000598 def test_unquoting_mixed_case(self):
599 # Test unquoting on mixed-case hex digits in the percent-escapes
600 given = '%Ab%eA'
601 expect = b'\xab\xea'
602 result = urllib.parse.unquote_to_bytes(given)
603 self.assertEqual(expect, result,
604 "using unquote_to_bytes(): %r != %r"
605 % (expect, result))
606
Brett Cannon74bfd702003-04-25 09:39:47 +0000607 def test_unquoting_parts(self):
608 # Make sure unquoting works when have non-quoted characters
609 # interspersed
610 given = 'ab%sd' % hexescape('c')
611 expect = "abcd"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000612 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000613 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000614 "using quote(): %r != %r" % (expect, result))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000615 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000616 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000617 "using unquote_plus(): %r != %r" % (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000618
Brett Cannon74bfd702003-04-25 09:39:47 +0000619 def test_unquoting_plus(self):
620 # Test difference between unquote() and unquote_plus()
621 given = "are+there+spaces..."
622 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000623 result = urllib.parse.unquote(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000624 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000625 "using unquote(): %r != %r" % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000626 expect = given.replace('+', ' ')
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000627 result = urllib.parse.unquote_plus(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000628 self.assertEqual(expect, result,
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000629 "using unquote_plus(): %r != %r" % (expect, result))
630
631 def test_unquote_to_bytes(self):
632 given = 'br%C3%BCckner_sapporo_20050930.doc'
633 expect = b'br\xc3\xbcckner_sapporo_20050930.doc'
634 result = urllib.parse.unquote_to_bytes(given)
635 self.assertEqual(expect, result,
636 "using unquote_to_bytes(): %r != %r"
637 % (expect, result))
638 # Test on a string with unescaped non-ASCII characters
639 # (Technically an invalid URI; expect those characters to be UTF-8
640 # encoded).
641 result = urllib.parse.unquote_to_bytes("\u6f22%C3%BC")
642 expect = b'\xe6\xbc\xa2\xc3\xbc' # UTF-8 for "\u6f22\u00fc"
643 self.assertEqual(expect, result,
644 "using unquote_to_bytes(): %r != %r"
645 % (expect, result))
646 # Test with a bytes as input
647 given = b'%A2%D8ab%FF'
648 expect = b'\xa2\xd8ab\xff'
649 result = urllib.parse.unquote_to_bytes(given)
650 self.assertEqual(expect, result,
651 "using unquote_to_bytes(): %r != %r"
652 % (expect, result))
653 # Test with a bytes as input, with unescaped non-ASCII bytes
654 # (Technically an invalid URI; expect those bytes to be preserved)
655 given = b'%A2\xd8ab%FF'
656 expect = b'\xa2\xd8ab\xff'
657 result = urllib.parse.unquote_to_bytes(given)
658 self.assertEqual(expect, result,
659 "using unquote_to_bytes(): %r != %r"
660 % (expect, result))
Brett Cannon74bfd702003-04-25 09:39:47 +0000661
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000662 def test_unquote_with_unicode(self):
Guido van Rossum52dbbb92008-08-18 21:44:30 +0000663 # Characters in the Latin-1 range, encoded with UTF-8
664 given = 'br%C3%BCckner_sapporo_20050930.doc'
665 expect = 'br\u00fcckner_sapporo_20050930.doc'
666 result = urllib.parse.unquote(given)
667 self.assertEqual(expect, result,
668 "using unquote(): %r != %r" % (expect, result))
669 # Characters in the Latin-1 range, encoded with None (default)
670 result = urllib.parse.unquote(given, encoding=None, errors=None)
671 self.assertEqual(expect, result,
672 "using unquote(): %r != %r" % (expect, result))
673
674 # Characters in the Latin-1 range, encoded with Latin-1
675 result = urllib.parse.unquote('br%FCckner_sapporo_20050930.doc',
676 encoding="latin-1")
677 expect = 'br\u00fcckner_sapporo_20050930.doc'
678 self.assertEqual(expect, result,
679 "using unquote(): %r != %r" % (expect, result))
680
681 # Characters in BMP, encoded with UTF-8
682 given = "%E6%BC%A2%E5%AD%97"
683 expect = "\u6f22\u5b57" # "Kanji"
684 result = urllib.parse.unquote(given)
685 self.assertEqual(expect, result,
686 "using unquote(): %r != %r" % (expect, result))
687
688 # Decode with UTF-8, invalid sequence
689 given = "%F3%B1"
690 expect = "\ufffd" # Replacement character
691 result = urllib.parse.unquote(given)
692 self.assertEqual(expect, result,
693 "using unquote(): %r != %r" % (expect, result))
694
695 # Decode with UTF-8, invalid sequence, replace errors
696 result = urllib.parse.unquote(given, errors="replace")
697 self.assertEqual(expect, result,
698 "using unquote(): %r != %r" % (expect, result))
699
700 # Decode with UTF-8, invalid sequence, ignoring errors
701 given = "%F3%B1"
702 expect = ""
703 result = urllib.parse.unquote(given, errors="ignore")
704 self.assertEqual(expect, result,
705 "using unquote(): %r != %r" % (expect, result))
706
707 # A mix of non-ASCII and percent-encoded characters, UTF-8
708 result = urllib.parse.unquote("\u6f22%C3%BC")
709 expect = '\u6f22\u00fc'
710 self.assertEqual(expect, result,
711 "using unquote(): %r != %r" % (expect, result))
712
713 # A mix of non-ASCII and percent-encoded characters, Latin-1
714 # (Note, the string contains non-Latin-1-representable characters)
715 result = urllib.parse.unquote("\u6f22%FC", encoding="latin-1")
716 expect = '\u6f22\u00fc'
717 self.assertEqual(expect, result,
718 "using unquote(): %r != %r" % (expect, result))
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000719
Brett Cannon74bfd702003-04-25 09:39:47 +0000720class urlencode_Tests(unittest.TestCase):
721 """Tests for urlencode()"""
722
723 def help_inputtype(self, given, test_type):
724 """Helper method for testing different input types.
Tim Petersc2659cf2003-05-12 20:19:37 +0000725
Brett Cannon74bfd702003-04-25 09:39:47 +0000726 'given' must lead to only the pairs:
727 * 1st, 1
728 * 2nd, 2
729 * 3rd, 3
Tim Petersc2659cf2003-05-12 20:19:37 +0000730
Brett Cannon74bfd702003-04-25 09:39:47 +0000731 Test cannot assume anything about order. Docs make no guarantee and
732 have possible dictionary input.
Tim Petersc2659cf2003-05-12 20:19:37 +0000733
Brett Cannon74bfd702003-04-25 09:39:47 +0000734 """
735 expect_somewhere = ["1st=1", "2nd=2", "3rd=3"]
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000736 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000737 for expected in expect_somewhere:
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000738 self.assertIn(expected, result,
Brett Cannon74bfd702003-04-25 09:39:47 +0000739 "testing %s: %s not found in %s" %
740 (test_type, expected, result))
741 self.assertEqual(result.count('&'), 2,
742 "testing %s: expected 2 '&'s; got %s" %
743 (test_type, result.count('&')))
744 amp_location = result.index('&')
745 on_amp_left = result[amp_location - 1]
746 on_amp_right = result[amp_location + 1]
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000747 self.assertTrue(on_amp_left.isdigit() and on_amp_right.isdigit(),
Brett Cannon74bfd702003-04-25 09:39:47 +0000748 "testing %s: '&' not located in proper place in %s" %
749 (test_type, result))
750 self.assertEqual(len(result), (5 * 3) + 2, #5 chars per thing and amps
751 "testing %s: "
752 "unexpected number of characters: %s != %s" %
753 (test_type, len(result), (5 * 3) + 2))
754
755 def test_using_mapping(self):
756 # Test passing in a mapping object as an argument.
757 self.help_inputtype({"1st":'1', "2nd":'2', "3rd":'3'},
758 "using dict as input type")
759
760 def test_using_sequence(self):
761 # Test passing in a sequence of two-item sequences as an argument.
762 self.help_inputtype([('1st', '1'), ('2nd', '2'), ('3rd', '3')],
763 "using sequence of two-item tuples as input")
764
765 def test_quoting(self):
766 # Make sure keys and values are quoted using quote_plus()
767 given = {"&":"="}
768 expect = "%s=%s" % (hexescape('&'), hexescape('='))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000769 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000770 self.assertEqual(expect, result)
771 given = {"key name":"A bunch of pluses"}
772 expect = "key+name=A+bunch+of+pluses"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000773 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000774 self.assertEqual(expect, result)
775
776 def test_doseq(self):
777 # Test that passing True for 'doseq' parameter works correctly
778 given = {'sequence':['1', '2', '3']}
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000779 expect = "sequence=%s" % urllib.parse.quote_plus(str(['1', '2', '3']))
780 result = urllib.parse.urlencode(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000781 self.assertEqual(expect, result)
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000782 result = urllib.parse.urlencode(given, True)
Brett Cannon74bfd702003-04-25 09:39:47 +0000783 for value in given["sequence"]:
784 expect = "sequence=%s" % value
Ezio Melottib58e0bd2010-01-23 15:40:09 +0000785 self.assertIn(expect, result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000786 self.assertEqual(result.count('&'), 2,
787 "Expected 2 '&'s, got %s" % result.count('&'))
788
Jeremy Hylton1ef7c6b2009-03-26 16:57:30 +0000789 def test_empty_sequence(self):
790 self.assertEqual("", urllib.parse.urlencode({}))
791 self.assertEqual("", urllib.parse.urlencode([]))
792
793 def test_nonstring_values(self):
794 self.assertEqual("a=1", urllib.parse.urlencode({"a": 1}))
795 self.assertEqual("a=None", urllib.parse.urlencode({"a": None}))
796
797 def test_nonstring_seq_values(self):
798 self.assertEqual("a=1&a=2", urllib.parse.urlencode({"a": [1, 2]}, True))
799 self.assertEqual("a=None&a=a",
800 urllib.parse.urlencode({"a": [None, "a"]}, True))
801 self.assertEqual("a=a&a=b",
802 urllib.parse.urlencode({"a": {"a": 1, "b": 1}}, True))
803
Senthil Kumarandf022da2010-07-03 17:48:22 +0000804 def test_urlencode_encoding(self):
805 # ASCII encoding. Expect %3F with errors="replace'
806 given = (('\u00a0', '\u00c1'),)
807 expect = '%3F=%3F'
808 result = urllib.parse.urlencode(given, encoding="ASCII", errors="replace")
809 self.assertEqual(expect, result)
810
811 # Default is UTF-8 encoding.
812 given = (('\u00a0', '\u00c1'),)
813 expect = '%C2%A0=%C3%81'
814 result = urllib.parse.urlencode(given)
815 self.assertEqual(expect, result)
816
817 # Latin-1 encoding.
818 given = (('\u00a0', '\u00c1'),)
819 expect = '%A0=%C1'
820 result = urllib.parse.urlencode(given, encoding="latin-1")
821 self.assertEqual(expect, result)
822
823 def test_urlencode_encoding_doseq(self):
824 # ASCII Encoding. Expect %3F with errors="replace'
825 given = (('\u00a0', '\u00c1'),)
826 expect = '%3F=%3F'
827 result = urllib.parse.urlencode(given, doseq=True,
828 encoding="ASCII", errors="replace")
829 self.assertEqual(expect, result)
830
831 # ASCII Encoding. On a sequence of values.
832 given = (("\u00a0", (1, "\u00c1")),)
833 expect = '%3F=1&%3F=%3F'
834 result = urllib.parse.urlencode(given, True,
835 encoding="ASCII", errors="replace")
836 self.assertEqual(expect, result)
837
838 # Utf-8
839 given = (("\u00a0", "\u00c1"),)
840 expect = '%C2%A0=%C3%81'
841 result = urllib.parse.urlencode(given, True)
842 self.assertEqual(expect, result)
843
844 given = (("\u00a0", (42, "\u00c1")),)
845 expect = '%C2%A0=42&%C2%A0=%C3%81'
846 result = urllib.parse.urlencode(given, True)
847 self.assertEqual(expect, result)
848
849 # latin-1
850 given = (("\u00a0", "\u00c1"),)
851 expect = '%A0=%C1'
852 result = urllib.parse.urlencode(given, True, encoding="latin-1")
853 self.assertEqual(expect, result)
854
855 given = (("\u00a0", (42, "\u00c1")),)
856 expect = '%A0=42&%A0=%C1'
857 result = urllib.parse.urlencode(given, True, encoding="latin-1")
858 self.assertEqual(expect, result)
859
860 def test_urlencode_bytes(self):
861 given = ((b'\xa0\x24', b'\xc1\x24'),)
862 expect = '%A0%24=%C1%24'
863 result = urllib.parse.urlencode(given)
864 self.assertEqual(expect, result)
865 result = urllib.parse.urlencode(given, True)
866 self.assertEqual(expect, result)
867
868 # Sequence of values
869 given = ((b'\xa0\x24', (42, b'\xc1\x24')),)
870 expect = '%A0%24=42&%A0%24=%C1%24'
871 result = urllib.parse.urlencode(given, True)
872 self.assertEqual(expect, result)
873
874 def test_urlencode_encoding_safe_parameter(self):
875
876 # Send '$' (\x24) as safe character
877 # Default utf-8 encoding
878
879 given = ((b'\xa0\x24', b'\xc1\x24'),)
880 result = urllib.parse.urlencode(given, safe=":$")
881 expect = '%A0$=%C1$'
882 self.assertEqual(expect, result)
883
884 given = ((b'\xa0\x24', b'\xc1\x24'),)
885 result = urllib.parse.urlencode(given, doseq=True, safe=":$")
886 expect = '%A0$=%C1$'
887 self.assertEqual(expect, result)
888
889 # Safe parameter in sequence
890 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
891 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
892 result = urllib.parse.urlencode(given, True, safe=":$")
893 self.assertEqual(expect, result)
894
895 # Test all above in latin-1 encoding
896
897 given = ((b'\xa0\x24', b'\xc1\x24'),)
898 result = urllib.parse.urlencode(given, safe=":$",
899 encoding="latin-1")
900 expect = '%A0$=%C1$'
901 self.assertEqual(expect, result)
902
903 given = ((b'\xa0\x24', b'\xc1\x24'),)
904 expect = '%A0$=%C1$'
905 result = urllib.parse.urlencode(given, doseq=True, safe=":$",
906 encoding="latin-1")
907
908 given = ((b'\xa0\x24', (b'\xc1\x24', 0xd, 42)),)
909 expect = '%A0$=%C1$&%A0$=13&%A0$=42'
910 result = urllib.parse.urlencode(given, True, safe=":$",
911 encoding="latin-1")
912 self.assertEqual(expect, result)
913
Brett Cannon74bfd702003-04-25 09:39:47 +0000914class Pathname_Tests(unittest.TestCase):
915 """Test pathname2url() and url2pathname()"""
916
917 def test_basic(self):
918 # Make sure simple tests pass
919 expected_path = os.path.join("parts", "of", "a", "path")
920 expected_url = "parts/of/a/path"
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000921 result = urllib.request.pathname2url(expected_path)
Brett Cannon74bfd702003-04-25 09:39:47 +0000922 self.assertEqual(expected_url, result,
923 "pathname2url() failed; %s != %s" %
924 (result, expected_url))
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000925 result = urllib.request.url2pathname(expected_url)
Brett Cannon74bfd702003-04-25 09:39:47 +0000926 self.assertEqual(expected_path, result,
927 "url2pathame() failed; %s != %s" %
928 (result, expected_path))
929
930 def test_quoting(self):
931 # Test automatic quoting and unquoting works for pathnam2url() and
932 # url2pathname() respectively
933 given = os.path.join("needs", "quot=ing", "here")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000934 expect = "needs/%s/here" % urllib.parse.quote("quot=ing")
935 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000936 self.assertEqual(expect, result,
937 "pathname2url() failed; %s != %s" %
938 (expect, result))
939 expect = given
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000940 result = urllib.request.url2pathname(result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000941 self.assertEqual(expect, result,
942 "url2pathname() failed; %s != %s" %
943 (expect, result))
944 given = os.path.join("make sure", "using_quote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000945 expect = "%s/using_quote" % urllib.parse.quote("make sure")
946 result = urllib.request.pathname2url(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000947 self.assertEqual(expect, result,
948 "pathname2url() failed; %s != %s" %
949 (expect, result))
950 given = "make+sure/using_unquote"
951 expect = os.path.join("make+sure", "using_unquote")
Jeremy Hylton1afc1692008-06-18 20:49:58 +0000952 result = urllib.request.url2pathname(given)
Brett Cannon74bfd702003-04-25 09:39:47 +0000953 self.assertEqual(expect, result,
954 "url2pathname() failed; %s != %s" %
955 (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000956
Senthil Kumaraneaaec272009-03-30 21:54:41 +0000957class Utility_Tests(unittest.TestCase):
958 """Testcase to test the various utility functions in the urllib."""
959
960 def test_splitpasswd(self):
961 """Some of password examples are not sensible, but it is added to
962 confirming to RFC2617 and addressing issue4675.
963 """
964 self.assertEqual(('user', 'ab'),urllib.parse.splitpasswd('user:ab'))
965 self.assertEqual(('user', 'a\nb'),urllib.parse.splitpasswd('user:a\nb'))
966 self.assertEqual(('user', 'a\tb'),urllib.parse.splitpasswd('user:a\tb'))
967 self.assertEqual(('user', 'a\rb'),urllib.parse.splitpasswd('user:a\rb'))
968 self.assertEqual(('user', 'a\fb'),urllib.parse.splitpasswd('user:a\fb'))
969 self.assertEqual(('user', 'a\vb'),urllib.parse.splitpasswd('user:a\vb'))
970 self.assertEqual(('user', 'a:b'),urllib.parse.splitpasswd('user:a:b'))
971
Senthil Kumaran690ce9b2009-05-05 18:41:13 +0000972
973class URLopener_Tests(unittest.TestCase):
974 """Testcase to test the open method of URLopener class."""
975
976 def test_quoted_open(self):
977 class DummyURLopener(urllib.request.URLopener):
978 def open_spam(self, url):
979 return url
980
981 self.assertEqual(DummyURLopener().open(
982 'spam://example/ /'),'//example/%20/')
983
Senthil Kumaran734f0592010-02-20 22:19:04 +0000984 # test the safe characters are not quoted by urlopen
985 self.assertEqual(DummyURLopener().open(
986 "spam://c:|windows%/:=&?~#+!$,;'@()*[]|/path/"),
987 "//c:|windows%/:=&?~#+!$,;'@()*[]|/path/")
988
Guido van Rossume7ba4952007-06-06 23:52:48 +0000989# Just commented them out.
990# Can't really tell why keep failing in windows and sparc.
991# Everywhere else they work ok, but on those machines, someteimes
992# fail in one of the tests, sometimes in other. I have a linux, and
993# the tests go ok.
994# If anybody has one of the problematic enviroments, please help!
995# . Facundo
996#
997# def server(evt):
Georg Brandlf78e02b2008-06-10 17:40:04 +0000998# import socket, time
Guido van Rossume7ba4952007-06-06 23:52:48 +0000999# serv = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
1000# serv.settimeout(3)
1001# serv.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
1002# serv.bind(("", 9093))
1003# serv.listen(5)
1004# try:
1005# conn, addr = serv.accept()
1006# conn.send("1 Hola mundo\n")
1007# cantdata = 0
1008# while cantdata < 13:
1009# data = conn.recv(13-cantdata)
1010# cantdata += len(data)
1011# time.sleep(.3)
1012# conn.send("2 No more lines\n")
1013# conn.close()
1014# except socket.timeout:
1015# pass
1016# finally:
1017# serv.close()
1018# evt.set()
1019#
1020# class FTPWrapperTests(unittest.TestCase):
1021#
1022# def setUp(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001023# import ftplib, time, threading
Guido van Rossume7ba4952007-06-06 23:52:48 +00001024# ftplib.FTP.port = 9093
1025# self.evt = threading.Event()
1026# threading.Thread(target=server, args=(self.evt,)).start()
1027# time.sleep(.1)
1028#
1029# def tearDown(self):
1030# self.evt.wait()
1031#
1032# def testBasic(self):
1033# # connects
1034# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
Georg Brandlf78e02b2008-06-10 17:40:04 +00001035# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001036#
1037# def testTimeoutNone(self):
Georg Brandlf78e02b2008-06-10 17:40:04 +00001038# # global default timeout is ignored
1039# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001040# self.assertTrue(socket.getdefaulttimeout() is None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001041# socket.setdefaulttimeout(30)
1042# try:
1043# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1044# finally:
Georg Brandlf78e02b2008-06-10 17:40:04 +00001045# socket.setdefaulttimeout(None)
Guido van Rossume7ba4952007-06-06 23:52:48 +00001046# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001047# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001048#
Georg Brandlf78e02b2008-06-10 17:40:04 +00001049# def testTimeoutDefault(self):
1050# # global default timeout is used
1051# import socket
Benjamin Petersonc9c0f202009-06-30 23:06:06 +00001052# self.assertTrue(socket.getdefaulttimeout() is None)
Georg Brandlf78e02b2008-06-10 17:40:04 +00001053# socket.setdefaulttimeout(30)
1054# try:
1055# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1056# finally:
1057# socket.setdefaulttimeout(None)
1058# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1059# ftp.close()
1060#
1061# def testTimeoutValue(self):
1062# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [],
1063# timeout=30)
1064# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1065# ftp.close()
Guido van Rossume7ba4952007-06-06 23:52:48 +00001066
Skip Montanaro080c9972001-01-28 21:12:22 +00001067
1068
Brett Cannon74bfd702003-04-25 09:39:47 +00001069def test_main():
Benjamin Petersonee8712c2008-05-20 21:35:26 +00001070 support.run_unittest(
Walter Dörwald21d3a322003-05-01 17:45:56 +00001071 urlopen_FileTests,
Hye-Shik Chang39aef792004-06-05 13:30:56 +00001072 urlopen_HttpTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001073 urlretrieve_FileTests,
Benjamin Peterson9bc93512008-09-22 22:10:59 +00001074 ProxyTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001075 QuotingTests,
1076 UnquotingTests,
1077 urlencode_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001078 Pathname_Tests,
Senthil Kumaraneaaec272009-03-30 21:54:41 +00001079 Utility_Tests,
Senthil Kumaran690ce9b2009-05-05 18:41:13 +00001080 URLopener_Tests,
Guido van Rossume7ba4952007-06-06 23:52:48 +00001081 #FTPWrapperTests,
Walter Dörwald21d3a322003-05-01 17:45:56 +00001082 )
Brett Cannon74bfd702003-04-25 09:39:47 +00001083
1084
1085
1086if __name__ == '__main__':
1087 test_main()