blob: 14de91e13dad19e6262f578032087898d84836ee [file] [log] [blame]
Martin Panter65076572016-09-07 12:03:06 +00001"""Regression tests for urllib"""
Brett Cannon74bfd702003-04-25 09:39:47 +00002
Senthil Kumaranb31c87b2016-04-25 09:17:54 -07003import collections
Jeremy Hylton6102e292000-08-31 15:48:10 +00004import urllib
Hye-Shik Chang39aef792004-06-05 13:30:56 +00005import httplib
Serhiy Storchakaa898abd2014-09-06 21:41:39 +03006import io
Brett Cannon74bfd702003-04-25 09:39:47 +00007import unittest
Brett Cannon74bfd702003-04-25 09:39:47 +00008import os
Senthil Kumarana99b7612011-04-14 12:54:35 +08009import sys
Brett Cannon74bfd702003-04-25 09:39:47 +000010import mimetools
Georg Brandl5a650a22005-08-26 08:51:34 +000011import tempfile
Jeremy Hylton6102e292000-08-31 15:48:10 +000012
Senthil Kumaranbcd833f2012-01-11 00:09:24 +080013from test import test_support
14from base64 import b64encode
15
16
Brett Cannon74bfd702003-04-25 09:39:47 +000017def hexescape(char):
18 """Escape char as RFC 2396 specifies"""
19 hex_repr = hex(ord(char))[2:].upper()
20 if len(hex_repr) == 1:
21 hex_repr = "0%s" % hex_repr
22 return "%" + hex_repr
Jeremy Hylton6102e292000-08-31 15:48:10 +000023
Senthil Kumaran87e58552011-11-01 02:44:45 +080024
Serhiy Storchakaa898abd2014-09-06 21:41:39 +030025def fakehttp(fakedata):
26 class FakeSocket(io.BytesIO):
27
28 def sendall(self, data):
29 FakeHTTPConnection.buf = data
30
31 def makefile(self, *args, **kwds):
32 return self
33
34 def read(self, amt=None):
35 if self.closed:
36 return b""
37 return io.BytesIO.read(self, amt)
38
39 def readline(self, length=None):
40 if self.closed:
41 return b""
42 return io.BytesIO.readline(self, length)
43
44 class FakeHTTPConnection(httplib.HTTPConnection):
45
46 # buffer to store data for verification in urlopen tests.
47 buf = ""
Serhiy Storchakaa898abd2014-09-06 21:41:39 +030048
49 def connect(self):
Martin Panter3079bbe2016-05-16 01:07:13 +000050 self.sock = FakeSocket(self.fakedata)
51 self.__class__.fakesock = self.sock
52 FakeHTTPConnection.fakedata = fakedata
Serhiy Storchakaa898abd2014-09-06 21:41:39 +030053
54 return FakeHTTPConnection
55
56
Senthil Kumaran87e58552011-11-01 02:44:45 +080057class FakeHTTPMixin(object):
58 def fakehttp(self, fakedata):
Senthil Kumaran87e58552011-11-01 02:44:45 +080059 assert httplib.HTTP._connection_class == httplib.HTTPConnection
Senthil Kumaranbcd833f2012-01-11 00:09:24 +080060
Serhiy Storchakaa898abd2014-09-06 21:41:39 +030061 httplib.HTTP._connection_class = fakehttp(fakedata)
Senthil Kumaran87e58552011-11-01 02:44:45 +080062
63 def unfakehttp(self):
64 httplib.HTTP._connection_class = httplib.HTTPConnection
65
66
Brett Cannon74bfd702003-04-25 09:39:47 +000067class urlopen_FileTests(unittest.TestCase):
68 """Test urlopen() opening a temporary file.
Jeremy Hylton6102e292000-08-31 15:48:10 +000069
Brett Cannon74bfd702003-04-25 09:39:47 +000070 Try to test as much functionality as possible so as to cut down on reliance
Andrew M. Kuchlingf1a2f9e2004-06-29 13:07:53 +000071 on connecting to the Net for testing.
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000072
Brett Cannon74bfd702003-04-25 09:39:47 +000073 """
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000074
Brett Cannon74bfd702003-04-25 09:39:47 +000075 def setUp(self):
76 """Setup of a temp file to use for testing"""
77 self.text = "test_urllib: %s\n" % self.__class__.__name__
Guido van Rossum51735b02003-04-25 15:01:05 +000078 FILE = file(test_support.TESTFN, 'wb')
Brett Cannon74bfd702003-04-25 09:39:47 +000079 try:
80 FILE.write(self.text)
81 finally:
82 FILE.close()
83 self.pathname = test_support.TESTFN
84 self.returned_obj = urllib.urlopen("file:%s" % self.pathname)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000085
Brett Cannon74bfd702003-04-25 09:39:47 +000086 def tearDown(self):
87 """Shut down the open object"""
88 self.returned_obj.close()
Brett Cannon19691362003-04-29 05:08:06 +000089 os.remove(test_support.TESTFN)
Jeremy Hylton7ae51bf2000-09-14 16:59:07 +000090
Brett Cannon74bfd702003-04-25 09:39:47 +000091 def test_interface(self):
92 # Make sure object returned by urlopen() has the specified methods
93 for attr in ("read", "readline", "readlines", "fileno",
Georg Brandl9b0d46d2008-01-20 11:43:03 +000094 "close", "info", "geturl", "getcode", "__iter__"):
Benjamin Peterson5c8da862009-06-30 22:57:08 +000095 self.assertTrue(hasattr(self.returned_obj, attr),
Brett Cannon74bfd702003-04-25 09:39:47 +000096 "object returned by urlopen() lacks %s attribute" %
97 attr)
Skip Montanaroe78b92a2001-01-20 20:22:30 +000098
Brett Cannon74bfd702003-04-25 09:39:47 +000099 def test_read(self):
100 self.assertEqual(self.text, self.returned_obj.read())
Skip Montanaro080c9972001-01-28 21:12:22 +0000101
Brett Cannon74bfd702003-04-25 09:39:47 +0000102 def test_readline(self):
103 self.assertEqual(self.text, self.returned_obj.readline())
104 self.assertEqual('', self.returned_obj.readline(),
105 "calling readline() after exhausting the file did not"
106 " return an empty string")
Skip Montanaro080c9972001-01-28 21:12:22 +0000107
Brett Cannon74bfd702003-04-25 09:39:47 +0000108 def test_readlines(self):
109 lines_list = self.returned_obj.readlines()
110 self.assertEqual(len(lines_list), 1,
111 "readlines() returned the wrong number of lines")
112 self.assertEqual(lines_list[0], self.text,
113 "readlines() returned improper text")
Skip Montanaro080c9972001-01-28 21:12:22 +0000114
Brett Cannon74bfd702003-04-25 09:39:47 +0000115 def test_fileno(self):
116 file_num = self.returned_obj.fileno()
Ezio Melottib0f5adc2010-01-24 16:58:36 +0000117 self.assertIsInstance(file_num, int, "fileno() did not return an int")
Brett Cannon74bfd702003-04-25 09:39:47 +0000118 self.assertEqual(os.read(file_num, len(self.text)), self.text,
119 "Reading on the file descriptor returned by fileno() "
120 "did not return the expected text")
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000121
Brett Cannon74bfd702003-04-25 09:39:47 +0000122 def test_close(self):
123 # Test close() by calling it hear and then having it be called again
124 # by the tearDown() method for the test
125 self.returned_obj.close()
Skip Montanaro080c9972001-01-28 21:12:22 +0000126
Brett Cannon74bfd702003-04-25 09:39:47 +0000127 def test_info(self):
Ezio Melottib0f5adc2010-01-24 16:58:36 +0000128 self.assertIsInstance(self.returned_obj.info(), mimetools.Message)
Skip Montanaroe78b92a2001-01-20 20:22:30 +0000129
Brett Cannon74bfd702003-04-25 09:39:47 +0000130 def test_geturl(self):
131 self.assertEqual(self.returned_obj.geturl(), self.pathname)
Skip Montanaro080c9972001-01-28 21:12:22 +0000132
Georg Brandl9b0d46d2008-01-20 11:43:03 +0000133 def test_getcode(self):
134 self.assertEqual(self.returned_obj.getcode(), None)
135
Brett Cannon74bfd702003-04-25 09:39:47 +0000136 def test_iter(self):
137 # Test iterator
138 # Don't need to count number of iterations since test would fail the
139 # instant it returned anything beyond the first line from the
140 # comparison
141 for line in self.returned_obj.__iter__():
142 self.assertEqual(line, self.text)
Skip Montanaro080c9972001-01-28 21:12:22 +0000143
Senthil Kumaran58c60622012-01-21 11:43:02 +0800144 def test_relativelocalfile(self):
145 self.assertRaises(ValueError,urllib.urlopen,'./' + self.pathname)
146
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000147class ProxyTests(unittest.TestCase):
148
149 def setUp(self):
Walter Dörwald4b965f62009-04-26 20:51:44 +0000150 # Records changes to env vars
151 self.env = test_support.EnvironmentVarGuard()
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000152 # Delete all proxy related env vars
Senthil Kumaran7a2ee0b2010-01-08 19:20:25 +0000153 for k in os.environ.keys():
Walter Dörwald4b965f62009-04-26 20:51:44 +0000154 if 'proxy' in k.lower():
Senthil Kumarandc61ec32009-10-01 01:50:13 +0000155 self.env.unset(k)
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000156
157 def tearDown(self):
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000158 # Restore all proxy related env vars
Walter Dörwald4b965f62009-04-26 20:51:44 +0000159 self.env.__exit__()
160 del self.env
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000161
162 def test_getproxies_environment_keep_no_proxies(self):
Walter Dörwald4b965f62009-04-26 20:51:44 +0000163 self.env.set('NO_PROXY', 'localhost')
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000164 proxies = urllib.getproxies_environment()
165 # getproxies_environment use lowered case truncated (no '_proxy') keys
Ezio Melotti2623a372010-11-21 13:34:58 +0000166 self.assertEqual('localhost', proxies['no'])
Senthil Kumaranb5bd4c82011-08-06 12:24:33 +0800167 # List of no_proxies with space.
Senthil Kumaranb31c87b2016-04-25 09:17:54 -0700168 self.env.set('NO_PROXY', 'localhost, anotherdomain.com, newdomain.com:1234')
Senthil Kumaranb5bd4c82011-08-06 12:24:33 +0800169 self.assertTrue(urllib.proxy_bypass_environment('anotherdomain.com'))
Senthil Kumaranb31c87b2016-04-25 09:17:54 -0700170 self.assertTrue(urllib.proxy_bypass_environment('anotherdomain.com:8888'))
171 self.assertTrue(urllib.proxy_bypass_environment('newdomain.com:1234'))
172
Senthil Kumaran75d7b612016-07-30 05:49:53 -0700173 def test_proxy_cgi_ignore(self):
174 try:
175 self.env.set('HTTP_PROXY', 'http://somewhere:3128')
176 proxies = urllib.getproxies_environment()
177 self.assertEqual('http://somewhere:3128', proxies['http'])
178 self.env.set('REQUEST_METHOD', 'GET')
179 proxies = urllib.getproxies_environment()
180 self.assertNotIn('http', proxies)
181 finally:
182 self.env.unset('REQUEST_METHOD')
183 self.env.unset('HTTP_PROXY')
184
Martin Panter064ee4d2016-04-30 01:03:40 +0000185 def test_proxy_bypass_environment_host_match(self):
186 bypass = urllib.proxy_bypass_environment
187 self.env.set('NO_PROXY',
Xiang Zhang98b1c822017-01-09 11:43:24 +0800188 'localhost, anotherdomain.com, newdomain.com:1234, .d.o.t')
Martin Panter064ee4d2016-04-30 01:03:40 +0000189 self.assertTrue(bypass('localhost'))
190 self.assertTrue(bypass('LocalHost')) # MixedCase
191 self.assertTrue(bypass('LOCALHOST')) # UPPERCASE
192 self.assertTrue(bypass('newdomain.com:1234'))
Xiang Zhang98b1c822017-01-09 11:43:24 +0800193 self.assertTrue(bypass('foo.d.o.t')) # issue 29142
Martin Panter064ee4d2016-04-30 01:03:40 +0000194 self.assertTrue(bypass('anotherdomain.com:8888'))
195 self.assertTrue(bypass('www.newdomain.com:1234'))
196 self.assertFalse(bypass('prelocalhost'))
197 self.assertFalse(bypass('newdomain.com')) # no port
198 self.assertFalse(bypass('newdomain.com:1235')) # wrong port
Senthil Kumaranb31c87b2016-04-25 09:17:54 -0700199
200class ProxyTests_withOrderedEnv(unittest.TestCase):
201
202 def setUp(self):
203 # We need to test conditions, where variable order _is_ significant
204 self._saved_env = os.environ
205 # Monkey patch os.environ, start with empty fake environment
206 os.environ = collections.OrderedDict()
207
208 def tearDown(self):
209 os.environ = self._saved_env
210
211 def test_getproxies_environment_prefer_lowercase(self):
212 # Test lowercase preference with removal
213 os.environ['no_proxy'] = ''
214 os.environ['No_Proxy'] = 'localhost'
215 self.assertFalse(urllib.proxy_bypass_environment('localhost'))
216 self.assertFalse(urllib.proxy_bypass_environment('arbitrary'))
217 os.environ['http_proxy'] = ''
218 os.environ['HTTP_PROXY'] = 'http://somewhere:3128'
219 proxies = urllib.getproxies_environment()
220 self.assertEqual({}, proxies)
221 # Test lowercase preference of proxy bypass and correct matching including ports
222 os.environ['no_proxy'] = 'localhost, noproxy.com, my.proxy:1234'
223 os.environ['No_Proxy'] = 'xyz.com'
224 self.assertTrue(urllib.proxy_bypass_environment('localhost'))
225 self.assertTrue(urllib.proxy_bypass_environment('noproxy.com:5678'))
226 self.assertTrue(urllib.proxy_bypass_environment('my.proxy:1234'))
227 self.assertFalse(urllib.proxy_bypass_environment('my.proxy'))
228 self.assertFalse(urllib.proxy_bypass_environment('arbitrary'))
229 # Test lowercase preference with replacement
230 os.environ['http_proxy'] = 'http://somewhere:3128'
231 os.environ['Http_Proxy'] = 'http://somewhereelse:3128'
232 proxies = urllib.getproxies_environment()
233 self.assertEqual('http://somewhere:3128', proxies['http'])
Benjamin Peterson2c7470d2008-09-21 21:27:51 +0000234
235
Senthil Kumaran87e58552011-11-01 02:44:45 +0800236class urlopen_HttpTests(unittest.TestCase, FakeHTTPMixin):
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000237 """Test urlopen() opening a fake http connection."""
238
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000239 def test_read(self):
240 self.fakehttp('Hello!')
241 try:
242 fp = urllib.urlopen("http://python.org/")
243 self.assertEqual(fp.readline(), 'Hello!')
244 self.assertEqual(fp.readline(), '')
Georg Brandl9b0d46d2008-01-20 11:43:03 +0000245 self.assertEqual(fp.geturl(), 'http://python.org/')
246 self.assertEqual(fp.getcode(), 200)
Hye-Shik Chang39aef792004-06-05 13:30:56 +0000247 finally:
248 self.unfakehttp()
249
Senthil Kumaran49c44082011-04-13 07:31:45 +0800250 def test_url_fragment(self):
251 # Issue #11703: geturl() omits fragments in the original URL.
252 url = 'http://docs.python.org/library/urllib.html#OK'
253 self.fakehttp('Hello!')
254 try:
255 fp = urllib.urlopen(url)
256 self.assertEqual(fp.geturl(), url)
257 finally:
258 self.unfakehttp()
259
Kurt B. Kaiser0f7c25d2008-01-02 04:11:28 +0000260 def test_read_bogus(self):
Kurt B. Kaiser0a112322008-01-02 05:23:38 +0000261 # urlopen() should raise IOError for many error codes.
Kurt B. Kaiser0f7c25d2008-01-02 04:11:28 +0000262 self.fakehttp('''HTTP/1.1 401 Authentication Required
263Date: Wed, 02 Jan 2008 03:03:54 GMT
264Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
265Connection: close
266Content-Type: text/html; charset=iso-8859-1
267''')
268 try:
269 self.assertRaises(IOError, urllib.urlopen, "http://python.org/")
270 finally:
271 self.unfakehttp()
272
guido@google.comf1509302011-03-28 13:47:01 -0700273 def test_invalid_redirect(self):
274 # urlopen() should raise IOError for many error codes.
275 self.fakehttp("""HTTP/1.1 302 Found
276Date: Wed, 02 Jan 2008 03:03:54 GMT
277Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
278Location: file:README
279Connection: close
280Content-Type: text/html; charset=iso-8859-1
281""")
282 try:
Martin Panterade40972016-02-04 06:01:35 +0000283 msg = "Redirection to url 'file:"
284 with self.assertRaisesRegexp(IOError, msg):
285 urllib.urlopen("http://python.org/")
guido@google.comf1509302011-03-28 13:47:01 -0700286 finally:
287 self.unfakehttp()
288
Martin Panterade40972016-02-04 06:01:35 +0000289 def test_redirect_limit_independent(self):
290 # Ticket #12923: make sure independent requests each use their
291 # own retry limit.
292 for i in range(urllib.FancyURLopener().maxtries):
293 self.fakehttp(b'''HTTP/1.1 302 Found
294Location: file://guidocomputer.athome.com:/python/license
295Connection: close
296''')
297 try:
298 self.assertRaises(IOError, urllib.urlopen,
299 "http://something")
300 finally:
301 self.unfakehttp()
302
Georg Brandlf66b6032007-03-14 08:27:52 +0000303 def test_empty_socket(self):
Kurt B. Kaiser0a112322008-01-02 05:23:38 +0000304 # urlopen() raises IOError if the underlying socket does not send any
305 # data. (#1680230)
Georg Brandlf66b6032007-03-14 08:27:52 +0000306 self.fakehttp('')
307 try:
308 self.assertRaises(IOError, urllib.urlopen, 'http://something')
309 finally:
310 self.unfakehttp()
311
Senthil Kumaranf8d370e2012-10-27 03:48:40 -0700312 def test_missing_localfile(self):
313 self.assertRaises(IOError, urllib.urlopen,
314 'file://localhost/a/missing/file.py')
315 fd, tmp_file = tempfile.mkstemp()
316 tmp_fileurl = 'file://localhost/' + tmp_file.replace(os.path.sep, '/')
Senthil Kumarana085f002013-06-01 07:59:10 -0700317 self.assertTrue(os.path.exists(tmp_file))
Senthil Kumaranf8d370e2012-10-27 03:48:40 -0700318 try:
Senthil Kumaranf8d370e2012-10-27 03:48:40 -0700319 fp = urllib.urlopen(tmp_fileurl)
Senthil Kumarana085f002013-06-01 07:59:10 -0700320 fp.close()
Senthil Kumaranf8d370e2012-10-27 03:48:40 -0700321 finally:
322 os.close(fd)
Senthil Kumarana085f002013-06-01 07:59:10 -0700323 os.unlink(tmp_file)
Senthil Kumaranf8d370e2012-10-27 03:48:40 -0700324
325 self.assertFalse(os.path.exists(tmp_file))
326 self.assertRaises(IOError, urllib.urlopen, tmp_fileurl)
327
328 def test_ftp_nonexisting(self):
329 self.assertRaises(IOError, urllib.urlopen,
330 'ftp://localhost/not/existing/file.py')
331
332
Senthil Kumaranbcd833f2012-01-11 00:09:24 +0800333 def test_userpass_inurl(self):
334 self.fakehttp('Hello!')
335 try:
336 fakehttp_wrapper = httplib.HTTP._connection_class
337 fp = urllib.urlopen("http://user:pass@python.org/")
338 authorization = ("Authorization: Basic %s\r\n" %
339 b64encode('user:pass'))
340 # The authorization header must be in place
341 self.assertIn(authorization, fakehttp_wrapper.buf)
342 self.assertEqual(fp.readline(), "Hello!")
343 self.assertEqual(fp.readline(), "")
344 self.assertEqual(fp.geturl(), 'http://user:pass@python.org/')
345 self.assertEqual(fp.getcode(), 200)
346 finally:
347 self.unfakehttp()
348
349 def test_userpass_with_spaces_inurl(self):
350 self.fakehttp('Hello!')
351 try:
352 url = "http://a b:c d@python.org/"
353 fakehttp_wrapper = httplib.HTTP._connection_class
354 authorization = ("Authorization: Basic %s\r\n" %
355 b64encode('a b:c d'))
356 fp = urllib.urlopen(url)
357 # The authorization header must be in place
358 self.assertIn(authorization, fakehttp_wrapper.buf)
359 self.assertEqual(fp.readline(), "Hello!")
360 self.assertEqual(fp.readline(), "")
361 # the spaces are quoted in URL so no match
362 self.assertNotEqual(fp.geturl(), url)
363 self.assertEqual(fp.getcode(), 200)
364 finally:
365 self.unfakehttp()
366
367
Brett Cannon19691362003-04-29 05:08:06 +0000368class urlretrieve_FileTests(unittest.TestCase):
Brett Cannon74bfd702003-04-25 09:39:47 +0000369 """Test urllib.urlretrieve() on local files"""
Skip Montanaro080c9972001-01-28 21:12:22 +0000370
Brett Cannon19691362003-04-29 05:08:06 +0000371 def setUp(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000372 # Create a list of temporary files. Each item in the list is a file
373 # name (absolute path or relative to the current working directory).
374 # All files in this list will be deleted in the tearDown method. Note,
375 # this only helps to makes sure temporary files get deleted, but it
376 # does nothing about trying to close files that may still be open. It
377 # is the responsibility of the developer to properly close files even
378 # when exceptional conditions occur.
379 self.tempFiles = []
380
Brett Cannon19691362003-04-29 05:08:06 +0000381 # Create a temporary file.
Georg Brandl5a650a22005-08-26 08:51:34 +0000382 self.registerFileForCleanUp(test_support.TESTFN)
Brett Cannon19691362003-04-29 05:08:06 +0000383 self.text = 'testing urllib.urlretrieve'
Georg Brandl5a650a22005-08-26 08:51:34 +0000384 try:
385 FILE = file(test_support.TESTFN, 'wb')
386 FILE.write(self.text)
387 FILE.close()
388 finally:
389 try: FILE.close()
390 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000391
392 def tearDown(self):
Georg Brandl5a650a22005-08-26 08:51:34 +0000393 # Delete the temporary files.
394 for each in self.tempFiles:
395 try: os.remove(each)
396 except: pass
397
398 def constructLocalFileUrl(self, filePath):
399 return "file://%s" % urllib.pathname2url(os.path.abspath(filePath))
400
401 def createNewTempFile(self, data=""):
402 """Creates a new temporary file containing the specified data,
403 registers the file for deletion during the test fixture tear down, and
404 returns the absolute path of the file."""
405
406 newFd, newFilePath = tempfile.mkstemp()
407 try:
408 self.registerFileForCleanUp(newFilePath)
409 newFile = os.fdopen(newFd, "wb")
410 newFile.write(data)
411 newFile.close()
412 finally:
413 try: newFile.close()
414 except: pass
415 return newFilePath
416
417 def registerFileForCleanUp(self, fileName):
418 self.tempFiles.append(fileName)
Brett Cannon19691362003-04-29 05:08:06 +0000419
420 def test_basic(self):
421 # Make sure that a local file just gets its own location returned and
422 # a headers value is returned.
423 result = urllib.urlretrieve("file:%s" % test_support.TESTFN)
424 self.assertEqual(result[0], test_support.TESTFN)
Ezio Melottib0f5adc2010-01-24 16:58:36 +0000425 self.assertIsInstance(result[1], mimetools.Message,
426 "did not get a mimetools.Message instance as "
427 "second returned value")
Brett Cannon19691362003-04-29 05:08:06 +0000428
429 def test_copy(self):
430 # Test that setting the filename argument works.
431 second_temp = "%s.2" % test_support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000432 self.registerFileForCleanUp(second_temp)
433 result = urllib.urlretrieve(self.constructLocalFileUrl(
434 test_support.TESTFN), second_temp)
Brett Cannon19691362003-04-29 05:08:06 +0000435 self.assertEqual(second_temp, result[0])
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000436 self.assertTrue(os.path.exists(second_temp), "copy of the file was not "
Brett Cannon19691362003-04-29 05:08:06 +0000437 "made")
438 FILE = file(second_temp, 'rb')
439 try:
440 text = FILE.read()
Brett Cannon19691362003-04-29 05:08:06 +0000441 FILE.close()
Georg Brandl5a650a22005-08-26 08:51:34 +0000442 finally:
443 try: FILE.close()
444 except: pass
Brett Cannon19691362003-04-29 05:08:06 +0000445 self.assertEqual(self.text, text)
446
447 def test_reporthook(self):
448 # Make sure that the reporthook works.
449 def hooktester(count, block_size, total_size, count_holder=[0]):
Ezio Melottib0f5adc2010-01-24 16:58:36 +0000450 self.assertIsInstance(count, int)
451 self.assertIsInstance(block_size, int)
452 self.assertIsInstance(total_size, int)
Brett Cannon19691362003-04-29 05:08:06 +0000453 self.assertEqual(count, count_holder[0])
454 count_holder[0] = count_holder[0] + 1
455 second_temp = "%s.2" % test_support.TESTFN
Georg Brandl5a650a22005-08-26 08:51:34 +0000456 self.registerFileForCleanUp(second_temp)
457 urllib.urlretrieve(self.constructLocalFileUrl(test_support.TESTFN),
458 second_temp, hooktester)
459
460 def test_reporthook_0_bytes(self):
461 # Test on zero length file. Should call reporthook only 1 time.
462 report = []
463 def hooktester(count, block_size, total_size, _report=report):
464 _report.append((count, block_size, total_size))
465 srcFileName = self.createNewTempFile()
466 urllib.urlretrieve(self.constructLocalFileUrl(srcFileName),
467 test_support.TESTFN, hooktester)
468 self.assertEqual(len(report), 1)
469 self.assertEqual(report[0][2], 0)
470
471 def test_reporthook_5_bytes(self):
472 # Test on 5 byte file. Should call reporthook only 2 times (once when
473 # the "network connection" is established and once when the block is
474 # read). Since the block size is 8192 bytes, only one block read is
475 # required to read the entire file.
476 report = []
477 def hooktester(count, block_size, total_size, _report=report):
478 _report.append((count, block_size, total_size))
479 srcFileName = self.createNewTempFile("x" * 5)
480 urllib.urlretrieve(self.constructLocalFileUrl(srcFileName),
481 test_support.TESTFN, hooktester)
482 self.assertEqual(len(report), 2)
483 self.assertEqual(report[0][1], 8192)
484 self.assertEqual(report[0][2], 5)
485
486 def test_reporthook_8193_bytes(self):
487 # Test on 8193 byte file. Should call reporthook only 3 times (once
488 # when the "network connection" is established, once for the next 8192
489 # bytes, and once for the last byte).
490 report = []
491 def hooktester(count, block_size, total_size, _report=report):
492 _report.append((count, block_size, total_size))
493 srcFileName = self.createNewTempFile("x" * 8193)
494 urllib.urlretrieve(self.constructLocalFileUrl(srcFileName),
495 test_support.TESTFN, hooktester)
496 self.assertEqual(len(report), 3)
497 self.assertEqual(report[0][1], 8192)
498 self.assertEqual(report[0][2], 8193)
Skip Montanaro080c9972001-01-28 21:12:22 +0000499
Senthil Kumaran87e58552011-11-01 02:44:45 +0800500
501class urlretrieve_HttpTests(unittest.TestCase, FakeHTTPMixin):
502 """Test urllib.urlretrieve() using fake http connections"""
503
504 def test_short_content_raises_ContentTooShortError(self):
505 self.fakehttp('''HTTP/1.1 200 OK
506Date: Wed, 02 Jan 2008 03:03:54 GMT
507Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
508Connection: close
509Content-Length: 100
510Content-Type: text/html; charset=iso-8859-1
511
512FF
513''')
514
515 def _reporthook(par1, par2, par3):
516 pass
517
518 try:
519 self.assertRaises(urllib.ContentTooShortError, urllib.urlretrieve,
520 'http://example.com', reporthook=_reporthook)
521 finally:
522 self.unfakehttp()
523
524 def test_short_content_raises_ContentTooShortError_without_reporthook(self):
525 self.fakehttp('''HTTP/1.1 200 OK
526Date: Wed, 02 Jan 2008 03:03:54 GMT
527Server: Apache/1.3.33 (Debian GNU/Linux) mod_ssl/2.8.22 OpenSSL/0.9.7e
528Connection: close
529Content-Length: 100
530Content-Type: text/html; charset=iso-8859-1
531
532FF
533''')
534 try:
535 self.assertRaises(urllib.ContentTooShortError, urllib.urlretrieve, 'http://example.com/')
536 finally:
537 self.unfakehttp()
538
Brett Cannon74bfd702003-04-25 09:39:47 +0000539class QuotingTests(unittest.TestCase):
540 """Tests for urllib.quote() and urllib.quote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000541
Brett Cannon74bfd702003-04-25 09:39:47 +0000542 According to RFC 2396 ("Uniform Resource Identifiers), to escape a
543 character you write it as '%' + <2 character US-ASCII hex value>. The Python
544 code of ``'%' + hex(ord(<character>))[2:]`` escapes a character properly.
545 Case does not matter on the hex letters.
546
547 The various character sets specified are:
Tim Petersc2659cf2003-05-12 20:19:37 +0000548
Brett Cannon74bfd702003-04-25 09:39:47 +0000549 Reserved characters : ";/?:@&=+$,"
550 Have special meaning in URIs and must be escaped if not being used for
551 their special meaning
552 Data characters : letters, digits, and "-_.!~*'()"
553 Unreserved and do not need to be escaped; can be, though, if desired
554 Control characters : 0x00 - 0x1F, 0x7F
555 Have no use in URIs so must be escaped
556 space : 0x20
557 Must be escaped
558 Delimiters : '<>#%"'
559 Must be escaped
560 Unwise : "{}|\^[]`"
561 Must be escaped
Tim Petersc2659cf2003-05-12 20:19:37 +0000562
Brett Cannon74bfd702003-04-25 09:39:47 +0000563 """
564
565 def test_never_quote(self):
566 # Make sure quote() does not quote letters, digits, and "_,.-"
567 do_not_quote = '' .join(["ABCDEFGHIJKLMNOPQRSTUVWXYZ",
568 "abcdefghijklmnopqrstuvwxyz",
569 "0123456789",
570 "_.-"])
571 result = urllib.quote(do_not_quote)
572 self.assertEqual(do_not_quote, result,
573 "using quote(): %s != %s" % (do_not_quote, result))
574 result = urllib.quote_plus(do_not_quote)
575 self.assertEqual(do_not_quote, result,
576 "using quote_plus(): %s != %s" % (do_not_quote, result))
577
578 def test_default_safe(self):
579 # Test '/' is default value for 'safe' parameter
580 self.assertEqual(urllib.quote.func_defaults[0], '/')
581
582 def test_safe(self):
583 # Test setting 'safe' parameter does what it should do
584 quote_by_default = "<>"
585 result = urllib.quote(quote_by_default, safe=quote_by_default)
586 self.assertEqual(quote_by_default, result,
587 "using quote(): %s != %s" % (quote_by_default, result))
588 result = urllib.quote_plus(quote_by_default, safe=quote_by_default)
589 self.assertEqual(quote_by_default, result,
590 "using quote_plus(): %s != %s" %
591 (quote_by_default, result))
592
593 def test_default_quoting(self):
594 # Make sure all characters that should be quoted are by default sans
595 # space (separate test for that).
596 should_quote = [chr(num) for num in range(32)] # For 0x00 - 0x1F
597 should_quote.append('<>#%"{}|\^[]`')
598 should_quote.append(chr(127)) # For 0x7F
599 should_quote = ''.join(should_quote)
600 for char in should_quote:
601 result = urllib.quote(char)
602 self.assertEqual(hexescape(char), result,
603 "using quote(): %s should be escaped to %s, not %s" %
604 (char, hexescape(char), result))
605 result = urllib.quote_plus(char)
606 self.assertEqual(hexescape(char), result,
607 "using quote_plus(): "
Tim Petersc2659cf2003-05-12 20:19:37 +0000608 "%s should be escapes to %s, not %s" %
Brett Cannon74bfd702003-04-25 09:39:47 +0000609 (char, hexescape(char), result))
610 del should_quote
611 partial_quote = "ab[]cd"
612 expected = "ab%5B%5Dcd"
613 result = urllib.quote(partial_quote)
614 self.assertEqual(expected, result,
615 "using quote(): %s != %s" % (expected, result))
Senthil Kumaran0d4c34c2011-09-13 06:42:21 +0800616 result = urllib.quote_plus(partial_quote)
Brett Cannon74bfd702003-04-25 09:39:47 +0000617 self.assertEqual(expected, result,
618 "using quote_plus(): %s != %s" % (expected, result))
Senthil Kumaranc7743aa2010-07-19 17:35:50 +0000619 self.assertRaises(TypeError, urllib.quote, None)
Brett Cannon74bfd702003-04-25 09:39:47 +0000620
621 def test_quoting_space(self):
622 # Make sure quote() and quote_plus() handle spaces as specified in
623 # their unique way
624 result = urllib.quote(' ')
625 self.assertEqual(result, hexescape(' '),
626 "using quote(): %s != %s" % (result, hexescape(' ')))
627 result = urllib.quote_plus(' ')
628 self.assertEqual(result, '+',
629 "using quote_plus(): %s != +" % result)
630 given = "a b cd e f"
631 expect = given.replace(' ', hexescape(' '))
632 result = urllib.quote(given)
633 self.assertEqual(expect, result,
634 "using quote(): %s != %s" % (expect, result))
635 expect = given.replace(' ', '+')
636 result = urllib.quote_plus(given)
637 self.assertEqual(expect, result,
638 "using quote_plus(): %s != %s" % (expect, result))
639
Raymond Hettinger2bdec7b2005-09-10 14:30:09 +0000640 def test_quoting_plus(self):
641 self.assertEqual(urllib.quote_plus('alpha+beta gamma'),
642 'alpha%2Bbeta+gamma')
643 self.assertEqual(urllib.quote_plus('alpha+beta gamma', '+'),
644 'alpha+beta+gamma')
645
Brett Cannon74bfd702003-04-25 09:39:47 +0000646class UnquotingTests(unittest.TestCase):
647 """Tests for unquote() and unquote_plus()
Tim Petersc2659cf2003-05-12 20:19:37 +0000648
Brett Cannon74bfd702003-04-25 09:39:47 +0000649 See the doc string for quoting_Tests for details on quoting and such.
650
651 """
652
653 def test_unquoting(self):
654 # Make sure unquoting of all ASCII values works
655 escape_list = []
656 for num in range(128):
657 given = hexescape(chr(num))
658 expect = chr(num)
659 result = urllib.unquote(given)
660 self.assertEqual(expect, result,
661 "using unquote(): %s != %s" % (expect, result))
662 result = urllib.unquote_plus(given)
663 self.assertEqual(expect, result,
664 "using unquote_plus(): %s != %s" %
665 (expect, result))
666 escape_list.append(given)
667 escape_string = ''.join(escape_list)
668 del escape_list
669 result = urllib.unquote(escape_string)
670 self.assertEqual(result.count('%'), 1,
671 "using quote(): not all characters escaped; %s" %
672 result)
673 result = urllib.unquote(escape_string)
674 self.assertEqual(result.count('%'), 1,
675 "using unquote(): not all characters escaped: "
676 "%s" % result)
677
Senthil Kumaranf3e9b2a2010-03-18 12:14:15 +0000678 def test_unquoting_badpercent(self):
679 # Test unquoting on bad percent-escapes
680 given = '%xab'
681 expect = given
682 result = urllib.unquote(given)
683 self.assertEqual(expect, result, "using unquote(): %r != %r"
684 % (expect, result))
685 given = '%x'
686 expect = given
687 result = urllib.unquote(given)
688 self.assertEqual(expect, result, "using unquote(): %r != %r"
689 % (expect, result))
690 given = '%'
691 expect = given
692 result = urllib.unquote(given)
693 self.assertEqual(expect, result, "using unquote(): %r != %r"
694 % (expect, result))
695
696 def test_unquoting_mixed_case(self):
697 # Test unquoting on mixed-case hex digits in the percent-escapes
698 given = '%Ab%eA'
699 expect = '\xab\xea'
700 result = urllib.unquote(given)
701 self.assertEqual(expect, result, "using unquote(): %r != %r"
702 % (expect, result))
703
Brett Cannon74bfd702003-04-25 09:39:47 +0000704 def test_unquoting_parts(self):
705 # Make sure unquoting works when have non-quoted characters
706 # interspersed
707 given = 'ab%sd' % hexescape('c')
708 expect = "abcd"
709 result = urllib.unquote(given)
710 self.assertEqual(expect, result,
711 "using quote(): %s != %s" % (expect, result))
712 result = urllib.unquote_plus(given)
713 self.assertEqual(expect, result,
714 "using unquote_plus(): %s != %s" % (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000715
Brett Cannon74bfd702003-04-25 09:39:47 +0000716 def test_unquoting_plus(self):
717 # Test difference between unquote() and unquote_plus()
718 given = "are+there+spaces..."
719 expect = given
720 result = urllib.unquote(given)
721 self.assertEqual(expect, result,
722 "using unquote(): %s != %s" % (expect, result))
723 expect = given.replace('+', ' ')
724 result = urllib.unquote_plus(given)
725 self.assertEqual(expect, result,
726 "using unquote_plus(): %s != %s" % (expect, result))
727
Raymond Hettinger4b0f20d2005-10-15 16:41:53 +0000728 def test_unquote_with_unicode(self):
729 r = urllib.unquote(u'br%C3%BCckner_sapporo_20050930.doc')
730 self.assertEqual(r, u'br\xc3\xbcckner_sapporo_20050930.doc')
731
Brett Cannon74bfd702003-04-25 09:39:47 +0000732class urlencode_Tests(unittest.TestCase):
733 """Tests for urlencode()"""
734
735 def help_inputtype(self, given, test_type):
736 """Helper method for testing different input types.
Tim Petersc2659cf2003-05-12 20:19:37 +0000737
Brett Cannon74bfd702003-04-25 09:39:47 +0000738 'given' must lead to only the pairs:
739 * 1st, 1
740 * 2nd, 2
741 * 3rd, 3
Tim Petersc2659cf2003-05-12 20:19:37 +0000742
Brett Cannon74bfd702003-04-25 09:39:47 +0000743 Test cannot assume anything about order. Docs make no guarantee and
744 have possible dictionary input.
Tim Petersc2659cf2003-05-12 20:19:37 +0000745
Brett Cannon74bfd702003-04-25 09:39:47 +0000746 """
747 expect_somewhere = ["1st=1", "2nd=2", "3rd=3"]
748 result = urllib.urlencode(given)
749 for expected in expect_somewhere:
Ezio Melottiaa980582010-01-23 23:04:36 +0000750 self.assertIn(expected, result,
Brett Cannon74bfd702003-04-25 09:39:47 +0000751 "testing %s: %s not found in %s" %
752 (test_type, expected, result))
753 self.assertEqual(result.count('&'), 2,
754 "testing %s: expected 2 '&'s; got %s" %
755 (test_type, result.count('&')))
756 amp_location = result.index('&')
757 on_amp_left = result[amp_location - 1]
758 on_amp_right = result[amp_location + 1]
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000759 self.assertTrue(on_amp_left.isdigit() and on_amp_right.isdigit(),
Brett Cannon74bfd702003-04-25 09:39:47 +0000760 "testing %s: '&' not located in proper place in %s" %
761 (test_type, result))
762 self.assertEqual(len(result), (5 * 3) + 2, #5 chars per thing and amps
763 "testing %s: "
764 "unexpected number of characters: %s != %s" %
765 (test_type, len(result), (5 * 3) + 2))
766
767 def test_using_mapping(self):
768 # Test passing in a mapping object as an argument.
769 self.help_inputtype({"1st":'1', "2nd":'2', "3rd":'3'},
770 "using dict as input type")
771
772 def test_using_sequence(self):
773 # Test passing in a sequence of two-item sequences as an argument.
774 self.help_inputtype([('1st', '1'), ('2nd', '2'), ('3rd', '3')],
775 "using sequence of two-item tuples as input")
776
777 def test_quoting(self):
778 # Make sure keys and values are quoted using quote_plus()
779 given = {"&":"="}
780 expect = "%s=%s" % (hexescape('&'), hexescape('='))
781 result = urllib.urlencode(given)
782 self.assertEqual(expect, result)
783 given = {"key name":"A bunch of pluses"}
784 expect = "key+name=A+bunch+of+pluses"
785 result = urllib.urlencode(given)
786 self.assertEqual(expect, result)
787
788 def test_doseq(self):
789 # Test that passing True for 'doseq' parameter works correctly
790 given = {'sequence':['1', '2', '3']}
791 expect = "sequence=%s" % urllib.quote_plus(str(['1', '2', '3']))
792 result = urllib.urlencode(given)
793 self.assertEqual(expect, result)
794 result = urllib.urlencode(given, True)
795 for value in given["sequence"]:
796 expect = "sequence=%s" % value
Ezio Melottiaa980582010-01-23 23:04:36 +0000797 self.assertIn(expect, result)
Brett Cannon74bfd702003-04-25 09:39:47 +0000798 self.assertEqual(result.count('&'), 2,
799 "Expected 2 '&'s, got %s" % result.count('&'))
800
801class Pathname_Tests(unittest.TestCase):
802 """Test pathname2url() and url2pathname()"""
803
804 def test_basic(self):
805 # Make sure simple tests pass
806 expected_path = os.path.join("parts", "of", "a", "path")
807 expected_url = "parts/of/a/path"
808 result = urllib.pathname2url(expected_path)
809 self.assertEqual(expected_url, result,
810 "pathname2url() failed; %s != %s" %
811 (result, expected_url))
812 result = urllib.url2pathname(expected_url)
813 self.assertEqual(expected_path, result,
814 "url2pathame() failed; %s != %s" %
815 (result, expected_path))
816
817 def test_quoting(self):
818 # Test automatic quoting and unquoting works for pathnam2url() and
819 # url2pathname() respectively
820 given = os.path.join("needs", "quot=ing", "here")
821 expect = "needs/%s/here" % urllib.quote("quot=ing")
822 result = urllib.pathname2url(given)
823 self.assertEqual(expect, result,
824 "pathname2url() failed; %s != %s" %
825 (expect, result))
826 expect = given
827 result = urllib.url2pathname(result)
828 self.assertEqual(expect, result,
829 "url2pathname() failed; %s != %s" %
830 (expect, result))
831 given = os.path.join("make sure", "using_quote")
832 expect = "%s/using_quote" % urllib.quote("make sure")
833 result = urllib.pathname2url(given)
834 self.assertEqual(expect, result,
835 "pathname2url() failed; %s != %s" %
836 (expect, result))
837 given = "make+sure/using_unquote"
838 expect = os.path.join("make+sure", "using_unquote")
839 result = urllib.url2pathname(given)
840 self.assertEqual(expect, result,
841 "url2pathname() failed; %s != %s" %
842 (expect, result))
Tim Petersc2659cf2003-05-12 20:19:37 +0000843
Senthil Kumarana99b7612011-04-14 12:54:35 +0800844 @unittest.skipUnless(sys.platform == 'win32',
845 'test specific to the nturl2path library')
846 def test_ntpath(self):
847 given = ('/C:/', '///C:/', '/C|//')
848 expect = 'C:\\'
849 for url in given:
850 result = urllib.url2pathname(url)
851 self.assertEqual(expect, result,
852 'nturl2path.url2pathname() failed; %s != %s' %
853 (expect, result))
854 given = '///C|/path'
855 expect = 'C:\\path'
856 result = urllib.url2pathname(given)
857 self.assertEqual(expect, result,
858 'nturl2path.url2pathname() failed; %s != %s' %
859 (expect, result))
860
Senthil Kumaran5e95e762009-03-30 21:51:50 +0000861class Utility_Tests(unittest.TestCase):
862 """Testcase to test the various utility functions in the urllib."""
Serhiy Storchakaf0b630b2015-03-02 16:31:57 +0200863 # In Python 3 this test class is moved to test_urlparse.
864
865 def test_splittype(self):
866 splittype = urllib.splittype
867 self.assertEqual(splittype('type:opaquestring'), ('type', 'opaquestring'))
868 self.assertEqual(splittype('opaquestring'), (None, 'opaquestring'))
869 self.assertEqual(splittype(':opaquestring'), (None, ':opaquestring'))
870 self.assertEqual(splittype('type:'), ('type', ''))
871 self.assertEqual(splittype('type:opaque:string'), ('type', 'opaque:string'))
872
873 def test_splithost(self):
874 splithost = urllib.splithost
875 self.assertEqual(splithost('//www.example.org:80/foo/bar/baz.html'),
876 ('www.example.org:80', '/foo/bar/baz.html'))
877 self.assertEqual(splithost('//www.example.org:80'),
878 ('www.example.org:80', ''))
879 self.assertEqual(splithost('/foo/bar/baz.html'),
880 (None, '/foo/bar/baz.html'))
881
882 def test_splituser(self):
883 splituser = urllib.splituser
884 self.assertEqual(splituser('User:Pass@www.python.org:080'),
885 ('User:Pass', 'www.python.org:080'))
886 self.assertEqual(splituser('@www.python.org:080'),
887 ('', 'www.python.org:080'))
888 self.assertEqual(splituser('www.python.org:080'),
889 (None, 'www.python.org:080'))
890 self.assertEqual(splituser('User:Pass@'),
891 ('User:Pass', ''))
892 self.assertEqual(splituser('User@example.com:Pass@www.python.org:080'),
893 ('User@example.com:Pass', 'www.python.org:080'))
Senthil Kumaran5e95e762009-03-30 21:51:50 +0000894
895 def test_splitpasswd(self):
Serhiy Storchakaf0b630b2015-03-02 16:31:57 +0200896 # Some of the password examples are not sensible, but it is added to
897 # confirming to RFC2617 and addressing issue4675.
898 splitpasswd = urllib.splitpasswd
899 self.assertEqual(splitpasswd('user:ab'), ('user', 'ab'))
900 self.assertEqual(splitpasswd('user:a\nb'), ('user', 'a\nb'))
901 self.assertEqual(splitpasswd('user:a\tb'), ('user', 'a\tb'))
902 self.assertEqual(splitpasswd('user:a\rb'), ('user', 'a\rb'))
903 self.assertEqual(splitpasswd('user:a\fb'), ('user', 'a\fb'))
904 self.assertEqual(splitpasswd('user:a\vb'), ('user', 'a\vb'))
905 self.assertEqual(splitpasswd('user:a:b'), ('user', 'a:b'))
906 self.assertEqual(splitpasswd('user:a b'), ('user', 'a b'))
907 self.assertEqual(splitpasswd('user 2:ab'), ('user 2', 'ab'))
908 self.assertEqual(splitpasswd('user+1:a+b'), ('user+1', 'a+b'))
909 self.assertEqual(splitpasswd('user:'), ('user', ''))
910 self.assertEqual(splitpasswd('user'), ('user', None))
911 self.assertEqual(splitpasswd(':ab'), ('', 'ab'))
Senthil Kumaran5e95e762009-03-30 21:51:50 +0000912
Serhiy Storchaka326b5ab2014-01-18 18:30:09 +0200913 def test_splitport(self):
914 splitport = urllib.splitport
915 self.assertEqual(splitport('parrot:88'), ('parrot', '88'))
916 self.assertEqual(splitport('parrot'), ('parrot', None))
917 self.assertEqual(splitport('parrot:'), ('parrot', None))
918 self.assertEqual(splitport('127.0.0.1'), ('127.0.0.1', None))
919 self.assertEqual(splitport('parrot:cheese'), ('parrot:cheese', None))
Serhiy Storchakaf0b630b2015-03-02 16:31:57 +0200920 self.assertEqual(splitport('[::1]:88'), ('[::1]', '88'))
921 self.assertEqual(splitport('[::1]'), ('[::1]', None))
922 self.assertEqual(splitport(':88'), ('', '88'))
Serhiy Storchaka326b5ab2014-01-18 18:30:09 +0200923
924 def test_splitnport(self):
925 splitnport = urllib.splitnport
926 self.assertEqual(splitnport('parrot:88'), ('parrot', 88))
927 self.assertEqual(splitnport('parrot'), ('parrot', -1))
928 self.assertEqual(splitnport('parrot', 55), ('parrot', 55))
929 self.assertEqual(splitnport('parrot:'), ('parrot', -1))
930 self.assertEqual(splitnport('parrot:', 55), ('parrot', 55))
931 self.assertEqual(splitnport('127.0.0.1'), ('127.0.0.1', -1))
932 self.assertEqual(splitnport('127.0.0.1', 55), ('127.0.0.1', 55))
933 self.assertEqual(splitnport('parrot:cheese'), ('parrot', None))
934 self.assertEqual(splitnport('parrot:cheese', 55), ('parrot', None))
935
Serhiy Storchakaf0b630b2015-03-02 16:31:57 +0200936 def test_splitquery(self):
937 # Normal cases are exercised by other tests; ensure that we also
938 # catch cases with no port specified (testcase ensuring coverage)
939 splitquery = urllib.splitquery
940 self.assertEqual(splitquery('http://python.org/fake?foo=bar'),
941 ('http://python.org/fake', 'foo=bar'))
942 self.assertEqual(splitquery('http://python.org/fake?foo=bar?'),
943 ('http://python.org/fake?foo=bar', ''))
944 self.assertEqual(splitquery('http://python.org/fake'),
945 ('http://python.org/fake', None))
946 self.assertEqual(splitquery('?foo=bar'), ('', 'foo=bar'))
947
948 def test_splittag(self):
949 splittag = urllib.splittag
950 self.assertEqual(splittag('http://example.com?foo=bar#baz'),
951 ('http://example.com?foo=bar', 'baz'))
952 self.assertEqual(splittag('http://example.com?foo=bar#'),
953 ('http://example.com?foo=bar', ''))
954 self.assertEqual(splittag('#baz'), ('', 'baz'))
955 self.assertEqual(splittag('http://example.com?foo=bar'),
956 ('http://example.com?foo=bar', None))
957 self.assertEqual(splittag('http://example.com?foo=bar#baz#boo'),
958 ('http://example.com?foo=bar#baz', 'boo'))
959
960 def test_splitattr(self):
961 splitattr = urllib.splitattr
962 self.assertEqual(splitattr('/path;attr1=value1;attr2=value2'),
963 ('/path', ['attr1=value1', 'attr2=value2']))
964 self.assertEqual(splitattr('/path;'), ('/path', ['']))
965 self.assertEqual(splitattr(';attr1=value1;attr2=value2'),
966 ('', ['attr1=value1', 'attr2=value2']))
967 self.assertEqual(splitattr('/path'), ('/path', []))
968
969 def test_splitvalue(self):
970 # Normal cases are exercised by other tests; test pathological cases
971 # with no key/value pairs. (testcase ensuring coverage)
972 splitvalue = urllib.splitvalue
973 self.assertEqual(splitvalue('foo=bar'), ('foo', 'bar'))
974 self.assertEqual(splitvalue('foo='), ('foo', ''))
975 self.assertEqual(splitvalue('=bar'), ('', 'bar'))
976 self.assertEqual(splitvalue('foobar'), ('foobar', None))
977 self.assertEqual(splitvalue('foo=bar=baz'), ('foo', 'bar=baz'))
978
979 def test_toBytes(self):
980 result = urllib.toBytes(u'http://www.python.org')
981 self.assertEqual(result, 'http://www.python.org')
982 self.assertRaises(UnicodeError, urllib.toBytes,
983 test_support.u(r'http://www.python.org/medi\u00e6val'))
984
985 def test_unwrap(self):
986 url = urllib.unwrap('<URL:type://host/path>')
987 self.assertEqual(url, 'type://host/path')
988
Senthil Kumaran5e95e762009-03-30 21:51:50 +0000989
Senthil Kumaran7c2867f2009-04-21 03:24:19 +0000990class URLopener_Tests(unittest.TestCase):
991 """Testcase to test the open method of URLopener class."""
992
993 def test_quoted_open(self):
994 class DummyURLopener(urllib.URLopener):
995 def open_spam(self, url):
996 return url
997
998 self.assertEqual(DummyURLopener().open(
999 'spam://example/ /'),'//example/%20/')
1000
Senthil Kumaran18d5a692010-02-20 22:05:34 +00001001 # test the safe characters are not quoted by urlopen
1002 self.assertEqual(DummyURLopener().open(
1003 "spam://c:|windows%/:=&?~#+!$,;'@()*[]|/path/"),
1004 "//c:|windows%/:=&?~#+!$,;'@()*[]|/path/")
1005
Senthil Kumaran7c2867f2009-04-21 03:24:19 +00001006
Facundo Batistad9880d02007-05-25 04:20:22 +00001007# Just commented them out.
1008# Can't really tell why keep failing in windows and sparc.
Ezio Melottic2077b02011-03-16 12:34:31 +02001009# Everywhere else they work ok, but on those machines, sometimes
Facundo Batistad9880d02007-05-25 04:20:22 +00001010# fail in one of the tests, sometimes in other. I have a linux, and
1011# the tests go ok.
Ezio Melotti419e23c2013-08-17 16:56:09 +03001012# If anybody has one of the problematic environments, please help!
Facundo Batistad9880d02007-05-25 04:20:22 +00001013# . Facundo
1014#
1015# def server(evt):
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001016# import socket, time
Facundo Batistad9880d02007-05-25 04:20:22 +00001017# serv = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
1018# serv.settimeout(3)
1019# serv.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
1020# serv.bind(("", 9093))
1021# serv.listen(5)
1022# try:
1023# conn, addr = serv.accept()
1024# conn.send("1 Hola mundo\n")
1025# cantdata = 0
1026# while cantdata < 13:
1027# data = conn.recv(13-cantdata)
1028# cantdata += len(data)
1029# time.sleep(.3)
1030# conn.send("2 No more lines\n")
1031# conn.close()
1032# except socket.timeout:
1033# pass
1034# finally:
1035# serv.close()
1036# evt.set()
1037#
1038# class FTPWrapperTests(unittest.TestCase):
1039#
1040# def setUp(self):
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001041# import ftplib, time, threading
Facundo Batistad9880d02007-05-25 04:20:22 +00001042# ftplib.FTP.port = 9093
1043# self.evt = threading.Event()
1044# threading.Thread(target=server, args=(self.evt,)).start()
1045# time.sleep(.1)
1046#
1047# def tearDown(self):
1048# self.evt.wait()
1049#
1050# def testBasic(self):
1051# # connects
1052# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001053# ftp.close()
Facundo Batistad9880d02007-05-25 04:20:22 +00001054#
1055# def testTimeoutNone(self):
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001056# # global default timeout is ignored
1057# import socket
Serhiy Storchaka528bed82014-02-08 14:49:55 +02001058# self.assertIsNone(socket.getdefaulttimeout())
Facundo Batistad9880d02007-05-25 04:20:22 +00001059# socket.setdefaulttimeout(30)
1060# try:
1061# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1062# finally:
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001063# socket.setdefaulttimeout(None)
Facundo Batistad9880d02007-05-25 04:20:22 +00001064# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001065# ftp.close()
Facundo Batistad9880d02007-05-25 04:20:22 +00001066#
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001067# def testTimeoutDefault(self):
1068# # global default timeout is used
1069# import socket
Serhiy Storchaka528bed82014-02-08 14:49:55 +02001070# self.assertIsNone(socket.getdefaulttimeout())
Facundo Batista4f1b1ed2008-05-29 16:39:26 +00001071# socket.setdefaulttimeout(30)
1072# try:
1073# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [])
1074# finally:
1075# socket.setdefaulttimeout(None)
1076# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1077# ftp.close()
1078#
1079# def testTimeoutValue(self):
1080# ftp = urllib.ftpwrapper("myuser", "mypass", "localhost", 9093, [],
1081# timeout=30)
1082# self.assertEqual(ftp.ftp.sock.gettimeout(), 30)
1083# ftp.close()
Facundo Batista711a54e2007-05-24 17:50:54 +00001084
Skip Montanaro080c9972001-01-28 21:12:22 +00001085
1086
Brett Cannon74bfd702003-04-25 09:39:47 +00001087def test_main():
Brett Cannon8bb8fa52008-07-02 01:57:08 +00001088 import warnings
Brett Cannon672237d2008-09-09 00:49:16 +00001089 with warnings.catch_warnings():
Brett Cannon8bb8fa52008-07-02 01:57:08 +00001090 warnings.filterwarnings('ignore', ".*urllib\.urlopen.*Python 3.0",
1091 DeprecationWarning)
1092 test_support.run_unittest(
1093 urlopen_FileTests,
1094 urlopen_HttpTests,
1095 urlretrieve_FileTests,
Senthil Kumaran87e58552011-11-01 02:44:45 +08001096 urlretrieve_HttpTests,
Benjamin Peterson2c7470d2008-09-21 21:27:51 +00001097 ProxyTests,
Brett Cannon8bb8fa52008-07-02 01:57:08 +00001098 QuotingTests,
1099 UnquotingTests,
1100 urlencode_Tests,
1101 Pathname_Tests,
Senthil Kumaran5e95e762009-03-30 21:51:50 +00001102 Utility_Tests,
Senthil Kumaran7c2867f2009-04-21 03:24:19 +00001103 URLopener_Tests,
Senthil Kumaranb31c87b2016-04-25 09:17:54 -07001104 ProxyTests,
1105 ProxyTests_withOrderedEnv,
Brett Cannon8bb8fa52008-07-02 01:57:08 +00001106 #FTPWrapperTests,
1107 )
Brett Cannon74bfd702003-04-25 09:39:47 +00001108
1109
1110
1111if __name__ == '__main__':
1112 test_main()