blob: cb28aa8712bdb886bcbf7a5934299d905114ff00 [file] [log] [blame]
Florent Xicluna8fbddf12010-03-17 20:29:51 +00001from test.support import run_unittest, check_warnings
Jeremy Hyltond9827c42000-08-03 22:11:43 +00002import cgi
3import os
4import sys
Thomas Wouters00ee7ba2006-08-21 19:07:27 +00005import tempfile
Thomas Wouters89f507f2006-12-13 04:49:30 +00006import unittest
Brett Cannon8f79dd52012-04-25 20:49:19 -04007import warnings
Senthil Kumaran6b102f22013-01-23 02:50:15 -08008from collections import namedtuple
Victor Stinner5c23b8e2011-01-14 13:05:21 +00009from io import StringIO, BytesIO
Jeremy Hyltond9827c42000-08-03 22:11:43 +000010
11class HackedSysModule:
12 # The regression test will have real values in sys.argv, which
Fred Drake004d5e62000-10-23 17:22:08 +000013 # will completely confuse the test of the cgi module
Jeremy Hyltond9827c42000-08-03 22:11:43 +000014 argv = []
15 stdin = sys.stdin
16
17cgi.sys = HackedSysModule()
18
Jeremy Hyltond9827c42000-08-03 22:11:43 +000019class ComparableException:
20 def __init__(self, err):
21 self.err = err
22
23 def __str__(self):
24 return str(self.err)
25
Guido van Rossum47b9ff62006-08-24 00:41:19 +000026 def __eq__(self, anExc):
Jeremy Hyltond9827c42000-08-03 22:11:43 +000027 if not isinstance(anExc, Exception):
Guido van Rossum47b9ff62006-08-24 00:41:19 +000028 return NotImplemented
29 return (self.err.__class__ == anExc.__class__ and
30 self.err.args == anExc.args)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000031
32 def __getattr__(self, attr):
Guido van Rossum846d6db2001-01-17 15:08:37 +000033 return getattr(self.err, attr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000034
35def do_test(buf, method):
36 env = {}
37 if method == "GET":
38 fp = None
39 env['REQUEST_METHOD'] = 'GET'
40 env['QUERY_STRING'] = buf
41 elif method == "POST":
Victor Stinner5c23b8e2011-01-14 13:05:21 +000042 fp = BytesIO(buf.encode('latin-1')) # FieldStorage expects bytes
Jeremy Hyltond9827c42000-08-03 22:11:43 +000043 env['REQUEST_METHOD'] = 'POST'
44 env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded'
45 env['CONTENT_LENGTH'] = str(len(buf))
46 else:
Collin Winter3add4d72007-08-29 23:37:32 +000047 raise ValueError("unknown method: %s" % method)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000048 try:
49 return cgi.parse(fp, env, strict_parsing=1)
Guido van Rossumcd16bf62007-06-13 18:07:49 +000050 except Exception as err:
Jeremy Hyltond9827c42000-08-03 22:11:43 +000051 return ComparableException(err)
52
Neil Schemenauer66edb622004-07-19 15:38:11 +000053parse_strict_test_cases = [
Jeremy Hyltond9827c42000-08-03 22:11:43 +000054 ("", ValueError("bad query field: ''")),
55 ("&", ValueError("bad query field: ''")),
56 ("&&", ValueError("bad query field: ''")),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000057 (";", ValueError("bad query field: ''")),
58 (";&;", ValueError("bad query field: ''")),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000059 # Should the next few really be valid?
60 ("=", {}),
61 ("=&=", {}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000062 ("=;=", {}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000063 # This rest seem to make sense
64 ("=a", {'': ['a']}),
65 ("&=a", ValueError("bad query field: ''")),
66 ("=a&", ValueError("bad query field: ''")),
67 ("=&a", ValueError("bad query field: 'a'")),
68 ("b=a", {'b': ['a']}),
69 ("b+=a", {'b ': ['a']}),
70 ("a=b=a", {'a': ['b=a']}),
71 ("a=+b=a", {'a': [' b=a']}),
72 ("&b=a", ValueError("bad query field: ''")),
73 ("b&=a", ValueError("bad query field: 'b'")),
74 ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}),
75 ("a=a+b&a=b+a", {'a': ['a b', 'b a']}),
76 ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000077 ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
78 ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000079 ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env",
80 {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'],
81 'cuyer': ['r'],
82 'expire': ['964546263'],
83 'kid': ['130003.300038'],
84 'lobale': ['en-US'],
85 'order_id': ['0bb2e248638833d48cb7fed300000f1b'],
86 'ss': ['env'],
87 'view': ['bustomer'],
88 }),
Fred Drake004d5e62000-10-23 17:22:08 +000089
Jeremy Hyltond9827c42000-08-03 22:11:43 +000090 ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse",
91 {'SUBMIT': ['Browse'],
92 '_assigned_to': ['31392'],
93 '_category': ['100'],
94 '_status': ['1'],
95 'group_id': ['5470'],
96 'set': ['custom'],
97 })
98 ]
99
Guido van Rossum47b9ff62006-08-24 00:41:19 +0000100def norm(seq):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000101 return sorted(seq, key=repr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000102
103def first_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000104 return [p[0] for p in list]
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000105
106def first_second_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000107 return [(p[0], p[1][0]) for p in list]
108
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000109def gen_result(data, environ):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000110 encoding = 'latin-1'
111 fake_stdin = BytesIO(data.encode(encoding))
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000112 fake_stdin.seek(0)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000113 form = cgi.FieldStorage(fp=fake_stdin, environ=environ, encoding=encoding)
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000114
115 result = {}
116 for k, v in dict(form).items():
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000117 result[k] = isinstance(v, list) and form.getlist(k) or v.value
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000118
119 return result
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000120
Thomas Wouters89f507f2006-12-13 04:49:30 +0000121class CgiTests(unittest.TestCase):
Neil Schemenauer66edb622004-07-19 15:38:11 +0000122
Senthil Kumaran6b102f22013-01-23 02:50:15 -0800123 def test_parse_multipart(self):
124 fp = BytesIO(POSTDATA.encode('latin1'))
125 env = {'boundary': BOUNDARY.encode('latin1'),
126 'CONTENT-LENGTH': '558'}
127 result = cgi.parse_multipart(fp, env)
128 expected = {'submit': [b' Add '], 'id': [b'1234'],
129 'file': [b'Testing 123.\n'], 'title': [b'']}
130 self.assertEqual(result, expected)
131
132 def test_fieldstorage_properties(self):
133 fs = cgi.FieldStorage()
134 self.assertFalse(fs)
135 self.assertIn("FieldStorage", repr(fs))
136 self.assertEqual(list(fs), list(fs.keys()))
137 fs.list.append(namedtuple('MockFieldStorage', 'name')('fieldvalue'))
138 self.assertTrue(fs)
139
Senthil Kumaran47b5ddb2012-03-13 01:50:27 -0700140 def test_escape(self):
Brett Cannon8f79dd52012-04-25 20:49:19 -0400141 # cgi.escape() is deprecated.
142 with warnings.catch_warnings():
143 warnings.filterwarnings('ignore', 'cgi\.escape',
144 DeprecationWarning)
145 self.assertEqual("test & string", cgi.escape("test & string"))
146 self.assertEqual("&lt;test string&gt;", cgi.escape("<test string>"))
147 self.assertEqual("&quot;test string&quot;", cgi.escape('"test string"', True))
Senthil Kumaran47b5ddb2012-03-13 01:50:27 -0700148
Thomas Wouters89f507f2006-12-13 04:49:30 +0000149 def test_strict(self):
150 for orig, expect in parse_strict_test_cases:
151 # Test basic parsing
152 d = do_test(orig, "GET")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000153 self.assertEqual(d, expect, "Error parsing %s method GET" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000154 d = do_test(orig, "POST")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000155 self.assertEqual(d, expect, "Error parsing %s method POST" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000156
157 env = {'QUERY_STRING': orig}
Thomas Wouters89f507f2006-12-13 04:49:30 +0000158 fs = cgi.FieldStorage(environ=env)
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000159 if isinstance(expect, dict):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000160 # test dict interface
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000161 self.assertEqual(len(expect), len(fs))
Ezio Melotti263cbdf2010-11-29 02:02:10 +0000162 self.assertCountEqual(expect.keys(), fs.keys())
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000163 ##self.assertEqual(norm(expect.values()), norm(fs.values()))
164 ##self.assertEqual(norm(expect.items()), norm(fs.items()))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000165 self.assertEqual(fs.getvalue("nonexistent field", "default"), "default")
166 # test individual fields
167 for key in expect.keys():
168 expect_val = expect[key]
Benjamin Peterson577473f2010-01-19 00:09:57 +0000169 self.assertIn(key, fs)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000170 if len(expect_val) > 1:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000171 self.assertEqual(fs.getvalue(key), expect_val)
172 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000173 self.assertEqual(fs.getvalue(key), expect_val[0])
Thomas Wouters89f507f2006-12-13 04:49:30 +0000174
175 def test_log(self):
176 cgi.log("Testing")
177
178 cgi.logfp = StringIO()
179 cgi.initlog("%s", "Testing initlog 1")
180 cgi.log("%s", "Testing log 2")
181 self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n")
182 if os.path.exists("/dev/null"):
183 cgi.logfp = None
184 cgi.logfile = "/dev/null"
185 cgi.initlog("%s", "Testing log 3")
Victor Stinnerd33344a2011-07-14 22:28:36 +0200186 self.addCleanup(cgi.closelog)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000187 cgi.log("Testing log 4")
188
189 def test_fieldstorage_readline(self):
190 # FieldStorage uses readline, which has the capacity to read all
191 # contents of the input file into memory; we use readline's size argument
192 # to prevent that for files that do not contain any newlines in
193 # non-GET/HEAD requests
194 class TestReadlineFile:
195 def __init__(self, file):
196 self.file = file
197 self.numcalls = 0
198
199 def readline(self, size=None):
200 self.numcalls += 1
201 if size:
202 return self.file.readline(size)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000203 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000204 return self.file.readline()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000205
Thomas Wouters89f507f2006-12-13 04:49:30 +0000206 def __getattr__(self, name):
207 file = self.__dict__['file']
208 a = getattr(file, name)
209 if not isinstance(a, int):
210 setattr(self, name, a)
211 return a
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000212
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000213 f = TestReadlineFile(tempfile.TemporaryFile("wb+"))
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000214 self.addCleanup(f.close)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000215 f.write(b'x' * 256 * 1024)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000216 f.seek(0)
217 env = {'REQUEST_METHOD':'PUT'}
218 fs = cgi.FieldStorage(fp=f, environ=env)
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000219 self.addCleanup(fs.file.close)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000220 # if we're not chunking properly, readline is only called twice
221 # (by read_binary); if we are chunking properly, it will be called 5 times
222 # as long as the chunksize is 1 << 16.
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000223 self.assertTrue(f.numcalls > 2)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000224 f.close()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000225
Thomas Wouters89f507f2006-12-13 04:49:30 +0000226 def test_fieldstorage_multipart(self):
227 #Test basic FieldStorage multipart parsing
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000228 env = {
229 'REQUEST_METHOD': 'POST',
230 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
231 'CONTENT_LENGTH': '558'}
232 fp = BytesIO(POSTDATA.encode('latin-1'))
233 fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1")
Ezio Melottib3aedd42010-11-20 19:04:17 +0000234 self.assertEqual(len(fs.list), 4)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000235 expect = [{'name':'id', 'filename':None, 'value':'1234'},
236 {'name':'title', 'filename':None, 'value':''},
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000237 {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'},
Thomas Wouters89f507f2006-12-13 04:49:30 +0000238 {'name':'submit', 'filename':None, 'value':' Add '}]
239 for x in range(len(fs.list)):
240 for k, exp in expect[x].items():
241 got = getattr(fs.list[x], k)
Ezio Melottib3aedd42010-11-20 19:04:17 +0000242 self.assertEqual(got, exp)
Thomas Wouters00ee7ba2006-08-21 19:07:27 +0000243
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000244 def test_fieldstorage_multipart_non_ascii(self):
245 #Test basic FieldStorage multipart parsing
246 env = {'REQUEST_METHOD':'POST',
247 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
248 'CONTENT_LENGTH':'558'}
249 for encoding in ['iso-8859-1','utf-8']:
250 fp = BytesIO(POSTDATA_NON_ASCII.encode(encoding))
251 fs = cgi.FieldStorage(fp, environ=env,encoding=encoding)
252 self.assertEqual(len(fs.list), 1)
253 expect = [{'name':'id', 'filename':None, 'value':'\xe7\xf1\x80'}]
254 for x in range(len(fs.list)):
255 for k, exp in expect[x].items():
256 got = getattr(fs.list[x], k)
257 self.assertEqual(got, exp)
258
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000259 _qs_result = {
260 'key1': 'value1',
261 'key2': ['value2x', 'value2y'],
262 'key3': 'value3',
263 'key4': 'value4'
264 }
265 def testQSAndUrlEncode(self):
266 data = "key2=value2x&key3=value3&key4=value4"
267 environ = {
268 'CONTENT_LENGTH': str(len(data)),
269 'CONTENT_TYPE': 'application/x-www-form-urlencoded',
270 'QUERY_STRING': 'key1=value1&key2=value2y',
271 'REQUEST_METHOD': 'POST',
272 }
273 v = gen_result(data, environ)
274 self.assertEqual(self._qs_result, v)
275
276 def testQSAndFormData(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000277 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000278Content-Disposition: form-data; name="key2"
279
280value2y
281---123
282Content-Disposition: form-data; name="key3"
283
284value3
285---123
286Content-Disposition: form-data; name="key4"
287
288value4
289---123--
290"""
291 environ = {
292 'CONTENT_LENGTH': str(len(data)),
293 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
294 'QUERY_STRING': 'key1=value1&key2=value2x',
295 'REQUEST_METHOD': 'POST',
296 }
297 v = gen_result(data, environ)
298 self.assertEqual(self._qs_result, v)
299
300 def testQSAndFormDataFile(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000301 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000302Content-Disposition: form-data; name="key2"
303
304value2y
305---123
306Content-Disposition: form-data; name="key3"
307
308value3
309---123
310Content-Disposition: form-data; name="key4"
311
312value4
313---123
314Content-Disposition: form-data; name="upload"; filename="fake.txt"
315Content-Type: text/plain
316
317this is the content of the fake file
318
319---123--
320"""
321 environ = {
322 'CONTENT_LENGTH': str(len(data)),
323 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
324 'QUERY_STRING': 'key1=value1&key2=value2x',
325 'REQUEST_METHOD': 'POST',
326 }
327 result = self._qs_result.copy()
328 result.update({
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000329 'upload': b'this is the content of the fake file\n'
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000330 })
331 v = gen_result(data, environ)
332 self.assertEqual(result, v)
333
Facundo Batistabd18fd62008-09-08 00:23:29 +0000334 def test_deprecated_parse_qs(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000335 # this func is moved to urllib.parse, this is just a sanity check
336 with check_warnings(('cgi.parse_qs is deprecated, use urllib.parse.'
337 'parse_qs instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000338 self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']},
339 cgi.parse_qs('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000340
341 def test_deprecated_parse_qsl(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000342 # this func is moved to urllib.parse, this is just a sanity check
343 with check_warnings(('cgi.parse_qsl is deprecated, use urllib.parse.'
344 'parse_qsl instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000345 self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')],
346 cgi.parse_qsl('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000347
Fred Drake9a0a65b2008-12-04 19:24:50 +0000348 def test_parse_header(self):
349 self.assertEqual(
350 cgi.parse_header("text/plain"),
351 ("text/plain", {}))
352 self.assertEqual(
353 cgi.parse_header("text/vnd.just.made.this.up ; "),
354 ("text/vnd.just.made.this.up", {}))
355 self.assertEqual(
356 cgi.parse_header("text/plain;charset=us-ascii"),
357 ("text/plain", {"charset": "us-ascii"}))
358 self.assertEqual(
359 cgi.parse_header('text/plain ; charset="us-ascii"'),
360 ("text/plain", {"charset": "us-ascii"}))
361 self.assertEqual(
362 cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'),
363 ("text/plain", {"charset": "us-ascii", "another": "opt"}))
364 self.assertEqual(
365 cgi.parse_header('attachment; filename="silly.txt"'),
366 ("attachment", {"filename": "silly.txt"}))
367 self.assertEqual(
368 cgi.parse_header('attachment; filename="strange;name"'),
369 ("attachment", {"filename": "strange;name"}))
370 self.assertEqual(
371 cgi.parse_header('attachment; filename="strange;name";size=123;'),
372 ("attachment", {"filename": "strange;name", "size": "123"}))
Senthil Kumaran1ef0c032011-10-20 01:05:44 +0800373 self.assertEqual(
374 cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'),
375 ("form-data", {"name": "files", "filename": 'fo"o;bar'}))
376
Fred Drake9a0a65b2008-12-04 19:24:50 +0000377
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000378BOUNDARY = "---------------------------721837373350705526688164684"
379
380POSTDATA = """-----------------------------721837373350705526688164684
381Content-Disposition: form-data; name="id"
382
3831234
384-----------------------------721837373350705526688164684
385Content-Disposition: form-data; name="title"
386
387
388-----------------------------721837373350705526688164684
389Content-Disposition: form-data; name="file"; filename="test.txt"
390Content-Type: text/plain
391
392Testing 123.
393
394-----------------------------721837373350705526688164684
395Content-Disposition: form-data; name="submit"
396
397 Add\x20
398-----------------------------721837373350705526688164684--
399"""
400
401POSTDATA_NON_ASCII = """-----------------------------721837373350705526688164684
402Content-Disposition: form-data; name="id"
403
404\xe7\xf1\x80
405-----------------------------721837373350705526688164684
406"""
407
Fred Drake9a0a65b2008-12-04 19:24:50 +0000408
Thomas Wouters89f507f2006-12-13 04:49:30 +0000409def test_main():
410 run_unittest(CgiTests)
411
412if __name__ == '__main__':
413 test_main()