blob: 5510a0dccd32c88a346b5024388406568d76ca94 [file] [log] [blame]
Florent Xicluna8fbddf12010-03-17 20:29:51 +00001from test.support import run_unittest, check_warnings
Jeremy Hyltond9827c42000-08-03 22:11:43 +00002import cgi
3import os
4import sys
Thomas Wouters00ee7ba2006-08-21 19:07:27 +00005import tempfile
Thomas Wouters89f507f2006-12-13 04:49:30 +00006import unittest
Brett Cannon8f79dd52012-04-25 20:49:19 -04007import warnings
Victor Stinner5c23b8e2011-01-14 13:05:21 +00008from io import StringIO, BytesIO
Jeremy Hyltond9827c42000-08-03 22:11:43 +00009
10class HackedSysModule:
11 # The regression test will have real values in sys.argv, which
Fred Drake004d5e62000-10-23 17:22:08 +000012 # will completely confuse the test of the cgi module
Jeremy Hyltond9827c42000-08-03 22:11:43 +000013 argv = []
14 stdin = sys.stdin
15
16cgi.sys = HackedSysModule()
17
Jeremy Hyltond9827c42000-08-03 22:11:43 +000018class ComparableException:
19 def __init__(self, err):
20 self.err = err
21
22 def __str__(self):
23 return str(self.err)
24
Guido van Rossum47b9ff62006-08-24 00:41:19 +000025 def __eq__(self, anExc):
Jeremy Hyltond9827c42000-08-03 22:11:43 +000026 if not isinstance(anExc, Exception):
Guido van Rossum47b9ff62006-08-24 00:41:19 +000027 return NotImplemented
28 return (self.err.__class__ == anExc.__class__ and
29 self.err.args == anExc.args)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000030
31 def __getattr__(self, attr):
Guido van Rossum846d6db2001-01-17 15:08:37 +000032 return getattr(self.err, attr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000033
34def do_test(buf, method):
35 env = {}
36 if method == "GET":
37 fp = None
38 env['REQUEST_METHOD'] = 'GET'
39 env['QUERY_STRING'] = buf
40 elif method == "POST":
Victor Stinner5c23b8e2011-01-14 13:05:21 +000041 fp = BytesIO(buf.encode('latin-1')) # FieldStorage expects bytes
Jeremy Hyltond9827c42000-08-03 22:11:43 +000042 env['REQUEST_METHOD'] = 'POST'
43 env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded'
44 env['CONTENT_LENGTH'] = str(len(buf))
45 else:
Collin Winter3add4d72007-08-29 23:37:32 +000046 raise ValueError("unknown method: %s" % method)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000047 try:
48 return cgi.parse(fp, env, strict_parsing=1)
Guido van Rossumcd16bf62007-06-13 18:07:49 +000049 except Exception as err:
Jeremy Hyltond9827c42000-08-03 22:11:43 +000050 return ComparableException(err)
51
Neil Schemenauer66edb622004-07-19 15:38:11 +000052parse_strict_test_cases = [
Jeremy Hyltond9827c42000-08-03 22:11:43 +000053 ("", ValueError("bad query field: ''")),
54 ("&", ValueError("bad query field: ''")),
55 ("&&", ValueError("bad query field: ''")),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000056 (";", ValueError("bad query field: ''")),
57 (";&;", ValueError("bad query field: ''")),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000058 # Should the next few really be valid?
59 ("=", {}),
60 ("=&=", {}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000061 ("=;=", {}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000062 # This rest seem to make sense
63 ("=a", {'': ['a']}),
64 ("&=a", ValueError("bad query field: ''")),
65 ("=a&", ValueError("bad query field: ''")),
66 ("=&a", ValueError("bad query field: 'a'")),
67 ("b=a", {'b': ['a']}),
68 ("b+=a", {'b ': ['a']}),
69 ("a=b=a", {'a': ['b=a']}),
70 ("a=+b=a", {'a': [' b=a']}),
71 ("&b=a", ValueError("bad query field: ''")),
72 ("b&=a", ValueError("bad query field: 'b'")),
73 ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}),
74 ("a=a+b&a=b+a", {'a': ['a b', 'b a']}),
75 ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000076 ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
77 ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000078 ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env",
79 {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'],
80 'cuyer': ['r'],
81 'expire': ['964546263'],
82 'kid': ['130003.300038'],
83 'lobale': ['en-US'],
84 'order_id': ['0bb2e248638833d48cb7fed300000f1b'],
85 'ss': ['env'],
86 'view': ['bustomer'],
87 }),
Fred Drake004d5e62000-10-23 17:22:08 +000088
Jeremy Hyltond9827c42000-08-03 22:11:43 +000089 ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse",
90 {'SUBMIT': ['Browse'],
91 '_assigned_to': ['31392'],
92 '_category': ['100'],
93 '_status': ['1'],
94 'group_id': ['5470'],
95 'set': ['custom'],
96 })
97 ]
98
Guido van Rossum47b9ff62006-08-24 00:41:19 +000099def norm(seq):
Guido van Rossumcc2b0162007-02-11 06:12:03 +0000100 return sorted(seq, key=repr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000101
102def first_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000103 return [p[0] for p in list]
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000104
105def first_second_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000106 return [(p[0], p[1][0]) for p in list]
107
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000108def gen_result(data, environ):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000109 encoding = 'latin-1'
110 fake_stdin = BytesIO(data.encode(encoding))
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000111 fake_stdin.seek(0)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000112 form = cgi.FieldStorage(fp=fake_stdin, environ=environ, encoding=encoding)
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000113
114 result = {}
115 for k, v in dict(form).items():
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000116 result[k] = isinstance(v, list) and form.getlist(k) or v.value
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000117
118 return result
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000119
Thomas Wouters89f507f2006-12-13 04:49:30 +0000120class CgiTests(unittest.TestCase):
Neil Schemenauer66edb622004-07-19 15:38:11 +0000121
Senthil Kumaran47b5ddb2012-03-13 01:50:27 -0700122 def test_escape(self):
Brett Cannon8f79dd52012-04-25 20:49:19 -0400123 # cgi.escape() is deprecated.
124 with warnings.catch_warnings():
125 warnings.filterwarnings('ignore', 'cgi\.escape',
126 DeprecationWarning)
127 self.assertEqual("test & string", cgi.escape("test & string"))
128 self.assertEqual("&lt;test string&gt;", cgi.escape("<test string>"))
129 self.assertEqual("&quot;test string&quot;", cgi.escape('"test string"', True))
Senthil Kumaran47b5ddb2012-03-13 01:50:27 -0700130
Thomas Wouters89f507f2006-12-13 04:49:30 +0000131 def test_strict(self):
132 for orig, expect in parse_strict_test_cases:
133 # Test basic parsing
134 d = do_test(orig, "GET")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000135 self.assertEqual(d, expect, "Error parsing %s method GET" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000136 d = do_test(orig, "POST")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000137 self.assertEqual(d, expect, "Error parsing %s method POST" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000138
139 env = {'QUERY_STRING': orig}
Thomas Wouters89f507f2006-12-13 04:49:30 +0000140 fs = cgi.FieldStorage(environ=env)
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000141 if isinstance(expect, dict):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000142 # test dict interface
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000143 self.assertEqual(len(expect), len(fs))
Ezio Melotti263cbdf2010-11-29 02:02:10 +0000144 self.assertCountEqual(expect.keys(), fs.keys())
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000145 ##self.assertEqual(norm(expect.values()), norm(fs.values()))
146 ##self.assertEqual(norm(expect.items()), norm(fs.items()))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000147 self.assertEqual(fs.getvalue("nonexistent field", "default"), "default")
148 # test individual fields
149 for key in expect.keys():
150 expect_val = expect[key]
Benjamin Peterson577473f2010-01-19 00:09:57 +0000151 self.assertIn(key, fs)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000152 if len(expect_val) > 1:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000153 self.assertEqual(fs.getvalue(key), expect_val)
154 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000155 self.assertEqual(fs.getvalue(key), expect_val[0])
Thomas Wouters89f507f2006-12-13 04:49:30 +0000156
157 def test_log(self):
158 cgi.log("Testing")
159
160 cgi.logfp = StringIO()
161 cgi.initlog("%s", "Testing initlog 1")
162 cgi.log("%s", "Testing log 2")
163 self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n")
164 if os.path.exists("/dev/null"):
165 cgi.logfp = None
166 cgi.logfile = "/dev/null"
167 cgi.initlog("%s", "Testing log 3")
Victor Stinnerd33344a2011-07-14 22:28:36 +0200168 self.addCleanup(cgi.closelog)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000169 cgi.log("Testing log 4")
170
171 def test_fieldstorage_readline(self):
172 # FieldStorage uses readline, which has the capacity to read all
173 # contents of the input file into memory; we use readline's size argument
174 # to prevent that for files that do not contain any newlines in
175 # non-GET/HEAD requests
176 class TestReadlineFile:
177 def __init__(self, file):
178 self.file = file
179 self.numcalls = 0
180
181 def readline(self, size=None):
182 self.numcalls += 1
183 if size:
184 return self.file.readline(size)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000185 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000186 return self.file.readline()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000187
Thomas Wouters89f507f2006-12-13 04:49:30 +0000188 def __getattr__(self, name):
189 file = self.__dict__['file']
190 a = getattr(file, name)
191 if not isinstance(a, int):
192 setattr(self, name, a)
193 return a
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000194
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000195 f = TestReadlineFile(tempfile.TemporaryFile("wb+"))
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000196 self.addCleanup(f.close)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000197 f.write(b'x' * 256 * 1024)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000198 f.seek(0)
199 env = {'REQUEST_METHOD':'PUT'}
200 fs = cgi.FieldStorage(fp=f, environ=env)
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000201 self.addCleanup(fs.file.close)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000202 # if we're not chunking properly, readline is only called twice
203 # (by read_binary); if we are chunking properly, it will be called 5 times
204 # as long as the chunksize is 1 << 16.
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000205 self.assertTrue(f.numcalls > 2)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000206 f.close()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000207
Thomas Wouters89f507f2006-12-13 04:49:30 +0000208 def test_fieldstorage_multipart(self):
209 #Test basic FieldStorage multipart parsing
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000210 env = {
211 'REQUEST_METHOD': 'POST',
212 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
213 'CONTENT_LENGTH': '558'}
214 fp = BytesIO(POSTDATA.encode('latin-1'))
215 fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1")
Ezio Melottib3aedd42010-11-20 19:04:17 +0000216 self.assertEqual(len(fs.list), 4)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000217 expect = [{'name':'id', 'filename':None, 'value':'1234'},
218 {'name':'title', 'filename':None, 'value':''},
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000219 {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'},
Thomas Wouters89f507f2006-12-13 04:49:30 +0000220 {'name':'submit', 'filename':None, 'value':' Add '}]
221 for x in range(len(fs.list)):
222 for k, exp in expect[x].items():
223 got = getattr(fs.list[x], k)
Ezio Melottib3aedd42010-11-20 19:04:17 +0000224 self.assertEqual(got, exp)
Thomas Wouters00ee7ba2006-08-21 19:07:27 +0000225
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000226 def test_fieldstorage_multipart_non_ascii(self):
227 #Test basic FieldStorage multipart parsing
228 env = {'REQUEST_METHOD':'POST',
229 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
230 'CONTENT_LENGTH':'558'}
231 for encoding in ['iso-8859-1','utf-8']:
232 fp = BytesIO(POSTDATA_NON_ASCII.encode(encoding))
233 fs = cgi.FieldStorage(fp, environ=env,encoding=encoding)
234 self.assertEqual(len(fs.list), 1)
235 expect = [{'name':'id', 'filename':None, 'value':'\xe7\xf1\x80'}]
236 for x in range(len(fs.list)):
237 for k, exp in expect[x].items():
238 got = getattr(fs.list[x], k)
239 self.assertEqual(got, exp)
240
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000241 _qs_result = {
242 'key1': 'value1',
243 'key2': ['value2x', 'value2y'],
244 'key3': 'value3',
245 'key4': 'value4'
246 }
247 def testQSAndUrlEncode(self):
248 data = "key2=value2x&key3=value3&key4=value4"
249 environ = {
250 'CONTENT_LENGTH': str(len(data)),
251 'CONTENT_TYPE': 'application/x-www-form-urlencoded',
252 'QUERY_STRING': 'key1=value1&key2=value2y',
253 'REQUEST_METHOD': 'POST',
254 }
255 v = gen_result(data, environ)
256 self.assertEqual(self._qs_result, v)
257
258 def testQSAndFormData(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000259 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000260Content-Disposition: form-data; name="key2"
261
262value2y
263---123
264Content-Disposition: form-data; name="key3"
265
266value3
267---123
268Content-Disposition: form-data; name="key4"
269
270value4
271---123--
272"""
273 environ = {
274 'CONTENT_LENGTH': str(len(data)),
275 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
276 'QUERY_STRING': 'key1=value1&key2=value2x',
277 'REQUEST_METHOD': 'POST',
278 }
279 v = gen_result(data, environ)
280 self.assertEqual(self._qs_result, v)
281
282 def testQSAndFormDataFile(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000283 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000284Content-Disposition: form-data; name="key2"
285
286value2y
287---123
288Content-Disposition: form-data; name="key3"
289
290value3
291---123
292Content-Disposition: form-data; name="key4"
293
294value4
295---123
296Content-Disposition: form-data; name="upload"; filename="fake.txt"
297Content-Type: text/plain
298
299this is the content of the fake file
300
301---123--
302"""
303 environ = {
304 'CONTENT_LENGTH': str(len(data)),
305 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
306 'QUERY_STRING': 'key1=value1&key2=value2x',
307 'REQUEST_METHOD': 'POST',
308 }
309 result = self._qs_result.copy()
310 result.update({
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000311 'upload': b'this is the content of the fake file\n'
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000312 })
313 v = gen_result(data, environ)
314 self.assertEqual(result, v)
315
Facundo Batistabd18fd62008-09-08 00:23:29 +0000316 def test_deprecated_parse_qs(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000317 # this func is moved to urllib.parse, this is just a sanity check
318 with check_warnings(('cgi.parse_qs is deprecated, use urllib.parse.'
319 'parse_qs instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000320 self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']},
321 cgi.parse_qs('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000322
323 def test_deprecated_parse_qsl(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000324 # this func is moved to urllib.parse, this is just a sanity check
325 with check_warnings(('cgi.parse_qsl is deprecated, use urllib.parse.'
326 'parse_qsl instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000327 self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')],
328 cgi.parse_qsl('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000329
Fred Drake9a0a65b2008-12-04 19:24:50 +0000330 def test_parse_header(self):
331 self.assertEqual(
332 cgi.parse_header("text/plain"),
333 ("text/plain", {}))
334 self.assertEqual(
335 cgi.parse_header("text/vnd.just.made.this.up ; "),
336 ("text/vnd.just.made.this.up", {}))
337 self.assertEqual(
338 cgi.parse_header("text/plain;charset=us-ascii"),
339 ("text/plain", {"charset": "us-ascii"}))
340 self.assertEqual(
341 cgi.parse_header('text/plain ; charset="us-ascii"'),
342 ("text/plain", {"charset": "us-ascii"}))
343 self.assertEqual(
344 cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'),
345 ("text/plain", {"charset": "us-ascii", "another": "opt"}))
346 self.assertEqual(
347 cgi.parse_header('attachment; filename="silly.txt"'),
348 ("attachment", {"filename": "silly.txt"}))
349 self.assertEqual(
350 cgi.parse_header('attachment; filename="strange;name"'),
351 ("attachment", {"filename": "strange;name"}))
352 self.assertEqual(
353 cgi.parse_header('attachment; filename="strange;name";size=123;'),
354 ("attachment", {"filename": "strange;name", "size": "123"}))
Senthil Kumaran1ef0c032011-10-20 01:05:44 +0800355 self.assertEqual(
356 cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'),
357 ("form-data", {"name": "files", "filename": 'fo"o;bar'}))
358
Fred Drake9a0a65b2008-12-04 19:24:50 +0000359
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000360BOUNDARY = "---------------------------721837373350705526688164684"
361
362POSTDATA = """-----------------------------721837373350705526688164684
363Content-Disposition: form-data; name="id"
364
3651234
366-----------------------------721837373350705526688164684
367Content-Disposition: form-data; name="title"
368
369
370-----------------------------721837373350705526688164684
371Content-Disposition: form-data; name="file"; filename="test.txt"
372Content-Type: text/plain
373
374Testing 123.
375
376-----------------------------721837373350705526688164684
377Content-Disposition: form-data; name="submit"
378
379 Add\x20
380-----------------------------721837373350705526688164684--
381"""
382
383POSTDATA_NON_ASCII = """-----------------------------721837373350705526688164684
384Content-Disposition: form-data; name="id"
385
386\xe7\xf1\x80
387-----------------------------721837373350705526688164684
388"""
389
Fred Drake9a0a65b2008-12-04 19:24:50 +0000390
Thomas Wouters89f507f2006-12-13 04:49:30 +0000391def test_main():
392 run_unittest(CgiTests)
393
394if __name__ == '__main__':
395 test_main()