blob: 3031fb38262bacc56ede3af789b5df4fbcea1d68 [file] [log] [blame]
Florent Xicluna8fbddf12010-03-17 20:29:51 +00001from test.support import run_unittest, check_warnings
Jeremy Hyltond9827c42000-08-03 22:11:43 +00002import cgi
3import os
4import sys
Thomas Wouters00ee7ba2006-08-21 19:07:27 +00005import tempfile
Thomas Wouters89f507f2006-12-13 04:49:30 +00006import unittest
Victor Stinner5c23b8e2011-01-14 13:05:21 +00007from io import StringIO, BytesIO
Jeremy Hyltond9827c42000-08-03 22:11:43 +00008
9class HackedSysModule:
10 # The regression test will have real values in sys.argv, which
Fred Drake004d5e62000-10-23 17:22:08 +000011 # will completely confuse the test of the cgi module
Jeremy Hyltond9827c42000-08-03 22:11:43 +000012 argv = []
13 stdin = sys.stdin
14
15cgi.sys = HackedSysModule()
16
Jeremy Hyltond9827c42000-08-03 22:11:43 +000017class ComparableException:
18 def __init__(self, err):
19 self.err = err
20
21 def __str__(self):
22 return str(self.err)
23
Guido van Rossum47b9ff62006-08-24 00:41:19 +000024 def __eq__(self, anExc):
Jeremy Hyltond9827c42000-08-03 22:11:43 +000025 if not isinstance(anExc, Exception):
Guido van Rossum47b9ff62006-08-24 00:41:19 +000026 return NotImplemented
27 return (self.err.__class__ == anExc.__class__ and
28 self.err.args == anExc.args)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000029
30 def __getattr__(self, attr):
Guido van Rossum846d6db2001-01-17 15:08:37 +000031 return getattr(self.err, attr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000032
33def do_test(buf, method):
34 env = {}
35 if method == "GET":
36 fp = None
37 env['REQUEST_METHOD'] = 'GET'
38 env['QUERY_STRING'] = buf
39 elif method == "POST":
Victor Stinner5c23b8e2011-01-14 13:05:21 +000040 fp = BytesIO(buf.encode('latin-1')) # FieldStorage expects bytes
Jeremy Hyltond9827c42000-08-03 22:11:43 +000041 env['REQUEST_METHOD'] = 'POST'
42 env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded'
43 env['CONTENT_LENGTH'] = str(len(buf))
44 else:
Collin Winter3add4d72007-08-29 23:37:32 +000045 raise ValueError("unknown method: %s" % method)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000046 try:
47 return cgi.parse(fp, env, strict_parsing=1)
Guido van Rossumcd16bf62007-06-13 18:07:49 +000048 except Exception as err:
Jeremy Hyltond9827c42000-08-03 22:11:43 +000049 return ComparableException(err)
50
Neil Schemenauer66edb622004-07-19 15:38:11 +000051parse_strict_test_cases = [
Jeremy Hyltond9827c42000-08-03 22:11:43 +000052 ("", ValueError("bad query field: ''")),
53 ("&", ValueError("bad query field: ''")),
54 ("&&", ValueError("bad query field: ''")),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000055 (";", ValueError("bad query field: ''")),
56 (";&;", ValueError("bad query field: ''")),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000057 # Should the next few really be valid?
58 ("=", {}),
59 ("=&=", {}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000060 ("=;=", {}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000061 # This rest seem to make sense
62 ("=a", {'': ['a']}),
63 ("&=a", ValueError("bad query field: ''")),
64 ("=a&", ValueError("bad query field: ''")),
65 ("=&a", ValueError("bad query field: 'a'")),
66 ("b=a", {'b': ['a']}),
67 ("b+=a", {'b ': ['a']}),
68 ("a=b=a", {'a': ['b=a']}),
69 ("a=+b=a", {'a': [' b=a']}),
70 ("&b=a", ValueError("bad query field: ''")),
71 ("b&=a", ValueError("bad query field: 'b'")),
72 ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}),
73 ("a=a+b&a=b+a", {'a': ['a b', 'b a']}),
74 ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000075 ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
76 ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000077 ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env",
78 {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'],
79 'cuyer': ['r'],
80 'expire': ['964546263'],
81 'kid': ['130003.300038'],
82 'lobale': ['en-US'],
83 'order_id': ['0bb2e248638833d48cb7fed300000f1b'],
84 'ss': ['env'],
85 'view': ['bustomer'],
86 }),
Fred Drake004d5e62000-10-23 17:22:08 +000087
Jeremy Hyltond9827c42000-08-03 22:11:43 +000088 ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse",
89 {'SUBMIT': ['Browse'],
90 '_assigned_to': ['31392'],
91 '_category': ['100'],
92 '_status': ['1'],
93 'group_id': ['5470'],
94 'set': ['custom'],
95 })
96 ]
97
Guido van Rossum47b9ff62006-08-24 00:41:19 +000098def norm(seq):
Guido van Rossumcc2b0162007-02-11 06:12:03 +000099 return sorted(seq, key=repr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000100
101def first_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000102 return [p[0] for p in list]
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000103
104def first_second_elts(list):
Guido van Rossumc1f779c2007-07-03 08:25:58 +0000105 return [(p[0], p[1][0]) for p in list]
106
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000107def gen_result(data, environ):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000108 encoding = 'latin-1'
109 fake_stdin = BytesIO(data.encode(encoding))
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000110 fake_stdin.seek(0)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000111 form = cgi.FieldStorage(fp=fake_stdin, environ=environ, encoding=encoding)
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000112
113 result = {}
114 for k, v in dict(form).items():
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000115 result[k] = isinstance(v, list) and form.getlist(k) or v.value
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000116
117 return result
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000118
Thomas Wouters89f507f2006-12-13 04:49:30 +0000119class CgiTests(unittest.TestCase):
Neil Schemenauer66edb622004-07-19 15:38:11 +0000120
Senthil Kumaran47b5ddb2012-03-13 01:50:27 -0700121 def test_escape(self):
122 self.assertEqual("test & string", cgi.escape("test & string"))
123 self.assertEqual("&lt;test string&gt;", cgi.escape("<test string>"))
124 self.assertEqual("&quot;test string&quot;", cgi.escape('"test string"', True))
125
Thomas Wouters89f507f2006-12-13 04:49:30 +0000126 def test_strict(self):
127 for orig, expect in parse_strict_test_cases:
128 # Test basic parsing
129 d = do_test(orig, "GET")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000130 self.assertEqual(d, expect, "Error parsing %s method GET" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000131 d = do_test(orig, "POST")
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000132 self.assertEqual(d, expect, "Error parsing %s method POST" % repr(orig))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000133
134 env = {'QUERY_STRING': orig}
Thomas Wouters89f507f2006-12-13 04:49:30 +0000135 fs = cgi.FieldStorage(environ=env)
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000136 if isinstance(expect, dict):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000137 # test dict interface
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000138 self.assertEqual(len(expect), len(fs))
Ezio Melotti263cbdf2010-11-29 02:02:10 +0000139 self.assertCountEqual(expect.keys(), fs.keys())
Georg Brandl49d1b4f2008-05-11 21:42:51 +0000140 ##self.assertEqual(norm(expect.values()), norm(fs.values()))
141 ##self.assertEqual(norm(expect.items()), norm(fs.items()))
Thomas Wouters89f507f2006-12-13 04:49:30 +0000142 self.assertEqual(fs.getvalue("nonexistent field", "default"), "default")
143 # test individual fields
144 for key in expect.keys():
145 expect_val = expect[key]
Benjamin Peterson577473f2010-01-19 00:09:57 +0000146 self.assertIn(key, fs)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000147 if len(expect_val) > 1:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000148 self.assertEqual(fs.getvalue(key), expect_val)
149 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000150 self.assertEqual(fs.getvalue(key), expect_val[0])
Thomas Wouters89f507f2006-12-13 04:49:30 +0000151
152 def test_log(self):
153 cgi.log("Testing")
154
155 cgi.logfp = StringIO()
156 cgi.initlog("%s", "Testing initlog 1")
157 cgi.log("%s", "Testing log 2")
158 self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n")
159 if os.path.exists("/dev/null"):
160 cgi.logfp = None
161 cgi.logfile = "/dev/null"
162 cgi.initlog("%s", "Testing log 3")
Ezio Melotti7ebb7062011-07-14 15:18:57 +0300163 def log_cleanup():
164 """Restore the global state of the log vars."""
165 cgi.logfile = ''
166 cgi.logfp.close()
167 cgi.logfp = None
168 cgi.log = cgi.initlog
169 self.addCleanup(log_cleanup)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000170 cgi.log("Testing log 4")
171
172 def test_fieldstorage_readline(self):
173 # FieldStorage uses readline, which has the capacity to read all
174 # contents of the input file into memory; we use readline's size argument
175 # to prevent that for files that do not contain any newlines in
176 # non-GET/HEAD requests
177 class TestReadlineFile:
178 def __init__(self, file):
179 self.file = file
180 self.numcalls = 0
181
182 def readline(self, size=None):
183 self.numcalls += 1
184 if size:
185 return self.file.readline(size)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000186 else:
Thomas Wouters89f507f2006-12-13 04:49:30 +0000187 return self.file.readline()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000188
Thomas Wouters89f507f2006-12-13 04:49:30 +0000189 def __getattr__(self, name):
190 file = self.__dict__['file']
191 a = getattr(file, name)
192 if not isinstance(a, int):
193 setattr(self, name, a)
194 return a
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000195
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000196 f = TestReadlineFile(tempfile.TemporaryFile("wb+"))
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000197 self.addCleanup(f.close)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000198 f.write(b'x' * 256 * 1024)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000199 f.seek(0)
200 env = {'REQUEST_METHOD':'PUT'}
201 fs = cgi.FieldStorage(fp=f, environ=env)
Benjamin Peterson807a5a12010-10-30 22:59:37 +0000202 self.addCleanup(fs.file.close)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000203 # if we're not chunking properly, readline is only called twice
204 # (by read_binary); if we are chunking properly, it will be called 5 times
205 # as long as the chunksize is 1 << 16.
Benjamin Petersonc9c0f202009-06-30 23:06:06 +0000206 self.assertTrue(f.numcalls > 2)
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000207 f.close()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000208
Thomas Wouters89f507f2006-12-13 04:49:30 +0000209 def test_fieldstorage_multipart(self):
210 #Test basic FieldStorage multipart parsing
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000211 env = {
212 'REQUEST_METHOD': 'POST',
213 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
214 'CONTENT_LENGTH': '558'}
215 fp = BytesIO(POSTDATA.encode('latin-1'))
216 fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1")
Ezio Melottib3aedd42010-11-20 19:04:17 +0000217 self.assertEqual(len(fs.list), 4)
Thomas Wouters89f507f2006-12-13 04:49:30 +0000218 expect = [{'name':'id', 'filename':None, 'value':'1234'},
219 {'name':'title', 'filename':None, 'value':''},
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000220 {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'},
Thomas Wouters89f507f2006-12-13 04:49:30 +0000221 {'name':'submit', 'filename':None, 'value':' Add '}]
222 for x in range(len(fs.list)):
223 for k, exp in expect[x].items():
224 got = getattr(fs.list[x], k)
Ezio Melottib3aedd42010-11-20 19:04:17 +0000225 self.assertEqual(got, exp)
Thomas Wouters00ee7ba2006-08-21 19:07:27 +0000226
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000227 def test_fieldstorage_multipart_non_ascii(self):
228 #Test basic FieldStorage multipart parsing
229 env = {'REQUEST_METHOD':'POST',
230 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY),
231 'CONTENT_LENGTH':'558'}
232 for encoding in ['iso-8859-1','utf-8']:
233 fp = BytesIO(POSTDATA_NON_ASCII.encode(encoding))
234 fs = cgi.FieldStorage(fp, environ=env,encoding=encoding)
235 self.assertEqual(len(fs.list), 1)
236 expect = [{'name':'id', 'filename':None, 'value':'\xe7\xf1\x80'}]
237 for x in range(len(fs.list)):
238 for k, exp in expect[x].items():
239 got = getattr(fs.list[x], k)
240 self.assertEqual(got, exp)
241
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000242 _qs_result = {
243 'key1': 'value1',
244 'key2': ['value2x', 'value2y'],
245 'key3': 'value3',
246 'key4': 'value4'
247 }
248 def testQSAndUrlEncode(self):
249 data = "key2=value2x&key3=value3&key4=value4"
250 environ = {
251 'CONTENT_LENGTH': str(len(data)),
252 'CONTENT_TYPE': 'application/x-www-form-urlencoded',
253 'QUERY_STRING': 'key1=value1&key2=value2y',
254 'REQUEST_METHOD': 'POST',
255 }
256 v = gen_result(data, environ)
257 self.assertEqual(self._qs_result, v)
258
259 def testQSAndFormData(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000260 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000261Content-Disposition: form-data; name="key2"
262
263value2y
264---123
265Content-Disposition: form-data; name="key3"
266
267value3
268---123
269Content-Disposition: form-data; name="key4"
270
271value4
272---123--
273"""
274 environ = {
275 'CONTENT_LENGTH': str(len(data)),
276 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
277 'QUERY_STRING': 'key1=value1&key2=value2x',
278 'REQUEST_METHOD': 'POST',
279 }
280 v = gen_result(data, environ)
281 self.assertEqual(self._qs_result, v)
282
283 def testQSAndFormDataFile(self):
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000284 data = """---123
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000285Content-Disposition: form-data; name="key2"
286
287value2y
288---123
289Content-Disposition: form-data; name="key3"
290
291value3
292---123
293Content-Disposition: form-data; name="key4"
294
295value4
296---123
297Content-Disposition: form-data; name="upload"; filename="fake.txt"
298Content-Type: text/plain
299
300this is the content of the fake file
301
302---123--
303"""
304 environ = {
305 'CONTENT_LENGTH': str(len(data)),
306 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
307 'QUERY_STRING': 'key1=value1&key2=value2x',
308 'REQUEST_METHOD': 'POST',
309 }
310 result = self._qs_result.copy()
311 result.update({
Victor Stinner5c23b8e2011-01-14 13:05:21 +0000312 'upload': b'this is the content of the fake file\n'
Benjamin Petersondcf97b92008-07-02 17:30:14 +0000313 })
314 v = gen_result(data, environ)
315 self.assertEqual(result, v)
316
Facundo Batistabd18fd62008-09-08 00:23:29 +0000317 def test_deprecated_parse_qs(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000318 # this func is moved to urllib.parse, this is just a sanity check
319 with check_warnings(('cgi.parse_qs is deprecated, use urllib.parse.'
320 'parse_qs instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000321 self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']},
322 cgi.parse_qs('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000323
324 def test_deprecated_parse_qsl(self):
Florent Xicluna8fbddf12010-03-17 20:29:51 +0000325 # this func is moved to urllib.parse, this is just a sanity check
326 with check_warnings(('cgi.parse_qsl is deprecated, use urllib.parse.'
327 'parse_qsl instead', DeprecationWarning)):
Facundo Batistaa27244b2008-09-09 02:43:19 +0000328 self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')],
329 cgi.parse_qsl('a=A1&b=B2&B=B3'))
Facundo Batistabd18fd62008-09-08 00:23:29 +0000330
Fred Drake9a0a65b2008-12-04 19:24:50 +0000331 def test_parse_header(self):
332 self.assertEqual(
333 cgi.parse_header("text/plain"),
334 ("text/plain", {}))
335 self.assertEqual(
336 cgi.parse_header("text/vnd.just.made.this.up ; "),
337 ("text/vnd.just.made.this.up", {}))
338 self.assertEqual(
339 cgi.parse_header("text/plain;charset=us-ascii"),
340 ("text/plain", {"charset": "us-ascii"}))
341 self.assertEqual(
342 cgi.parse_header('text/plain ; charset="us-ascii"'),
343 ("text/plain", {"charset": "us-ascii"}))
344 self.assertEqual(
345 cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'),
346 ("text/plain", {"charset": "us-ascii", "another": "opt"}))
347 self.assertEqual(
348 cgi.parse_header('attachment; filename="silly.txt"'),
349 ("attachment", {"filename": "silly.txt"}))
350 self.assertEqual(
351 cgi.parse_header('attachment; filename="strange;name"'),
352 ("attachment", {"filename": "strange;name"}))
353 self.assertEqual(
354 cgi.parse_header('attachment; filename="strange;name";size=123;'),
355 ("attachment", {"filename": "strange;name", "size": "123"}))
Senthil Kumaran1ef0c032011-10-20 01:05:44 +0800356 self.assertEqual(
357 cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'),
358 ("form-data", {"name": "files", "filename": 'fo"o;bar'}))
359
Fred Drake9a0a65b2008-12-04 19:24:50 +0000360
Victor Stinnerf0e293c2011-03-01 23:09:57 +0000361BOUNDARY = "---------------------------721837373350705526688164684"
362
363POSTDATA = """-----------------------------721837373350705526688164684
364Content-Disposition: form-data; name="id"
365
3661234
367-----------------------------721837373350705526688164684
368Content-Disposition: form-data; name="title"
369
370
371-----------------------------721837373350705526688164684
372Content-Disposition: form-data; name="file"; filename="test.txt"
373Content-Type: text/plain
374
375Testing 123.
376
377-----------------------------721837373350705526688164684
378Content-Disposition: form-data; name="submit"
379
380 Add\x20
381-----------------------------721837373350705526688164684--
382"""
383
384POSTDATA_NON_ASCII = """-----------------------------721837373350705526688164684
385Content-Disposition: form-data; name="id"
386
387\xe7\xf1\x80
388-----------------------------721837373350705526688164684
389"""
390
Fred Drake9a0a65b2008-12-04 19:24:50 +0000391
Thomas Wouters89f507f2006-12-13 04:49:30 +0000392def test_main():
393 run_unittest(CgiTests)
394
395if __name__ == '__main__':
396 test_main()