blob: f6abe976cf7bf3cba7a8184409078e2798f68525 [file] [log] [blame]
Ezio Melottief490962010-01-31 11:46:54 +00001from test.test_support import run_unittest, check_warnings
Jeremy Hyltond9827c42000-08-03 22:11:43 +00002import cgi
3import os
4import sys
Guido van Rossum9568b732006-08-10 17:41:07 +00005import tempfile
Georg Brandle1844332006-10-29 20:09:12 +00006import unittest
Jeremy Hyltond9827c42000-08-03 22:11:43 +00007
8class HackedSysModule:
9 # The regression test will have real values in sys.argv, which
Fred Drake004d5e62000-10-23 17:22:08 +000010 # will completely confuse the test of the cgi module
Jeremy Hyltond9827c42000-08-03 22:11:43 +000011 argv = []
12 stdin = sys.stdin
13
14cgi.sys = HackedSysModule()
15
16try:
17 from cStringIO import StringIO
18except ImportError:
19 from StringIO import StringIO
20
21class ComparableException:
22 def __init__(self, err):
23 self.err = err
24
25 def __str__(self):
26 return str(self.err)
27
28 def __cmp__(self, anExc):
29 if not isinstance(anExc, Exception):
30 return -1
31 x = cmp(self.err.__class__, anExc.__class__)
32 if x != 0:
33 return x
34 return cmp(self.err.args, anExc.args)
35
36 def __getattr__(self, attr):
Guido van Rossum846d6db2001-01-17 15:08:37 +000037 return getattr(self.err, attr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000038
39def do_test(buf, method):
40 env = {}
41 if method == "GET":
42 fp = None
43 env['REQUEST_METHOD'] = 'GET'
44 env['QUERY_STRING'] = buf
45 elif method == "POST":
46 fp = StringIO(buf)
47 env['REQUEST_METHOD'] = 'POST'
48 env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded'
49 env['CONTENT_LENGTH'] = str(len(buf))
50 else:
51 raise ValueError, "unknown method: %s" % method
52 try:
53 return cgi.parse(fp, env, strict_parsing=1)
54 except StandardError, err:
55 return ComparableException(err)
56
Neil Schemenauer66edb622004-07-19 15:38:11 +000057parse_strict_test_cases = [
Jeremy Hyltond9827c42000-08-03 22:11:43 +000058 ("", ValueError("bad query field: ''")),
59 ("&", ValueError("bad query field: ''")),
60 ("&&", ValueError("bad query field: ''")),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000061 (";", ValueError("bad query field: ''")),
62 (";&;", ValueError("bad query field: ''")),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000063 # Should the next few really be valid?
64 ("=", {}),
65 ("=&=", {}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000066 ("=;=", {}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000067 # This rest seem to make sense
68 ("=a", {'': ['a']}),
69 ("&=a", ValueError("bad query field: ''")),
70 ("=a&", ValueError("bad query field: ''")),
71 ("=&a", ValueError("bad query field: 'a'")),
72 ("b=a", {'b': ['a']}),
73 ("b+=a", {'b ': ['a']}),
74 ("a=b=a", {'a': ['b=a']}),
75 ("a=+b=a", {'a': [' b=a']}),
76 ("&b=a", ValueError("bad query field: ''")),
77 ("b&=a", ValueError("bad query field: 'b'")),
78 ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}),
79 ("a=a+b&a=b+a", {'a': ['a b', 'b a']}),
80 ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000081 ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
82 ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000083 ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env",
84 {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'],
85 'cuyer': ['r'],
86 'expire': ['964546263'],
87 'kid': ['130003.300038'],
88 'lobale': ['en-US'],
89 'order_id': ['0bb2e248638833d48cb7fed300000f1b'],
90 'ss': ['env'],
91 'view': ['bustomer'],
92 }),
Fred Drake004d5e62000-10-23 17:22:08 +000093
Jeremy Hyltond9827c42000-08-03 22:11:43 +000094 ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse",
95 {'SUBMIT': ['Browse'],
96 '_assigned_to': ['31392'],
97 '_category': ['100'],
98 '_status': ['1'],
99 'group_id': ['5470'],
100 'set': ['custom'],
101 })
102 ]
103
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000104def first_elts(list):
105 return map(lambda x:x[0], list)
106
107def first_second_elts(list):
108 return map(lambda p:(p[0], p[1][0]), list)
109
Facundo Batistaa6a4d502008-06-21 18:58:04 +0000110def gen_result(data, environ):
111 fake_stdin = StringIO(data)
112 fake_stdin.seek(0)
113 form = cgi.FieldStorage(fp=fake_stdin, environ=environ)
114
115 result = {}
116 for k, v in dict(form).items():
Florent Xicluna945a8ba2010-03-17 19:15:56 +0000117 result[k] = isinstance(v, list) and form.getlist(k) or v.value
Facundo Batistaa6a4d502008-06-21 18:58:04 +0000118
119 return result
120
Georg Brandle1844332006-10-29 20:09:12 +0000121class CgiTests(unittest.TestCase):
Neil Schemenauer66edb622004-07-19 15:38:11 +0000122
Senthil Kumarand17a8982012-03-13 01:48:41 -0700123 def test_escape(self):
124 self.assertEqual("test & string", cgi.escape("test & string"))
125 self.assertEqual("&lt;test string&gt;", cgi.escape("<test string>"))
126 self.assertEqual("&quot;test string&quot;", cgi.escape('"test string"', True))
127
Georg Brandle1844332006-10-29 20:09:12 +0000128 def test_strict(self):
129 for orig, expect in parse_strict_test_cases:
130 # Test basic parsing
131 d = do_test(orig, "GET")
132 self.assertEqual(d, expect, "Error parsing %s" % repr(orig))
133 d = do_test(orig, "POST")
134 self.assertEqual(d, expect, "Error parsing %s" % repr(orig))
135
136 env = {'QUERY_STRING': orig}
137 fcd = cgi.FormContentDict(env)
138 sd = cgi.SvFormContentDict(env)
139 fs = cgi.FieldStorage(environ=env)
Florent Xicluna945a8ba2010-03-17 19:15:56 +0000140 if isinstance(expect, dict):
Georg Brandle1844332006-10-29 20:09:12 +0000141 # test dict interface
142 self.assertEqual(len(expect), len(fcd))
Michael Foord98e7b762010-03-20 03:00:34 +0000143 self.assertItemsEqual(expect.keys(), fcd.keys())
144 self.assertItemsEqual(expect.values(), fcd.values())
145 self.assertItemsEqual(expect.items(), fcd.items())
Georg Brandle1844332006-10-29 20:09:12 +0000146 self.assertEqual(fcd.get("nonexistent field", "default"), "default")
147 self.assertEqual(len(sd), len(fs))
Michael Foord98e7b762010-03-20 03:00:34 +0000148 self.assertItemsEqual(sd.keys(), fs.keys())
Georg Brandle1844332006-10-29 20:09:12 +0000149 self.assertEqual(fs.getvalue("nonexistent field", "default"), "default")
150 # test individual fields
151 for key in expect.keys():
152 expect_val = expect[key]
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000153 self.assertTrue(fcd.has_key(key))
Michael Foord98e7b762010-03-20 03:00:34 +0000154 self.assertItemsEqual(fcd[key], expect[key])
Georg Brandle1844332006-10-29 20:09:12 +0000155 self.assertEqual(fcd.get(key, "default"), fcd[key])
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000156 self.assertTrue(fs.has_key(key))
Georg Brandle1844332006-10-29 20:09:12 +0000157 if len(expect_val) > 1:
158 single_value = 0
159 else:
160 single_value = 1
161 try:
162 val = sd[key]
163 except IndexError:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000164 self.assertFalse(single_value)
Georg Brandle1844332006-10-29 20:09:12 +0000165 self.assertEqual(fs.getvalue(key), expect_val)
166 else:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000167 self.assertTrue(single_value)
Georg Brandle1844332006-10-29 20:09:12 +0000168 self.assertEqual(val, expect_val[0])
169 self.assertEqual(fs.getvalue(key), expect_val[0])
Michael Foord98e7b762010-03-20 03:00:34 +0000170 self.assertItemsEqual(sd.getlist(key), expect_val)
Georg Brandle1844332006-10-29 20:09:12 +0000171 if single_value:
Michael Foord98e7b762010-03-20 03:00:34 +0000172 self.assertItemsEqual(sd.values(),
Ezio Melottief490962010-01-31 11:46:54 +0000173 first_elts(expect.values()))
Michael Foord98e7b762010-03-20 03:00:34 +0000174 self.assertItemsEqual(sd.items(),
Ezio Melottief490962010-01-31 11:46:54 +0000175 first_second_elts(expect.items()))
Georg Brandle1844332006-10-29 20:09:12 +0000176
177 def test_weird_formcontentdict(self):
178 # Test the weird FormContentDict classes
179 env = {'QUERY_STRING': "x=1&y=2.0&z=2-3.%2b0&1=1abc"}
180 expect = {'x': 1, 'y': 2.0, 'z': '2-3.+0', '1': '1abc'}
181 d = cgi.InterpFormContentDict(env)
182 for k, v in expect.items():
183 self.assertEqual(d[k], v)
184 for k, v in d.items():
185 self.assertEqual(expect[k], v)
Michael Foord98e7b762010-03-20 03:00:34 +0000186 self.assertItemsEqual(expect.values(), d.values())
Georg Brandle1844332006-10-29 20:09:12 +0000187
188 def test_log(self):
189 cgi.log("Testing")
190
191 cgi.logfp = StringIO()
192 cgi.initlog("%s", "Testing initlog 1")
193 cgi.log("%s", "Testing log 2")
194 self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n")
195 if os.path.exists("/dev/null"):
196 cgi.logfp = None
197 cgi.logfile = "/dev/null"
198 cgi.initlog("%s", "Testing log 3")
199 cgi.log("Testing log 4")
200
201 def test_fieldstorage_readline(self):
202 # FieldStorage uses readline, which has the capacity to read all
203 # contents of the input file into memory; we use readline's size argument
204 # to prevent that for files that do not contain any newlines in
205 # non-GET/HEAD requests
206 class TestReadlineFile:
207 def __init__(self, file):
208 self.file = file
209 self.numcalls = 0
210
211 def readline(self, size=None):
212 self.numcalls += 1
213 if size:
214 return self.file.readline(size)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000215 else:
Georg Brandle1844332006-10-29 20:09:12 +0000216 return self.file.readline()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000217
Georg Brandle1844332006-10-29 20:09:12 +0000218 def __getattr__(self, name):
219 file = self.__dict__['file']
220 a = getattr(file, name)
221 if not isinstance(a, int):
222 setattr(self, name, a)
223 return a
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000224
Georg Brandle1844332006-10-29 20:09:12 +0000225 f = TestReadlineFile(tempfile.TemporaryFile())
226 f.write('x' * 256 * 1024)
227 f.seek(0)
228 env = {'REQUEST_METHOD':'PUT'}
229 fs = cgi.FieldStorage(fp=f, environ=env)
230 # if we're not chunking properly, readline is only called twice
231 # (by read_binary); if we are chunking properly, it will be called 5 times
232 # as long as the chunksize is 1 << 16.
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000233 self.assertTrue(f.numcalls > 2)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000234
Georg Brandle1844332006-10-29 20:09:12 +0000235 def test_fieldstorage_multipart(self):
236 #Test basic FieldStorage multipart parsing
237 env = {'REQUEST_METHOD':'POST', 'CONTENT_TYPE':'multipart/form-data; boundary=---------------------------721837373350705526688164684', 'CONTENT_LENGTH':'558'}
238 postdata = """-----------------------------721837373350705526688164684
Guido van Rossum9568b732006-08-10 17:41:07 +0000239Content-Disposition: form-data; name="id"
240
2411234
242-----------------------------721837373350705526688164684
243Content-Disposition: form-data; name="title"
244
245
246-----------------------------721837373350705526688164684
247Content-Disposition: form-data; name="file"; filename="test.txt"
248Content-Type: text/plain
249
250Testing 123.
251
252-----------------------------721837373350705526688164684
253Content-Disposition: form-data; name="submit"
254
Tim Petersb7ad1eb2006-08-10 23:22:13 +0000255 Add\x20
Guido van Rossum9568b732006-08-10 17:41:07 +0000256-----------------------------721837373350705526688164684--
257"""
Georg Brandle1844332006-10-29 20:09:12 +0000258 fs = cgi.FieldStorage(fp=StringIO(postdata), environ=env)
Ezio Melotti2623a372010-11-21 13:34:58 +0000259 self.assertEqual(len(fs.list), 4)
Georg Brandle1844332006-10-29 20:09:12 +0000260 expect = [{'name':'id', 'filename':None, 'value':'1234'},
261 {'name':'title', 'filename':None, 'value':''},
262 {'name':'file', 'filename':'test.txt','value':'Testing 123.\n'},
263 {'name':'submit', 'filename':None, 'value':' Add '}]
264 for x in range(len(fs.list)):
265 for k, exp in expect[x].items():
266 got = getattr(fs.list[x], k)
Ezio Melotti2623a372010-11-21 13:34:58 +0000267 self.assertEqual(got, exp)
Guido van Rossum9568b732006-08-10 17:41:07 +0000268
Facundo Batistaa6a4d502008-06-21 18:58:04 +0000269 _qs_result = {
270 'key1': 'value1',
271 'key2': ['value2x', 'value2y'],
272 'key3': 'value3',
273 'key4': 'value4'
274 }
275 def testQSAndUrlEncode(self):
276 data = "key2=value2x&key3=value3&key4=value4"
277 environ = {
278 'CONTENT_LENGTH': str(len(data)),
279 'CONTENT_TYPE': 'application/x-www-form-urlencoded',
280 'QUERY_STRING': 'key1=value1&key2=value2y',
281 'REQUEST_METHOD': 'POST',
282 }
283 v = gen_result(data, environ)
284 self.assertEqual(self._qs_result, v)
285
286 def testQSAndFormData(self):
287 data = """
288---123
289Content-Disposition: form-data; name="key2"
290
291value2y
292---123
293Content-Disposition: form-data; name="key3"
294
295value3
296---123
297Content-Disposition: form-data; name="key4"
298
299value4
300---123--
301"""
302 environ = {
303 'CONTENT_LENGTH': str(len(data)),
304 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
305 'QUERY_STRING': 'key1=value1&key2=value2x',
306 'REQUEST_METHOD': 'POST',
307 }
308 v = gen_result(data, environ)
309 self.assertEqual(self._qs_result, v)
310
311 def testQSAndFormDataFile(self):
312 data = """
313---123
314Content-Disposition: form-data; name="key2"
315
316value2y
317---123
318Content-Disposition: form-data; name="key3"
319
320value3
321---123
322Content-Disposition: form-data; name="key4"
323
324value4
325---123
326Content-Disposition: form-data; name="upload"; filename="fake.txt"
327Content-Type: text/plain
328
329this is the content of the fake file
330
331---123--
332"""
333 environ = {
334 'CONTENT_LENGTH': str(len(data)),
335 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
336 'QUERY_STRING': 'key1=value1&key2=value2x',
337 'REQUEST_METHOD': 'POST',
338 }
339 result = self._qs_result.copy()
340 result.update({
341 'upload': 'this is the content of the fake file\n'
342 })
343 v = gen_result(data, environ)
344 self.assertEqual(result, v)
345
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000346 def test_deprecated_parse_qs(self):
Florent Xicluna78c18712010-03-17 20:05:11 +0000347 # this func is moved to urlparse, this is just a sanity check
348 with check_warnings(('cgi.parse_qs is deprecated, use urlparse.'
349 'parse_qs instead', PendingDeprecationWarning)):
Ezio Melottief490962010-01-31 11:46:54 +0000350 self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']},
351 cgi.parse_qs('a=A1&b=B2&B=B3'))
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000352
353 def test_deprecated_parse_qsl(self):
Florent Xicluna78c18712010-03-17 20:05:11 +0000354 # this func is moved to urlparse, this is just a sanity check
355 with check_warnings(('cgi.parse_qsl is deprecated, use urlparse.'
356 'parse_qsl instead', PendingDeprecationWarning)):
Ezio Melottief490962010-01-31 11:46:54 +0000357 self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')],
358 cgi.parse_qsl('a=A1&b=B2&B=B3'))
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000359
Fred Drake52481032008-12-04 18:25:17 +0000360 def test_parse_header(self):
361 self.assertEqual(
362 cgi.parse_header("text/plain"),
363 ("text/plain", {}))
364 self.assertEqual(
365 cgi.parse_header("text/vnd.just.made.this.up ; "),
366 ("text/vnd.just.made.this.up", {}))
367 self.assertEqual(
368 cgi.parse_header("text/plain;charset=us-ascii"),
369 ("text/plain", {"charset": "us-ascii"}))
370 self.assertEqual(
371 cgi.parse_header('text/plain ; charset="us-ascii"'),
372 ("text/plain", {"charset": "us-ascii"}))
373 self.assertEqual(
374 cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'),
375 ("text/plain", {"charset": "us-ascii", "another": "opt"}))
376 self.assertEqual(
377 cgi.parse_header('attachment; filename="silly.txt"'),
378 ("attachment", {"filename": "silly.txt"}))
379 self.assertEqual(
380 cgi.parse_header('attachment; filename="strange;name"'),
381 ("attachment", {"filename": "strange;name"}))
382 self.assertEqual(
383 cgi.parse_header('attachment; filename="strange;name";size=123;'),
384 ("attachment", {"filename": "strange;name", "size": "123"}))
Senthil Kumaran59a06d42011-10-20 00:52:24 +0800385 self.assertEqual(
386 cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'),
387 ("form-data", {"name": "files", "filename": 'fo"o;bar'}))
Fred Drake52481032008-12-04 18:25:17 +0000388
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000389
Georg Brandle1844332006-10-29 20:09:12 +0000390def test_main():
391 run_unittest(CgiTests)
392
393if __name__ == '__main__':
394 test_main()