blob: 5b5329170fb66904681db95153bb692c89293c19 [file] [log] [blame]
Ezio Melottief490962010-01-31 11:46:54 +00001from test.test_support import run_unittest, check_warnings
Jeremy Hyltond9827c42000-08-03 22:11:43 +00002import cgi
3import os
4import sys
Guido van Rossum9568b732006-08-10 17:41:07 +00005import tempfile
Georg Brandle1844332006-10-29 20:09:12 +00006import unittest
Guido van Rossum9568b732006-08-10 17:41:07 +00007from StringIO import StringIO
Jeremy Hyltond9827c42000-08-03 22:11:43 +00008
9class HackedSysModule:
10 # The regression test will have real values in sys.argv, which
Fred Drake004d5e62000-10-23 17:22:08 +000011 # will completely confuse the test of the cgi module
Jeremy Hyltond9827c42000-08-03 22:11:43 +000012 argv = []
13 stdin = sys.stdin
14
15cgi.sys = HackedSysModule()
16
17try:
18 from cStringIO import StringIO
19except ImportError:
20 from StringIO import StringIO
21
22class ComparableException:
23 def __init__(self, err):
24 self.err = err
25
26 def __str__(self):
27 return str(self.err)
28
29 def __cmp__(self, anExc):
30 if not isinstance(anExc, Exception):
31 return -1
32 x = cmp(self.err.__class__, anExc.__class__)
33 if x != 0:
34 return x
35 return cmp(self.err.args, anExc.args)
36
37 def __getattr__(self, attr):
Guido van Rossum846d6db2001-01-17 15:08:37 +000038 return getattr(self.err, attr)
Jeremy Hyltond9827c42000-08-03 22:11:43 +000039
40def do_test(buf, method):
41 env = {}
42 if method == "GET":
43 fp = None
44 env['REQUEST_METHOD'] = 'GET'
45 env['QUERY_STRING'] = buf
46 elif method == "POST":
47 fp = StringIO(buf)
48 env['REQUEST_METHOD'] = 'POST'
49 env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded'
50 env['CONTENT_LENGTH'] = str(len(buf))
51 else:
52 raise ValueError, "unknown method: %s" % method
53 try:
54 return cgi.parse(fp, env, strict_parsing=1)
55 except StandardError, err:
56 return ComparableException(err)
57
Neil Schemenauer66edb622004-07-19 15:38:11 +000058parse_strict_test_cases = [
Jeremy Hyltond9827c42000-08-03 22:11:43 +000059 ("", ValueError("bad query field: ''")),
60 ("&", ValueError("bad query field: ''")),
61 ("&&", ValueError("bad query field: ''")),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000062 (";", ValueError("bad query field: ''")),
63 (";&;", ValueError("bad query field: ''")),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000064 # Should the next few really be valid?
65 ("=", {}),
66 ("=&=", {}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000067 ("=;=", {}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000068 # This rest seem to make sense
69 ("=a", {'': ['a']}),
70 ("&=a", ValueError("bad query field: ''")),
71 ("=a&", ValueError("bad query field: ''")),
72 ("=&a", ValueError("bad query field: 'a'")),
73 ("b=a", {'b': ['a']}),
74 ("b+=a", {'b ': ['a']}),
75 ("a=b=a", {'a': ['b=a']}),
76 ("a=+b=a", {'a': [' b=a']}),
77 ("&b=a", ValueError("bad query field: ''")),
78 ("b&=a", ValueError("bad query field: 'b'")),
79 ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}),
80 ("a=a+b&a=b+a", {'a': ['a b', 'b a']}),
81 ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltonafde7e22000-09-15 20:06:57 +000082 ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
83 ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}),
Jeremy Hyltond9827c42000-08-03 22:11:43 +000084 ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env",
85 {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'],
86 'cuyer': ['r'],
87 'expire': ['964546263'],
88 'kid': ['130003.300038'],
89 'lobale': ['en-US'],
90 'order_id': ['0bb2e248638833d48cb7fed300000f1b'],
91 'ss': ['env'],
92 'view': ['bustomer'],
93 }),
Fred Drake004d5e62000-10-23 17:22:08 +000094
Jeremy Hyltond9827c42000-08-03 22:11:43 +000095 ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse",
96 {'SUBMIT': ['Browse'],
97 '_assigned_to': ['31392'],
98 '_category': ['100'],
99 '_status': ['1'],
100 'group_id': ['5470'],
101 'set': ['custom'],
102 })
103 ]
104
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000105def first_elts(list):
106 return map(lambda x:x[0], list)
107
108def first_second_elts(list):
109 return map(lambda p:(p[0], p[1][0]), list)
110
Facundo Batistaa6a4d502008-06-21 18:58:04 +0000111def gen_result(data, environ):
112 fake_stdin = StringIO(data)
113 fake_stdin.seek(0)
114 form = cgi.FieldStorage(fp=fake_stdin, environ=environ)
115
116 result = {}
117 for k, v in dict(form).items():
118 result[k] = type(v) is list and form.getlist(k) or v.value
119
120 return result
121
Georg Brandle1844332006-10-29 20:09:12 +0000122class CgiTests(unittest.TestCase):
Neil Schemenauer66edb622004-07-19 15:38:11 +0000123
Georg Brandle1844332006-10-29 20:09:12 +0000124 def test_strict(self):
125 for orig, expect in parse_strict_test_cases:
126 # Test basic parsing
127 d = do_test(orig, "GET")
128 self.assertEqual(d, expect, "Error parsing %s" % repr(orig))
129 d = do_test(orig, "POST")
130 self.assertEqual(d, expect, "Error parsing %s" % repr(orig))
131
132 env = {'QUERY_STRING': orig}
133 fcd = cgi.FormContentDict(env)
134 sd = cgi.SvFormContentDict(env)
135 fs = cgi.FieldStorage(environ=env)
136 if type(expect) == type({}):
137 # test dict interface
138 self.assertEqual(len(expect), len(fcd))
Ezio Melottief490962010-01-31 11:46:54 +0000139 self.assertSameElements(expect.keys(), fcd.keys())
140 self.assertSameElements(expect.values(), fcd.values())
141 self.assertSameElements(expect.items(), fcd.items())
Georg Brandle1844332006-10-29 20:09:12 +0000142 self.assertEqual(fcd.get("nonexistent field", "default"), "default")
143 self.assertEqual(len(sd), len(fs))
Ezio Melottief490962010-01-31 11:46:54 +0000144 self.assertSameElements(sd.keys(), fs.keys())
Georg Brandle1844332006-10-29 20:09:12 +0000145 self.assertEqual(fs.getvalue("nonexistent field", "default"), "default")
146 # test individual fields
147 for key in expect.keys():
148 expect_val = expect[key]
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000149 self.assertTrue(fcd.has_key(key))
Ezio Melottief490962010-01-31 11:46:54 +0000150 self.assertSameElements(fcd[key], expect[key])
Georg Brandle1844332006-10-29 20:09:12 +0000151 self.assertEqual(fcd.get(key, "default"), fcd[key])
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000152 self.assertTrue(fs.has_key(key))
Georg Brandle1844332006-10-29 20:09:12 +0000153 if len(expect_val) > 1:
154 single_value = 0
155 else:
156 single_value = 1
157 try:
158 val = sd[key]
159 except IndexError:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000160 self.assertFalse(single_value)
Georg Brandle1844332006-10-29 20:09:12 +0000161 self.assertEqual(fs.getvalue(key), expect_val)
162 else:
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000163 self.assertTrue(single_value)
Georg Brandle1844332006-10-29 20:09:12 +0000164 self.assertEqual(val, expect_val[0])
165 self.assertEqual(fs.getvalue(key), expect_val[0])
Ezio Melottief490962010-01-31 11:46:54 +0000166 self.assertSameElements(sd.getlist(key), expect_val)
Georg Brandle1844332006-10-29 20:09:12 +0000167 if single_value:
Ezio Melottief490962010-01-31 11:46:54 +0000168 self.assertSameElements(sd.values(),
169 first_elts(expect.values()))
170 self.assertSameElements(sd.items(),
171 first_second_elts(expect.items()))
Georg Brandle1844332006-10-29 20:09:12 +0000172
173 def test_weird_formcontentdict(self):
174 # Test the weird FormContentDict classes
175 env = {'QUERY_STRING': "x=1&y=2.0&z=2-3.%2b0&1=1abc"}
176 expect = {'x': 1, 'y': 2.0, 'z': '2-3.+0', '1': '1abc'}
177 d = cgi.InterpFormContentDict(env)
178 for k, v in expect.items():
179 self.assertEqual(d[k], v)
180 for k, v in d.items():
181 self.assertEqual(expect[k], v)
Ezio Melottief490962010-01-31 11:46:54 +0000182 self.assertSameElements(expect.values(), d.values())
Georg Brandle1844332006-10-29 20:09:12 +0000183
184 def test_log(self):
185 cgi.log("Testing")
186
187 cgi.logfp = StringIO()
188 cgi.initlog("%s", "Testing initlog 1")
189 cgi.log("%s", "Testing log 2")
190 self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n")
191 if os.path.exists("/dev/null"):
192 cgi.logfp = None
193 cgi.logfile = "/dev/null"
194 cgi.initlog("%s", "Testing log 3")
195 cgi.log("Testing log 4")
196
197 def test_fieldstorage_readline(self):
198 # FieldStorage uses readline, which has the capacity to read all
199 # contents of the input file into memory; we use readline's size argument
200 # to prevent that for files that do not contain any newlines in
201 # non-GET/HEAD requests
202 class TestReadlineFile:
203 def __init__(self, file):
204 self.file = file
205 self.numcalls = 0
206
207 def readline(self, size=None):
208 self.numcalls += 1
209 if size:
210 return self.file.readline(size)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000211 else:
Georg Brandle1844332006-10-29 20:09:12 +0000212 return self.file.readline()
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000213
Georg Brandle1844332006-10-29 20:09:12 +0000214 def __getattr__(self, name):
215 file = self.__dict__['file']
216 a = getattr(file, name)
217 if not isinstance(a, int):
218 setattr(self, name, a)
219 return a
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000220
Georg Brandle1844332006-10-29 20:09:12 +0000221 f = TestReadlineFile(tempfile.TemporaryFile())
222 f.write('x' * 256 * 1024)
223 f.seek(0)
224 env = {'REQUEST_METHOD':'PUT'}
225 fs = cgi.FieldStorage(fp=f, environ=env)
226 # if we're not chunking properly, readline is only called twice
227 # (by read_binary); if we are chunking properly, it will be called 5 times
228 # as long as the chunksize is 1 << 16.
Benjamin Peterson5c8da862009-06-30 22:57:08 +0000229 self.assertTrue(f.numcalls > 2)
Jeremy Hyltond9827c42000-08-03 22:11:43 +0000230
Georg Brandle1844332006-10-29 20:09:12 +0000231 def test_fieldstorage_multipart(self):
232 #Test basic FieldStorage multipart parsing
233 env = {'REQUEST_METHOD':'POST', 'CONTENT_TYPE':'multipart/form-data; boundary=---------------------------721837373350705526688164684', 'CONTENT_LENGTH':'558'}
234 postdata = """-----------------------------721837373350705526688164684
Guido van Rossum9568b732006-08-10 17:41:07 +0000235Content-Disposition: form-data; name="id"
236
2371234
238-----------------------------721837373350705526688164684
239Content-Disposition: form-data; name="title"
240
241
242-----------------------------721837373350705526688164684
243Content-Disposition: form-data; name="file"; filename="test.txt"
244Content-Type: text/plain
245
246Testing 123.
247
248-----------------------------721837373350705526688164684
249Content-Disposition: form-data; name="submit"
250
Tim Petersb7ad1eb2006-08-10 23:22:13 +0000251 Add\x20
Guido van Rossum9568b732006-08-10 17:41:07 +0000252-----------------------------721837373350705526688164684--
253"""
Georg Brandle1844332006-10-29 20:09:12 +0000254 fs = cgi.FieldStorage(fp=StringIO(postdata), environ=env)
255 self.assertEquals(len(fs.list), 4)
256 expect = [{'name':'id', 'filename':None, 'value':'1234'},
257 {'name':'title', 'filename':None, 'value':''},
258 {'name':'file', 'filename':'test.txt','value':'Testing 123.\n'},
259 {'name':'submit', 'filename':None, 'value':' Add '}]
260 for x in range(len(fs.list)):
261 for k, exp in expect[x].items():
262 got = getattr(fs.list[x], k)
263 self.assertEquals(got, exp)
Guido van Rossum9568b732006-08-10 17:41:07 +0000264
Facundo Batistaa6a4d502008-06-21 18:58:04 +0000265 _qs_result = {
266 'key1': 'value1',
267 'key2': ['value2x', 'value2y'],
268 'key3': 'value3',
269 'key4': 'value4'
270 }
271 def testQSAndUrlEncode(self):
272 data = "key2=value2x&key3=value3&key4=value4"
273 environ = {
274 'CONTENT_LENGTH': str(len(data)),
275 'CONTENT_TYPE': 'application/x-www-form-urlencoded',
276 'QUERY_STRING': 'key1=value1&key2=value2y',
277 'REQUEST_METHOD': 'POST',
278 }
279 v = gen_result(data, environ)
280 self.assertEqual(self._qs_result, v)
281
282 def testQSAndFormData(self):
283 data = """
284---123
285Content-Disposition: form-data; name="key2"
286
287value2y
288---123
289Content-Disposition: form-data; name="key3"
290
291value3
292---123
293Content-Disposition: form-data; name="key4"
294
295value4
296---123--
297"""
298 environ = {
299 'CONTENT_LENGTH': str(len(data)),
300 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
301 'QUERY_STRING': 'key1=value1&key2=value2x',
302 'REQUEST_METHOD': 'POST',
303 }
304 v = gen_result(data, environ)
305 self.assertEqual(self._qs_result, v)
306
307 def testQSAndFormDataFile(self):
308 data = """
309---123
310Content-Disposition: form-data; name="key2"
311
312value2y
313---123
314Content-Disposition: form-data; name="key3"
315
316value3
317---123
318Content-Disposition: form-data; name="key4"
319
320value4
321---123
322Content-Disposition: form-data; name="upload"; filename="fake.txt"
323Content-Type: text/plain
324
325this is the content of the fake file
326
327---123--
328"""
329 environ = {
330 'CONTENT_LENGTH': str(len(data)),
331 'CONTENT_TYPE': 'multipart/form-data; boundary=-123',
332 'QUERY_STRING': 'key1=value1&key2=value2x',
333 'REQUEST_METHOD': 'POST',
334 }
335 result = self._qs_result.copy()
336 result.update({
337 'upload': 'this is the content of the fake file\n'
338 })
339 v = gen_result(data, environ)
340 self.assertEqual(result, v)
341
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000342 def test_deprecated_parse_qs(self):
Ezio Melottief490962010-01-31 11:46:54 +0000343 with check_warnings():
344 # this func is moved to urlparse, this is just a sanity check
345 self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']},
346 cgi.parse_qs('a=A1&b=B2&B=B3'))
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000347
348 def test_deprecated_parse_qsl(self):
Ezio Melottief490962010-01-31 11:46:54 +0000349 with check_warnings():
350 # this func is moved to urlparse, this is just a sanity check
351 self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')],
352 cgi.parse_qsl('a=A1&b=B2&B=B3'))
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000353
Fred Drake52481032008-12-04 18:25:17 +0000354 def test_parse_header(self):
355 self.assertEqual(
356 cgi.parse_header("text/plain"),
357 ("text/plain", {}))
358 self.assertEqual(
359 cgi.parse_header("text/vnd.just.made.this.up ; "),
360 ("text/vnd.just.made.this.up", {}))
361 self.assertEqual(
362 cgi.parse_header("text/plain;charset=us-ascii"),
363 ("text/plain", {"charset": "us-ascii"}))
364 self.assertEqual(
365 cgi.parse_header('text/plain ; charset="us-ascii"'),
366 ("text/plain", {"charset": "us-ascii"}))
367 self.assertEqual(
368 cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'),
369 ("text/plain", {"charset": "us-ascii", "another": "opt"}))
370 self.assertEqual(
371 cgi.parse_header('attachment; filename="silly.txt"'),
372 ("attachment", {"filename": "silly.txt"}))
373 self.assertEqual(
374 cgi.parse_header('attachment; filename="strange;name"'),
375 ("attachment", {"filename": "strange;name"}))
376 self.assertEqual(
377 cgi.parse_header('attachment; filename="strange;name";size=123;'),
378 ("attachment", {"filename": "strange;name", "size": "123"}))
379
Facundo Batistaace0bcf2008-09-08 00:20:28 +0000380
Georg Brandle1844332006-10-29 20:09:12 +0000381def test_main():
382 run_unittest(CgiTests)
383
384if __name__ == '__main__':
385 test_main()