Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 1 | import cgi |
| 2 | import os |
| 3 | import sys |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 4 | import tempfile |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 5 | import unittest |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 6 | from collections import namedtuple |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 7 | from io import StringIO, BytesIO |
Martin Panter | 1cd2772 | 2016-06-06 01:53:28 +0000 | [diff] [blame] | 8 | from test import support |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 9 | |
| 10 | class HackedSysModule: |
| 11 | # The regression test will have real values in sys.argv, which |
Fred Drake | 004d5e6 | 2000-10-23 17:22:08 +0000 | [diff] [blame] | 12 | # will completely confuse the test of the cgi module |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 13 | argv = [] |
| 14 | stdin = sys.stdin |
| 15 | |
| 16 | cgi.sys = HackedSysModule() |
| 17 | |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 18 | class ComparableException: |
| 19 | def __init__(self, err): |
| 20 | self.err = err |
| 21 | |
| 22 | def __str__(self): |
| 23 | return str(self.err) |
| 24 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 25 | def __eq__(self, anExc): |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 26 | if not isinstance(anExc, Exception): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 27 | return NotImplemented |
| 28 | return (self.err.__class__ == anExc.__class__ and |
| 29 | self.err.args == anExc.args) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 30 | |
| 31 | def __getattr__(self, attr): |
Guido van Rossum | 846d6db | 2001-01-17 15:08:37 +0000 | [diff] [blame] | 32 | return getattr(self.err, attr) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 33 | |
| 34 | def do_test(buf, method): |
| 35 | env = {} |
| 36 | if method == "GET": |
| 37 | fp = None |
| 38 | env['REQUEST_METHOD'] = 'GET' |
| 39 | env['QUERY_STRING'] = buf |
| 40 | elif method == "POST": |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 41 | fp = BytesIO(buf.encode('latin-1')) # FieldStorage expects bytes |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 42 | env['REQUEST_METHOD'] = 'POST' |
| 43 | env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded' |
| 44 | env['CONTENT_LENGTH'] = str(len(buf)) |
| 45 | else: |
Collin Winter | 3add4d7 | 2007-08-29 23:37:32 +0000 | [diff] [blame] | 46 | raise ValueError("unknown method: %s" % method) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 47 | try: |
| 48 | return cgi.parse(fp, env, strict_parsing=1) |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 49 | except Exception as err: |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 50 | return ComparableException(err) |
| 51 | |
Neil Schemenauer | 66edb62 | 2004-07-19 15:38:11 +0000 | [diff] [blame] | 52 | parse_strict_test_cases = [ |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 53 | ("", ValueError("bad query field: ''")), |
| 54 | ("&", ValueError("bad query field: ''")), |
| 55 | ("&&", ValueError("bad query field: ''")), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 56 | (";", ValueError("bad query field: ''")), |
| 57 | (";&;", ValueError("bad query field: ''")), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 58 | # Should the next few really be valid? |
| 59 | ("=", {}), |
| 60 | ("=&=", {}), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 61 | ("=;=", {}), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 62 | # This rest seem to make sense |
| 63 | ("=a", {'': ['a']}), |
| 64 | ("&=a", ValueError("bad query field: ''")), |
| 65 | ("=a&", ValueError("bad query field: ''")), |
| 66 | ("=&a", ValueError("bad query field: 'a'")), |
| 67 | ("b=a", {'b': ['a']}), |
| 68 | ("b+=a", {'b ': ['a']}), |
| 69 | ("a=b=a", {'a': ['b=a']}), |
| 70 | ("a=+b=a", {'a': [' b=a']}), |
| 71 | ("&b=a", ValueError("bad query field: ''")), |
| 72 | ("b&=a", ValueError("bad query field: 'b'")), |
| 73 | ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}), |
| 74 | ("a=a+b&a=b+a", {'a': ['a b', 'b a']}), |
| 75 | ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 76 | ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
| 77 | ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 78 | ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env", |
| 79 | {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'], |
| 80 | 'cuyer': ['r'], |
| 81 | 'expire': ['964546263'], |
| 82 | 'kid': ['130003.300038'], |
| 83 | 'lobale': ['en-US'], |
| 84 | 'order_id': ['0bb2e248638833d48cb7fed300000f1b'], |
| 85 | 'ss': ['env'], |
| 86 | 'view': ['bustomer'], |
| 87 | }), |
Fred Drake | 004d5e6 | 2000-10-23 17:22:08 +0000 | [diff] [blame] | 88 | |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 89 | ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse", |
| 90 | {'SUBMIT': ['Browse'], |
| 91 | '_assigned_to': ['31392'], |
| 92 | '_category': ['100'], |
| 93 | '_status': ['1'], |
| 94 | 'group_id': ['5470'], |
| 95 | 'set': ['custom'], |
| 96 | }) |
| 97 | ] |
| 98 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 99 | def norm(seq): |
Guido van Rossum | cc2b016 | 2007-02-11 06:12:03 +0000 | [diff] [blame] | 100 | return sorted(seq, key=repr) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 101 | |
| 102 | def first_elts(list): |
Guido van Rossum | c1f779c | 2007-07-03 08:25:58 +0000 | [diff] [blame] | 103 | return [p[0] for p in list] |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 104 | |
| 105 | def first_second_elts(list): |
Guido van Rossum | c1f779c | 2007-07-03 08:25:58 +0000 | [diff] [blame] | 106 | return [(p[0], p[1][0]) for p in list] |
| 107 | |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 108 | def gen_result(data, environ): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 109 | encoding = 'latin-1' |
| 110 | fake_stdin = BytesIO(data.encode(encoding)) |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 111 | fake_stdin.seek(0) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 112 | form = cgi.FieldStorage(fp=fake_stdin, environ=environ, encoding=encoding) |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 113 | |
| 114 | result = {} |
| 115 | for k, v in dict(form).items(): |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 116 | result[k] = isinstance(v, list) and form.getlist(k) or v.value |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 117 | |
| 118 | return result |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 119 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 120 | class CgiTests(unittest.TestCase): |
Neil Schemenauer | 66edb62 | 2004-07-19 15:38:11 +0000 | [diff] [blame] | 121 | |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 122 | def test_parse_multipart(self): |
| 123 | fp = BytesIO(POSTDATA.encode('latin1')) |
| 124 | env = {'boundary': BOUNDARY.encode('latin1'), |
| 125 | 'CONTENT-LENGTH': '558'} |
| 126 | result = cgi.parse_multipart(fp, env) |
Pierre Quentel | cc3fa20 | 2017-05-08 14:08:34 +0200 | [diff] [blame] | 127 | expected = {'submit': [' Add '], 'id': ['1234'], |
| 128 | 'file': [b'Testing 123.\n'], 'title': ['']} |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 129 | self.assertEqual(result, expected) |
| 130 | |
roger | d8cf351 | 2020-06-15 16:58:54 +0200 | [diff] [blame] | 131 | def test_parse_multipart_without_content_length(self): |
| 132 | POSTDATA = '''--JfISa01 |
| 133 | Content-Disposition: form-data; name="submit-name" |
| 134 | |
| 135 | just a string |
| 136 | |
| 137 | --JfISa01-- |
| 138 | ''' |
| 139 | fp = BytesIO(POSTDATA.encode('latin1')) |
| 140 | env = {'boundary': 'JfISa01'.encode('latin1')} |
| 141 | result = cgi.parse_multipart(fp, env) |
| 142 | expected = {'submit-name': ['just a string\n']} |
| 143 | self.assertEqual(result, expected) |
| 144 | |
Amber Brown | 545c955 | 2018-05-14 18:11:55 -0400 | [diff] [blame] | 145 | def test_parse_multipart_invalid_encoding(self): |
| 146 | BOUNDARY = "JfISa01" |
| 147 | POSTDATA = """--JfISa01 |
| 148 | Content-Disposition: form-data; name="submit-name" |
| 149 | Content-Length: 3 |
| 150 | |
| 151 | \u2603 |
| 152 | --JfISa01""" |
| 153 | fp = BytesIO(POSTDATA.encode('utf8')) |
| 154 | env = {'boundary': BOUNDARY.encode('latin1'), |
| 155 | 'CONTENT-LENGTH': str(len(POSTDATA.encode('utf8')))} |
| 156 | result = cgi.parse_multipart(fp, env, encoding="ascii", |
| 157 | errors="surrogateescape") |
| 158 | expected = {'submit-name': ["\udce2\udc98\udc83"]} |
| 159 | self.assertEqual(result, expected) |
| 160 | self.assertEqual("\u2603".encode('utf8'), |
| 161 | result["submit-name"][0].encode('utf8', 'surrogateescape')) |
| 162 | |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 163 | def test_fieldstorage_properties(self): |
| 164 | fs = cgi.FieldStorage() |
| 165 | self.assertFalse(fs) |
| 166 | self.assertIn("FieldStorage", repr(fs)) |
| 167 | self.assertEqual(list(fs), list(fs.keys())) |
| 168 | fs.list.append(namedtuple('MockFieldStorage', 'name')('fieldvalue')) |
| 169 | self.assertTrue(fs) |
| 170 | |
Senthil Kumaran | b4cbb92 | 2014-01-11 22:20:16 -0800 | [diff] [blame] | 171 | def test_fieldstorage_invalid(self): |
| 172 | self.assertRaises(TypeError, cgi.FieldStorage, "not-a-file-obj", |
| 173 | environ={"REQUEST_METHOD":"PUT"}) |
| 174 | self.assertRaises(TypeError, cgi.FieldStorage, "foo", "bar") |
| 175 | fs = cgi.FieldStorage(headers={'content-type':'text/plain'}) |
| 176 | self.assertRaises(TypeError, bool, fs) |
| 177 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 178 | def test_strict(self): |
| 179 | for orig, expect in parse_strict_test_cases: |
| 180 | # Test basic parsing |
| 181 | d = do_test(orig, "GET") |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 182 | self.assertEqual(d, expect, "Error parsing %s method GET" % repr(orig)) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 183 | d = do_test(orig, "POST") |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 184 | self.assertEqual(d, expect, "Error parsing %s method POST" % repr(orig)) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 185 | |
| 186 | env = {'QUERY_STRING': orig} |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 187 | fs = cgi.FieldStorage(environ=env) |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 188 | if isinstance(expect, dict): |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 189 | # test dict interface |
Georg Brandl | 49d1b4f | 2008-05-11 21:42:51 +0000 | [diff] [blame] | 190 | self.assertEqual(len(expect), len(fs)) |
Ezio Melotti | 263cbdf | 2010-11-29 02:02:10 +0000 | [diff] [blame] | 191 | self.assertCountEqual(expect.keys(), fs.keys()) |
Georg Brandl | 49d1b4f | 2008-05-11 21:42:51 +0000 | [diff] [blame] | 192 | ##self.assertEqual(norm(expect.values()), norm(fs.values())) |
| 193 | ##self.assertEqual(norm(expect.items()), norm(fs.items())) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 194 | self.assertEqual(fs.getvalue("nonexistent field", "default"), "default") |
| 195 | # test individual fields |
| 196 | for key in expect.keys(): |
| 197 | expect_val = expect[key] |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 198 | self.assertIn(key, fs) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 199 | if len(expect_val) > 1: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 200 | self.assertEqual(fs.getvalue(key), expect_val) |
| 201 | else: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 202 | self.assertEqual(fs.getvalue(key), expect_val[0]) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 203 | |
| 204 | def test_log(self): |
| 205 | cgi.log("Testing") |
| 206 | |
| 207 | cgi.logfp = StringIO() |
| 208 | cgi.initlog("%s", "Testing initlog 1") |
| 209 | cgi.log("%s", "Testing log 2") |
| 210 | self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n") |
Serhiy Storchaka | 85c3033 | 2015-02-15 13:58:23 +0200 | [diff] [blame] | 211 | if os.path.exists(os.devnull): |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 212 | cgi.logfp = None |
Serhiy Storchaka | 85c3033 | 2015-02-15 13:58:23 +0200 | [diff] [blame] | 213 | cgi.logfile = os.devnull |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 214 | cgi.initlog("%s", "Testing log 3") |
Victor Stinner | d33344a | 2011-07-14 22:28:36 +0200 | [diff] [blame] | 215 | self.addCleanup(cgi.closelog) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 216 | cgi.log("Testing log 4") |
| 217 | |
| 218 | def test_fieldstorage_readline(self): |
| 219 | # FieldStorage uses readline, which has the capacity to read all |
| 220 | # contents of the input file into memory; we use readline's size argument |
| 221 | # to prevent that for files that do not contain any newlines in |
| 222 | # non-GET/HEAD requests |
| 223 | class TestReadlineFile: |
| 224 | def __init__(self, file): |
| 225 | self.file = file |
| 226 | self.numcalls = 0 |
| 227 | |
| 228 | def readline(self, size=None): |
| 229 | self.numcalls += 1 |
| 230 | if size: |
| 231 | return self.file.readline(size) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 232 | else: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 233 | return self.file.readline() |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 234 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 235 | def __getattr__(self, name): |
| 236 | file = self.__dict__['file'] |
| 237 | a = getattr(file, name) |
| 238 | if not isinstance(a, int): |
| 239 | setattr(self, name, a) |
| 240 | return a |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 241 | |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 242 | f = TestReadlineFile(tempfile.TemporaryFile("wb+")) |
Benjamin Peterson | 807a5a1 | 2010-10-30 22:59:37 +0000 | [diff] [blame] | 243 | self.addCleanup(f.close) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 244 | f.write(b'x' * 256 * 1024) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 245 | f.seek(0) |
| 246 | env = {'REQUEST_METHOD':'PUT'} |
| 247 | fs = cgi.FieldStorage(fp=f, environ=env) |
Benjamin Peterson | 807a5a1 | 2010-10-30 22:59:37 +0000 | [diff] [blame] | 248 | self.addCleanup(fs.file.close) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 249 | # if we're not chunking properly, readline is only called twice |
| 250 | # (by read_binary); if we are chunking properly, it will be called 5 times |
| 251 | # as long as the chunksize is 1 << 16. |
Serhiy Storchaka | 25d8aea | 2014-02-08 14:50:08 +0200 | [diff] [blame] | 252 | self.assertGreater(f.numcalls, 2) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 253 | f.close() |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 254 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 255 | def test_fieldstorage_multipart(self): |
| 256 | #Test basic FieldStorage multipart parsing |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 257 | env = { |
| 258 | 'REQUEST_METHOD': 'POST', |
| 259 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 260 | 'CONTENT_LENGTH': '558'} |
| 261 | fp = BytesIO(POSTDATA.encode('latin-1')) |
| 262 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 263 | self.assertEqual(len(fs.list), 4) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 264 | expect = [{'name':'id', 'filename':None, 'value':'1234'}, |
| 265 | {'name':'title', 'filename':None, 'value':''}, |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 266 | {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'}, |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 267 | {'name':'submit', 'filename':None, 'value':' Add '}] |
| 268 | for x in range(len(fs.list)): |
| 269 | for k, exp in expect[x].items(): |
| 270 | got = getattr(fs.list[x], k) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 271 | self.assertEqual(got, exp) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 272 | |
Donald Stufft | d90f8d1 | 2015-03-29 16:43:23 -0400 | [diff] [blame] | 273 | def test_fieldstorage_multipart_leading_whitespace(self): |
| 274 | env = { |
| 275 | 'REQUEST_METHOD': 'POST', |
| 276 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 277 | 'CONTENT_LENGTH': '560'} |
| 278 | # Add some leading whitespace to our post data that will cause the |
| 279 | # first line to not be the innerboundary. |
| 280 | fp = BytesIO(b"\r\n" + POSTDATA.encode('latin-1')) |
| 281 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 282 | self.assertEqual(len(fs.list), 4) |
| 283 | expect = [{'name':'id', 'filename':None, 'value':'1234'}, |
| 284 | {'name':'title', 'filename':None, 'value':''}, |
| 285 | {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'}, |
| 286 | {'name':'submit', 'filename':None, 'value':' Add '}] |
| 287 | for x in range(len(fs.list)): |
| 288 | for k, exp in expect[x].items(): |
| 289 | got = getattr(fs.list[x], k) |
| 290 | self.assertEqual(got, exp) |
| 291 | |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 292 | def test_fieldstorage_multipart_non_ascii(self): |
| 293 | #Test basic FieldStorage multipart parsing |
| 294 | env = {'REQUEST_METHOD':'POST', |
| 295 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 296 | 'CONTENT_LENGTH':'558'} |
| 297 | for encoding in ['iso-8859-1','utf-8']: |
| 298 | fp = BytesIO(POSTDATA_NON_ASCII.encode(encoding)) |
| 299 | fs = cgi.FieldStorage(fp, environ=env,encoding=encoding) |
| 300 | self.assertEqual(len(fs.list), 1) |
| 301 | expect = [{'name':'id', 'filename':None, 'value':'\xe7\xf1\x80'}] |
| 302 | for x in range(len(fs.list)): |
| 303 | for k, exp in expect[x].items(): |
| 304 | got = getattr(fs.list[x], k) |
| 305 | self.assertEqual(got, exp) |
| 306 | |
Serhiy Storchaka | c7bfe0e | 2013-06-17 16:34:41 +0300 | [diff] [blame] | 307 | def test_fieldstorage_multipart_maxline(self): |
| 308 | # Issue #18167 |
| 309 | maxline = 1 << 16 |
| 310 | self.maxDiff = None |
| 311 | def check(content): |
| 312 | data = """---123 |
| 313 | Content-Disposition: form-data; name="upload"; filename="fake.txt" |
| 314 | Content-Type: text/plain |
| 315 | |
| 316 | %s |
| 317 | ---123-- |
| 318 | """.replace('\n', '\r\n') % content |
| 319 | environ = { |
| 320 | 'CONTENT_LENGTH': str(len(data)), |
| 321 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 322 | 'REQUEST_METHOD': 'POST', |
| 323 | } |
| 324 | self.assertEqual(gen_result(data, environ), |
| 325 | {'upload': content.encode('latin1')}) |
| 326 | check('x' * (maxline - 1)) |
| 327 | check('x' * (maxline - 1) + '\r') |
| 328 | check('x' * (maxline - 1) + '\r' + 'y' * (maxline - 1)) |
| 329 | |
Florent Xicluna | 331c3fd | 2013-07-07 12:44:28 +0200 | [diff] [blame] | 330 | def test_fieldstorage_multipart_w3c(self): |
| 331 | # Test basic FieldStorage multipart parsing (W3C sample) |
| 332 | env = { |
| 333 | 'REQUEST_METHOD': 'POST', |
| 334 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY_W3), |
| 335 | 'CONTENT_LENGTH': str(len(POSTDATA_W3))} |
| 336 | fp = BytesIO(POSTDATA_W3.encode('latin-1')) |
| 337 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 338 | self.assertEqual(len(fs.list), 2) |
| 339 | self.assertEqual(fs.list[0].name, 'submit-name') |
| 340 | self.assertEqual(fs.list[0].value, 'Larry') |
| 341 | self.assertEqual(fs.list[1].name, 'files') |
| 342 | files = fs.list[1].value |
| 343 | self.assertEqual(len(files), 2) |
| 344 | expect = [{'name': None, 'filename': 'file1.txt', 'value': b'... contents of file1.txt ...'}, |
| 345 | {'name': None, 'filename': 'file2.gif', 'value': b'...contents of file2.gif...'}] |
| 346 | for x in range(len(files)): |
| 347 | for k, exp in expect[x].items(): |
| 348 | got = getattr(files[x], k) |
| 349 | self.assertEqual(got, exp) |
| 350 | |
Victor Stinner | 6579459 | 2015-08-18 10:21:10 -0700 | [diff] [blame] | 351 | def test_fieldstorage_part_content_length(self): |
| 352 | BOUNDARY = "JfISa01" |
| 353 | POSTDATA = """--JfISa01 |
| 354 | Content-Disposition: form-data; name="submit-name" |
| 355 | Content-Length: 5 |
| 356 | |
| 357 | Larry |
| 358 | --JfISa01""" |
| 359 | env = { |
| 360 | 'REQUEST_METHOD': 'POST', |
| 361 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 362 | 'CONTENT_LENGTH': str(len(POSTDATA))} |
| 363 | fp = BytesIO(POSTDATA.encode('latin-1')) |
| 364 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 365 | self.assertEqual(len(fs.list), 1) |
| 366 | self.assertEqual(fs.list[0].name, 'submit-name') |
| 367 | self.assertEqual(fs.list[0].value, 'Larry') |
| 368 | |
Pierre Quentel | 2d7caca | 2019-09-11 13:05:53 +0200 | [diff] [blame] | 369 | def test_field_storage_multipart_no_content_length(self): |
| 370 | fp = BytesIO(b"""--MyBoundary |
| 371 | Content-Disposition: form-data; name="my-arg"; filename="foo" |
| 372 | |
| 373 | Test |
| 374 | |
| 375 | --MyBoundary-- |
| 376 | """) |
| 377 | env = { |
| 378 | "REQUEST_METHOD": "POST", |
| 379 | "CONTENT_TYPE": "multipart/form-data; boundary=MyBoundary", |
| 380 | "wsgi.input": fp, |
| 381 | } |
| 382 | fields = cgi.FieldStorage(fp, environ=env) |
| 383 | |
| 384 | self.assertEqual(len(fields["my-arg"].file.read()), 5) |
| 385 | |
Berker Peksag | bf5e960 | 2015-02-06 10:21:37 +0200 | [diff] [blame] | 386 | def test_fieldstorage_as_context_manager(self): |
| 387 | fp = BytesIO(b'x' * 10) |
| 388 | env = {'REQUEST_METHOD': 'PUT'} |
| 389 | with cgi.FieldStorage(fp=fp, environ=env) as fs: |
| 390 | content = fs.file.read() |
| 391 | self.assertFalse(fs.file.closed) |
| 392 | self.assertTrue(fs.file.closed) |
| 393 | self.assertEqual(content, 'x' * 10) |
| 394 | with self.assertRaisesRegex(ValueError, 'I/O operation on closed file'): |
| 395 | fs.file.read() |
| 396 | |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 397 | _qs_result = { |
| 398 | 'key1': 'value1', |
| 399 | 'key2': ['value2x', 'value2y'], |
| 400 | 'key3': 'value3', |
| 401 | 'key4': 'value4' |
| 402 | } |
| 403 | def testQSAndUrlEncode(self): |
| 404 | data = "key2=value2x&key3=value3&key4=value4" |
| 405 | environ = { |
| 406 | 'CONTENT_LENGTH': str(len(data)), |
| 407 | 'CONTENT_TYPE': 'application/x-www-form-urlencoded', |
| 408 | 'QUERY_STRING': 'key1=value1&key2=value2y', |
| 409 | 'REQUEST_METHOD': 'POST', |
| 410 | } |
| 411 | v = gen_result(data, environ) |
| 412 | self.assertEqual(self._qs_result, v) |
| 413 | |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 414 | def test_max_num_fields(self): |
| 415 | # For application/x-www-form-urlencoded |
| 416 | data = '&'.join(['a=a']*11) |
| 417 | environ = { |
| 418 | 'CONTENT_LENGTH': str(len(data)), |
| 419 | 'CONTENT_TYPE': 'application/x-www-form-urlencoded', |
| 420 | 'REQUEST_METHOD': 'POST', |
| 421 | } |
| 422 | |
| 423 | with self.assertRaises(ValueError): |
| 424 | cgi.FieldStorage( |
| 425 | fp=BytesIO(data.encode()), |
| 426 | environ=environ, |
| 427 | max_num_fields=10, |
| 428 | ) |
| 429 | |
| 430 | # For multipart/form-data |
| 431 | data = """---123 |
| 432 | Content-Disposition: form-data; name="a" |
| 433 | |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 434 | 3 |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 435 | ---123 |
| 436 | Content-Type: application/x-www-form-urlencoded |
| 437 | |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 438 | a=4 |
| 439 | ---123 |
| 440 | Content-Type: application/x-www-form-urlencoded |
| 441 | |
| 442 | a=5 |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 443 | ---123-- |
| 444 | """ |
| 445 | environ = { |
| 446 | 'CONTENT_LENGTH': str(len(data)), |
| 447 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 448 | 'QUERY_STRING': 'a=1&a=2', |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 449 | 'REQUEST_METHOD': 'POST', |
| 450 | } |
| 451 | |
| 452 | # 2 GET entities |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 453 | # 1 top level POST entities |
| 454 | # 1 entity within the second POST entity |
| 455 | # 1 entity within the third POST entity |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 456 | with self.assertRaises(ValueError): |
| 457 | cgi.FieldStorage( |
| 458 | fp=BytesIO(data.encode()), |
| 459 | environ=environ, |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 460 | max_num_fields=4, |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 461 | ) |
| 462 | cgi.FieldStorage( |
| 463 | fp=BytesIO(data.encode()), |
| 464 | environ=environ, |
matthewbelisle-wf | b79b5c0 | 2018-10-23 03:14:35 -0500 | [diff] [blame] | 465 | max_num_fields=5, |
matthewbelisle-wf | 2091448 | 2018-10-19 05:52:59 -0500 | [diff] [blame] | 466 | ) |
| 467 | |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 468 | def testQSAndFormData(self): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 469 | data = """---123 |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 470 | Content-Disposition: form-data; name="key2" |
| 471 | |
| 472 | value2y |
| 473 | ---123 |
| 474 | Content-Disposition: form-data; name="key3" |
| 475 | |
| 476 | value3 |
| 477 | ---123 |
| 478 | Content-Disposition: form-data; name="key4" |
| 479 | |
| 480 | value4 |
| 481 | ---123-- |
| 482 | """ |
| 483 | environ = { |
| 484 | 'CONTENT_LENGTH': str(len(data)), |
| 485 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 486 | 'QUERY_STRING': 'key1=value1&key2=value2x', |
| 487 | 'REQUEST_METHOD': 'POST', |
| 488 | } |
| 489 | v = gen_result(data, environ) |
| 490 | self.assertEqual(self._qs_result, v) |
| 491 | |
| 492 | def testQSAndFormDataFile(self): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 493 | data = """---123 |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 494 | Content-Disposition: form-data; name="key2" |
| 495 | |
| 496 | value2y |
| 497 | ---123 |
| 498 | Content-Disposition: form-data; name="key3" |
| 499 | |
| 500 | value3 |
| 501 | ---123 |
| 502 | Content-Disposition: form-data; name="key4" |
| 503 | |
| 504 | value4 |
| 505 | ---123 |
| 506 | Content-Disposition: form-data; name="upload"; filename="fake.txt" |
| 507 | Content-Type: text/plain |
| 508 | |
| 509 | this is the content of the fake file |
| 510 | |
| 511 | ---123-- |
| 512 | """ |
| 513 | environ = { |
| 514 | 'CONTENT_LENGTH': str(len(data)), |
| 515 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 516 | 'QUERY_STRING': 'key1=value1&key2=value2x', |
| 517 | 'REQUEST_METHOD': 'POST', |
| 518 | } |
| 519 | result = self._qs_result.copy() |
| 520 | result.update({ |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 521 | 'upload': b'this is the content of the fake file\n' |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 522 | }) |
| 523 | v = gen_result(data, environ) |
| 524 | self.assertEqual(result, v) |
| 525 | |
Fred Drake | 9a0a65b | 2008-12-04 19:24:50 +0000 | [diff] [blame] | 526 | def test_parse_header(self): |
| 527 | self.assertEqual( |
| 528 | cgi.parse_header("text/plain"), |
| 529 | ("text/plain", {})) |
| 530 | self.assertEqual( |
| 531 | cgi.parse_header("text/vnd.just.made.this.up ; "), |
| 532 | ("text/vnd.just.made.this.up", {})) |
| 533 | self.assertEqual( |
| 534 | cgi.parse_header("text/plain;charset=us-ascii"), |
| 535 | ("text/plain", {"charset": "us-ascii"})) |
| 536 | self.assertEqual( |
| 537 | cgi.parse_header('text/plain ; charset="us-ascii"'), |
| 538 | ("text/plain", {"charset": "us-ascii"})) |
| 539 | self.assertEqual( |
| 540 | cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'), |
| 541 | ("text/plain", {"charset": "us-ascii", "another": "opt"})) |
| 542 | self.assertEqual( |
| 543 | cgi.parse_header('attachment; filename="silly.txt"'), |
| 544 | ("attachment", {"filename": "silly.txt"})) |
| 545 | self.assertEqual( |
| 546 | cgi.parse_header('attachment; filename="strange;name"'), |
| 547 | ("attachment", {"filename": "strange;name"})) |
| 548 | self.assertEqual( |
| 549 | cgi.parse_header('attachment; filename="strange;name";size=123;'), |
| 550 | ("attachment", {"filename": "strange;name", "size": "123"})) |
Senthil Kumaran | 1ef0c03 | 2011-10-20 01:05:44 +0800 | [diff] [blame] | 551 | self.assertEqual( |
| 552 | cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'), |
| 553 | ("form-data", {"name": "files", "filename": 'fo"o;bar'})) |
| 554 | |
Martin Panter | 1cd2772 | 2016-06-06 01:53:28 +0000 | [diff] [blame] | 555 | def test_all(self): |
Victor Stinner | fbf43f0 | 2020-08-17 07:20:40 +0200 | [diff] [blame^] | 556 | not_exported = { |
| 557 | "logfile", "logfp", "initlog", "dolog", "nolog", "closelog", "log", |
| 558 | "maxlen", "valid_boundary"} |
| 559 | support.check__all__(self, cgi, not_exported=not_exported) |
Martin Panter | 1cd2772 | 2016-06-06 01:53:28 +0000 | [diff] [blame] | 560 | |
Fred Drake | 9a0a65b | 2008-12-04 19:24:50 +0000 | [diff] [blame] | 561 | |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 562 | BOUNDARY = "---------------------------721837373350705526688164684" |
| 563 | |
| 564 | POSTDATA = """-----------------------------721837373350705526688164684 |
| 565 | Content-Disposition: form-data; name="id" |
| 566 | |
| 567 | 1234 |
| 568 | -----------------------------721837373350705526688164684 |
| 569 | Content-Disposition: form-data; name="title" |
| 570 | |
| 571 | |
| 572 | -----------------------------721837373350705526688164684 |
| 573 | Content-Disposition: form-data; name="file"; filename="test.txt" |
| 574 | Content-Type: text/plain |
| 575 | |
| 576 | Testing 123. |
| 577 | |
| 578 | -----------------------------721837373350705526688164684 |
| 579 | Content-Disposition: form-data; name="submit" |
| 580 | |
| 581 | Add\x20 |
| 582 | -----------------------------721837373350705526688164684-- |
| 583 | """ |
| 584 | |
| 585 | POSTDATA_NON_ASCII = """-----------------------------721837373350705526688164684 |
| 586 | Content-Disposition: form-data; name="id" |
| 587 | |
| 588 | \xe7\xf1\x80 |
| 589 | -----------------------------721837373350705526688164684 |
| 590 | """ |
| 591 | |
Florent Xicluna | 331c3fd | 2013-07-07 12:44:28 +0200 | [diff] [blame] | 592 | # http://www.w3.org/TR/html401/interact/forms.html#h-17.13.4 |
| 593 | BOUNDARY_W3 = "AaB03x" |
| 594 | POSTDATA_W3 = """--AaB03x |
| 595 | Content-Disposition: form-data; name="submit-name" |
| 596 | |
| 597 | Larry |
| 598 | --AaB03x |
| 599 | Content-Disposition: form-data; name="files" |
| 600 | Content-Type: multipart/mixed; boundary=BbC04y |
| 601 | |
| 602 | --BbC04y |
| 603 | Content-Disposition: file; filename="file1.txt" |
| 604 | Content-Type: text/plain |
| 605 | |
| 606 | ... contents of file1.txt ... |
| 607 | --BbC04y |
| 608 | Content-Disposition: file; filename="file2.gif" |
| 609 | Content-Type: image/gif |
| 610 | Content-Transfer-Encoding: binary |
| 611 | |
| 612 | ...contents of file2.gif... |
| 613 | --BbC04y-- |
| 614 | --AaB03x-- |
| 615 | """ |
| 616 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 617 | if __name__ == '__main__': |
Berker Peksag | bf5e960 | 2015-02-06 10:21:37 +0200 | [diff] [blame] | 618 | unittest.main() |