Berker Peksag | bf5e960 | 2015-02-06 10:21:37 +0200 | [diff] [blame] | 1 | from test.support import check_warnings |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 2 | import cgi |
| 3 | import os |
| 4 | import sys |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 5 | import tempfile |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 6 | import unittest |
Brett Cannon | 8f79dd5 | 2012-04-25 20:49:19 -0400 | [diff] [blame] | 7 | import warnings |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 8 | from collections import namedtuple |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 9 | from io import StringIO, BytesIO |
Martin Panter | 1cd2772 | 2016-06-06 01:53:28 +0000 | [diff] [blame] | 10 | from test import support |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 11 | |
| 12 | class HackedSysModule: |
| 13 | # The regression test will have real values in sys.argv, which |
Fred Drake | 004d5e6 | 2000-10-23 17:22:08 +0000 | [diff] [blame] | 14 | # will completely confuse the test of the cgi module |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 15 | argv = [] |
| 16 | stdin = sys.stdin |
| 17 | |
| 18 | cgi.sys = HackedSysModule() |
| 19 | |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 20 | class ComparableException: |
| 21 | def __init__(self, err): |
| 22 | self.err = err |
| 23 | |
| 24 | def __str__(self): |
| 25 | return str(self.err) |
| 26 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 27 | def __eq__(self, anExc): |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 28 | if not isinstance(anExc, Exception): |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 29 | return NotImplemented |
| 30 | return (self.err.__class__ == anExc.__class__ and |
| 31 | self.err.args == anExc.args) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 32 | |
| 33 | def __getattr__(self, attr): |
Guido van Rossum | 846d6db | 2001-01-17 15:08:37 +0000 | [diff] [blame] | 34 | return getattr(self.err, attr) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 35 | |
| 36 | def do_test(buf, method): |
| 37 | env = {} |
| 38 | if method == "GET": |
| 39 | fp = None |
| 40 | env['REQUEST_METHOD'] = 'GET' |
| 41 | env['QUERY_STRING'] = buf |
| 42 | elif method == "POST": |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 43 | fp = BytesIO(buf.encode('latin-1')) # FieldStorage expects bytes |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 44 | env['REQUEST_METHOD'] = 'POST' |
| 45 | env['CONTENT_TYPE'] = 'application/x-www-form-urlencoded' |
| 46 | env['CONTENT_LENGTH'] = str(len(buf)) |
| 47 | else: |
Collin Winter | 3add4d7 | 2007-08-29 23:37:32 +0000 | [diff] [blame] | 48 | raise ValueError("unknown method: %s" % method) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 49 | try: |
| 50 | return cgi.parse(fp, env, strict_parsing=1) |
Guido van Rossum | cd16bf6 | 2007-06-13 18:07:49 +0000 | [diff] [blame] | 51 | except Exception as err: |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 52 | return ComparableException(err) |
| 53 | |
Neil Schemenauer | 66edb62 | 2004-07-19 15:38:11 +0000 | [diff] [blame] | 54 | parse_strict_test_cases = [ |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 55 | ("", ValueError("bad query field: ''")), |
| 56 | ("&", ValueError("bad query field: ''")), |
| 57 | ("&&", ValueError("bad query field: ''")), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 58 | (";", ValueError("bad query field: ''")), |
| 59 | (";&;", ValueError("bad query field: ''")), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 60 | # Should the next few really be valid? |
| 61 | ("=", {}), |
| 62 | ("=&=", {}), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 63 | ("=;=", {}), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 64 | # This rest seem to make sense |
| 65 | ("=a", {'': ['a']}), |
| 66 | ("&=a", ValueError("bad query field: ''")), |
| 67 | ("=a&", ValueError("bad query field: ''")), |
| 68 | ("=&a", ValueError("bad query field: 'a'")), |
| 69 | ("b=a", {'b': ['a']}), |
| 70 | ("b+=a", {'b ': ['a']}), |
| 71 | ("a=b=a", {'a': ['b=a']}), |
| 72 | ("a=+b=a", {'a': [' b=a']}), |
| 73 | ("&b=a", ValueError("bad query field: ''")), |
| 74 | ("b&=a", ValueError("bad query field: 'b'")), |
| 75 | ("a=a+b&b=b+c", {'a': ['a b'], 'b': ['b c']}), |
| 76 | ("a=a+b&a=b+a", {'a': ['a b', 'b a']}), |
| 77 | ("x=1&y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
Jeremy Hylton | afde7e2 | 2000-09-15 20:06:57 +0000 | [diff] [blame] | 78 | ("x=1;y=2.0&z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
| 79 | ("x=1;y=2.0;z=2-3.%2b0", {'x': ['1'], 'y': ['2.0'], 'z': ['2-3.+0']}), |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 80 | ("Hbc5161168c542333633315dee1182227:key_store_seqid=400006&cuyer=r&view=bustomer&order_id=0bb2e248638833d48cb7fed300000f1b&expire=964546263&lobale=en-US&kid=130003.300038&ss=env", |
| 81 | {'Hbc5161168c542333633315dee1182227:key_store_seqid': ['400006'], |
| 82 | 'cuyer': ['r'], |
| 83 | 'expire': ['964546263'], |
| 84 | 'kid': ['130003.300038'], |
| 85 | 'lobale': ['en-US'], |
| 86 | 'order_id': ['0bb2e248638833d48cb7fed300000f1b'], |
| 87 | 'ss': ['env'], |
| 88 | 'view': ['bustomer'], |
| 89 | }), |
Fred Drake | 004d5e6 | 2000-10-23 17:22:08 +0000 | [diff] [blame] | 90 | |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 91 | ("group_id=5470&set=custom&_assigned_to=31392&_status=1&_category=100&SUBMIT=Browse", |
| 92 | {'SUBMIT': ['Browse'], |
| 93 | '_assigned_to': ['31392'], |
| 94 | '_category': ['100'], |
| 95 | '_status': ['1'], |
| 96 | 'group_id': ['5470'], |
| 97 | 'set': ['custom'], |
| 98 | }) |
| 99 | ] |
| 100 | |
Guido van Rossum | 47b9ff6 | 2006-08-24 00:41:19 +0000 | [diff] [blame] | 101 | def norm(seq): |
Guido van Rossum | cc2b016 | 2007-02-11 06:12:03 +0000 | [diff] [blame] | 102 | return sorted(seq, key=repr) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 103 | |
| 104 | def first_elts(list): |
Guido van Rossum | c1f779c | 2007-07-03 08:25:58 +0000 | [diff] [blame] | 105 | return [p[0] for p in list] |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 106 | |
| 107 | def first_second_elts(list): |
Guido van Rossum | c1f779c | 2007-07-03 08:25:58 +0000 | [diff] [blame] | 108 | return [(p[0], p[1][0]) for p in list] |
| 109 | |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 110 | def gen_result(data, environ): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 111 | encoding = 'latin-1' |
| 112 | fake_stdin = BytesIO(data.encode(encoding)) |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 113 | fake_stdin.seek(0) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 114 | form = cgi.FieldStorage(fp=fake_stdin, environ=environ, encoding=encoding) |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 115 | |
| 116 | result = {} |
| 117 | for k, v in dict(form).items(): |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 118 | result[k] = isinstance(v, list) and form.getlist(k) or v.value |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 119 | |
| 120 | return result |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 121 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 122 | class CgiTests(unittest.TestCase): |
Neil Schemenauer | 66edb62 | 2004-07-19 15:38:11 +0000 | [diff] [blame] | 123 | |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 124 | def test_parse_multipart(self): |
| 125 | fp = BytesIO(POSTDATA.encode('latin1')) |
| 126 | env = {'boundary': BOUNDARY.encode('latin1'), |
| 127 | 'CONTENT-LENGTH': '558'} |
| 128 | result = cgi.parse_multipart(fp, env) |
Pierre Quentel | cc3fa20 | 2017-05-08 14:08:34 +0200 | [diff] [blame] | 129 | expected = {'submit': [' Add '], 'id': ['1234'], |
| 130 | 'file': [b'Testing 123.\n'], 'title': ['']} |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 131 | self.assertEqual(result, expected) |
| 132 | |
Amber Brown | 545c955 | 2018-05-14 18:11:55 -0400 | [diff] [blame^] | 133 | def test_parse_multipart_invalid_encoding(self): |
| 134 | BOUNDARY = "JfISa01" |
| 135 | POSTDATA = """--JfISa01 |
| 136 | Content-Disposition: form-data; name="submit-name" |
| 137 | Content-Length: 3 |
| 138 | |
| 139 | \u2603 |
| 140 | --JfISa01""" |
| 141 | fp = BytesIO(POSTDATA.encode('utf8')) |
| 142 | env = {'boundary': BOUNDARY.encode('latin1'), |
| 143 | 'CONTENT-LENGTH': str(len(POSTDATA.encode('utf8')))} |
| 144 | result = cgi.parse_multipart(fp, env, encoding="ascii", |
| 145 | errors="surrogateescape") |
| 146 | expected = {'submit-name': ["\udce2\udc98\udc83"]} |
| 147 | self.assertEqual(result, expected) |
| 148 | self.assertEqual("\u2603".encode('utf8'), |
| 149 | result["submit-name"][0].encode('utf8', 'surrogateescape')) |
| 150 | |
Senthil Kumaran | 6b102f2 | 2013-01-23 02:50:15 -0800 | [diff] [blame] | 151 | def test_fieldstorage_properties(self): |
| 152 | fs = cgi.FieldStorage() |
| 153 | self.assertFalse(fs) |
| 154 | self.assertIn("FieldStorage", repr(fs)) |
| 155 | self.assertEqual(list(fs), list(fs.keys())) |
| 156 | fs.list.append(namedtuple('MockFieldStorage', 'name')('fieldvalue')) |
| 157 | self.assertTrue(fs) |
| 158 | |
Senthil Kumaran | b4cbb92 | 2014-01-11 22:20:16 -0800 | [diff] [blame] | 159 | def test_fieldstorage_invalid(self): |
| 160 | self.assertRaises(TypeError, cgi.FieldStorage, "not-a-file-obj", |
| 161 | environ={"REQUEST_METHOD":"PUT"}) |
| 162 | self.assertRaises(TypeError, cgi.FieldStorage, "foo", "bar") |
| 163 | fs = cgi.FieldStorage(headers={'content-type':'text/plain'}) |
| 164 | self.assertRaises(TypeError, bool, fs) |
| 165 | |
Senthil Kumaran | 47b5ddb | 2012-03-13 01:50:27 -0700 | [diff] [blame] | 166 | def test_escape(self): |
Brett Cannon | 8f79dd5 | 2012-04-25 20:49:19 -0400 | [diff] [blame] | 167 | # cgi.escape() is deprecated. |
| 168 | with warnings.catch_warnings(): |
R David Murray | 44b548d | 2016-09-08 13:59:53 -0400 | [diff] [blame] | 169 | warnings.filterwarnings('ignore', r'cgi\.escape', |
Brett Cannon | 8f79dd5 | 2012-04-25 20:49:19 -0400 | [diff] [blame] | 170 | DeprecationWarning) |
| 171 | self.assertEqual("test & string", cgi.escape("test & string")) |
| 172 | self.assertEqual("<test string>", cgi.escape("<test string>")) |
| 173 | self.assertEqual(""test string"", cgi.escape('"test string"', True)) |
Senthil Kumaran | 47b5ddb | 2012-03-13 01:50:27 -0700 | [diff] [blame] | 174 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 175 | def test_strict(self): |
| 176 | for orig, expect in parse_strict_test_cases: |
| 177 | # Test basic parsing |
| 178 | d = do_test(orig, "GET") |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 179 | self.assertEqual(d, expect, "Error parsing %s method GET" % repr(orig)) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 180 | d = do_test(orig, "POST") |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 181 | self.assertEqual(d, expect, "Error parsing %s method POST" % repr(orig)) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 182 | |
| 183 | env = {'QUERY_STRING': orig} |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 184 | fs = cgi.FieldStorage(environ=env) |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 185 | if isinstance(expect, dict): |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 186 | # test dict interface |
Georg Brandl | 49d1b4f | 2008-05-11 21:42:51 +0000 | [diff] [blame] | 187 | self.assertEqual(len(expect), len(fs)) |
Ezio Melotti | 263cbdf | 2010-11-29 02:02:10 +0000 | [diff] [blame] | 188 | self.assertCountEqual(expect.keys(), fs.keys()) |
Georg Brandl | 49d1b4f | 2008-05-11 21:42:51 +0000 | [diff] [blame] | 189 | ##self.assertEqual(norm(expect.values()), norm(fs.values())) |
| 190 | ##self.assertEqual(norm(expect.items()), norm(fs.items())) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 191 | self.assertEqual(fs.getvalue("nonexistent field", "default"), "default") |
| 192 | # test individual fields |
| 193 | for key in expect.keys(): |
| 194 | expect_val = expect[key] |
Benjamin Peterson | 577473f | 2010-01-19 00:09:57 +0000 | [diff] [blame] | 195 | self.assertIn(key, fs) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 196 | if len(expect_val) > 1: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 197 | self.assertEqual(fs.getvalue(key), expect_val) |
| 198 | else: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 199 | self.assertEqual(fs.getvalue(key), expect_val[0]) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 200 | |
| 201 | def test_log(self): |
| 202 | cgi.log("Testing") |
| 203 | |
| 204 | cgi.logfp = StringIO() |
| 205 | cgi.initlog("%s", "Testing initlog 1") |
| 206 | cgi.log("%s", "Testing log 2") |
| 207 | self.assertEqual(cgi.logfp.getvalue(), "Testing initlog 1\nTesting log 2\n") |
Serhiy Storchaka | 85c3033 | 2015-02-15 13:58:23 +0200 | [diff] [blame] | 208 | if os.path.exists(os.devnull): |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 209 | cgi.logfp = None |
Serhiy Storchaka | 85c3033 | 2015-02-15 13:58:23 +0200 | [diff] [blame] | 210 | cgi.logfile = os.devnull |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 211 | cgi.initlog("%s", "Testing log 3") |
Victor Stinner | d33344a | 2011-07-14 22:28:36 +0200 | [diff] [blame] | 212 | self.addCleanup(cgi.closelog) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 213 | cgi.log("Testing log 4") |
| 214 | |
| 215 | def test_fieldstorage_readline(self): |
| 216 | # FieldStorage uses readline, which has the capacity to read all |
| 217 | # contents of the input file into memory; we use readline's size argument |
| 218 | # to prevent that for files that do not contain any newlines in |
| 219 | # non-GET/HEAD requests |
| 220 | class TestReadlineFile: |
| 221 | def __init__(self, file): |
| 222 | self.file = file |
| 223 | self.numcalls = 0 |
| 224 | |
| 225 | def readline(self, size=None): |
| 226 | self.numcalls += 1 |
| 227 | if size: |
| 228 | return self.file.readline(size) |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 229 | else: |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 230 | return self.file.readline() |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 231 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 232 | def __getattr__(self, name): |
| 233 | file = self.__dict__['file'] |
| 234 | a = getattr(file, name) |
| 235 | if not isinstance(a, int): |
| 236 | setattr(self, name, a) |
| 237 | return a |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 238 | |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 239 | f = TestReadlineFile(tempfile.TemporaryFile("wb+")) |
Benjamin Peterson | 807a5a1 | 2010-10-30 22:59:37 +0000 | [diff] [blame] | 240 | self.addCleanup(f.close) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 241 | f.write(b'x' * 256 * 1024) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 242 | f.seek(0) |
| 243 | env = {'REQUEST_METHOD':'PUT'} |
| 244 | fs = cgi.FieldStorage(fp=f, environ=env) |
Benjamin Peterson | 807a5a1 | 2010-10-30 22:59:37 +0000 | [diff] [blame] | 245 | self.addCleanup(fs.file.close) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 246 | # if we're not chunking properly, readline is only called twice |
| 247 | # (by read_binary); if we are chunking properly, it will be called 5 times |
| 248 | # as long as the chunksize is 1 << 16. |
Serhiy Storchaka | 25d8aea | 2014-02-08 14:50:08 +0200 | [diff] [blame] | 249 | self.assertGreater(f.numcalls, 2) |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 250 | f.close() |
Jeremy Hylton | d9827c4 | 2000-08-03 22:11:43 +0000 | [diff] [blame] | 251 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 252 | def test_fieldstorage_multipart(self): |
| 253 | #Test basic FieldStorage multipart parsing |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 254 | env = { |
| 255 | 'REQUEST_METHOD': 'POST', |
| 256 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 257 | 'CONTENT_LENGTH': '558'} |
| 258 | fp = BytesIO(POSTDATA.encode('latin-1')) |
| 259 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 260 | self.assertEqual(len(fs.list), 4) |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 261 | expect = [{'name':'id', 'filename':None, 'value':'1234'}, |
| 262 | {'name':'title', 'filename':None, 'value':''}, |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 263 | {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'}, |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 264 | {'name':'submit', 'filename':None, 'value':' Add '}] |
| 265 | for x in range(len(fs.list)): |
| 266 | for k, exp in expect[x].items(): |
| 267 | got = getattr(fs.list[x], k) |
Ezio Melotti | b3aedd4 | 2010-11-20 19:04:17 +0000 | [diff] [blame] | 268 | self.assertEqual(got, exp) |
Thomas Wouters | 00ee7ba | 2006-08-21 19:07:27 +0000 | [diff] [blame] | 269 | |
Donald Stufft | d90f8d1 | 2015-03-29 16:43:23 -0400 | [diff] [blame] | 270 | def test_fieldstorage_multipart_leading_whitespace(self): |
| 271 | env = { |
| 272 | 'REQUEST_METHOD': 'POST', |
| 273 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 274 | 'CONTENT_LENGTH': '560'} |
| 275 | # Add some leading whitespace to our post data that will cause the |
| 276 | # first line to not be the innerboundary. |
| 277 | fp = BytesIO(b"\r\n" + POSTDATA.encode('latin-1')) |
| 278 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 279 | self.assertEqual(len(fs.list), 4) |
| 280 | expect = [{'name':'id', 'filename':None, 'value':'1234'}, |
| 281 | {'name':'title', 'filename':None, 'value':''}, |
| 282 | {'name':'file', 'filename':'test.txt', 'value':b'Testing 123.\n'}, |
| 283 | {'name':'submit', 'filename':None, 'value':' Add '}] |
| 284 | for x in range(len(fs.list)): |
| 285 | for k, exp in expect[x].items(): |
| 286 | got = getattr(fs.list[x], k) |
| 287 | self.assertEqual(got, exp) |
| 288 | |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 289 | def test_fieldstorage_multipart_non_ascii(self): |
| 290 | #Test basic FieldStorage multipart parsing |
| 291 | env = {'REQUEST_METHOD':'POST', |
| 292 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 293 | 'CONTENT_LENGTH':'558'} |
| 294 | for encoding in ['iso-8859-1','utf-8']: |
| 295 | fp = BytesIO(POSTDATA_NON_ASCII.encode(encoding)) |
| 296 | fs = cgi.FieldStorage(fp, environ=env,encoding=encoding) |
| 297 | self.assertEqual(len(fs.list), 1) |
| 298 | expect = [{'name':'id', 'filename':None, 'value':'\xe7\xf1\x80'}] |
| 299 | for x in range(len(fs.list)): |
| 300 | for k, exp in expect[x].items(): |
| 301 | got = getattr(fs.list[x], k) |
| 302 | self.assertEqual(got, exp) |
| 303 | |
Serhiy Storchaka | c7bfe0e | 2013-06-17 16:34:41 +0300 | [diff] [blame] | 304 | def test_fieldstorage_multipart_maxline(self): |
| 305 | # Issue #18167 |
| 306 | maxline = 1 << 16 |
| 307 | self.maxDiff = None |
| 308 | def check(content): |
| 309 | data = """---123 |
| 310 | Content-Disposition: form-data; name="upload"; filename="fake.txt" |
| 311 | Content-Type: text/plain |
| 312 | |
| 313 | %s |
| 314 | ---123-- |
| 315 | """.replace('\n', '\r\n') % content |
| 316 | environ = { |
| 317 | 'CONTENT_LENGTH': str(len(data)), |
| 318 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 319 | 'REQUEST_METHOD': 'POST', |
| 320 | } |
| 321 | self.assertEqual(gen_result(data, environ), |
| 322 | {'upload': content.encode('latin1')}) |
| 323 | check('x' * (maxline - 1)) |
| 324 | check('x' * (maxline - 1) + '\r') |
| 325 | check('x' * (maxline - 1) + '\r' + 'y' * (maxline - 1)) |
| 326 | |
Florent Xicluna | 331c3fd | 2013-07-07 12:44:28 +0200 | [diff] [blame] | 327 | def test_fieldstorage_multipart_w3c(self): |
| 328 | # Test basic FieldStorage multipart parsing (W3C sample) |
| 329 | env = { |
| 330 | 'REQUEST_METHOD': 'POST', |
| 331 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY_W3), |
| 332 | 'CONTENT_LENGTH': str(len(POSTDATA_W3))} |
| 333 | fp = BytesIO(POSTDATA_W3.encode('latin-1')) |
| 334 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 335 | self.assertEqual(len(fs.list), 2) |
| 336 | self.assertEqual(fs.list[0].name, 'submit-name') |
| 337 | self.assertEqual(fs.list[0].value, 'Larry') |
| 338 | self.assertEqual(fs.list[1].name, 'files') |
| 339 | files = fs.list[1].value |
| 340 | self.assertEqual(len(files), 2) |
| 341 | expect = [{'name': None, 'filename': 'file1.txt', 'value': b'... contents of file1.txt ...'}, |
| 342 | {'name': None, 'filename': 'file2.gif', 'value': b'...contents of file2.gif...'}] |
| 343 | for x in range(len(files)): |
| 344 | for k, exp in expect[x].items(): |
| 345 | got = getattr(files[x], k) |
| 346 | self.assertEqual(got, exp) |
| 347 | |
Victor Stinner | 6579459 | 2015-08-18 10:21:10 -0700 | [diff] [blame] | 348 | def test_fieldstorage_part_content_length(self): |
| 349 | BOUNDARY = "JfISa01" |
| 350 | POSTDATA = """--JfISa01 |
| 351 | Content-Disposition: form-data; name="submit-name" |
| 352 | Content-Length: 5 |
| 353 | |
| 354 | Larry |
| 355 | --JfISa01""" |
| 356 | env = { |
| 357 | 'REQUEST_METHOD': 'POST', |
| 358 | 'CONTENT_TYPE': 'multipart/form-data; boundary={}'.format(BOUNDARY), |
| 359 | 'CONTENT_LENGTH': str(len(POSTDATA))} |
| 360 | fp = BytesIO(POSTDATA.encode('latin-1')) |
| 361 | fs = cgi.FieldStorage(fp, environ=env, encoding="latin-1") |
| 362 | self.assertEqual(len(fs.list), 1) |
| 363 | self.assertEqual(fs.list[0].name, 'submit-name') |
| 364 | self.assertEqual(fs.list[0].value, 'Larry') |
| 365 | |
Berker Peksag | bf5e960 | 2015-02-06 10:21:37 +0200 | [diff] [blame] | 366 | def test_fieldstorage_as_context_manager(self): |
| 367 | fp = BytesIO(b'x' * 10) |
| 368 | env = {'REQUEST_METHOD': 'PUT'} |
| 369 | with cgi.FieldStorage(fp=fp, environ=env) as fs: |
| 370 | content = fs.file.read() |
| 371 | self.assertFalse(fs.file.closed) |
| 372 | self.assertTrue(fs.file.closed) |
| 373 | self.assertEqual(content, 'x' * 10) |
| 374 | with self.assertRaisesRegex(ValueError, 'I/O operation on closed file'): |
| 375 | fs.file.read() |
| 376 | |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 377 | _qs_result = { |
| 378 | 'key1': 'value1', |
| 379 | 'key2': ['value2x', 'value2y'], |
| 380 | 'key3': 'value3', |
| 381 | 'key4': 'value4' |
| 382 | } |
| 383 | def testQSAndUrlEncode(self): |
| 384 | data = "key2=value2x&key3=value3&key4=value4" |
| 385 | environ = { |
| 386 | 'CONTENT_LENGTH': str(len(data)), |
| 387 | 'CONTENT_TYPE': 'application/x-www-form-urlencoded', |
| 388 | 'QUERY_STRING': 'key1=value1&key2=value2y', |
| 389 | 'REQUEST_METHOD': 'POST', |
| 390 | } |
| 391 | v = gen_result(data, environ) |
| 392 | self.assertEqual(self._qs_result, v) |
| 393 | |
| 394 | def testQSAndFormData(self): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 395 | data = """---123 |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 396 | Content-Disposition: form-data; name="key2" |
| 397 | |
| 398 | value2y |
| 399 | ---123 |
| 400 | Content-Disposition: form-data; name="key3" |
| 401 | |
| 402 | value3 |
| 403 | ---123 |
| 404 | Content-Disposition: form-data; name="key4" |
| 405 | |
| 406 | value4 |
| 407 | ---123-- |
| 408 | """ |
| 409 | environ = { |
| 410 | 'CONTENT_LENGTH': str(len(data)), |
| 411 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 412 | 'QUERY_STRING': 'key1=value1&key2=value2x', |
| 413 | 'REQUEST_METHOD': 'POST', |
| 414 | } |
| 415 | v = gen_result(data, environ) |
| 416 | self.assertEqual(self._qs_result, v) |
| 417 | |
| 418 | def testQSAndFormDataFile(self): |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 419 | data = """---123 |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 420 | Content-Disposition: form-data; name="key2" |
| 421 | |
| 422 | value2y |
| 423 | ---123 |
| 424 | Content-Disposition: form-data; name="key3" |
| 425 | |
| 426 | value3 |
| 427 | ---123 |
| 428 | Content-Disposition: form-data; name="key4" |
| 429 | |
| 430 | value4 |
| 431 | ---123 |
| 432 | Content-Disposition: form-data; name="upload"; filename="fake.txt" |
| 433 | Content-Type: text/plain |
| 434 | |
| 435 | this is the content of the fake file |
| 436 | |
| 437 | ---123-- |
| 438 | """ |
| 439 | environ = { |
| 440 | 'CONTENT_LENGTH': str(len(data)), |
| 441 | 'CONTENT_TYPE': 'multipart/form-data; boundary=-123', |
| 442 | 'QUERY_STRING': 'key1=value1&key2=value2x', |
| 443 | 'REQUEST_METHOD': 'POST', |
| 444 | } |
| 445 | result = self._qs_result.copy() |
| 446 | result.update({ |
Victor Stinner | 5c23b8e | 2011-01-14 13:05:21 +0000 | [diff] [blame] | 447 | 'upload': b'this is the content of the fake file\n' |
Benjamin Peterson | dcf97b9 | 2008-07-02 17:30:14 +0000 | [diff] [blame] | 448 | }) |
| 449 | v = gen_result(data, environ) |
| 450 | self.assertEqual(result, v) |
| 451 | |
Facundo Batista | bd18fd6 | 2008-09-08 00:23:29 +0000 | [diff] [blame] | 452 | def test_deprecated_parse_qs(self): |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 453 | # this func is moved to urllib.parse, this is just a sanity check |
| 454 | with check_warnings(('cgi.parse_qs is deprecated, use urllib.parse.' |
| 455 | 'parse_qs instead', DeprecationWarning)): |
Facundo Batista | a27244b | 2008-09-09 02:43:19 +0000 | [diff] [blame] | 456 | self.assertEqual({'a': ['A1'], 'B': ['B3'], 'b': ['B2']}, |
| 457 | cgi.parse_qs('a=A1&b=B2&B=B3')) |
Facundo Batista | bd18fd6 | 2008-09-08 00:23:29 +0000 | [diff] [blame] | 458 | |
| 459 | def test_deprecated_parse_qsl(self): |
Florent Xicluna | 8fbddf1 | 2010-03-17 20:29:51 +0000 | [diff] [blame] | 460 | # this func is moved to urllib.parse, this is just a sanity check |
| 461 | with check_warnings(('cgi.parse_qsl is deprecated, use urllib.parse.' |
| 462 | 'parse_qsl instead', DeprecationWarning)): |
Facundo Batista | a27244b | 2008-09-09 02:43:19 +0000 | [diff] [blame] | 463 | self.assertEqual([('a', 'A1'), ('b', 'B2'), ('B', 'B3')], |
| 464 | cgi.parse_qsl('a=A1&b=B2&B=B3')) |
Facundo Batista | bd18fd6 | 2008-09-08 00:23:29 +0000 | [diff] [blame] | 465 | |
Fred Drake | 9a0a65b | 2008-12-04 19:24:50 +0000 | [diff] [blame] | 466 | def test_parse_header(self): |
| 467 | self.assertEqual( |
| 468 | cgi.parse_header("text/plain"), |
| 469 | ("text/plain", {})) |
| 470 | self.assertEqual( |
| 471 | cgi.parse_header("text/vnd.just.made.this.up ; "), |
| 472 | ("text/vnd.just.made.this.up", {})) |
| 473 | self.assertEqual( |
| 474 | cgi.parse_header("text/plain;charset=us-ascii"), |
| 475 | ("text/plain", {"charset": "us-ascii"})) |
| 476 | self.assertEqual( |
| 477 | cgi.parse_header('text/plain ; charset="us-ascii"'), |
| 478 | ("text/plain", {"charset": "us-ascii"})) |
| 479 | self.assertEqual( |
| 480 | cgi.parse_header('text/plain ; charset="us-ascii"; another=opt'), |
| 481 | ("text/plain", {"charset": "us-ascii", "another": "opt"})) |
| 482 | self.assertEqual( |
| 483 | cgi.parse_header('attachment; filename="silly.txt"'), |
| 484 | ("attachment", {"filename": "silly.txt"})) |
| 485 | self.assertEqual( |
| 486 | cgi.parse_header('attachment; filename="strange;name"'), |
| 487 | ("attachment", {"filename": "strange;name"})) |
| 488 | self.assertEqual( |
| 489 | cgi.parse_header('attachment; filename="strange;name";size=123;'), |
| 490 | ("attachment", {"filename": "strange;name", "size": "123"})) |
Senthil Kumaran | 1ef0c03 | 2011-10-20 01:05:44 +0800 | [diff] [blame] | 491 | self.assertEqual( |
| 492 | cgi.parse_header('form-data; name="files"; filename="fo\\"o;bar"'), |
| 493 | ("form-data", {"name": "files", "filename": 'fo"o;bar'})) |
| 494 | |
Martin Panter | 1cd2772 | 2016-06-06 01:53:28 +0000 | [diff] [blame] | 495 | def test_all(self): |
| 496 | blacklist = {"logfile", "logfp", "initlog", "dolog", "nolog", |
| 497 | "closelog", "log", "maxlen", "valid_boundary"} |
| 498 | support.check__all__(self, cgi, blacklist=blacklist) |
| 499 | |
Fred Drake | 9a0a65b | 2008-12-04 19:24:50 +0000 | [diff] [blame] | 500 | |
Victor Stinner | f0e293c | 2011-03-01 23:09:57 +0000 | [diff] [blame] | 501 | BOUNDARY = "---------------------------721837373350705526688164684" |
| 502 | |
| 503 | POSTDATA = """-----------------------------721837373350705526688164684 |
| 504 | Content-Disposition: form-data; name="id" |
| 505 | |
| 506 | 1234 |
| 507 | -----------------------------721837373350705526688164684 |
| 508 | Content-Disposition: form-data; name="title" |
| 509 | |
| 510 | |
| 511 | -----------------------------721837373350705526688164684 |
| 512 | Content-Disposition: form-data; name="file"; filename="test.txt" |
| 513 | Content-Type: text/plain |
| 514 | |
| 515 | Testing 123. |
| 516 | |
| 517 | -----------------------------721837373350705526688164684 |
| 518 | Content-Disposition: form-data; name="submit" |
| 519 | |
| 520 | Add\x20 |
| 521 | -----------------------------721837373350705526688164684-- |
| 522 | """ |
| 523 | |
| 524 | POSTDATA_NON_ASCII = """-----------------------------721837373350705526688164684 |
| 525 | Content-Disposition: form-data; name="id" |
| 526 | |
| 527 | \xe7\xf1\x80 |
| 528 | -----------------------------721837373350705526688164684 |
| 529 | """ |
| 530 | |
Florent Xicluna | 331c3fd | 2013-07-07 12:44:28 +0200 | [diff] [blame] | 531 | # http://www.w3.org/TR/html401/interact/forms.html#h-17.13.4 |
| 532 | BOUNDARY_W3 = "AaB03x" |
| 533 | POSTDATA_W3 = """--AaB03x |
| 534 | Content-Disposition: form-data; name="submit-name" |
| 535 | |
| 536 | Larry |
| 537 | --AaB03x |
| 538 | Content-Disposition: form-data; name="files" |
| 539 | Content-Type: multipart/mixed; boundary=BbC04y |
| 540 | |
| 541 | --BbC04y |
| 542 | Content-Disposition: file; filename="file1.txt" |
| 543 | Content-Type: text/plain |
| 544 | |
| 545 | ... contents of file1.txt ... |
| 546 | --BbC04y |
| 547 | Content-Disposition: file; filename="file2.gif" |
| 548 | Content-Type: image/gif |
| 549 | Content-Transfer-Encoding: binary |
| 550 | |
| 551 | ...contents of file2.gif... |
| 552 | --BbC04y-- |
| 553 | --AaB03x-- |
| 554 | """ |
| 555 | |
Thomas Wouters | 89f507f | 2006-12-13 04:49:30 +0000 | [diff] [blame] | 556 | if __name__ == '__main__': |
Berker Peksag | bf5e960 | 2015-02-06 10:21:37 +0200 | [diff] [blame] | 557 | unittest.main() |