blob: 86426cde1a72c065f8dffcc8033747ca103e2515 [file] [log] [blame]
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00001"""JSON token scanner
Christian Heimes90540002008-05-08 14:29:10 +00002"""
Christian Heimes90540002008-05-08 14:29:10 +00003import re
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00004try:
5 from _json import make_scanner as c_make_scanner
6except ImportError:
7 c_make_scanner = None
Christian Heimes90540002008-05-08 14:29:10 +00008
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00009__all__ = ['make_scanner']
Christian Heimes90540002008-05-08 14:29:10 +000010
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000011NUMBER_RE = re.compile(
12 r'(-?(?:0|[1-9]\d*))(\.\d+)?([eE][-+]?\d+)?',
13 (re.VERBOSE | re.MULTILINE | re.DOTALL))
Christian Heimes90540002008-05-08 14:29:10 +000014
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000015def py_make_scanner(context):
16 parse_object = context.parse_object
17 parse_array = context.parse_array
18 parse_string = context.parse_string
19 match_number = NUMBER_RE.match
20 strict = context.strict
21 parse_float = context.parse_float
22 parse_int = context.parse_int
23 parse_constant = context.parse_constant
24 object_hook = context.object_hook
Antoine Pitrou7d6e0762010-09-04 20:16:53 +000025 object_pairs_hook = context.object_pairs_hook
26 memo = context.memo
Christian Heimes90540002008-05-08 14:29:10 +000027
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000028 def _scan_once(string, idx):
29 try:
30 nextchar = string[idx]
31 except IndexError:
Ezio Melotti37623ab2013-01-03 08:44:15 +020032 raise StopIteration(idx)
Christian Heimes90540002008-05-08 14:29:10 +000033
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000034 if nextchar == '"':
35 return parse_string(string, idx + 1, strict)
36 elif nextchar == '{':
37 return parse_object((string, idx + 1), strict,
Antoine Pitrou7d6e0762010-09-04 20:16:53 +000038 _scan_once, object_hook, object_pairs_hook, memo)
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000039 elif nextchar == '[':
40 return parse_array((string, idx + 1), _scan_once)
41 elif nextchar == 'n' and string[idx:idx + 4] == 'null':
42 return None, idx + 4
43 elif nextchar == 't' and string[idx:idx + 4] == 'true':
44 return True, idx + 4
45 elif nextchar == 'f' and string[idx:idx + 5] == 'false':
46 return False, idx + 5
Christian Heimes90540002008-05-08 14:29:10 +000047
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000048 m = match_number(string, idx)
49 if m is not None:
50 integer, frac, exp = m.groups()
51 if frac or exp:
52 res = parse_float(integer + (frac or '') + (exp or ''))
53 else:
54 res = parse_int(integer)
55 return res, m.end()
56 elif nextchar == 'N' and string[idx:idx + 3] == 'NaN':
57 return parse_constant('NaN'), idx + 3
58 elif nextchar == 'I' and string[idx:idx + 8] == 'Infinity':
59 return parse_constant('Infinity'), idx + 8
60 elif nextchar == '-' and string[idx:idx + 9] == '-Infinity':
61 return parse_constant('-Infinity'), idx + 9
62 else:
Ezio Melotti37623ab2013-01-03 08:44:15 +020063 raise StopIteration(idx)
Christian Heimes90540002008-05-08 14:29:10 +000064
Antoine Pitrou7d6e0762010-09-04 20:16:53 +000065 def scan_once(string, idx):
66 try:
67 return _scan_once(string, idx)
68 finally:
69 memo.clear()
70
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000071 return _scan_once
Christian Heimes90540002008-05-08 14:29:10 +000072
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000073make_scanner = c_make_scanner or py_make_scanner