blob: b4f356146fed58f9513bf23e1f786f0511bbac6c [file] [log] [blame]
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00001"""JSON token scanner
Christian Heimes90540002008-05-08 14:29:10 +00002"""
Christian Heimes90540002008-05-08 14:29:10 +00003import re
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00004try:
5 from _json import make_scanner as c_make_scanner
6except ImportError:
7 c_make_scanner = None
Christian Heimes90540002008-05-08 14:29:10 +00008
Benjamin Petersonc6b607d2009-05-02 12:36:44 +00009__all__ = ['make_scanner']
Christian Heimes90540002008-05-08 14:29:10 +000010
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000011NUMBER_RE = re.compile(
12 r'(-?(?:0|[1-9]\d*))(\.\d+)?([eE][-+]?\d+)?',
13 (re.VERBOSE | re.MULTILINE | re.DOTALL))
Christian Heimes90540002008-05-08 14:29:10 +000014
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000015def py_make_scanner(context):
16 parse_object = context.parse_object
17 parse_array = context.parse_array
18 parse_string = context.parse_string
19 match_number = NUMBER_RE.match
20 strict = context.strict
21 parse_float = context.parse_float
22 parse_int = context.parse_int
23 parse_constant = context.parse_constant
24 object_hook = context.object_hook
Christian Heimes90540002008-05-08 14:29:10 +000025
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000026 def _scan_once(string, idx):
27 try:
28 nextchar = string[idx]
29 except IndexError:
30 raise StopIteration
Christian Heimes90540002008-05-08 14:29:10 +000031
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000032 if nextchar == '"':
33 return parse_string(string, idx + 1, strict)
34 elif nextchar == '{':
35 return parse_object((string, idx + 1), strict,
36 _scan_once, object_hook, object_pairs_hook)
37 elif nextchar == '[':
38 return parse_array((string, idx + 1), _scan_once)
39 elif nextchar == 'n' and string[idx:idx + 4] == 'null':
40 return None, idx + 4
41 elif nextchar == 't' and string[idx:idx + 4] == 'true':
42 return True, idx + 4
43 elif nextchar == 'f' and string[idx:idx + 5] == 'false':
44 return False, idx + 5
Christian Heimes90540002008-05-08 14:29:10 +000045
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000046 m = match_number(string, idx)
47 if m is not None:
48 integer, frac, exp = m.groups()
49 if frac or exp:
50 res = parse_float(integer + (frac or '') + (exp or ''))
51 else:
52 res = parse_int(integer)
53 return res, m.end()
54 elif nextchar == 'N' and string[idx:idx + 3] == 'NaN':
55 return parse_constant('NaN'), idx + 3
56 elif nextchar == 'I' and string[idx:idx + 8] == 'Infinity':
57 return parse_constant('Infinity'), idx + 8
58 elif nextchar == '-' and string[idx:idx + 9] == '-Infinity':
59 return parse_constant('-Infinity'), idx + 9
60 else:
61 raise StopIteration
Christian Heimes90540002008-05-08 14:29:10 +000062
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000063 return _scan_once
Christian Heimes90540002008-05-08 14:29:10 +000064
Benjamin Petersonc6b607d2009-05-02 12:36:44 +000065make_scanner = c_make_scanner or py_make_scanner