eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 1 | #----------------------------------------------------------------- |
| 2 | # pycparser: cdecl.py |
| 3 | # |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 4 | # Example of the CDECL tool using pycparser. CDECL "explains" C type |
| 5 | # declarations in plain English. |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 6 | # |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 7 | # The AST generated by pycparser from the given declaration is traversed |
| 8 | # recursively to build the explanation. Note that the declaration must be a |
| 9 | # valid external declaration in C. All the types used in it must be defined with |
| 10 | # typedef, or parsing will fail. The definition can be arbitrary - pycparser |
| 11 | # doesn't really care what the type is defined to be, only that it's a type. |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 12 | # |
| 13 | # For example: |
| 14 | # |
Hart Chu | b23e267 | 2017-02-26 21:56:44 +0800 | [diff] [blame^] | 15 | # c_decl = 'typedef int Node; const Node* (*ar)[10];' |
| 16 | # |
| 17 | # explain_c_declaration(c_decl) |
| 18 | # => ar is a pointer to array[10] of pointer to const Node |
| 19 | # |
| 20 | # struct and typedef are expanded when according arguments are set: |
| 21 | # |
| 22 | # explain_c_declaration(c_decl, expand_typedef=True) |
| 23 | # => ar is a pointer to array[10] of pointer to const int |
| 24 | # |
| 25 | # c_decl = 'struct P {int x; int y;} p;' |
| 26 | # |
| 27 | # explain_c_declaration(c_decl) |
| 28 | # => p is a struct P |
| 29 | # |
| 30 | # explain_c_declaration(c_decl, expand_struct=True) |
| 31 | # => p is a struct P containing {x is a int, y is a int} |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 32 | # |
Eli Bendersky | 6d45ff7 | 2017-02-02 05:59:50 -0800 | [diff] [blame] | 33 | # Eli Bendersky [http://eli.thegreenplace.net] |
eli.bendersky | 84a6a63 | 2011-04-29 09:00:43 +0300 | [diff] [blame] | 34 | # License: BSD |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 35 | #----------------------------------------------------------------- |
Hart Chu | b23e267 | 2017-02-26 21:56:44 +0800 | [diff] [blame^] | 36 | import copy |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 37 | import sys |
| 38 | |
| 39 | # This is not required if you've installed pycparser into |
| 40 | # your site-packages/ with setup.py |
| 41 | # |
Ben | f86dea1 | 2012-02-03 06:24:55 +0200 | [diff] [blame] | 42 | sys.path.extend(['.', '..']) |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 43 | |
| 44 | from pycparser import c_parser, c_ast |
| 45 | |
| 46 | |
Hart Chu | b23e267 | 2017-02-26 21:56:44 +0800 | [diff] [blame^] | 47 | def explain_c_declaration(c_decl, expand_struct=False, expand_typedef=False): |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 48 | """ Parses the declaration in c_decl and returns a text |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 49 | explanation as a string. |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 50 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 51 | The last external node of the string is used, to allow |
Eli Bendersky | 3921e8e | 2010-05-21 09:05:39 +0300 | [diff] [blame] | 52 | earlier typedefs for used types. |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 53 | """ |
| 54 | parser = c_parser.CParser() |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 55 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 56 | try: |
| 57 | node = parser.parse(c_decl, filename='<stdin>') |
| 58 | except c_parser.ParseError: |
| 59 | e = sys.exc_info()[1] |
| 60 | return "Parse error:" + str(e) |
| 61 | |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 62 | if (not isinstance(node, c_ast.FileAST) or |
| 63 | not isinstance(node.ext[-1], c_ast.Decl) |
| 64 | ): |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 65 | return "Not a valid declaration" |
| 66 | |
Hart Chu | b23e267 | 2017-02-26 21:56:44 +0800 | [diff] [blame^] | 67 | try: |
| 68 | expanded = expand_struct_typedef(node.ext[-1], node, |
| 69 | expand_struct=expand_struct, |
| 70 | expand_typedef=expand_typedef) |
| 71 | except Exception as e: |
| 72 | return "Not a valid declaration: " + str(e) |
| 73 | |
| 74 | return _explain_decl_node(expanded) |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 75 | |
| 76 | |
Eli Bendersky | 3921e8e | 2010-05-21 09:05:39 +0300 | [diff] [blame] | 77 | def _explain_decl_node(decl_node): |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 78 | """ Receives a c_ast.Decl note and returns its explanation in |
Eli Bendersky | 3921e8e | 2010-05-21 09:05:39 +0300 | [diff] [blame] | 79 | English. |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 80 | """ |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 81 | storage = ' '.join(decl_node.storage) + ' ' if decl_node.storage else '' |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 82 | |
| 83 | return (decl_node.name + |
| 84 | " is a " + |
| 85 | storage + |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 86 | _explain_type(decl_node.type)) |
| 87 | |
| 88 | |
Eli Bendersky | 3921e8e | 2010-05-21 09:05:39 +0300 | [diff] [blame] | 89 | def _explain_type(decl): |
| 90 | """ Recursively explains a type decl node |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 91 | """ |
| 92 | typ = type(decl) |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 93 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 94 | if typ == c_ast.TypeDecl: |
| 95 | quals = ' '.join(decl.quals) + ' ' if decl.quals else '' |
| 96 | return quals + _explain_type(decl.type) |
| 97 | elif typ == c_ast.Typename or typ == c_ast.Decl: |
| 98 | return _explain_type(decl.type) |
| 99 | elif typ == c_ast.IdentifierType: |
| 100 | return ' '.join(decl.names) |
| 101 | elif typ == c_ast.PtrDecl: |
| 102 | quals = ' '.join(decl.quals) + ' ' if decl.quals else '' |
| 103 | return quals + 'pointer to ' + _explain_type(decl.type) |
| 104 | elif typ == c_ast.ArrayDecl: |
| 105 | arr = 'array' |
| 106 | if decl.dim: arr += '[%s]' % decl.dim.value |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 107 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 108 | return arr + " of " + _explain_type(decl.type) |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 109 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 110 | elif typ == c_ast.FuncDecl: |
| 111 | if decl.args: |
| 112 | params = [_explain_type(param) for param in decl.args.params] |
| 113 | args = ', '.join(params) |
| 114 | else: |
| 115 | args = '' |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 116 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 117 | return ('function(%s) returning ' % (args) + |
| 118 | _explain_type(decl.type)) |
| 119 | |
Hart Chu | b23e267 | 2017-02-26 21:56:44 +0800 | [diff] [blame^] | 120 | elif typ == c_ast.Struct: |
| 121 | decls = [_explain_decl_node(mem_decl) for mem_decl in decl.decls] |
| 122 | members = ', '.join(decls) |
| 123 | |
| 124 | return ('struct%s ' % (' ' + decl.name if decl.name else '') + |
| 125 | ('containing {%s}' % members if members else '')) |
| 126 | |
| 127 | |
| 128 | def expand_struct_typedef(cdecl, file_ast, expand_struct=False, expand_typedef=False): |
| 129 | """Expand struct & typedef in context of file_ast and return a new expanded node""" |
| 130 | decl_copy = copy.deepcopy(cdecl) |
| 131 | _expand_in_place(decl_copy, file_ast, expand_struct, expand_typedef) |
| 132 | return decl_copy |
| 133 | |
| 134 | |
| 135 | def _expand_in_place(decl, file_ast, expand_struct=False, expand_typedef=False): |
| 136 | """Recursively expand struct & typedef in place, throw Exception if |
| 137 | undeclared struct or typedef are used |
| 138 | """ |
| 139 | typ = type(decl) |
| 140 | |
| 141 | if typ in (c_ast.Decl, c_ast.TypeDecl, c_ast.PtrDecl, c_ast.ArrayDecl): |
| 142 | decl.type = _expand_in_place(decl.type, file_ast, expand_struct, expand_typedef) |
| 143 | |
| 144 | elif typ == c_ast.Struct: |
| 145 | if not decl.decls: |
| 146 | struct = _find_struct(decl.name, file_ast) |
| 147 | if not struct: |
| 148 | raise Exception('using undeclared struct %s' % decl.name) |
| 149 | decl.decls = struct.decls |
| 150 | |
| 151 | for i, mem_decl in enumerate(decl.decls): |
| 152 | decl.decls[i] = _expand_in_place(mem_decl, file_ast, expand_struct, expand_typedef) |
| 153 | |
| 154 | if not expand_struct: |
| 155 | decl.decls = [] |
| 156 | |
| 157 | elif (typ == c_ast.IdentifierType and |
| 158 | decl.names[0] not in ('int', 'char')): |
| 159 | typedef = _find_typedef(decl.names[0], file_ast) |
| 160 | if not typedef: |
| 161 | raise Exception('using undeclared type %s' % decl.names[0]) |
| 162 | |
| 163 | if expand_typedef: |
| 164 | return typedef.type |
| 165 | |
| 166 | return decl |
| 167 | |
| 168 | |
| 169 | def _find_struct(name, file_ast): |
| 170 | """Receives a struct name and return declared struct object in file_ast |
| 171 | """ |
| 172 | for node in file_ast.ext: |
| 173 | if (type(node) == c_ast.Decl and |
| 174 | type(node.type) == c_ast.Struct and |
| 175 | node.type.name == name): |
| 176 | return node.type |
| 177 | |
| 178 | |
| 179 | def _find_typedef(name, file_ast): |
| 180 | """Receives a type name and return typedef object in file_ast |
| 181 | """ |
| 182 | for node in file_ast.ext: |
| 183 | if type(node) == c_ast.Typedef and node.name == name: |
| 184 | return node |
| 185 | |
eli.bendersky | fe5c2bb | 2010-12-04 17:38:11 +0200 | [diff] [blame] | 186 | |
| 187 | if __name__ == "__main__": |
| 188 | if len(sys.argv) > 1: |
| 189 | c_decl = sys.argv[1] |
| 190 | else: |
| 191 | c_decl = "char *(*(**foo[][8])())[];" |
| 192 | |
| 193 | print("Explaining the declaration: " + c_decl + "\n") |
Eli Bendersky | 27797e8 | 2013-09-25 06:30:17 -0700 | [diff] [blame] | 194 | print(explain_c_declaration(c_decl) + "\n") |