blob: a3abe858d10cc3da171ed00df7e25b85f56d844b [file] [log] [blame]
Nguyen Anh Quynhac6d1da2013-12-02 17:44:48 +08001# Capstone Disassembler Engine
2# By Dang Hoang Vu, 2013
fenuks110ab1d2014-04-11 11:00:33 +02003from __future__ import print_function
danghvu8054c9e2013-12-01 13:24:11 -06004import sys, re
5
Nguyen Anh Quynh72d3c4f2015-02-28 08:42:40 +08006INCL_DIR = '../include/capstone/'
danghvu8054c9e2013-12-01 13:24:11 -06007
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +08008include = [ 'arm.h', 'arm64.h', 'mips.h', 'x86.h', 'ppc.h', 'sparc.h', 'systemz.h', 'xcore.h' ]
danghvu8054c9e2013-12-01 13:24:11 -06009
10template = {
11 'java': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080012 'header': "// For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT\npackage capstone;\n\npublic class %s_const {\n",
danghvu8054c9e2013-12-01 13:24:11 -060013 'footer': "}",
14 'line_format': '\tpublic static final int %s = %s;\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080015 'out_file': './java/capstone/%s_const.java',
16 # prefixes for constant filenames of all archs - case sensitive
17 'arm.h': 'Arm',
18 'arm64.h': 'Arm64',
19 'mips.h': 'Mips',
20 'x86.h': 'X86',
danghvu5611de02014-01-05 03:35:43 +070021 'ppc.h': 'Ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080022 'sparc.h': 'Sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080023 'systemz.h': 'Sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080024 'xcore.h': 'Xcore',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080025 'comment_open': '\t//',
26 'comment_close': '',
danghvucfb01202013-12-01 13:46:49 -060027 },
28 'python': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080029 'header': "# For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.py]\n",
danghvucfb01202013-12-01 13:46:49 -060030 'footer': "",
31 'line_format': '%s = %s\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080032 'out_file': './python/capstone/%s_const.py',
33 # prefixes for constant filenames of all archs - case sensitive
34 'arm.h': 'arm',
35 'arm64.h': 'arm64',
36 'mips.h': 'mips',
37 'x86.h': 'x86',
danghvu5611de02014-01-05 03:35:43 +070038 'ppc.h': 'ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080039 'sparc.h': 'sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080040 'systemz.h': 'sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080041 'xcore.h': 'xcore',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080042 'comment_open': '#',
43 'comment_close': '',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080044 },
45 'ocaml': {
46 'header': "(* For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.ml] *)\n",
47 'footer': "",
48 'line_format': 'let _%s = %s;;\n',
49 'out_file': './ocaml/%s_const.ml',
50 # prefixes for constant filenames of all archs - case sensitive
51 'arm.h': 'arm',
52 'arm64.h': 'arm64',
53 'mips.h': 'mips',
54 'x86.h': 'x86',
55 'ppc.h': 'ppc',
56 'sparc.h': 'sparc',
57 'systemz.h': 'sysz',
58 'xcore.h': 'xcore',
59 'comment_open': '(*',
60 'comment_close': ' *)',
61 },
danghvu8054c9e2013-12-01 13:24:11 -060062}
63
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080064# markup for comments to be added to autogen files
65MARKUP = '//>'
66
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +080067def gen(lang):
danghvu8054c9e2013-12-01 13:24:11 -060068 global include, INCL_DIR
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +080069 templ = template[lang]
learn_more8c7b3202015-08-02 20:09:41 +020070 print('Generating bindings for', lang)
danghvu8054c9e2013-12-01 13:24:11 -060071 for target in include:
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080072 prefix = templ[target]
learn_more78de4fa2015-08-02 20:10:35 +020073 outfile = open(templ['out_file'] %(prefix), 'wb') # open as binary prevents windows newlines
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100074 outfile.write((templ['header'] % (prefix)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -060075
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080076 lines = open(INCL_DIR + target).readlines()
danghvu8054c9e2013-12-01 13:24:11 -060077
78 count = 0
79 for line in lines:
80 line = line.strip()
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080081
82 if line.startswith(MARKUP): # markup for comments
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100083 outfile.write(("\n%s%s%s\n" %(templ['comment_open'], \
84 line.replace(MARKUP, ''), \
85 templ['comment_close']) ).encode("utf-8"))
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080086 continue
87
danghvu8054c9e2013-12-01 13:24:11 -060088 if line == '' or line.startswith('//'):
89 continue
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080090
learn_moref6ded662015-08-02 20:12:51 +020091 if line.startswith('#define '):
92 line = line[8:] #cut off define
93 xline = re.split('\s+', line, 1) #split to at most 2 express
94 if len(xline) != 2:
95 continue
96 if '(' in xline[0] or ')' in xline[0]: #does it look like a function
97 continue
98 xline.insert(1, '=') # insert an = so the expression below can parse it
99 line = ' '.join(xline)
100
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800101 if not line.startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600102 continue
103
104 tmp = line.strip().split(',')
105 for t in tmp:
106 t = t.strip()
107 if not t or t.startswith('//'): continue
Nguyen Anh Quynh10647ae2015-03-25 17:35:59 +0800108 # hacky: remove type cast (uint64_t)
109 t = t.replace('(uint64_t)', '')
learn_moref6ded662015-08-02 20:12:51 +0200110 t = re.sub(r'\((\d+)ULL << (\d+)\)', r'\1 << \2', t) # (1ULL<<1) to 1 << 1
danghvu8054c9e2013-12-01 13:24:11 -0600111 f = re.split('\s+', t)
112
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800113 if f[0].startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600114 if len(f) > 1 and f[1] not in '//=':
fenuks110ab1d2014-04-11 11:00:33 +0200115 print("Error: Unable to convert %s" % f)
danghvu8054c9e2013-12-01 13:24:11 -0600116 continue
117 elif len(f) > 1 and f[1] == '=':
danghvu5611de02014-01-05 03:35:43 +0700118 rhs = ''.join(f[2:])
danghvu8054c9e2013-12-01 13:24:11 -0600119 else:
120 rhs = str(count)
121 count += 1
122
danghvub09c1222013-12-04 00:30:45 -0600123 try:
danghvub4b6fea2013-12-04 00:19:48 -0600124 count = int(rhs) + 1
125 if (count == 1):
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000126 outfile.write(("\n").encode("utf-8"))
danghvub09c1222013-12-04 00:30:45 -0600127 except ValueError:
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800128 if lang == 'ocaml':
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800129 # ocaml uses lsl for '<<', lor for '|'
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800130 rhs = rhs.replace('<<', ' lsl ')
131 rhs = rhs.replace('|', ' lor ')
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800132 # ocaml variable has _ as prefix
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800133 if rhs[0].isalpha():
134 rhs = '_' + rhs
danghvu8054c9e2013-12-01 13:24:11 -0600135
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000136 outfile.write((templ['line_format'] %(f[0].strip(), rhs)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600137
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000138 outfile.write((templ['footer']).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600139 outfile.close()
140
141def main():
danghvucfb01202013-12-01 13:46:49 -0600142 try:
learn_more8c7b3202015-08-02 20:09:41 +0200143 if sys.argv[1] == 'all':
144 for key in template.keys():
145 gen(key)
146 else:
147 gen(sys.argv[1])
danghvucfb01202013-12-01 13:46:49 -0600148 except:
149 raise RuntimeError("Unsupported binding %s" % sys.argv[1])
danghvu8054c9e2013-12-01 13:24:11 -0600150
151if __name__ == "__main__":
152 if len(sys.argv) < 2:
learn_more8c7b3202015-08-02 20:09:41 +0200153 print("Usage:", sys.argv[0], " <bindings: java|python|ocaml|all>")
danghvu8054c9e2013-12-01 13:24:11 -0600154 sys.exit(1)
155 main()