blob: 8c49dbf45e65e2e7152649a157cd8946ca3223a2 [file] [log] [blame]
Nguyen Anh Quynhac6d1da2013-12-02 17:44:48 +08001# Capstone Disassembler Engine
2# By Dang Hoang Vu, 2013
fenuks110ab1d2014-04-11 11:00:33 +02003from __future__ import print_function
danghvu8054c9e2013-12-01 13:24:11 -06004import sys, re
5
Nguyen Anh Quynh72d3c4f2015-02-28 08:42:40 +08006INCL_DIR = '../include/capstone/'
danghvu8054c9e2013-12-01 13:24:11 -06007
Daniel Collin2ee675c2015-08-03 18:45:08 +02008include = [ 'arm.h', 'arm64.h', 'm68k.h', 'mips.h', 'x86.h', 'ppc.h', 'sparc.h', 'systemz.h', 'xcore.h' ]
danghvu8054c9e2013-12-01 13:24:11 -06009
10template = {
11 'java': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080012 'header': "// For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT\npackage capstone;\n\npublic class %s_const {\n",
danghvu8054c9e2013-12-01 13:24:11 -060013 'footer': "}",
14 'line_format': '\tpublic static final int %s = %s;\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080015 'out_file': './java/capstone/%s_const.java',
16 # prefixes for constant filenames of all archs - case sensitive
17 'arm.h': 'Arm',
18 'arm64.h': 'Arm64',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080019 'm68k.h': 'M68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080020 'mips.h': 'Mips',
21 'x86.h': 'X86',
danghvu5611de02014-01-05 03:35:43 +070022 'ppc.h': 'Ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080023 'sparc.h': 'Sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080024 'systemz.h': 'Sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080025 'xcore.h': 'Xcore',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080026 'comment_open': '\t//',
27 'comment_close': '',
danghvucfb01202013-12-01 13:46:49 -060028 },
29 'python': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080030 'header': "# For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.py]\n",
danghvucfb01202013-12-01 13:46:49 -060031 'footer': "",
32 'line_format': '%s = %s\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080033 'out_file': './python/capstone/%s_const.py',
34 # prefixes for constant filenames of all archs - case sensitive
35 'arm.h': 'arm',
36 'arm64.h': 'arm64',
Daniel Collin2ee675c2015-08-03 18:45:08 +020037 'm68k.h': 'm68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080038 'mips.h': 'mips',
39 'x86.h': 'x86',
danghvu5611de02014-01-05 03:35:43 +070040 'ppc.h': 'ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080041 'sparc.h': 'sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080042 'systemz.h': 'sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080043 'xcore.h': 'xcore',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080044 'comment_open': '#',
45 'comment_close': '',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080046 },
47 'ocaml': {
48 'header': "(* For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.ml] *)\n",
49 'footer': "",
50 'line_format': 'let _%s = %s;;\n',
51 'out_file': './ocaml/%s_const.ml',
52 # prefixes for constant filenames of all archs - case sensitive
53 'arm.h': 'arm',
54 'arm64.h': 'arm64',
55 'mips.h': 'mips',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080056 'm68k.h': 'm68k',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080057 'x86.h': 'x86',
58 'ppc.h': 'ppc',
59 'sparc.h': 'sparc',
60 'systemz.h': 'sysz',
61 'xcore.h': 'xcore',
62 'comment_open': '(*',
63 'comment_close': ' *)',
64 },
danghvu8054c9e2013-12-01 13:24:11 -060065}
66
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080067# markup for comments to be added to autogen files
68MARKUP = '//>'
69
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +080070def gen(lang):
danghvu8054c9e2013-12-01 13:24:11 -060071 global include, INCL_DIR
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +080072 templ = template[lang]
learn_more8c7b3202015-08-02 20:09:41 +020073 print('Generating bindings for', lang)
danghvu8054c9e2013-12-01 13:24:11 -060074 for target in include:
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080075 prefix = templ[target]
learn_more78de4fa2015-08-02 20:10:35 +020076 outfile = open(templ['out_file'] %(prefix), 'wb') # open as binary prevents windows newlines
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100077 outfile.write((templ['header'] % (prefix)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -060078
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080079 lines = open(INCL_DIR + target).readlines()
danghvu8054c9e2013-12-01 13:24:11 -060080
81 count = 0
82 for line in lines:
83 line = line.strip()
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080084
85 if line.startswith(MARKUP): # markup for comments
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100086 outfile.write(("\n%s%s%s\n" %(templ['comment_open'], \
87 line.replace(MARKUP, ''), \
88 templ['comment_close']) ).encode("utf-8"))
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080089 continue
90
danghvu8054c9e2013-12-01 13:24:11 -060091 if line == '' or line.startswith('//'):
92 continue
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080093
learn_moref6ded662015-08-02 20:12:51 +020094 if line.startswith('#define '):
95 line = line[8:] #cut off define
96 xline = re.split('\s+', line, 1) #split to at most 2 express
97 if len(xline) != 2:
98 continue
99 if '(' in xline[0] or ')' in xline[0]: #does it look like a function
100 continue
101 xline.insert(1, '=') # insert an = so the expression below can parse it
102 line = ' '.join(xline)
103
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800104 if not line.startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600105 continue
106
107 tmp = line.strip().split(',')
108 for t in tmp:
109 t = t.strip()
110 if not t or t.startswith('//'): continue
Nguyen Anh Quynh10647ae2015-03-25 17:35:59 +0800111 # hacky: remove type cast (uint64_t)
112 t = t.replace('(uint64_t)', '')
learn_moref6ded662015-08-02 20:12:51 +0200113 t = re.sub(r'\((\d+)ULL << (\d+)\)', r'\1 << \2', t) # (1ULL<<1) to 1 << 1
danghvu8054c9e2013-12-01 13:24:11 -0600114 f = re.split('\s+', t)
115
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800116 if f[0].startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600117 if len(f) > 1 and f[1] not in '//=':
fenuks110ab1d2014-04-11 11:00:33 +0200118 print("Error: Unable to convert %s" % f)
danghvu8054c9e2013-12-01 13:24:11 -0600119 continue
120 elif len(f) > 1 and f[1] == '=':
danghvu5611de02014-01-05 03:35:43 +0700121 rhs = ''.join(f[2:])
danghvu8054c9e2013-12-01 13:24:11 -0600122 else:
123 rhs = str(count)
124 count += 1
125
danghvub09c1222013-12-04 00:30:45 -0600126 try:
danghvub4b6fea2013-12-04 00:19:48 -0600127 count = int(rhs) + 1
128 if (count == 1):
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000129 outfile.write(("\n").encode("utf-8"))
danghvub09c1222013-12-04 00:30:45 -0600130 except ValueError:
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800131 if lang == 'ocaml':
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800132 # ocaml uses lsl for '<<', lor for '|'
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800133 rhs = rhs.replace('<<', ' lsl ')
134 rhs = rhs.replace('|', ' lor ')
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800135 # ocaml variable has _ as prefix
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800136 if rhs[0].isalpha():
137 rhs = '_' + rhs
danghvu8054c9e2013-12-01 13:24:11 -0600138
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000139 outfile.write((templ['line_format'] %(f[0].strip(), rhs)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600140
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000141 outfile.write((templ['footer']).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600142 outfile.close()
143
144def main():
danghvucfb01202013-12-01 13:46:49 -0600145 try:
learn_more8c7b3202015-08-02 20:09:41 +0200146 if sys.argv[1] == 'all':
147 for key in template.keys():
148 gen(key)
149 else:
150 gen(sys.argv[1])
danghvucfb01202013-12-01 13:46:49 -0600151 except:
152 raise RuntimeError("Unsupported binding %s" % sys.argv[1])
danghvu8054c9e2013-12-01 13:24:11 -0600153
154if __name__ == "__main__":
155 if len(sys.argv) < 2:
learn_more8c7b3202015-08-02 20:09:41 +0200156 print("Usage:", sys.argv[0], " <bindings: java|python|ocaml|all>")
danghvu8054c9e2013-12-01 13:24:11 -0600157 sys.exit(1)
158 main()