blob: 91c50eaabd1a019a78aee96b88e75fabfe922b86 [file] [log] [blame]
Nguyen Anh Quynhac6d1da2013-12-02 17:44:48 +08001# Capstone Disassembler Engine
2# By Dang Hoang Vu, 2013
fenuks110ab1d2014-04-11 11:00:33 +02003from __future__ import print_function
danghvu8054c9e2013-12-01 13:24:11 -06004import sys, re
5
Nguyen Anh Quynh72d3c4f2015-02-28 08:42:40 +08006INCL_DIR = '../include/capstone/'
danghvu8054c9e2013-12-01 13:24:11 -06007
Fotis Loukos0a159f12016-05-03 16:37:52 +03008include = [ 'arm.h', 'arm64.h', 'm68k.h', 'mips.h', 'x86.h', 'ppc.h', 'sparc.h', 'systemz.h', 'xcore.h', 'tms320c64x.h' ]
danghvu8054c9e2013-12-01 13:24:11 -06009
10template = {
11 'java': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080012 'header': "// For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT\npackage capstone;\n\npublic class %s_const {\n",
danghvu8054c9e2013-12-01 13:24:11 -060013 'footer': "}",
14 'line_format': '\tpublic static final int %s = %s;\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080015 'out_file': './java/capstone/%s_const.java',
16 # prefixes for constant filenames of all archs - case sensitive
17 'arm.h': 'Arm',
18 'arm64.h': 'Arm64',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080019 'm68k.h': 'M68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080020 'mips.h': 'Mips',
21 'x86.h': 'X86',
danghvu5611de02014-01-05 03:35:43 +070022 'ppc.h': 'Ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080023 'sparc.h': 'Sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080024 'systemz.h': 'Sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080025 'xcore.h': 'Xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030026 'tms320c64x.h': 'TMS320C64x',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080027 'comment_open': '\t//',
28 'comment_close': '',
danghvucfb01202013-12-01 13:46:49 -060029 },
30 'python': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080031 'header': "# For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.py]\n",
danghvucfb01202013-12-01 13:46:49 -060032 'footer': "",
33 'line_format': '%s = %s\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080034 'out_file': './python/capstone/%s_const.py',
35 # prefixes for constant filenames of all archs - case sensitive
36 'arm.h': 'arm',
37 'arm64.h': 'arm64',
Daniel Collin2ee675c2015-08-03 18:45:08 +020038 'm68k.h': 'm68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080039 'mips.h': 'mips',
40 'x86.h': 'x86',
danghvu5611de02014-01-05 03:35:43 +070041 'ppc.h': 'ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080042 'sparc.h': 'sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080043 'systemz.h': 'sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080044 'xcore.h': 'xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030045 'tms320c64x.h': 'tms320c64x',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080046 'comment_open': '#',
47 'comment_close': '',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080048 },
49 'ocaml': {
50 'header': "(* For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.ml] *)\n",
51 'footer': "",
52 'line_format': 'let _%s = %s;;\n',
53 'out_file': './ocaml/%s_const.ml',
54 # prefixes for constant filenames of all archs - case sensitive
55 'arm.h': 'arm',
56 'arm64.h': 'arm64',
57 'mips.h': 'mips',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080058 'm68k.h': 'm68k',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080059 'x86.h': 'x86',
60 'ppc.h': 'ppc',
61 'sparc.h': 'sparc',
62 'systemz.h': 'sysz',
63 'xcore.h': 'xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030064 'tms320c64x.h': 'tms320c64x',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080065 'comment_open': '(*',
66 'comment_close': ' *)',
67 },
danghvu8054c9e2013-12-01 13:24:11 -060068}
69
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080070# markup for comments to be added to autogen files
71MARKUP = '//>'
72
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +080073def gen(lang):
danghvu8054c9e2013-12-01 13:24:11 -060074 global include, INCL_DIR
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +080075 templ = template[lang]
learn_more8c7b3202015-08-02 20:09:41 +020076 print('Generating bindings for', lang)
danghvu8054c9e2013-12-01 13:24:11 -060077 for target in include:
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080078 prefix = templ[target]
learn_more78de4fa2015-08-02 20:10:35 +020079 outfile = open(templ['out_file'] %(prefix), 'wb') # open as binary prevents windows newlines
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100080 outfile.write((templ['header'] % (prefix)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -060081
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080082 lines = open(INCL_DIR + target).readlines()
danghvu8054c9e2013-12-01 13:24:11 -060083
84 count = 0
85 for line in lines:
86 line = line.strip()
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080087
88 if line.startswith(MARKUP): # markup for comments
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +100089 outfile.write(("\n%s%s%s\n" %(templ['comment_open'], \
90 line.replace(MARKUP, ''), \
91 templ['comment_close']) ).encode("utf-8"))
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080092 continue
93
danghvu8054c9e2013-12-01 13:24:11 -060094 if line == '' or line.startswith('//'):
95 continue
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080096
learn_moref6ded662015-08-02 20:12:51 +020097 if line.startswith('#define '):
98 line = line[8:] #cut off define
99 xline = re.split('\s+', line, 1) #split to at most 2 express
100 if len(xline) != 2:
101 continue
102 if '(' in xline[0] or ')' in xline[0]: #does it look like a function
103 continue
104 xline.insert(1, '=') # insert an = so the expression below can parse it
105 line = ' '.join(xline)
106
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800107 if not line.startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600108 continue
109
110 tmp = line.strip().split(',')
111 for t in tmp:
112 t = t.strip()
113 if not t or t.startswith('//'): continue
Nguyen Anh Quynh10647ae2015-03-25 17:35:59 +0800114 # hacky: remove type cast (uint64_t)
115 t = t.replace('(uint64_t)', '')
learn_moref6ded662015-08-02 20:12:51 +0200116 t = re.sub(r'\((\d+)ULL << (\d+)\)', r'\1 << \2', t) # (1ULL<<1) to 1 << 1
danghvu8054c9e2013-12-01 13:24:11 -0600117 f = re.split('\s+', t)
118
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800119 if f[0].startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600120 if len(f) > 1 and f[1] not in '//=':
fenuks110ab1d2014-04-11 11:00:33 +0200121 print("Error: Unable to convert %s" % f)
danghvu8054c9e2013-12-01 13:24:11 -0600122 continue
123 elif len(f) > 1 and f[1] == '=':
danghvu5611de02014-01-05 03:35:43 +0700124 rhs = ''.join(f[2:])
danghvu8054c9e2013-12-01 13:24:11 -0600125 else:
126 rhs = str(count)
127 count += 1
128
danghvub09c1222013-12-04 00:30:45 -0600129 try:
danghvub4b6fea2013-12-04 00:19:48 -0600130 count = int(rhs) + 1
131 if (count == 1):
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000132 outfile.write(("\n").encode("utf-8"))
danghvub09c1222013-12-04 00:30:45 -0600133 except ValueError:
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800134 if lang == 'ocaml':
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800135 # ocaml uses lsl for '<<', lor for '|'
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800136 rhs = rhs.replace('<<', ' lsl ')
137 rhs = rhs.replace('|', ' lor ')
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800138 # ocaml variable has _ as prefix
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800139 if rhs[0].isalpha():
140 rhs = '_' + rhs
danghvu8054c9e2013-12-01 13:24:11 -0600141
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000142 outfile.write((templ['line_format'] %(f[0].strip(), rhs)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600143
Nicolas PLANEL101bc4e2015-10-03 14:59:51 +1000144 outfile.write((templ['footer']).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600145 outfile.close()
146
147def main():
danghvucfb01202013-12-01 13:46:49 -0600148 try:
learn_more8c7b3202015-08-02 20:09:41 +0200149 if sys.argv[1] == 'all':
150 for key in template.keys():
151 gen(key)
152 else:
153 gen(sys.argv[1])
danghvucfb01202013-12-01 13:46:49 -0600154 except:
155 raise RuntimeError("Unsupported binding %s" % sys.argv[1])
danghvu8054c9e2013-12-01 13:24:11 -0600156
157if __name__ == "__main__":
158 if len(sys.argv) < 2:
learn_more8c7b3202015-08-02 20:09:41 +0200159 print("Usage:", sys.argv[0], " <bindings: java|python|ocaml|all>")
danghvu8054c9e2013-12-01 13:24:11 -0600160 sys.exit(1)
161 main()