blob: f36d8a5ecc5cd63eccfcea28912fb3a422a49a50 [file] [log] [blame]
Nguyen Anh Quynhac6d1da2013-12-02 17:44:48 +08001# Capstone Disassembler Engine
2# By Dang Hoang Vu, 2013
fenuks110ab1d2014-04-11 11:00:33 +02003from __future__ import print_function
danghvu8054c9e2013-12-01 13:24:11 -06004import sys, re
5
Nguyen Anh Quynh72d3c4f2015-02-28 08:42:40 +08006INCL_DIR = '../include/capstone/'
danghvu8054c9e2013-12-01 13:24:11 -06007
Nguyen Anh Quynhed1246d2018-03-31 17:29:22 +08008include = [ 'arm.h', 'arm64.h', 'm68k.h', 'mips.h', 'x86.h', 'ppc.h', 'sparc.h', 'systemz.h', 'xcore.h', 'tms320c64x.h', 'm680x.h', 'evm.h' ]
danghvu8054c9e2013-12-01 13:24:11 -06009
10template = {
11 'java': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080012 'header': "// For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT\npackage capstone;\n\npublic class %s_const {\n",
danghvu8054c9e2013-12-01 13:24:11 -060013 'footer': "}",
14 'line_format': '\tpublic static final int %s = %s;\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080015 'out_file': './java/capstone/%s_const.java',
16 # prefixes for constant filenames of all archs - case sensitive
17 'arm.h': 'Arm',
18 'arm64.h': 'Arm64',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080019 'm68k.h': 'M68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080020 'mips.h': 'Mips',
21 'x86.h': 'X86',
danghvu5611de02014-01-05 03:35:43 +070022 'ppc.h': 'Ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080023 'sparc.h': 'Sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080024 'systemz.h': 'Sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080025 'xcore.h': 'Xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030026 'tms320c64x.h': 'TMS320C64x',
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020027 'm680x.h': 'M680x',
Nguyen Anh Quynhed1246d2018-03-31 17:29:22 +080028 'evm.h': 'Evm',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080029 'comment_open': '\t//',
30 'comment_close': '',
danghvucfb01202013-12-01 13:46:49 -060031 },
32 'python': {
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080033 'header': "# For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.py]\n",
danghvucfb01202013-12-01 13:46:49 -060034 'footer': "",
35 'line_format': '%s = %s\n',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080036 'out_file': './python/capstone/%s_const.py',
37 # prefixes for constant filenames of all archs - case sensitive
38 'arm.h': 'arm',
39 'arm64.h': 'arm64',
Daniel Collin2ee675c2015-08-03 18:45:08 +020040 'm68k.h': 'm68k',
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080041 'mips.h': 'mips',
42 'x86.h': 'x86',
danghvu5611de02014-01-05 03:35:43 +070043 'ppc.h': 'ppc',
Nguyen Anh Quynh1055a2e2014-03-10 14:37:08 +080044 'sparc.h': 'sparc',
Nguyen Anh Quynh1c8405d2014-03-23 11:17:24 +080045 'systemz.h': 'sysz',
Nguyen Anh Quynh553bb482014-05-26 23:47:04 +080046 'xcore.h': 'xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030047 'tms320c64x.h': 'tms320c64x',
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020048 'm680x.h': 'm680x',
Nguyen Anh Quynhed1246d2018-03-31 17:29:22 +080049 'evm.h': 'evm',
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080050 'comment_open': '#',
51 'comment_close': '',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080052 },
53 'ocaml': {
54 'header': "(* For Capstone Engine. AUTO-GENERATED FILE, DO NOT EDIT [%s_const.ml] *)\n",
55 'footer': "",
56 'line_format': 'let _%s = %s;;\n',
57 'out_file': './ocaml/%s_const.ml',
58 # prefixes for constant filenames of all archs - case sensitive
59 'arm.h': 'arm',
60 'arm64.h': 'arm64',
61 'mips.h': 'mips',
Nguyen Anh Quynh57bf77a2015-10-03 11:32:24 +080062 'm68k.h': 'm68k',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080063 'x86.h': 'x86',
64 'ppc.h': 'ppc',
65 'sparc.h': 'sparc',
66 'systemz.h': 'sysz',
67 'xcore.h': 'xcore',
Fotis Loukos0a159f12016-05-03 16:37:52 +030068 'tms320c64x.h': 'tms320c64x',
Wolfgang Schwotzer22b4d0e2017-10-21 15:44:36 +020069 'm680x.h': 'm680x',
Nguyen Anh Quynhed1246d2018-03-31 17:29:22 +080070 'evm.h': 'evm',
Nguyen Anh Quynh586be762014-09-21 23:23:38 +080071 'comment_open': '(*',
72 'comment_close': ' *)',
73 },
danghvu8054c9e2013-12-01 13:24:11 -060074}
75
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080076# markup for comments to be added to autogen files
77MARKUP = '//>'
78
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +080079def gen(lang):
danghvu8054c9e2013-12-01 13:24:11 -060080 global include, INCL_DIR
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +100081 print('Generating bindings for', lang)
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +080082 templ = template[lang]
learn_more8c7b3202015-08-02 20:09:41 +020083 print('Generating bindings for', lang)
danghvu8054c9e2013-12-01 13:24:11 -060084 for target in include:
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080085 prefix = templ[target]
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +100086 outfile = open(templ['out_file'] %(prefix), 'wb') # open as binary prevents windows newlines
87 outfile.write((templ['header'] % (prefix)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -060088
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +080089 lines = open(INCL_DIR + target).readlines()
danghvu8054c9e2013-12-01 13:24:11 -060090
91 count = 0
92 for line in lines:
93 line = line.strip()
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080094
95 if line.startswith(MARKUP): # markup for comments
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +100096 outfile.write(("\n%s%s%s\n" %(templ['comment_open'], \
97 line.replace(MARKUP, ''), \
98 templ['comment_close']) ).encode("utf-8"))
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +080099 continue
100
danghvu8054c9e2013-12-01 13:24:11 -0600101 if line == '' or line.startswith('//'):
102 continue
Nguyen Anh Quynha2f825f2013-12-04 23:56:24 +0800103
learn_moref6ded662015-08-02 20:12:51 +0200104 if line.startswith('#define '):
105 line = line[8:] #cut off define
106 xline = re.split('\s+', line, 1) #split to at most 2 express
107 if len(xline) != 2:
108 continue
109 if '(' in xline[0] or ')' in xline[0]: #does it look like a function
110 continue
111 xline.insert(1, '=') # insert an = so the expression below can parse it
112 line = ' '.join(xline)
113
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800114 if not line.startswith(prefix.upper()):
danghvu8054c9e2013-12-01 13:24:11 -0600115 continue
116
117 tmp = line.strip().split(',')
118 for t in tmp:
119 t = t.strip()
120 if not t or t.startswith('//'): continue
Nguyen Anh Quynh10647ae2015-03-25 17:35:59 +0800121 # hacky: remove type cast (uint64_t)
122 t = t.replace('(uint64_t)', '')
learn_moref6ded662015-08-02 20:12:51 +0200123 t = re.sub(r'\((\d+)ULL << (\d+)\)', r'\1 << \2', t) # (1ULL<<1) to 1 << 1
danghvu8054c9e2013-12-01 13:24:11 -0600124 f = re.split('\s+', t)
125
Nguyen Anh Quynh96a056d2013-12-02 18:37:46 +0800126 if f[0].startswith(prefix.upper()):
Nguyen Anh Quynh2b4aec92018-10-01 20:29:39 +0800127 if len(f) > 1 and f[1] not in ('//', '///<', '='):
fenuks110ab1d2014-04-11 11:00:33 +0200128 print("Error: Unable to convert %s" % f)
danghvu8054c9e2013-12-01 13:24:11 -0600129 continue
130 elif len(f) > 1 and f[1] == '=':
danghvu5611de02014-01-05 03:35:43 +0700131 rhs = ''.join(f[2:])
danghvu8054c9e2013-12-01 13:24:11 -0600132 else:
133 rhs = str(count)
134 count += 1
135
danghvub09c1222013-12-04 00:30:45 -0600136 try:
danghvub4b6fea2013-12-04 00:19:48 -0600137 count = int(rhs) + 1
138 if (count == 1):
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +1000139 outfile.write(("\n").encode("utf-8"))
danghvub09c1222013-12-04 00:30:45 -0600140 except ValueError:
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800141 if lang == 'ocaml':
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800142 # ocaml uses lsl for '<<', lor for '|'
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800143 rhs = rhs.replace('<<', ' lsl ')
144 rhs = rhs.replace('|', ' lor ')
Nguyen Anh Quynhe483c6e2014-09-22 00:07:58 +0800145 # ocaml variable has _ as prefix
Nguyen Anh Quynha22d3002014-09-21 23:32:50 +0800146 if rhs[0].isalpha():
147 rhs = '_' + rhs
danghvu8054c9e2013-12-01 13:24:11 -0600148
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +1000149 outfile.write((templ['line_format'] %(f[0].strip(), rhs)).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600150
Nicolas PLANEL8b25b0a2015-10-03 14:59:51 +1000151 outfile.write((templ['footer']).encode("utf-8"))
danghvu8054c9e2013-12-01 13:24:11 -0600152 outfile.close()
153
154def main():
danghvucfb01202013-12-01 13:46:49 -0600155 try:
learn_more8c7b3202015-08-02 20:09:41 +0200156 if sys.argv[1] == 'all':
157 for key in template.keys():
158 gen(key)
159 else:
160 gen(sys.argv[1])
danghvucfb01202013-12-01 13:46:49 -0600161 except:
162 raise RuntimeError("Unsupported binding %s" % sys.argv[1])
danghvu8054c9e2013-12-01 13:24:11 -0600163
164if __name__ == "__main__":
165 if len(sys.argv) < 2:
learn_more8c7b3202015-08-02 20:09:41 +0200166 print("Usage:", sys.argv[0], " <bindings: java|python|ocaml|all>")
danghvu8054c9e2013-12-01 13:24:11 -0600167 sys.exit(1)
168 main()