blob: 093a892026f95060876d9433c5606e7934290bab [file] [log] [blame]
Masami Hiramatsueb132962009-08-13 16:34:13 -04001#!/bin/awk -f
2# gen-insn-attr-x86.awk: Instruction attribute table generator
3# Written by Masami Hiramatsu <mhiramat@redhat.com>
4#
5# Usage: awk -f gen-insn-attr-x86.awk x86-opcode-map.txt > inat-tables.c
6
Masami Hiramatsu69d991f2009-08-21 15:43:16 -04007# Awk implementation sanity check
8function check_awk_implement() {
Masami Hiramatsu69d991f2009-08-21 15:43:16 -04009 if (sprintf("%x", 0) != "0")
10 return "Your awk has a printf-format problem."
11 return ""
12}
13
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040014# Clear working vars
15function clear_vars() {
16 delete table
17 delete lptable2
18 delete lptable1
19 delete lptable3
20 eid = -1 # escape id
21 gid = -1 # group id
22 aid = -1 # AVX id
23 tname = ""
24}
25
Masami Hiramatsueb132962009-08-13 16:34:13 -040026BEGIN {
Masami Hiramatsu69d991f2009-08-21 15:43:16 -040027 # Implementation error checking
28 awkchecked = check_awk_implement()
29 if (awkchecked != "") {
30 print "Error: " awkchecked > "/dev/stderr"
31 print "Please try to use gawk." > "/dev/stderr"
32 exit 1
33 }
34
35 # Setup generating tables
Masami Hiramatsueb132962009-08-13 16:34:13 -040036 print "/* x86 opcode map generated from x86-opcode-map.txt */"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040037 print "/* Do not change this code. */\n"
Masami Hiramatsueb132962009-08-13 16:34:13 -040038 ggid = 1
39 geid = 1
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040040 gaid = 0
41 delete etable
42 delete gtable
43 delete atable
Masami Hiramatsueb132962009-08-13 16:34:13 -040044
Roland Dreier4beb3d62009-12-16 17:39:48 -080045 opnd_expr = "^[A-Za-z/]"
Masami Hiramatsueb132962009-08-13 16:34:13 -040046 ext_expr = "^\\("
47 sep_expr = "^\\|$"
Roland Dreier4beb3d62009-12-16 17:39:48 -080048 group_expr = "^Grp[0-9A-Za-z]+"
Masami Hiramatsueb132962009-08-13 16:34:13 -040049
Masami Hiramatsua9c373d2011-12-05 21:05:57 +090050 imm_expr = "^[IJAOL][a-z]"
Masami Hiramatsueb132962009-08-13 16:34:13 -040051 imm_flag["Ib"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
52 imm_flag["Jb"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
53 imm_flag["Iw"] = "INAT_MAKE_IMM(INAT_IMM_WORD)"
54 imm_flag["Id"] = "INAT_MAKE_IMM(INAT_IMM_DWORD)"
55 imm_flag["Iq"] = "INAT_MAKE_IMM(INAT_IMM_QWORD)"
56 imm_flag["Ap"] = "INAT_MAKE_IMM(INAT_IMM_PTR)"
57 imm_flag["Iz"] = "INAT_MAKE_IMM(INAT_IMM_VWORD32)"
58 imm_flag["Jz"] = "INAT_MAKE_IMM(INAT_IMM_VWORD32)"
59 imm_flag["Iv"] = "INAT_MAKE_IMM(INAT_IMM_VWORD)"
60 imm_flag["Ob"] = "INAT_MOFFSET"
61 imm_flag["Ov"] = "INAT_MOFFSET"
Masami Hiramatsua9c373d2011-12-05 21:05:57 +090062 imm_flag["Lx"] = "INAT_MAKE_IMM(INAT_IMM_BYTE)"
Masami Hiramatsueb132962009-08-13 16:34:13 -040063
Roland Dreier4beb3d62009-12-16 17:39:48 -080064 modrm_expr = "^([CDEGMNPQRSUVW/][a-z]+|NTA|T[012])"
Masami Hiramatsueb132962009-08-13 16:34:13 -040065 force64_expr = "\\([df]64\\)"
66 rex_expr = "^REX(\\.[XRWB]+)*"
67 fpu_expr = "^ESC" # TODO
68
Masami Hiramatsu436d03f2012-06-05 00:09:11 +090069 lprefix1_expr = "\\((66|!F3)\\)"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040070 lprefix2_expr = "\\(F3\\)"
Masami Hiramatsu3e21bb02013-08-06 16:37:50 +090071 lprefix3_expr = "\\((F2|!F3|66\\&F2)\\)"
Masami Hiramatsu436d03f2012-06-05 00:09:11 +090072 lprefix_expr = "\\((66|F2|F3)\\)"
Masami Hiramatsueb132962009-08-13 16:34:13 -040073 max_lprefix = 4
74
Masami Hiramatsua9c373d2011-12-05 21:05:57 +090075 # All opcodes starting with lower-case 'v' or with (v1) superscript
76 # accepts VEX prefix
77 vexok_opcode_expr = "^v.*"
78 vexok_expr = "\\(v1\\)"
79 # All opcodes with (v) superscript supports *only* VEX prefix
80 vexonly_expr = "\\(v\\)"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040081
Masami Hiramatsueb132962009-08-13 16:34:13 -040082 prefix_expr = "\\(Prefix\\)"
83 prefix_num["Operand-Size"] = "INAT_PFX_OPNDSZ"
84 prefix_num["REPNE"] = "INAT_PFX_REPNE"
85 prefix_num["REP/REPE"] = "INAT_PFX_REPE"
Masami Hiramatsu3e21bb02013-08-06 16:37:50 +090086 prefix_num["XACQUIRE"] = "INAT_PFX_REPNE"
87 prefix_num["XRELEASE"] = "INAT_PFX_REPE"
Masami Hiramatsueb132962009-08-13 16:34:13 -040088 prefix_num["LOCK"] = "INAT_PFX_LOCK"
89 prefix_num["SEG=CS"] = "INAT_PFX_CS"
90 prefix_num["SEG=DS"] = "INAT_PFX_DS"
91 prefix_num["SEG=ES"] = "INAT_PFX_ES"
92 prefix_num["SEG=FS"] = "INAT_PFX_FS"
93 prefix_num["SEG=GS"] = "INAT_PFX_GS"
94 prefix_num["SEG=SS"] = "INAT_PFX_SS"
95 prefix_num["Address-Size"] = "INAT_PFX_ADDRSZ"
Masami Hiramatsua9c373d2011-12-05 21:05:57 +090096 prefix_num["VEX+1byte"] = "INAT_PFX_VEX2"
97 prefix_num["VEX+2byte"] = "INAT_PFX_VEX3"
Masami Hiramatsueb132962009-08-13 16:34:13 -040098
Masami Hiramatsue0e492e2009-10-27 16:42:27 -040099 clear_vars()
Masami Hiramatsueb132962009-08-13 16:34:13 -0400100}
101
102function semantic_error(msg) {
103 print "Semantic error at " NR ": " msg > "/dev/stderr"
104 exit 1
105}
106
107function debug(msg) {
108 print "DEBUG: " msg
109}
110
111function array_size(arr, i,c) {
112 c = 0
113 for (i in arr)
114 c++
115 return c
116}
117
118/^Table:/ {
119 print "/* " $0 " */"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400120 if (tname != "")
121 semantic_error("Hit Table: before EndTable:.");
Masami Hiramatsueb132962009-08-13 16:34:13 -0400122}
123
124/^Referrer:/ {
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400125 if (NF != 1) {
Masami Hiramatsueb132962009-08-13 16:34:13 -0400126 # escape opcode table
127 ref = ""
128 for (i = 2; i <= NF; i++)
129 ref = ref $i
130 eid = escape[ref]
131 tname = sprintf("inat_escape_table_%d", eid)
132 }
133}
134
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400135/^AVXcode:/ {
136 if (NF != 1) {
137 # AVX/escape opcode table
138 aid = $2
139 if (gaid <= aid)
140 gaid = aid + 1
141 if (tname == "") # AVX only opcode table
142 tname = sprintf("inat_avx_table_%d", $2)
143 }
144 if (aid == -1 && eid == -1) # primary opcode table
145 tname = "inat_primary_table"
146}
147
Masami Hiramatsueb132962009-08-13 16:34:13 -0400148/^GrpTable:/ {
149 print "/* " $0 " */"
150 if (!($2 in group))
151 semantic_error("No group: " $2 )
152 gid = group[$2]
153 tname = "inat_group_table_" gid
154}
155
156function print_table(tbl,name,fmt,n)
157{
158 print "const insn_attr_t " name " = {"
159 for (i = 0; i < n; i++) {
160 id = sprintf(fmt, i)
161 if (tbl[id])
162 print " [" id "] = " tbl[id] ","
163 }
164 print "};"
165}
166
167/^EndTable/ {
168 if (gid != -1) {
169 # print group tables
170 if (array_size(table) != 0) {
171 print_table(table, tname "[INAT_GROUP_TABLE_SIZE]",
172 "0x%x", 8)
173 gtable[gid,0] = tname
174 }
175 if (array_size(lptable1) != 0) {
176 print_table(lptable1, tname "_1[INAT_GROUP_TABLE_SIZE]",
177 "0x%x", 8)
178 gtable[gid,1] = tname "_1"
179 }
180 if (array_size(lptable2) != 0) {
181 print_table(lptable2, tname "_2[INAT_GROUP_TABLE_SIZE]",
182 "0x%x", 8)
183 gtable[gid,2] = tname "_2"
184 }
185 if (array_size(lptable3) != 0) {
186 print_table(lptable3, tname "_3[INAT_GROUP_TABLE_SIZE]",
187 "0x%x", 8)
188 gtable[gid,3] = tname "_3"
189 }
190 } else {
191 # print primary/escaped tables
192 if (array_size(table) != 0) {
193 print_table(table, tname "[INAT_OPCODE_TABLE_SIZE]",
194 "0x%02x", 256)
195 etable[eid,0] = tname
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400196 if (aid >= 0)
197 atable[aid,0] = tname
Masami Hiramatsueb132962009-08-13 16:34:13 -0400198 }
199 if (array_size(lptable1) != 0) {
200 print_table(lptable1,tname "_1[INAT_OPCODE_TABLE_SIZE]",
201 "0x%02x", 256)
202 etable[eid,1] = tname "_1"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400203 if (aid >= 0)
204 atable[aid,1] = tname "_1"
Masami Hiramatsueb132962009-08-13 16:34:13 -0400205 }
206 if (array_size(lptable2) != 0) {
207 print_table(lptable2,tname "_2[INAT_OPCODE_TABLE_SIZE]",
208 "0x%02x", 256)
209 etable[eid,2] = tname "_2"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400210 if (aid >= 0)
211 atable[aid,2] = tname "_2"
Masami Hiramatsueb132962009-08-13 16:34:13 -0400212 }
213 if (array_size(lptable3) != 0) {
214 print_table(lptable3,tname "_3[INAT_OPCODE_TABLE_SIZE]",
215 "0x%02x", 256)
216 etable[eid,3] = tname "_3"
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400217 if (aid >= 0)
218 atable[aid,3] = tname "_3"
Masami Hiramatsueb132962009-08-13 16:34:13 -0400219 }
220 }
221 print ""
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400222 clear_vars()
Masami Hiramatsueb132962009-08-13 16:34:13 -0400223}
224
225function add_flags(old,new) {
226 if (old && new)
227 return old " | " new
228 else if (old)
229 return old
230 else
231 return new
232}
233
234# convert operands to flags.
Jonathan Nieder23637562009-12-13 16:04:38 -0600235function convert_operands(count,opnd, i,j,imm,mod)
Masami Hiramatsueb132962009-08-13 16:34:13 -0400236{
237 imm = null
238 mod = null
Jonathan Nieder23637562009-12-13 16:04:38 -0600239 for (j = 1; j <= count; j++) {
240 i = opnd[j]
Masami Hiramatsueb132962009-08-13 16:34:13 -0400241 if (match(i, imm_expr) == 1) {
242 if (!imm_flag[i])
243 semantic_error("Unknown imm opnd: " i)
244 if (imm) {
245 if (i != "Ib")
246 semantic_error("Second IMM error")
247 imm = add_flags(imm, "INAT_SCNDIMM")
248 } else
249 imm = imm_flag[i]
250 } else if (match(i, modrm_expr))
251 mod = "INAT_MODRM"
252 }
253 return add_flags(imm, mod)
254}
255
256/^[0-9a-f]+\:/ {
257 if (NR == 1)
258 next
259 # get index
260 idx = "0x" substr($1, 1, index($1,":") - 1)
261 if (idx in table)
262 semantic_error("Redefine " idx " in " tname)
263
264 # check if escaped opcode
265 if ("escape" == $2) {
266 if ($3 != "#")
267 semantic_error("No escaped name")
268 ref = ""
269 for (i = 4; i <= NF; i++)
270 ref = ref $i
271 if (ref in escape)
272 semantic_error("Redefine escape (" ref ")")
273 escape[ref] = geid
274 geid++
275 table[idx] = "INAT_MAKE_ESCAPE(" escape[ref] ")"
276 next
277 }
278
279 variant = null
280 # converts
281 i = 2
282 while (i <= NF) {
283 opcode = $(i++)
284 delete opnds
285 ext = null
286 flags = null
287 opnd = null
288 # parse one opcode
289 if (match($i, opnd_expr)) {
290 opnd = $i
Jonathan Nieder23637562009-12-13 16:04:38 -0600291 count = split($(i++), opnds, ",")
292 flags = convert_operands(count, opnds)
Masami Hiramatsueb132962009-08-13 16:34:13 -0400293 }
294 if (match($i, ext_expr))
295 ext = $(i++)
296 if (match($i, sep_expr))
297 i++
298 else if (i < NF)
299 semantic_error($i " is not a separator")
300
301 # check if group opcode
302 if (match(opcode, group_expr)) {
303 if (!(opcode in group)) {
304 group[opcode] = ggid
305 ggid++
306 }
307 flags = add_flags(flags, "INAT_MAKE_GROUP(" group[opcode] ")")
308 }
309 # check force(or default) 64bit
310 if (match(ext, force64_expr))
311 flags = add_flags(flags, "INAT_FORCE64")
312
313 # check REX prefix
314 if (match(opcode, rex_expr))
Masami Hiramatsu04d46c12009-10-27 16:42:11 -0400315 flags = add_flags(flags, "INAT_MAKE_PREFIX(INAT_PFX_REX)")
Masami Hiramatsueb132962009-08-13 16:34:13 -0400316
317 # check coprocessor escape : TODO
318 if (match(opcode, fpu_expr))
319 flags = add_flags(flags, "INAT_MODRM")
320
Masami Hiramatsua9c373d2011-12-05 21:05:57 +0900321 # check VEX codes
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400322 if (match(ext, vexonly_expr))
323 flags = add_flags(flags, "INAT_VEXOK | INAT_VEXONLY")
Masami Hiramatsua9c373d2011-12-05 21:05:57 +0900324 else if (match(ext, vexok_expr) || match(opcode, vexok_opcode_expr))
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400325 flags = add_flags(flags, "INAT_VEXOK")
326
Masami Hiramatsueb132962009-08-13 16:34:13 -0400327 # check prefixes
328 if (match(ext, prefix_expr)) {
329 if (!prefix_num[opcode])
330 semantic_error("Unknown prefix: " opcode)
331 flags = add_flags(flags, "INAT_MAKE_PREFIX(" prefix_num[opcode] ")")
332 }
333 if (length(flags) == 0)
334 continue
335 # check if last prefix
336 if (match(ext, lprefix1_expr)) {
337 lptable1[idx] = add_flags(lptable1[idx],flags)
338 variant = "INAT_VARIANT"
Masami Hiramatsu436d03f2012-06-05 00:09:11 +0900339 }
340 if (match(ext, lprefix2_expr)) {
Masami Hiramatsueb132962009-08-13 16:34:13 -0400341 lptable2[idx] = add_flags(lptable2[idx],flags)
342 variant = "INAT_VARIANT"
Masami Hiramatsu436d03f2012-06-05 00:09:11 +0900343 }
344 if (match(ext, lprefix3_expr)) {
Masami Hiramatsueb132962009-08-13 16:34:13 -0400345 lptable3[idx] = add_flags(lptable3[idx],flags)
346 variant = "INAT_VARIANT"
Masami Hiramatsu436d03f2012-06-05 00:09:11 +0900347 }
348 if (!match(ext, lprefix_expr)){
Masami Hiramatsueb132962009-08-13 16:34:13 -0400349 table[idx] = add_flags(table[idx],flags)
350 }
351 }
352 if (variant)
353 table[idx] = add_flags(table[idx],variant)
354}
355
356END {
Masami Hiramatsu69d991f2009-08-21 15:43:16 -0400357 if (awkchecked != "")
358 exit 1
Masami Hiramatsueb132962009-08-13 16:34:13 -0400359 # print escape opcode map's array
360 print "/* Escape opcode map array */"
Cong Ding28a79382012-12-09 08:21:04 +0000361 print "const insn_attr_t * const inat_escape_tables[INAT_ESC_MAX + 1]" \
Masami Hiramatsu04d46c12009-10-27 16:42:11 -0400362 "[INAT_LSTPFX_MAX + 1] = {"
Masami Hiramatsueb132962009-08-13 16:34:13 -0400363 for (i = 0; i < geid; i++)
364 for (j = 0; j < max_lprefix; j++)
365 if (etable[i,j])
366 print " ["i"]["j"] = "etable[i,j]","
367 print "};\n"
368 # print group opcode map's array
369 print "/* Group opcode map array */"
Cong Ding28a79382012-12-09 08:21:04 +0000370 print "const insn_attr_t * const inat_group_tables[INAT_GRP_MAX + 1]"\
Masami Hiramatsu04d46c12009-10-27 16:42:11 -0400371 "[INAT_LSTPFX_MAX + 1] = {"
Masami Hiramatsueb132962009-08-13 16:34:13 -0400372 for (i = 0; i < ggid; i++)
373 for (j = 0; j < max_lprefix; j++)
374 if (gtable[i,j])
375 print " ["i"]["j"] = "gtable[i,j]","
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400376 print "};\n"
377 # print AVX opcode map's array
378 print "/* AVX opcode map array */"
Cong Ding28a79382012-12-09 08:21:04 +0000379 print "const insn_attr_t * const inat_avx_tables[X86_VEX_M_MAX + 1]"\
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400380 "[INAT_LSTPFX_MAX + 1] = {"
381 for (i = 0; i < gaid; i++)
382 for (j = 0; j < max_lprefix; j++)
383 if (atable[i,j])
384 print " ["i"]["j"] = "atable[i,j]","
Masami Hiramatsueb132962009-08-13 16:34:13 -0400385 print "};"
386}
Masami Hiramatsue0e492e2009-10-27 16:42:27 -0400387