blob: 1a7801c92bd703703861c6559833bb48106a826e [file] [log] [blame]
Marek Olsak5df00d62014-12-07 12:18:57 +00001//===-- VIInstructions.td - VI Instruction Defintions ---------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Instruction definitions for VI and newer.
10//===----------------------------------------------------------------------===//
11
Tom Stellardd1f0f022015-04-23 19:33:54 +000012let SIAssemblerPredicate = DisableInst, SubtargetPredicate = isVI in {
13
14//===----------------------------------------------------------------------===//
15// VOP1 Instructions
16//===----------------------------------------------------------------------===//
17
18defm V_CVT_F16_U16 : VOP1Inst <vop1<0, 0x39>, "v_cvt_f16_u16", VOP_F16_I16>;
19defm V_CVT_F16_I16 : VOP1Inst <vop1<0, 0x3a>, "v_cvt_f16_i16", VOP_F16_I16>;
20defm V_CVT_U16_F16 : VOP1Inst <vop1<0, 0x3b>, "v_cvt_u16_f16", VOP_I16_F16>;
21defm V_CVT_I16_F16 : VOP1Inst <vop1<0, 0x3c>, "v_cvt_i16_f16", VOP_I16_F16>;
22defm V_RCP_F16 : VOP1Inst <vop1<0, 0x3d>, "v_rcp_f16", VOP_F16_F16>;
23defm V_SQRT_F16 : VOP1Inst <vop1<0, 0x3e>, "v_sqrt_f16", VOP_F16_F16>;
24defm V_RSQ_F16 : VOP1Inst <vop1<0, 0x3f>, "v_rsq_f16", VOP_F16_F16>;
25defm V_LOG_F16 : VOP1Inst <vop1<0, 0x40>, "v_log_f16", VOP_F16_F16>;
26defm V_EXP_F16 : VOP1Inst <vop1<0, 0x41>, "v_exp_f16", VOP_F16_F16>;
27defm V_FREXP_MANT_F16 : VOP1Inst <vop1<0, 0x42>, "v_frexp_mant_f16",
28 VOP_F16_F16
29>;
30defm V_FREXP_EXP_I16_F16 : VOP1Inst <vop1<0, 0x43>, "v_frexp_exp_i16_f16",
31 VOP_I16_F16
32>;
33defm V_FLOOR_F16 : VOP1Inst <vop1<0, 0x44>, "v_floor_f16", VOP_F16_F16>;
34defm V_CEIL_F16 : VOP1Inst <vop1<0, 0x45>, "v_ceil_f16", VOP_F16_F16>;
35defm V_TRUNC_F16 : VOP1Inst <vop1<0, 0x46>, "v_trunc_f16", VOP_F16_F16>;
36defm V_RNDNE_F16 : VOP1Inst <vop1<0, 0x47>, "v_rndne_f16", VOP_F16_F16>;
37defm V_FRACT_F16 : VOP1Inst <vop1<0, 0x48>, "v_fract_f16", VOP_F16_F16>;
38defm V_SIN_F16 : VOP1Inst <vop1<0, 0x49>, "v_sin_f16", VOP_F16_F16>;
39defm V_COS_F16 : VOP1Inst <vop1<0, 0x4a>, "v_cos_f16", VOP_F16_F16>;
40
Tom Stellard245c15f2015-05-26 15:55:52 +000041//===----------------------------------------------------------------------===//
42// VOP2 Instructions
43//===----------------------------------------------------------------------===//
44
45let isCommutable = 1 in {
46
47defm V_ADD_F16 : VOP2Inst <vop2<0, 0x1f>, "v_add_f16", VOP_F16_F16_F16>;
48defm V_SUB_F16 : VOP2Inst <vop2<0, 0x20>, "v_sub_f16", VOP_F16_F16_F16>;
49defm V_SUBREV_F16 : VOP2Inst <vop2<0, 0x21>, "v_subrev_f16", VOP_F16_F16_F16,
50 null_frag, "v_sub_f16"
51>;
52defm V_MUL_F16 : VOP2Inst <vop2<0, 0x22>, "v_mul_f16", VOP_F16_F16_F16>;
53defm V_MAC_F16 : VOP2Inst <vop2<0, 0x23>, "v_mac_f16", VOP_F16_F16_F16>;
54} // End isCommutable = 1
55defm V_MADMK_F16 : VOP2MADK <vop2<0,0x24>, "v_madmk_f16">;
56let isCommutable = 1 in {
57defm V_MADAK_F16 : VOP2MADK <vop2<0,0x25>, "v_madak_f16">;
58defm V_ADD_U16 : VOP2Inst <vop2<0,0x26>, "v_add_u16", VOP_I16_I16_I16>;
59defm V_SUB_U16 : VOP2Inst <vop2<0,0x27>, "v_sub_u16" , VOP_I16_I16_I16>;
60defm V_SUBREV_U16 : VOP2Inst <vop2<0,0x28>, "v_subrev_u16", VOP_I16_I16_I16>;
61defm V_MUL_LO_U16 : VOP2Inst <vop2<0,0x29>, "v_mul_lo_u16", VOP_I16_I16_I16>;
62} // End isCommutable = 1
63defm V_LSHLREV_B16 : VOP2Inst <vop2<0,0x2a>, "v_lshlrev_b16", VOP_I16_I16_I16>;
64defm V_LSHRREV_B16 : VOP2Inst <vop2<0,0x2b>, "v_lshrrev_b16", VOP_I16_I16_I16>;
65defm V_ASHRREV_B16 : VOP2Inst <vop2<0,0x2c>, "v_ashrrev_b16", VOP_I16_I16_I16>;
66let isCommutable = 1 in {
67defm V_MAX_F16 : VOP2Inst <vop2<0,0x2d>, "v_max_f16", VOP_F16_F16_F16>;
68defm V_MIN_F16 : VOP2Inst <vop2<0,0x2e>, "v_min_f16", VOP_F16_F16_F16>;
69defm V_MAX_U16 : VOP2Inst <vop2<0,0x2f>, "v_max_u16", VOP_I16_I16_I16>;
70defm V_MAX_I16 : VOP2Inst <vop2<0,0x30>, "v_max_i16", VOP_I16_I16_I16>;
71defm V_MIN_U16 : VOP2Inst <vop2<0,0x31>, "v_min_u16", VOP_I16_I16_I16>;
72defm V_MIN_I16 : VOP2Inst <vop2<0,0x32>, "v_min_i16", VOP_I16_I16_I16>;
73} // End isCommutable = 1
74defm V_LDEXP_F16 : VOP2Inst <vop2<0,0x33>, "v_ldexp_f16", VOP_F16_F16_I16>;
75
Matt Arsenault6c2e2002015-11-05 01:03:08 +000076// Aliases to simplify matching of floating-point instructions that
77// are VOP2 on SI and VOP3 on VI.
Tom Stellard245c15f2015-05-26 15:55:52 +000078
79class SI2_VI3Alias <string name, Instruction inst> : InstAlias <
80 name#" $dst, $src0, $src1",
81 (inst VGPR_32:$dst, 0, VCSrc_32:$src0, 0, VCSrc_32:$src1, 0, 0)
82>, PredicateControl {
83 let UseInstAsmMatchConverter = 0;
84}
85
86def : SI2_VI3Alias <"v_ldexp_f32", V_LDEXP_F32_e64_vi>;
87def : SI2_VI3Alias <"v_cvt_pkaccum_u8_f32", V_CVT_PKACCUM_U8_F32_e64_vi>;
88def : SI2_VI3Alias <"v_cvt_pknorm_i16_f32", V_CVT_PKNORM_I16_F32_e64_vi>;
89def : SI2_VI3Alias <"v_cvt_pknorm_u16_f32", V_CVT_PKNORM_U16_F32_e64_vi>;
90def : SI2_VI3Alias <"v_cvt_pkrtz_f16_f32", V_CVT_PKRTZ_F16_F32_e64_vi>;
91
Matt Arsenaulte66621b2015-09-24 19:52:27 +000092//===----------------------------------------------------------------------===//
93// SMEM Instructions
94//===----------------------------------------------------------------------===//
95
96def S_DCACHE_WB : SMEM_Inval <0x21,
97 "s_dcache_wb", int_amdgcn_s_dcache_wb>;
98
99def S_DCACHE_WB_VOL : SMEM_Inval <0x23,
100 "s_dcache_wb_vol", int_amdgcn_s_dcache_wb_vol>;
101
Tom Stellardd1f0f022015-04-23 19:33:54 +0000102} // End SIAssemblerPredicate = DisableInst, SubtargetPredicate = isVI
Marek Olsak5df00d62014-12-07 12:18:57 +0000103
Tom Stellard3da56722016-01-04 20:23:10 +0000104let Predicates = [isVI] in {
105
106// 1. Offset as 20bit DWORD immediate
107def : Pat <
108 (SIload_constant v4i32:$sbase, IMM20bit:$offset),
109 (S_BUFFER_LOAD_DWORD_IMM $sbase, (as_i32imm $offset))
110>;
111
112} // End Predicates = [isVI]