| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1 | //===-- SOPInstructions.td - SOP Instruction Defintions -------------------===// | 
|  | 2 | // | 
| Chandler Carruth | 2946cd7 | 2019-01-19 08:50:56 +0000 | [diff] [blame] | 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|  | 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|  | 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 6 | // | 
|  | 7 | //===----------------------------------------------------------------------===// | 
|  | 8 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 9 | def GPRIdxModeMatchClass : AsmOperandClass { | 
|  | 10 | let Name = "GPRIdxMode"; | 
|  | 11 | let PredicateMethod = "isGPRIdxMode"; | 
| Dmitry Preobrazhensky | ef92035 | 2019-02-27 13:12:12 +0000 | [diff] [blame] | 12 | let ParserMethod = "parseGPRIdxMode"; | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 13 | let RenderMethod = "addImmOperands"; | 
|  | 14 | } | 
|  | 15 |  | 
|  | 16 | def GPRIdxMode : Operand<i32> { | 
|  | 17 | let PrintMethod = "printVGPRIndexMode"; | 
|  | 18 | let ParserMatchClass = GPRIdxModeMatchClass; | 
|  | 19 | let OperandType = "OPERAND_IMMEDIATE"; | 
|  | 20 | } | 
|  | 21 |  | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 22 | class SOP_Pseudo<string opName, dag outs, dag ins, string asmOps, | 
|  | 23 | list<dag> pattern=[]> : | 
|  | 24 | InstSI<outs, ins, "", pattern>, | 
|  | 25 | SIMCInstr<opName, SIEncodingFamily.NONE> { | 
|  | 26 |  | 
|  | 27 | let isPseudo = 1; | 
|  | 28 | let isCodeGenOnly = 1; | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 29 |  | 
|  | 30 | string Mnemonic = opName; | 
|  | 31 | string AsmOperands = asmOps; | 
|  | 32 |  | 
|  | 33 | bits<1> has_sdst = 0; | 
|  | 34 | } | 
|  | 35 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 36 | //===----------------------------------------------------------------------===// | 
|  | 37 | // SOP1 Instructions | 
|  | 38 | //===----------------------------------------------------------------------===// | 
|  | 39 |  | 
|  | 40 | class SOP1_Pseudo <string opName, dag outs, dag ins, | 
|  | 41 | string asmOps, list<dag> pattern=[]> : | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 42 | SOP_Pseudo<opName, outs, ins, asmOps, pattern> { | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 43 |  | 
|  | 44 | let mayLoad = 0; | 
|  | 45 | let mayStore = 0; | 
|  | 46 | let hasSideEffects = 0; | 
|  | 47 | let SALU = 1; | 
|  | 48 | let SOP1 = 1; | 
|  | 49 | let SchedRW = [WriteSALU]; | 
| Matt Arsenault | 6bc43d8 | 2016-10-06 16:20:41 +0000 | [diff] [blame] | 50 | let Size = 4; | 
| Tom Stellard | 2add8a1 | 2016-09-06 20:00:26 +0000 | [diff] [blame] | 51 | let UseNamedOperandTable = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 52 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 53 | bits<1> has_src0 = 1; | 
|  | 54 | bits<1> has_sdst = 1; | 
|  | 55 | } | 
|  | 56 |  | 
|  | 57 | class SOP1_Real<bits<8> op, SOP1_Pseudo ps> : | 
|  | 58 | InstSI <ps.OutOperandList, ps.InOperandList, | 
|  | 59 | ps.Mnemonic # " " # ps.AsmOperands, []>, | 
|  | 60 | Enc32 { | 
|  | 61 |  | 
|  | 62 | let isPseudo = 0; | 
|  | 63 | let isCodeGenOnly = 0; | 
| Matt Arsenault | 6bc43d8 | 2016-10-06 16:20:41 +0000 | [diff] [blame] | 64 | let Size = 4; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 65 |  | 
|  | 66 | // copy relevant pseudo op flags | 
|  | 67 | let SubtargetPredicate = ps.SubtargetPredicate; | 
|  | 68 | let AsmMatchConverter  = ps.AsmMatchConverter; | 
|  | 69 |  | 
|  | 70 | // encoding | 
|  | 71 | bits<7> sdst; | 
|  | 72 | bits<8> src0; | 
|  | 73 |  | 
|  | 74 | let Inst{7-0} = !if(ps.has_src0, src0, ?); | 
|  | 75 | let Inst{15-8} = op; | 
|  | 76 | let Inst{22-16} = !if(ps.has_sdst, sdst, ?); | 
|  | 77 | let Inst{31-23} = 0x17d; //encoding; | 
|  | 78 | } | 
|  | 79 |  | 
| Matt Arsenault | fd6fd00 | 2019-02-25 19:24:46 +0000 | [diff] [blame] | 80 | class SOP1_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo < | 
|  | 81 | opName, (outs SReg_32:$sdst), | 
|  | 82 | !if(tied_in, (ins SSrc_b32:$src0, SReg_32:$sdst_in), | 
|  | 83 | (ins SSrc_b32:$src0)), | 
|  | 84 | "$sdst, $src0", pattern> { | 
|  | 85 | let Constraints = !if(tied_in, "$sdst = $sdst_in", ""); | 
|  | 86 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 87 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 88 | // 32-bit input, no output. | 
|  | 89 | class SOP1_0_32 <string opName, list<dag> pattern = []> : SOP1_Pseudo < | 
|  | 90 | opName, (outs), (ins SSrc_b32:$src0), | 
|  | 91 | "$src0", pattern> { | 
|  | 92 | let has_sdst = 0; | 
|  | 93 | } | 
|  | 94 |  | 
| Dmitry Preobrazhensky | 12194e9 | 2017-04-12 12:40:19 +0000 | [diff] [blame] | 95 | class SOP1_0_32R <string opName, list<dag> pattern = []> : SOP1_Pseudo < | 
|  | 96 | opName, (outs), (ins SReg_32:$src0), | 
|  | 97 | "$src0", pattern> { | 
|  | 98 | let has_sdst = 0; | 
|  | 99 | } | 
|  | 100 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 101 | class SOP1_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 102 | opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 103 | "$sdst, $src0", pattern | 
|  | 104 | >; | 
|  | 105 |  | 
|  | 106 | // 64-bit input, 32-bit output. | 
|  | 107 | class SOP1_32_64 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 108 | opName, (outs SReg_32:$sdst), (ins SSrc_b64:$src0), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 109 | "$sdst, $src0", pattern | 
|  | 110 | >; | 
|  | 111 |  | 
|  | 112 | // 32-bit input, 64-bit output. | 
| Matt Arsenault | fd6fd00 | 2019-02-25 19:24:46 +0000 | [diff] [blame] | 113 | class SOP1_64_32 <string opName, list<dag> pattern=[], bit tied_in = 0> : SOP1_Pseudo < | 
|  | 114 | opName, (outs SReg_64:$sdst), | 
|  | 115 | !if(tied_in, (ins SSrc_b32:$src0, SReg_64:$sdst_in), | 
|  | 116 | (ins SSrc_b32:$src0)), | 
|  | 117 | "$sdst, $src0", pattern> { | 
|  | 118 | let Constraints = !if(tied_in, "$sdst = $sdst_in", ""); | 
|  | 119 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 120 |  | 
|  | 121 | // no input, 64-bit output. | 
|  | 122 | class SOP1_64_0 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < | 
|  | 123 | opName, (outs SReg_64:$sdst), (ins), "$sdst", pattern> { | 
|  | 124 | let has_src0 = 0; | 
|  | 125 | } | 
|  | 126 |  | 
|  | 127 | // 64-bit input, no output | 
|  | 128 | class SOP1_1 <string opName, list<dag> pattern=[]> : SOP1_Pseudo < | 
|  | 129 | opName, (outs), (ins SReg_64:$src0), "$src0", pattern> { | 
|  | 130 | let has_sdst = 0; | 
|  | 131 | } | 
|  | 132 |  | 
|  | 133 |  | 
|  | 134 | let isMoveImm = 1 in { | 
|  | 135 | let isReMaterializable = 1, isAsCheapAsAMove = 1 in { | 
|  | 136 | def S_MOV_B32 : SOP1_32 <"s_mov_b32">; | 
|  | 137 | def S_MOV_B64 : SOP1_64 <"s_mov_b64">; | 
|  | 138 | } // End isRematerializeable = 1 | 
|  | 139 |  | 
|  | 140 | let Uses = [SCC] in { | 
|  | 141 | def S_CMOV_B32 : SOP1_32 <"s_cmov_b32">; | 
|  | 142 | def S_CMOV_B64 : SOP1_64 <"s_cmov_b64">; | 
|  | 143 | } // End Uses = [SCC] | 
|  | 144 | } // End isMoveImm = 1 | 
|  | 145 |  | 
|  | 146 | let Defs = [SCC] in { | 
|  | 147 | def S_NOT_B32 : SOP1_32 <"s_not_b32", | 
|  | 148 | [(set i32:$sdst, (not i32:$src0))] | 
|  | 149 | >; | 
|  | 150 |  | 
|  | 151 | def S_NOT_B64 : SOP1_64 <"s_not_b64", | 
|  | 152 | [(set i64:$sdst, (not i64:$src0))] | 
|  | 153 | >; | 
|  | 154 | def S_WQM_B32 : SOP1_32 <"s_wqm_b32">; | 
| Marek Olsak | 2114fc3 | 2017-10-24 10:26:59 +0000 | [diff] [blame] | 155 | def S_WQM_B64 : SOP1_64 <"s_wqm_b64", | 
|  | 156 | [(set i1:$sdst, (int_amdgcn_wqm_vote i1:$src0))] | 
|  | 157 | >; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 158 | } // End Defs = [SCC] | 
|  | 159 |  | 
|  | 160 |  | 
|  | 161 | def S_BREV_B32 : SOP1_32 <"s_brev_b32", | 
|  | 162 | [(set i32:$sdst, (bitreverse i32:$src0))] | 
|  | 163 | >; | 
|  | 164 | def S_BREV_B64 : SOP1_64 <"s_brev_b64">; | 
|  | 165 |  | 
|  | 166 | let Defs = [SCC] in { | 
|  | 167 | def S_BCNT0_I32_B32 : SOP1_32 <"s_bcnt0_i32_b32">; | 
|  | 168 | def S_BCNT0_I32_B64 : SOP1_32_64 <"s_bcnt0_i32_b64">; | 
|  | 169 | def S_BCNT1_I32_B32 : SOP1_32 <"s_bcnt1_i32_b32", | 
|  | 170 | [(set i32:$sdst, (ctpop i32:$src0))] | 
|  | 171 | >; | 
|  | 172 | def S_BCNT1_I32_B64 : SOP1_32_64 <"s_bcnt1_i32_b64">; | 
|  | 173 | } // End Defs = [SCC] | 
|  | 174 |  | 
|  | 175 | def S_FF0_I32_B32 : SOP1_32 <"s_ff0_i32_b32">; | 
|  | 176 | def S_FF0_I32_B64 : SOP1_32_64 <"s_ff0_i32_b64">; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 177 | def S_FF1_I32_B64 : SOP1_32_64 <"s_ff1_i32_b64">; | 
|  | 178 |  | 
| Wei Ding | 5676aca | 2017-10-12 19:37:14 +0000 | [diff] [blame] | 179 | def S_FF1_I32_B32 : SOP1_32 <"s_ff1_i32_b32", | 
|  | 180 | [(set i32:$sdst, (AMDGPUffbl_b32 i32:$src0))] | 
|  | 181 | >; | 
|  | 182 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 183 | def S_FLBIT_I32_B32 : SOP1_32 <"s_flbit_i32_b32", | 
|  | 184 | [(set i32:$sdst, (AMDGPUffbh_u32 i32:$src0))] | 
|  | 185 | >; | 
|  | 186 |  | 
|  | 187 | def S_FLBIT_I32_B64 : SOP1_32_64 <"s_flbit_i32_b64">; | 
|  | 188 | def S_FLBIT_I32 : SOP1_32 <"s_flbit_i32", | 
|  | 189 | [(set i32:$sdst, (AMDGPUffbh_i32 i32:$src0))] | 
|  | 190 | >; | 
|  | 191 | def S_FLBIT_I32_I64 : SOP1_32_64 <"s_flbit_i32_i64">; | 
|  | 192 | def S_SEXT_I32_I8 : SOP1_32 <"s_sext_i32_i8", | 
|  | 193 | [(set i32:$sdst, (sext_inreg i32:$src0, i8))] | 
|  | 194 | >; | 
|  | 195 | def S_SEXT_I32_I16 : SOP1_32 <"s_sext_i32_i16", | 
|  | 196 | [(set i32:$sdst, (sext_inreg i32:$src0, i16))] | 
|  | 197 | >; | 
|  | 198 |  | 
| Matt Arsenault | fd6fd00 | 2019-02-25 19:24:46 +0000 | [diff] [blame] | 199 | def S_BITSET0_B32 : SOP1_32    <"s_bitset0_b32", [], 1>; | 
|  | 200 | def S_BITSET0_B64 : SOP1_64_32 <"s_bitset0_b64", [], 1>; | 
|  | 201 | def S_BITSET1_B32 : SOP1_32    <"s_bitset1_b32", [], 1>; | 
|  | 202 | def S_BITSET1_B64 : SOP1_64_32 <"s_bitset1_b64", [], 1>; | 
| Konstantin Zhuravlyov | b2ff8df | 2017-05-26 20:38:26 +0000 | [diff] [blame] | 203 | def S_GETPC_B64 : SOP1_64_0  <"s_getpc_b64", | 
|  | 204 | [(set i64:$sdst, (int_amdgcn_s_getpc))] | 
|  | 205 | >; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 206 |  | 
| Matt Arsenault | 2b1f9aa | 2017-05-17 21:56:25 +0000 | [diff] [blame] | 207 | let isTerminator = 1, isBarrier = 1, SchedRW = [WriteBranch] in { | 
|  | 208 |  | 
|  | 209 | let isBranch = 1, isIndirectBranch = 1 in { | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 210 | def S_SETPC_B64 : SOP1_1  <"s_setpc_b64">; | 
| Matt Arsenault | 2b1f9aa | 2017-05-17 21:56:25 +0000 | [diff] [blame] | 211 | } // End isBranch = 1, isIndirectBranch = 1 | 
|  | 212 |  | 
|  | 213 | let isReturn = 1 in { | 
|  | 214 | // Define variant marked as return rather than branch. | 
|  | 215 | def S_SETPC_B64_return : SOP1_1<"", [(AMDGPUret_flag i64:$src0)]>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 216 | } | 
| Matt Arsenault | 2b1f9aa | 2017-05-17 21:56:25 +0000 | [diff] [blame] | 217 | } // End isTerminator = 1, isBarrier = 1 | 
|  | 218 |  | 
|  | 219 | let isCall = 1 in { | 
|  | 220 | def S_SWAPPC_B64 : SOP1_64 <"s_swappc_b64" | 
|  | 221 | >; | 
|  | 222 | } | 
|  | 223 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 224 | def S_RFE_B64 : SOP1_1  <"s_rfe_b64">; | 
|  | 225 |  | 
|  | 226 | let hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] in { | 
|  | 227 |  | 
|  | 228 | def S_AND_SAVEEXEC_B64 : SOP1_64 <"s_and_saveexec_b64">; | 
|  | 229 | def S_OR_SAVEEXEC_B64 : SOP1_64 <"s_or_saveexec_b64">; | 
|  | 230 | def S_XOR_SAVEEXEC_B64 : SOP1_64 <"s_xor_saveexec_b64">; | 
|  | 231 | def S_ANDN2_SAVEEXEC_B64 : SOP1_64 <"s_andn2_saveexec_b64">; | 
|  | 232 | def S_ORN2_SAVEEXEC_B64 : SOP1_64 <"s_orn2_saveexec_b64">; | 
|  | 233 | def S_NAND_SAVEEXEC_B64 : SOP1_64 <"s_nand_saveexec_b64">; | 
|  | 234 | def S_NOR_SAVEEXEC_B64 : SOP1_64 <"s_nor_saveexec_b64">; | 
|  | 235 | def S_XNOR_SAVEEXEC_B64 : SOP1_64 <"s_xnor_saveexec_b64">; | 
|  | 236 |  | 
|  | 237 | } // End hasSideEffects = 1, Uses = [EXEC], Defs = [EXEC, SCC] | 
|  | 238 |  | 
|  | 239 | def S_QUADMASK_B32 : SOP1_32 <"s_quadmask_b32">; | 
|  | 240 | def S_QUADMASK_B64 : SOP1_64 <"s_quadmask_b64">; | 
|  | 241 |  | 
|  | 242 | let Uses = [M0] in { | 
|  | 243 | def S_MOVRELS_B32 : SOP1_32 <"s_movrels_b32">; | 
|  | 244 | def S_MOVRELS_B64 : SOP1_64 <"s_movrels_b64">; | 
|  | 245 | def S_MOVRELD_B32 : SOP1_32 <"s_movreld_b32">; | 
|  | 246 | def S_MOVRELD_B64 : SOP1_64 <"s_movreld_b64">; | 
|  | 247 | } // End Uses = [M0] | 
|  | 248 |  | 
| Dmitry Preobrazhensky | 12194e9 | 2017-04-12 12:40:19 +0000 | [diff] [blame] | 249 | def S_CBRANCH_JOIN : SOP1_0_32R <"s_cbranch_join">; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 250 | def S_MOV_REGRD_B32 : SOP1_32 <"s_mov_regrd_b32">; | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 251 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 252 | let Defs = [SCC] in { | 
|  | 253 | def S_ABS_I32 : SOP1_32 <"s_abs_i32">; | 
|  | 254 | } // End Defs = [SCC] | 
|  | 255 | def S_MOV_FED_B32 : SOP1_32 <"s_mov_fed_b32">; | 
|  | 256 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 257 | let SubtargetPredicate = HasVGPRIndexMode in { | 
|  | 258 | def S_SET_GPR_IDX_IDX : SOP1_0_32<"s_set_gpr_idx_idx"> { | 
|  | 259 | let Uses = [M0]; | 
|  | 260 | let Defs = [M0]; | 
|  | 261 | } | 
|  | 262 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 263 |  | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 264 | let SubtargetPredicate = isGFX9Plus in { | 
| Dmitry Preobrazhensky | f20aff5 | 2018-04-06 16:35:11 +0000 | [diff] [blame] | 265 | let hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] in { | 
|  | 266 | def S_ANDN1_SAVEEXEC_B64 : SOP1_64<"s_andn1_saveexec_b64">; | 
|  | 267 | def S_ORN1_SAVEEXEC_B64  : SOP1_64<"s_orn1_saveexec_b64">; | 
|  | 268 | def S_ANDN1_WREXEC_B64   : SOP1_64<"s_andn1_wrexec_b64">; | 
|  | 269 | def S_ANDN2_WREXEC_B64   : SOP1_64<"s_andn2_wrexec_b64">; | 
|  | 270 | } // End hasSideEffects = 1, Defs = [EXEC, SCC], Uses = [EXEC] | 
|  | 271 |  | 
|  | 272 | def S_BITREPLICATE_B64_B32 : SOP1_64_32<"s_bitreplicate_b64_b32">; | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 273 | } // End SubtargetPredicate = isGFX9Plus | 
| Dmitry Preobrazhensky | f20aff5 | 2018-04-06 16:35:11 +0000 | [diff] [blame] | 274 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 275 | //===----------------------------------------------------------------------===// | 
|  | 276 | // SOP2 Instructions | 
|  | 277 | //===----------------------------------------------------------------------===// | 
|  | 278 |  | 
|  | 279 | class SOP2_Pseudo<string opName, dag outs, dag ins, | 
|  | 280 | string asmOps, list<dag> pattern=[]> : | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 281 | SOP_Pseudo<opName, outs, ins, asmOps, pattern> { | 
|  | 282 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 283 | let mayLoad = 0; | 
|  | 284 | let mayStore = 0; | 
|  | 285 | let hasSideEffects = 0; | 
|  | 286 | let SALU = 1; | 
|  | 287 | let SOP2 = 1; | 
|  | 288 | let SchedRW = [WriteSALU]; | 
|  | 289 | let UseNamedOperandTable = 1; | 
|  | 290 |  | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 291 | let has_sdst = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 292 |  | 
|  | 293 | // Pseudo instructions have no encodings, but adding this field here allows | 
|  | 294 | // us to do: | 
|  | 295 | // let sdst = xxx in { | 
|  | 296 | // for multiclasses that include both real and pseudo instructions. | 
|  | 297 | // field bits<7> sdst = 0; | 
|  | 298 | // let Size = 4; // Do we need size here? | 
|  | 299 | } | 
|  | 300 |  | 
| Nicolai Haehnle | 4f850ea | 2018-03-26 13:56:53 +0000 | [diff] [blame] | 301 | class SOP2_Real<bits<7> op, SOP_Pseudo ps> : | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 302 | InstSI <ps.OutOperandList, ps.InOperandList, | 
|  | 303 | ps.Mnemonic # " " # ps.AsmOperands, []>, | 
|  | 304 | Enc32 { | 
|  | 305 | let isPseudo = 0; | 
|  | 306 | let isCodeGenOnly = 0; | 
|  | 307 |  | 
|  | 308 | // copy relevant pseudo op flags | 
|  | 309 | let SubtargetPredicate = ps.SubtargetPredicate; | 
|  | 310 | let AsmMatchConverter  = ps.AsmMatchConverter; | 
| Dmitry Preobrazhensky | 61105ba | 2019-01-18 13:57:43 +0000 | [diff] [blame] | 311 | let UseNamedOperandTable = ps.UseNamedOperandTable; | 
|  | 312 | let TSFlags = ps.TSFlags; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 313 |  | 
|  | 314 | // encoding | 
|  | 315 | bits<7> sdst; | 
|  | 316 | bits<8> src0; | 
|  | 317 | bits<8> src1; | 
|  | 318 |  | 
|  | 319 | let Inst{7-0}   = src0; | 
|  | 320 | let Inst{15-8}  = src1; | 
|  | 321 | let Inst{22-16} = !if(ps.has_sdst, sdst, ?); | 
|  | 322 | let Inst{29-23} = op; | 
|  | 323 | let Inst{31-30} = 0x2; // encoding | 
|  | 324 | } | 
|  | 325 |  | 
|  | 326 |  | 
|  | 327 | class SOP2_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 328 | opName, (outs SReg_32:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 329 | "$sdst, $src0, $src1", pattern | 
|  | 330 | >; | 
|  | 331 |  | 
|  | 332 | class SOP2_64 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 333 | opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b64:$src1), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 334 | "$sdst, $src0, $src1", pattern | 
|  | 335 | >; | 
|  | 336 |  | 
|  | 337 | class SOP2_64_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 338 | opName, (outs SReg_64:$sdst), (ins SSrc_b64:$src0, SSrc_b32:$src1), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 339 | "$sdst, $src0, $src1", pattern | 
|  | 340 | >; | 
|  | 341 |  | 
|  | 342 | class SOP2_64_32_32 <string opName, list<dag> pattern=[]> : SOP2_Pseudo < | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 343 | opName, (outs SReg_64:$sdst), (ins SSrc_b32:$src0, SSrc_b32:$src1), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 344 | "$sdst, $src0, $src1", pattern | 
|  | 345 | >; | 
|  | 346 |  | 
| Graham Sellers | 04f7a4d | 2018-11-29 16:05:38 +0000 | [diff] [blame] | 347 | class UniformUnaryFrag<SDPatternOperator Op> : PatFrag < | 
|  | 348 | (ops node:$src0), | 
|  | 349 | (Op $src0), | 
|  | 350 | [{ return !N->isDivergent(); }] | 
|  | 351 | >; | 
|  | 352 |  | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 353 | class UniformBinFrag<SDPatternOperator Op> : PatFrag < | 
|  | 354 | (ops node:$src0, node:$src1), | 
|  | 355 | (Op $src0, $src1), | 
|  | 356 | [{ return !N->isDivergent(); }] | 
|  | 357 | >; | 
|  | 358 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 359 | let Defs = [SCC] in { // Carry out goes to SCC | 
|  | 360 | let isCommutable = 1 in { | 
|  | 361 | def S_ADD_U32 : SOP2_32 <"s_add_u32">; | 
|  | 362 | def S_ADD_I32 : SOP2_32 <"s_add_i32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 363 | [(set i32:$sdst, (UniformBinFrag<add> SSrc_b32:$src0, SSrc_b32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 364 | >; | 
|  | 365 | } // End isCommutable = 1 | 
|  | 366 |  | 
|  | 367 | def S_SUB_U32 : SOP2_32 <"s_sub_u32">; | 
|  | 368 | def S_SUB_I32 : SOP2_32 <"s_sub_i32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 369 | [(set i32:$sdst, (UniformBinFrag<sub> SSrc_b32:$src0, SSrc_b32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 370 | >; | 
|  | 371 |  | 
|  | 372 | let Uses = [SCC] in { // Carry in comes from SCC | 
|  | 373 | let isCommutable = 1 in { | 
|  | 374 | def S_ADDC_U32 : SOP2_32 <"s_addc_u32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 375 | [(set i32:$sdst, (UniformBinFrag<adde> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 376 | } // End isCommutable = 1 | 
|  | 377 |  | 
|  | 378 | def S_SUBB_U32 : SOP2_32 <"s_subb_u32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 379 | [(set i32:$sdst, (UniformBinFrag<sube> (i32 SSrc_b32:$src0), (i32 SSrc_b32:$src1)))]>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 380 | } // End Uses = [SCC] | 
|  | 381 |  | 
| Matt Arsenault | 479ba3a | 2016-09-07 06:25:55 +0000 | [diff] [blame] | 382 |  | 
|  | 383 | let isCommutable = 1 in { | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 384 | def S_MIN_I32 : SOP2_32 <"s_min_i32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 385 | [(set i32:$sdst, (UniformBinFrag<smin> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 386 | >; | 
|  | 387 | def S_MIN_U32 : SOP2_32 <"s_min_u32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 388 | [(set i32:$sdst, (UniformBinFrag<umin> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 389 | >; | 
|  | 390 | def S_MAX_I32 : SOP2_32 <"s_max_i32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 391 | [(set i32:$sdst, (UniformBinFrag<smax> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 392 | >; | 
|  | 393 | def S_MAX_U32 : SOP2_32 <"s_max_u32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 394 | [(set i32:$sdst, (UniformBinFrag<umax> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 395 | >; | 
| Matt Arsenault | 479ba3a | 2016-09-07 06:25:55 +0000 | [diff] [blame] | 396 | } // End isCommutable = 1 | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 397 | } // End Defs = [SCC] | 
|  | 398 |  | 
|  | 399 |  | 
|  | 400 | let Uses = [SCC] in { | 
|  | 401 | def S_CSELECT_B32 : SOP2_32 <"s_cselect_b32">; | 
|  | 402 | def S_CSELECT_B64 : SOP2_64 <"s_cselect_b64">; | 
|  | 403 | } // End Uses = [SCC] | 
|  | 404 |  | 
|  | 405 | let Defs = [SCC] in { | 
| Matt Arsenault | 479ba3a | 2016-09-07 06:25:55 +0000 | [diff] [blame] | 406 | let isCommutable = 1 in { | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 407 | def S_AND_B32 : SOP2_32 <"s_and_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 408 | [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 409 | >; | 
|  | 410 |  | 
|  | 411 | def S_AND_B64 : SOP2_64 <"s_and_b64", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 412 | [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, i64:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 413 | >; | 
|  | 414 |  | 
|  | 415 | def S_OR_B32 : SOP2_32 <"s_or_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 416 | [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 417 | >; | 
|  | 418 |  | 
|  | 419 | def S_OR_B64 : SOP2_64 <"s_or_b64", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 420 | [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, i64:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 421 | >; | 
|  | 422 |  | 
|  | 423 | def S_XOR_B32 : SOP2_32 <"s_xor_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 424 | [(set i32:$sdst, (UniformBinFrag<xor> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 425 | >; | 
|  | 426 |  | 
|  | 427 | def S_XOR_B64 : SOP2_64 <"s_xor_b64", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 428 | [(set i64:$sdst, (UniformBinFrag<xor> i64:$src0, i64:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 429 | >; | 
| Konstantin Zhuravlyov | ca8946a | 2017-09-18 21:22:45 +0000 | [diff] [blame] | 430 |  | 
|  | 431 | def S_XNOR_B32 : SOP2_32 <"s_xnor_b32", | 
|  | 432 | [(set i32:$sdst, (not (xor_oneuse i32:$src0, i32:$src1)))] | 
|  | 433 | >; | 
|  | 434 |  | 
|  | 435 | def S_XNOR_B64 : SOP2_64 <"s_xnor_b64", | 
|  | 436 | [(set i64:$sdst, (not (xor_oneuse i64:$src0, i64:$src1)))] | 
|  | 437 | >; | 
| Graham Sellers | 04f7a4d | 2018-11-29 16:05:38 +0000 | [diff] [blame] | 438 |  | 
|  | 439 | def S_NAND_B32 : SOP2_32 <"s_nand_b32", | 
|  | 440 | [(set i32:$sdst, (not (and_oneuse i32:$src0, i32:$src1)))] | 
|  | 441 | >; | 
|  | 442 |  | 
|  | 443 | def S_NAND_B64 : SOP2_64 <"s_nand_b64", | 
|  | 444 | [(set i64:$sdst, (not (and_oneuse i64:$src0, i64:$src1)))] | 
|  | 445 | >; | 
|  | 446 |  | 
|  | 447 | def S_NOR_B32 : SOP2_32 <"s_nor_b32", | 
|  | 448 | [(set i32:$sdst, (not (or_oneuse i32:$src0, i32:$src1)))] | 
|  | 449 | >; | 
|  | 450 |  | 
|  | 451 | def S_NOR_B64 : SOP2_64 <"s_nor_b64", | 
|  | 452 | [(set i64:$sdst, (not (or_oneuse i64:$src0, i64:$src1)))] | 
|  | 453 | >; | 
| Matt Arsenault | 479ba3a | 2016-09-07 06:25:55 +0000 | [diff] [blame] | 454 | } // End isCommutable = 1 | 
|  | 455 |  | 
| Graham Sellers | 04f7a4d | 2018-11-29 16:05:38 +0000 | [diff] [blame] | 456 | def S_ANDN2_B32 : SOP2_32 <"s_andn2_b32", | 
|  | 457 | [(set i32:$sdst, (UniformBinFrag<and> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))] | 
|  | 458 | >; | 
|  | 459 |  | 
|  | 460 | def S_ANDN2_B64 : SOP2_64 <"s_andn2_b64", | 
|  | 461 | [(set i64:$sdst, (UniformBinFrag<and> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))] | 
|  | 462 | >; | 
|  | 463 |  | 
|  | 464 | def S_ORN2_B32 : SOP2_32 <"s_orn2_b32", | 
|  | 465 | [(set i32:$sdst, (UniformBinFrag<or> i32:$src0, (UniformUnaryFrag<not> i32:$src1)))] | 
|  | 466 | >; | 
|  | 467 |  | 
|  | 468 | def S_ORN2_B64 : SOP2_64 <"s_orn2_b64", | 
|  | 469 | [(set i64:$sdst, (UniformBinFrag<or> i64:$src0, (UniformUnaryFrag<not> i64:$src1)))] | 
|  | 470 | >; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 471 | } // End Defs = [SCC] | 
|  | 472 |  | 
|  | 473 | // Use added complexity so these patterns are preferred to the VALU patterns. | 
|  | 474 | let AddedComplexity = 1 in { | 
|  | 475 |  | 
|  | 476 | let Defs = [SCC] in { | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 477 | // TODO: b64 versions require VOP3 change since v_lshlrev_b64 is VOP3 | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 478 | def S_LSHL_B32 : SOP2_32 <"s_lshl_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 479 | [(set i32:$sdst, (UniformBinFrag<shl> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 480 | >; | 
|  | 481 | def S_LSHL_B64 : SOP2_64_32 <"s_lshl_b64", | 
| Alexander Timofeev | b048fa3 | 2018-10-01 11:06:35 +0000 | [diff] [blame] | 482 | [(set i64:$sdst, (UniformBinFrag<shl> i64:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 483 | >; | 
|  | 484 | def S_LSHR_B32 : SOP2_32 <"s_lshr_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 485 | [(set i32:$sdst, (UniformBinFrag<srl> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 486 | >; | 
|  | 487 | def S_LSHR_B64 : SOP2_64_32 <"s_lshr_b64", | 
| Alexander Timofeev | b048fa3 | 2018-10-01 11:06:35 +0000 | [diff] [blame] | 488 | [(set i64:$sdst, (UniformBinFrag<srl> i64:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 489 | >; | 
|  | 490 | def S_ASHR_I32 : SOP2_32 <"s_ashr_i32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 491 | [(set i32:$sdst, (UniformBinFrag<sra> i32:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 492 | >; | 
|  | 493 | def S_ASHR_I64 : SOP2_64_32 <"s_ashr_i64", | 
| Alexander Timofeev | b048fa3 | 2018-10-01 11:06:35 +0000 | [diff] [blame] | 494 | [(set i64:$sdst, (UniformBinFrag<sra> i64:$src0, i32:$src1))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 495 | >; | 
|  | 496 | } // End Defs = [SCC] | 
|  | 497 |  | 
|  | 498 | def S_BFM_B32 : SOP2_32 <"s_bfm_b32", | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 499 | [(set i32:$sdst, (UniformBinFrag<AMDGPUbfm> i32:$src0, i32:$src1))]>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 500 | def S_BFM_B64 : SOP2_64_32_32 <"s_bfm_b64">; | 
| Alexander Timofeev | 36617f01 | 2018-09-21 10:31:22 +0000 | [diff] [blame] | 501 |  | 
|  | 502 | // TODO: S_MUL_I32 require V_MUL_LO_I32 from VOP3 change | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 503 | def S_MUL_I32 : SOP2_32 <"s_mul_i32", | 
| Matt Arsenault | 479ba3a | 2016-09-07 06:25:55 +0000 | [diff] [blame] | 504 | [(set i32:$sdst, (mul i32:$src0, i32:$src1))]> { | 
|  | 505 | let isCommutable = 1; | 
|  | 506 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 507 |  | 
|  | 508 | } // End AddedComplexity = 1 | 
|  | 509 |  | 
|  | 510 | let Defs = [SCC] in { | 
|  | 511 | def S_BFE_U32 : SOP2_32 <"s_bfe_u32">; | 
|  | 512 | def S_BFE_I32 : SOP2_32 <"s_bfe_i32">; | 
|  | 513 | def S_BFE_U64 : SOP2_64_32 <"s_bfe_u64">; | 
|  | 514 | def S_BFE_I64 : SOP2_64_32 <"s_bfe_i64">; | 
|  | 515 | } // End Defs = [SCC] | 
|  | 516 |  | 
|  | 517 | def S_CBRANCH_G_FORK : SOP2_Pseudo < | 
|  | 518 | "s_cbranch_g_fork", (outs), | 
| Dmitry Preobrazhensky | 5714860 | 2017-04-14 11:52:26 +0000 | [diff] [blame] | 519 | (ins SCSrc_b64:$src0, SCSrc_b64:$src1), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 520 | "$src0, $src1" | 
|  | 521 | > { | 
|  | 522 | let has_sdst = 0; | 
|  | 523 | } | 
|  | 524 |  | 
|  | 525 | let Defs = [SCC] in { | 
|  | 526 | def S_ABSDIFF_I32 : SOP2_32 <"s_absdiff_i32">; | 
|  | 527 | } // End Defs = [SCC] | 
|  | 528 |  | 
| Stanislav Mekhanoshin | 5182302 | 2019-04-06 09:20:48 +0000 | [diff] [blame^] | 529 | let SubtargetPredicate = isGFX8GFX9 in { | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 530 | def S_RFE_RESTORE_B64 : SOP2_Pseudo < | 
|  | 531 | "s_rfe_restore_b64", (outs), | 
|  | 532 | (ins SSrc_b64:$src0, SSrc_b32:$src1), | 
|  | 533 | "$src0, $src1" | 
|  | 534 | > { | 
|  | 535 | let hasSideEffects = 1; | 
|  | 536 | let has_sdst = 0; | 
|  | 537 | } | 
|  | 538 | } | 
|  | 539 |  | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 540 | let SubtargetPredicate = isGFX9Plus in { | 
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 541 | def S_PACK_LL_B32_B16 : SOP2_32<"s_pack_ll_b32_b16">; | 
|  | 542 | def S_PACK_LH_B32_B16 : SOP2_32<"s_pack_lh_b32_b16">; | 
|  | 543 | def S_PACK_HH_B32_B16 : SOP2_32<"s_pack_hh_b32_b16">; | 
| Dmitry Preobrazhensky | 2f8e146 | 2018-04-09 13:10:33 +0000 | [diff] [blame] | 544 |  | 
|  | 545 | let Defs = [SCC] in { | 
|  | 546 | def S_LSHL1_ADD_U32 : SOP2_32<"s_lshl1_add_u32">; | 
|  | 547 | def S_LSHL2_ADD_U32 : SOP2_32<"s_lshl2_add_u32">; | 
|  | 548 | def S_LSHL3_ADD_U32 : SOP2_32<"s_lshl3_add_u32">; | 
|  | 549 | def S_LSHL4_ADD_U32 : SOP2_32<"s_lshl4_add_u32">; | 
|  | 550 | } // End Defs = [SCC] | 
|  | 551 |  | 
| Michael Liao | efb4f9e | 2019-03-18 20:40:09 +0000 | [diff] [blame] | 552 | let isCommutable = 1 in { | 
|  | 553 | def S_MUL_HI_U32 : SOP2_32<"s_mul_hi_u32", | 
|  | 554 | [(set i32:$sdst, (UniformBinFrag<mulhu> SSrc_b32:$src0, SSrc_b32:$src1))]>; | 
|  | 555 | def S_MUL_HI_I32 : SOP2_32<"s_mul_hi_i32", | 
|  | 556 | [(set i32:$sdst, (UniformBinFrag<mulhs> SSrc_b32:$src0, SSrc_b32:$src1))]>; | 
|  | 557 | } | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 558 | } // End SubtargetPredicate = isGFX9Plus | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 559 |  | 
|  | 560 | //===----------------------------------------------------------------------===// | 
|  | 561 | // SOPK Instructions | 
|  | 562 | //===----------------------------------------------------------------------===// | 
|  | 563 |  | 
|  | 564 | class SOPK_Pseudo <string opName, dag outs, dag ins, | 
|  | 565 | string asmOps, list<dag> pattern=[]> : | 
|  | 566 | InstSI <outs, ins, "", pattern>, | 
|  | 567 | SIMCInstr<opName, SIEncodingFamily.NONE> { | 
|  | 568 | let isPseudo = 1; | 
|  | 569 | let isCodeGenOnly = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 570 | let mayLoad = 0; | 
|  | 571 | let mayStore = 0; | 
|  | 572 | let hasSideEffects = 0; | 
|  | 573 | let SALU = 1; | 
|  | 574 | let SOPK = 1; | 
|  | 575 | let SchedRW = [WriteSALU]; | 
|  | 576 | let UseNamedOperandTable = 1; | 
|  | 577 | string Mnemonic = opName; | 
|  | 578 | string AsmOperands = asmOps; | 
|  | 579 |  | 
|  | 580 | bits<1> has_sdst = 1; | 
|  | 581 | } | 
|  | 582 |  | 
|  | 583 | class SOPK_Real<bits<5> op, SOPK_Pseudo ps> : | 
|  | 584 | InstSI <ps.OutOperandList, ps.InOperandList, | 
|  | 585 | ps.Mnemonic # " " # ps.AsmOperands, []> { | 
|  | 586 | let isPseudo = 0; | 
|  | 587 | let isCodeGenOnly = 0; | 
|  | 588 |  | 
|  | 589 | // copy relevant pseudo op flags | 
|  | 590 | let SubtargetPredicate = ps.SubtargetPredicate; | 
|  | 591 | let AsmMatchConverter  = ps.AsmMatchConverter; | 
|  | 592 | let DisableEncoding    = ps.DisableEncoding; | 
|  | 593 | let Constraints        = ps.Constraints; | 
|  | 594 |  | 
|  | 595 | // encoding | 
|  | 596 | bits<7>  sdst; | 
|  | 597 | bits<16> simm16; | 
|  | 598 | bits<32> imm; | 
|  | 599 | } | 
|  | 600 |  | 
|  | 601 | class SOPK_Real32<bits<5> op, SOPK_Pseudo ps> : | 
|  | 602 | SOPK_Real <op, ps>, | 
|  | 603 | Enc32 { | 
|  | 604 | let Inst{15-0}  = simm16; | 
|  | 605 | let Inst{22-16} = !if(ps.has_sdst, sdst, ?); | 
|  | 606 | let Inst{27-23} = op; | 
|  | 607 | let Inst{31-28} = 0xb; //encoding | 
|  | 608 | } | 
|  | 609 |  | 
|  | 610 | class SOPK_Real64<bits<5> op, SOPK_Pseudo ps> : | 
|  | 611 | SOPK_Real<op, ps>, | 
|  | 612 | Enc64 { | 
|  | 613 | let Inst{15-0}  = simm16; | 
|  | 614 | let Inst{22-16} = !if(ps.has_sdst, sdst, ?); | 
|  | 615 | let Inst{27-23} = op; | 
|  | 616 | let Inst{31-28} = 0xb; //encoding | 
|  | 617 | let Inst{63-32} = imm; | 
|  | 618 | } | 
|  | 619 |  | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 620 | class SOPKInstTable <bit is_sopk, string cmpOp = ""> { | 
|  | 621 | bit IsSOPK = is_sopk; | 
|  | 622 | string BaseCmpOp = cmpOp; | 
|  | 623 | } | 
|  | 624 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 625 | class SOPK_32 <string opName, list<dag> pattern=[]> : SOPK_Pseudo < | 
|  | 626 | opName, | 
|  | 627 | (outs SReg_32:$sdst), | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 628 | (ins s16imm:$simm16), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 629 | "$sdst, $simm16", | 
|  | 630 | pattern>; | 
|  | 631 |  | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 632 | class SOPK_SCC <string opName, string base_op, bit isSignExt> : SOPK_Pseudo < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 633 | opName, | 
|  | 634 | (outs), | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 635 | !if(isSignExt, | 
|  | 636 | (ins SReg_32:$sdst, s16imm:$simm16), | 
|  | 637 | (ins SReg_32:$sdst, u16imm:$simm16)), | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 638 | "$sdst, $simm16", []>, | 
|  | 639 | SOPKInstTable<1, base_op>{ | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 640 | let Defs = [SCC]; | 
|  | 641 | } | 
|  | 642 |  | 
|  | 643 | class SOPK_32TIE <string opName, list<dag> pattern=[]> : SOPK_Pseudo < | 
|  | 644 | opName, | 
|  | 645 | (outs SReg_32:$sdst), | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 646 | (ins SReg_32:$src0, s16imm:$simm16), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 647 | "$sdst, $simm16", | 
|  | 648 | pattern | 
|  | 649 | >; | 
|  | 650 |  | 
|  | 651 | let isReMaterializable = 1, isMoveImm = 1 in { | 
|  | 652 | def S_MOVK_I32 : SOPK_32 <"s_movk_i32">; | 
|  | 653 | } // End isReMaterializable = 1 | 
|  | 654 | let Uses = [SCC] in { | 
|  | 655 | def S_CMOVK_I32 : SOPK_32 <"s_cmovk_i32">; | 
|  | 656 | } | 
|  | 657 |  | 
|  | 658 | let isCompare = 1 in { | 
|  | 659 |  | 
|  | 660 | // This instruction is disabled for now until we can figure out how to teach | 
|  | 661 | // the instruction selector to correctly use the  S_CMP* vs V_CMP* | 
|  | 662 | // instructions. | 
|  | 663 | // | 
|  | 664 | // When this instruction is enabled the code generator sometimes produces this | 
|  | 665 | // invalid sequence: | 
|  | 666 | // | 
|  | 667 | // SCC = S_CMPK_EQ_I32 SGPR0, imm | 
|  | 668 | // VCC = COPY SCC | 
|  | 669 | // VGPR0 = V_CNDMASK VCC, VGPR0, VGPR1 | 
|  | 670 | // | 
|  | 671 | // def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", | 
|  | 672 | //   [(set i1:$dst, (setcc i32:$src0, imm:$src1, SETEQ))] | 
|  | 673 | // >; | 
|  | 674 |  | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 675 | def S_CMPK_EQ_I32 : SOPK_SCC <"s_cmpk_eq_i32", "s_cmp_eq_i32", 1>; | 
|  | 676 | def S_CMPK_LG_I32 : SOPK_SCC <"s_cmpk_lg_i32", "s_cmp_lg_i32", 1>; | 
|  | 677 | def S_CMPK_GT_I32 : SOPK_SCC <"s_cmpk_gt_i32", "s_cmp_gt_i32", 1>; | 
|  | 678 | def S_CMPK_GE_I32 : SOPK_SCC <"s_cmpk_ge_i32", "s_cmp_ge_i32", 1>; | 
|  | 679 | def S_CMPK_LT_I32 : SOPK_SCC <"s_cmpk_lt_i32", "s_cmp_lt_i32", 1>; | 
|  | 680 | def S_CMPK_LE_I32 : SOPK_SCC <"s_cmpk_le_i32", "s_cmp_le_i32", 1>; | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 681 |  | 
|  | 682 | let SOPKZext = 1 in { | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 683 | def S_CMPK_EQ_U32 : SOPK_SCC <"s_cmpk_eq_u32", "s_cmp_eq_u32", 0>; | 
|  | 684 | def S_CMPK_LG_U32 : SOPK_SCC <"s_cmpk_lg_u32", "s_cmp_lg_u32", 0>; | 
|  | 685 | def S_CMPK_GT_U32 : SOPK_SCC <"s_cmpk_gt_u32", "s_cmp_gt_u32", 0>; | 
|  | 686 | def S_CMPK_GE_U32 : SOPK_SCC <"s_cmpk_ge_u32", "s_cmp_ge_u32", 0>; | 
|  | 687 | def S_CMPK_LT_U32 : SOPK_SCC <"s_cmpk_lt_u32", "s_cmp_lt_u32", 0>; | 
|  | 688 | def S_CMPK_LE_U32 : SOPK_SCC <"s_cmpk_le_u32", "s_cmp_le_u32", 0>; | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 689 | } // End SOPKZext = 1 | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 690 | } // End isCompare = 1 | 
|  | 691 |  | 
|  | 692 | let Defs = [SCC], isCommutable = 1, DisableEncoding = "$src0", | 
|  | 693 | Constraints = "$sdst = $src0" in { | 
|  | 694 | def S_ADDK_I32 : SOPK_32TIE <"s_addk_i32">; | 
|  | 695 | def S_MULK_I32 : SOPK_32TIE <"s_mulk_i32">; | 
|  | 696 | } | 
|  | 697 |  | 
|  | 698 | def S_CBRANCH_I_FORK : SOPK_Pseudo < | 
|  | 699 | "s_cbranch_i_fork", | 
| Dmitry Preobrazhensky | c7d35a0 | 2017-04-26 15:34:19 +0000 | [diff] [blame] | 700 | (outs), (ins SReg_64:$sdst, s16imm:$simm16), | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 701 | "$sdst, $simm16" | 
|  | 702 | >; | 
|  | 703 |  | 
|  | 704 | let mayLoad = 1 in { | 
|  | 705 | def S_GETREG_B32 : SOPK_Pseudo < | 
|  | 706 | "s_getreg_b32", | 
|  | 707 | (outs SReg_32:$sdst), (ins hwreg:$simm16), | 
|  | 708 | "$sdst, $simm16" | 
|  | 709 | >; | 
|  | 710 | } | 
|  | 711 |  | 
| Tom Stellard | 8485fa0 | 2016-12-07 02:42:15 +0000 | [diff] [blame] | 712 | let hasSideEffects = 1 in { | 
|  | 713 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 714 | def S_SETREG_B32 : SOPK_Pseudo < | 
|  | 715 | "s_setreg_b32", | 
|  | 716 | (outs), (ins SReg_32:$sdst, hwreg:$simm16), | 
| Tom Stellard | 8485fa0 | 2016-12-07 02:42:15 +0000 | [diff] [blame] | 717 | "$simm16, $sdst", | 
|  | 718 | [(AMDGPUsetreg i32:$sdst, (i16 timm:$simm16))] | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 719 | >; | 
|  | 720 |  | 
|  | 721 | // FIXME: Not on SI? | 
|  | 722 | //def S_GETREG_REGRD_B32 : SOPK_32 <sopk<0x14, 0x13>, "s_getreg_regrd_b32">; | 
|  | 723 |  | 
|  | 724 | def S_SETREG_IMM32_B32 : SOPK_Pseudo < | 
|  | 725 | "s_setreg_imm32_b32", | 
|  | 726 | (outs), (ins i32imm:$imm, hwreg:$simm16), | 
| Matt Arsenault | 10c17ca | 2016-10-06 10:13:23 +0000 | [diff] [blame] | 727 | "$simm16, $imm"> { | 
|  | 728 | let Size = 8; // Unlike every other SOPK instruction. | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 729 | let has_sdst = 0; | 
|  | 730 | } | 
|  | 731 |  | 
| Tom Stellard | 8485fa0 | 2016-12-07 02:42:15 +0000 | [diff] [blame] | 732 | } // End hasSideEffects = 1 | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 733 |  | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 734 | let SubtargetPredicate = isGFX9Plus in { | 
| Dmitry Preobrazhensky | ae31223 | 2018-04-06 18:24:49 +0000 | [diff] [blame] | 735 | def S_CALL_B64 : SOPK_Pseudo< | 
|  | 736 | "s_call_b64", | 
|  | 737 | (outs SReg_64:$sdst), | 
|  | 738 | (ins s16imm:$simm16), | 
|  | 739 | "$sdst, $simm16"> { | 
|  | 740 | let isCall = 1; | 
|  | 741 | } | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 742 | } // End SubtargetPredicate = isGFX9Plus | 
| Dmitry Preobrazhensky | ae31223 | 2018-04-06 18:24:49 +0000 | [diff] [blame] | 743 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 744 | //===----------------------------------------------------------------------===// | 
|  | 745 | // SOPC Instructions | 
|  | 746 | //===----------------------------------------------------------------------===// | 
|  | 747 |  | 
|  | 748 | class SOPCe <bits<7> op> : Enc32 { | 
|  | 749 | bits<8> src0; | 
|  | 750 | bits<8> src1; | 
|  | 751 |  | 
|  | 752 | let Inst{7-0} = src0; | 
|  | 753 | let Inst{15-8} = src1; | 
|  | 754 | let Inst{22-16} = op; | 
|  | 755 | let Inst{31-23} = 0x17e; | 
|  | 756 | } | 
|  | 757 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 758 | class SOPC <bits<7> op, dag outs, dag ins, string asm, | 
|  | 759 | list<dag> pattern = []> : | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 760 | InstSI<outs, ins, asm, pattern>, SOPCe <op> { | 
|  | 761 | let mayLoad = 0; | 
|  | 762 | let mayStore = 0; | 
|  | 763 | let hasSideEffects = 0; | 
|  | 764 | let SALU = 1; | 
|  | 765 | let SOPC = 1; | 
|  | 766 | let isCodeGenOnly = 0; | 
|  | 767 | let Defs = [SCC]; | 
|  | 768 | let SchedRW = [WriteSALU]; | 
|  | 769 | let UseNamedOperandTable = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 770 | } | 
|  | 771 |  | 
|  | 772 | class SOPC_Base <bits<7> op, RegisterOperand rc0, RegisterOperand rc1, | 
|  | 773 | string opName, list<dag> pattern = []> : SOPC < | 
|  | 774 | op, (outs), (ins rc0:$src0, rc1:$src1), | 
|  | 775 | opName#" $src0, $src1", pattern > { | 
|  | 776 | let Defs = [SCC]; | 
|  | 777 | } | 
|  | 778 | class SOPC_Helper <bits<7> op, RegisterOperand rc, ValueType vt, | 
|  | 779 | string opName, PatLeaf cond> : SOPC_Base < | 
|  | 780 | op, rc, rc, opName, | 
|  | 781 | [(set SCC, (si_setcc_uniform vt:$src0, vt:$src1, cond))] > { | 
|  | 782 | } | 
|  | 783 |  | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 784 | class SOPC_CMP_32<bits<7> op, string opName, | 
|  | 785 | PatLeaf cond = COND_NULL, string revOp = opName> | 
|  | 786 | : SOPC_Helper<op, SSrc_b32, i32, opName, cond>, | 
|  | 787 | Commutable_REV<revOp, !eq(revOp, opName)>, | 
|  | 788 | SOPKInstTable<0, opName> { | 
|  | 789 | let isCompare = 1; | 
|  | 790 | let isCommutable = 1; | 
|  | 791 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 792 |  | 
| Matt Arsenault | 7b1dc2c | 2016-09-17 02:02:19 +0000 | [diff] [blame] | 793 | class SOPC_CMP_64<bits<7> op, string opName, | 
|  | 794 | PatLeaf cond = COND_NULL, string revOp = opName> | 
|  | 795 | : SOPC_Helper<op, SSrc_b64, i64, opName, cond>, | 
|  | 796 | Commutable_REV<revOp, !eq(revOp, opName)> { | 
|  | 797 | let isCompare = 1; | 
|  | 798 | let isCommutable = 1; | 
|  | 799 | } | 
|  | 800 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 801 | class SOPC_32<bits<7> op, string opName, list<dag> pattern = []> | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 802 | : SOPC_Base<op, SSrc_b32, SSrc_b32, opName, pattern>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 803 |  | 
|  | 804 | class SOPC_64_32<bits<7> op, string opName, list<dag> pattern = []> | 
| Sam Kolton | 1eeb11b | 2016-09-09 14:44:04 +0000 | [diff] [blame] | 805 | : SOPC_Base<op, SSrc_b64, SSrc_b32, opName, pattern>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 806 |  | 
| Matt Arsenault | 5d8eb25 | 2016-09-30 01:50:20 +0000 | [diff] [blame] | 807 | def S_CMP_EQ_I32 : SOPC_CMP_32 <0x00, "s_cmp_eq_i32">; | 
|  | 808 | def S_CMP_LG_I32 : SOPC_CMP_32 <0x01, "s_cmp_lg_i32">; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 809 | def S_CMP_GT_I32 : SOPC_CMP_32 <0x02, "s_cmp_gt_i32", COND_SGT>; | 
|  | 810 | def S_CMP_GE_I32 : SOPC_CMP_32 <0x03, "s_cmp_ge_i32", COND_SGE>; | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 811 | def S_CMP_LT_I32 : SOPC_CMP_32 <0x04, "s_cmp_lt_i32", COND_SLT, "s_cmp_gt_i32">; | 
|  | 812 | def S_CMP_LE_I32 : SOPC_CMP_32 <0x05, "s_cmp_le_i32", COND_SLE, "s_cmp_ge_i32">; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 813 | def S_CMP_EQ_U32 : SOPC_CMP_32 <0x06, "s_cmp_eq_u32", COND_EQ>; | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 814 | def S_CMP_LG_U32 : SOPC_CMP_32 <0x07, "s_cmp_lg_u32", COND_NE>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 815 | def S_CMP_GT_U32 : SOPC_CMP_32 <0x08, "s_cmp_gt_u32", COND_UGT>; | 
|  | 816 | def S_CMP_GE_U32 : SOPC_CMP_32 <0x09, "s_cmp_ge_u32", COND_UGE>; | 
| Matt Arsenault | 7ccf6cd | 2016-09-16 21:41:16 +0000 | [diff] [blame] | 817 | def S_CMP_LT_U32 : SOPC_CMP_32 <0x0a, "s_cmp_lt_u32", COND_ULT, "s_cmp_gt_u32">; | 
|  | 818 | def S_CMP_LE_U32 : SOPC_CMP_32 <0x0b, "s_cmp_le_u32", COND_ULE, "s_cmp_ge_u32">; | 
|  | 819 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 820 | def S_BITCMP0_B32 : SOPC_32 <0x0c, "s_bitcmp0_b32">; | 
|  | 821 | def S_BITCMP1_B32 : SOPC_32 <0x0d, "s_bitcmp1_b32">; | 
|  | 822 | def S_BITCMP0_B64 : SOPC_64_32 <0x0e, "s_bitcmp0_b64">; | 
|  | 823 | def S_BITCMP1_B64 : SOPC_64_32 <0x0f, "s_bitcmp1_b64">; | 
|  | 824 | def S_SETVSKIP : SOPC_32 <0x10, "s_setvskip">; | 
|  | 825 |  | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 826 | let SubtargetPredicate = isGFX8Plus in { | 
| Matt Arsenault | 7b1dc2c | 2016-09-17 02:02:19 +0000 | [diff] [blame] | 827 | def S_CMP_EQ_U64 : SOPC_CMP_64 <0x12, "s_cmp_eq_u64", COND_EQ>; | 
|  | 828 | def S_CMP_LG_U64 : SOPC_CMP_64 <0x13, "s_cmp_lg_u64", COND_NE>; | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 829 | } // End SubtargetPredicate = isGFX8Plus | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 830 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 831 | let SubtargetPredicate = HasVGPRIndexMode in { | 
|  | 832 | def S_SET_GPR_IDX_ON : SOPC <0x11, | 
|  | 833 | (outs), | 
|  | 834 | (ins SSrc_b32:$src0, GPRIdxMode:$src1), | 
|  | 835 | "s_set_gpr_idx_on $src0,$src1"> { | 
|  | 836 | let Defs = [M0]; // No scc def | 
|  | 837 | let Uses = [M0]; // Other bits of m0 unmodified. | 
|  | 838 | let hasSideEffects = 1; // Sets mode.gpr_idx_en | 
| Matt Arsenault | 2d8c289 | 2016-11-01 20:42:24 +0000 | [diff] [blame] | 839 | let FixedSize = 1; | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 840 | } | 
|  | 841 | } | 
|  | 842 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 843 | //===----------------------------------------------------------------------===// | 
|  | 844 | // SOPP Instructions | 
|  | 845 | //===----------------------------------------------------------------------===// | 
|  | 846 |  | 
|  | 847 | class SOPPe <bits<7> op> : Enc32 { | 
|  | 848 | bits <16> simm16; | 
|  | 849 |  | 
|  | 850 | let Inst{15-0} = simm16; | 
|  | 851 | let Inst{22-16} = op; | 
|  | 852 | let Inst{31-23} = 0x17f; // encoding | 
|  | 853 | } | 
|  | 854 |  | 
|  | 855 | class SOPP <bits<7> op, dag ins, string asm, list<dag> pattern = []> : | 
|  | 856 | InstSI <(outs), ins, asm, pattern >, SOPPe <op> { | 
|  | 857 |  | 
|  | 858 | let mayLoad = 0; | 
|  | 859 | let mayStore = 0; | 
|  | 860 | let hasSideEffects = 0; | 
|  | 861 | let SALU = 1; | 
|  | 862 | let SOPP = 1; | 
| Matt Arsenault | 10c17ca | 2016-10-06 10:13:23 +0000 | [diff] [blame] | 863 | let Size = 4; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 864 | let SchedRW = [WriteSALU]; | 
|  | 865 |  | 
|  | 866 | let UseNamedOperandTable = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 867 | } | 
|  | 868 |  | 
|  | 869 |  | 
|  | 870 | def S_NOP : SOPP <0x00000000, (ins i16imm:$simm16), "s_nop $simm16">; | 
|  | 871 |  | 
|  | 872 | let isTerminator = 1 in { | 
|  | 873 |  | 
| David Stuttard | 20ea21c | 2019-03-12 09:52:58 +0000 | [diff] [blame] | 874 | def S_ENDPGM : SOPP <0x00000001, (ins EndpgmImm:$simm16), "s_endpgm $simm16"> { | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 875 | let isBarrier = 1; | 
| Matt Arsenault | 4e9c1e3 | 2016-10-28 23:00:38 +0000 | [diff] [blame] | 876 | let isReturn = 1; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 877 | } | 
|  | 878 |  | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 879 | def S_ENDPGM_SAVED : SOPP <0x0000001B, (ins), "s_endpgm_saved"> { | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 880 | let SubtargetPredicate = isGFX8Plus; | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 881 | let simm16 = 0; | 
|  | 882 | let isBarrier = 1; | 
|  | 883 | let isReturn = 1; | 
|  | 884 | } | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 885 |  | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 886 | let SubtargetPredicate = isGFX9Plus in { | 
| Dmitry Preobrazhensky | 306b1a0 | 2018-04-06 17:25:00 +0000 | [diff] [blame] | 887 | let isBarrier = 1, isReturn = 1, simm16 = 0 in { | 
|  | 888 | def S_ENDPGM_ORDERED_PS_DONE : | 
|  | 889 | SOPP<0x01e, (ins), "s_endpgm_ordered_ps_done">; | 
|  | 890 | } // End isBarrier = 1, isReturn = 1, simm16 = 0 | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 891 | } // End SubtargetPredicate = isGFX9Plus | 
| Dmitry Preobrazhensky | 306b1a0 | 2018-04-06 17:25:00 +0000 | [diff] [blame] | 892 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 893 | let isBranch = 1, SchedRW = [WriteBranch] in { | 
|  | 894 | def S_BRANCH : SOPP < | 
|  | 895 | 0x00000002, (ins sopp_brtarget:$simm16), "s_branch $simm16", | 
|  | 896 | [(br bb:$simm16)]> { | 
|  | 897 | let isBarrier = 1; | 
|  | 898 | } | 
|  | 899 |  | 
|  | 900 | let Uses = [SCC] in { | 
|  | 901 | def S_CBRANCH_SCC0 : SOPP < | 
|  | 902 | 0x00000004, (ins sopp_brtarget:$simm16), | 
|  | 903 | "s_cbranch_scc0 $simm16" | 
|  | 904 | >; | 
|  | 905 | def S_CBRANCH_SCC1 : SOPP < | 
|  | 906 | 0x00000005, (ins sopp_brtarget:$simm16), | 
| Matt Arsenault | d674e0a | 2017-10-10 20:34:49 +0000 | [diff] [blame] | 907 | "s_cbranch_scc1 $simm16" | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 908 | >; | 
|  | 909 | } // End Uses = [SCC] | 
|  | 910 |  | 
|  | 911 | let Uses = [VCC] in { | 
|  | 912 | def S_CBRANCH_VCCZ : SOPP < | 
|  | 913 | 0x00000006, (ins sopp_brtarget:$simm16), | 
|  | 914 | "s_cbranch_vccz $simm16" | 
|  | 915 | >; | 
|  | 916 | def S_CBRANCH_VCCNZ : SOPP < | 
|  | 917 | 0x00000007, (ins sopp_brtarget:$simm16), | 
|  | 918 | "s_cbranch_vccnz $simm16" | 
|  | 919 | >; | 
|  | 920 | } // End Uses = [VCC] | 
|  | 921 |  | 
|  | 922 | let Uses = [EXEC] in { | 
|  | 923 | def S_CBRANCH_EXECZ : SOPP < | 
|  | 924 | 0x00000008, (ins sopp_brtarget:$simm16), | 
|  | 925 | "s_cbranch_execz $simm16" | 
|  | 926 | >; | 
|  | 927 | def S_CBRANCH_EXECNZ : SOPP < | 
|  | 928 | 0x00000009, (ins sopp_brtarget:$simm16), | 
|  | 929 | "s_cbranch_execnz $simm16" | 
|  | 930 | >; | 
|  | 931 | } // End Uses = [EXEC] | 
|  | 932 |  | 
| Dmitry Preobrazhensky | 3ac6311 | 2017-04-05 17:26:45 +0000 | [diff] [blame] | 933 | def S_CBRANCH_CDBGSYS : SOPP < | 
|  | 934 | 0x00000017, (ins sopp_brtarget:$simm16), | 
|  | 935 | "s_cbranch_cdbgsys $simm16" | 
|  | 936 | >; | 
|  | 937 |  | 
|  | 938 | def S_CBRANCH_CDBGSYS_AND_USER : SOPP < | 
|  | 939 | 0x0000001A, (ins sopp_brtarget:$simm16), | 
|  | 940 | "s_cbranch_cdbgsys_and_user $simm16" | 
|  | 941 | >; | 
|  | 942 |  | 
|  | 943 | def S_CBRANCH_CDBGSYS_OR_USER : SOPP < | 
|  | 944 | 0x00000019, (ins sopp_brtarget:$simm16), | 
|  | 945 | "s_cbranch_cdbgsys_or_user $simm16" | 
|  | 946 | >; | 
|  | 947 |  | 
|  | 948 | def S_CBRANCH_CDBGUSER : SOPP < | 
|  | 949 | 0x00000018, (ins sopp_brtarget:$simm16), | 
|  | 950 | "s_cbranch_cdbguser $simm16" | 
|  | 951 | >; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 952 |  | 
|  | 953 | } // End isBranch = 1 | 
|  | 954 | } // End isTerminator = 1 | 
|  | 955 |  | 
|  | 956 | let hasSideEffects = 1 in { | 
|  | 957 | def S_BARRIER : SOPP <0x0000000a, (ins), "s_barrier", | 
|  | 958 | [(int_amdgcn_s_barrier)]> { | 
|  | 959 | let SchedRW = [WriteBarrier]; | 
|  | 960 | let simm16 = 0; | 
|  | 961 | let mayLoad = 1; | 
|  | 962 | let mayStore = 1; | 
|  | 963 | let isConvergent = 1; | 
|  | 964 | } | 
|  | 965 |  | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 966 | def S_WAKEUP : SOPP <0x00000003, (ins), "s_wakeup"> { | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 967 | let SubtargetPredicate = isGFX8Plus; | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 968 | let simm16 = 0; | 
|  | 969 | let mayLoad = 1; | 
|  | 970 | let mayStore = 1; | 
|  | 971 | } | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 972 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 973 | let mayLoad = 1, mayStore = 1, hasSideEffects = 1 in | 
|  | 974 | def S_WAITCNT : SOPP <0x0000000c, (ins WAIT_FLAG:$simm16), "s_waitcnt $simm16">; | 
|  | 975 | def S_SETHALT : SOPP <0x0000000d, (ins i16imm:$simm16), "s_sethalt $simm16">; | 
| Dmitry Preobrazhensky | 3ac6311 | 2017-04-05 17:26:45 +0000 | [diff] [blame] | 976 | def S_SETKILL : SOPP <0x0000000b, (ins i16imm:$simm16), "s_setkill $simm16">; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 977 |  | 
|  | 978 | // On SI the documentation says sleep for approximately 64 * low 2 | 
|  | 979 | // bits, consistent with the reported maximum of 448. On VI the | 
|  | 980 | // maximum reported is 960 cycles, so 960 / 64 = 15 max, so is the | 
|  | 981 | // maximum really 15 on VI? | 
|  | 982 | def S_SLEEP : SOPP <0x0000000e, (ins i32imm:$simm16), | 
|  | 983 | "s_sleep $simm16", [(int_amdgcn_s_sleep SIMM16bit:$simm16)]> { | 
|  | 984 | let hasSideEffects = 1; | 
|  | 985 | let mayLoad = 1; | 
|  | 986 | let mayStore = 1; | 
|  | 987 | } | 
|  | 988 |  | 
|  | 989 | def S_SETPRIO : SOPP <0x0000000f, (ins i16imm:$simm16), "s_setprio $simm16">; | 
|  | 990 |  | 
|  | 991 | let Uses = [EXEC, M0] in { | 
|  | 992 | // FIXME: Should this be mayLoad+mayStore? | 
|  | 993 | def S_SENDMSG : SOPP <0x00000010, (ins SendMsgImm:$simm16), "s_sendmsg $simm16", | 
|  | 994 | [(AMDGPUsendmsg (i32 imm:$simm16))] | 
|  | 995 | >; | 
| Jan Vesely | d48445d | 2017-01-04 18:06:55 +0000 | [diff] [blame] | 996 |  | 
|  | 997 | def S_SENDMSGHALT : SOPP <0x00000011, (ins SendMsgImm:$simm16), "s_sendmsghalt $simm16", | 
|  | 998 | [(AMDGPUsendmsghalt (i32 imm:$simm16))] | 
|  | 999 | >; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1000 | } // End Uses = [EXEC, M0] | 
|  | 1001 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1002 | def S_TRAP : SOPP <0x00000012, (ins i16imm:$simm16), "s_trap $simm16">; | 
|  | 1003 | def S_ICACHE_INV : SOPP <0x00000013, (ins), "s_icache_inv"> { | 
|  | 1004 | let simm16 = 0; | 
|  | 1005 | } | 
|  | 1006 | def S_INCPERFLEVEL : SOPP <0x00000014, (ins i32imm:$simm16), "s_incperflevel $simm16", | 
|  | 1007 | [(int_amdgcn_s_incperflevel SIMM16bit:$simm16)]> { | 
|  | 1008 | let hasSideEffects = 1; | 
|  | 1009 | let mayLoad = 1; | 
|  | 1010 | let mayStore = 1; | 
|  | 1011 | } | 
|  | 1012 | def S_DECPERFLEVEL : SOPP <0x00000015, (ins i32imm:$simm16), "s_decperflevel $simm16", | 
|  | 1013 | [(int_amdgcn_s_decperflevel SIMM16bit:$simm16)]> { | 
|  | 1014 | let hasSideEffects = 1; | 
|  | 1015 | let mayLoad = 1; | 
|  | 1016 | let mayStore = 1; | 
|  | 1017 | } | 
|  | 1018 | def S_TTRACEDATA : SOPP <0x00000016, (ins), "s_ttracedata"> { | 
|  | 1019 | let simm16 = 0; | 
|  | 1020 | } | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 1021 |  | 
|  | 1022 | let SubtargetPredicate = HasVGPRIndexMode in { | 
|  | 1023 | def S_SET_GPR_IDX_OFF : SOPP<0x1c, (ins), "s_set_gpr_idx_off"> { | 
|  | 1024 | let simm16 = 0; | 
|  | 1025 | } | 
|  | 1026 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1027 | } // End hasSideEffects | 
|  | 1028 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 1029 | let SubtargetPredicate = HasVGPRIndexMode in { | 
|  | 1030 | def S_SET_GPR_IDX_MODE : SOPP<0x1d, (ins GPRIdxMode:$simm16), | 
|  | 1031 | "s_set_gpr_idx_mode$simm16"> { | 
|  | 1032 | let Defs = [M0]; | 
|  | 1033 | } | 
|  | 1034 | } | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1035 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1036 | //===----------------------------------------------------------------------===// | 
|  | 1037 | // S_GETREG_B32 Intrinsic Pattern. | 
|  | 1038 | //===----------------------------------------------------------------------===// | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1039 | def : GCNPat < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1040 | (int_amdgcn_s_getreg imm:$simm16), | 
|  | 1041 | (S_GETREG_B32 (as_i16imm $simm16)) | 
|  | 1042 | >; | 
|  | 1043 |  | 
|  | 1044 | //===----------------------------------------------------------------------===// | 
|  | 1045 | // SOP1 Patterns | 
|  | 1046 | //===----------------------------------------------------------------------===// | 
|  | 1047 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1048 | def : GCNPat < | 
| David Stuttard | 20ea21c | 2019-03-12 09:52:58 +0000 | [diff] [blame] | 1049 | (AMDGPUendpgm), | 
|  | 1050 | (S_ENDPGM (i16 0)) | 
|  | 1051 | >; | 
|  | 1052 |  | 
|  | 1053 | def : GCNPat < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1054 | (i64 (ctpop i64:$src)), | 
|  | 1055 | (i64 (REG_SEQUENCE SReg_64, | 
|  | 1056 | (i32 (COPY_TO_REGCLASS (S_BCNT1_I32_B64 $src), SReg_32)), sub0, | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1057 | (S_MOV_B32 (i32 0)), sub1)) | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1058 | >; | 
|  | 1059 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1060 | def : GCNPat < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1061 | (i32 (smax i32:$x, (i32 (ineg i32:$x)))), | 
|  | 1062 | (S_ABS_I32 $x) | 
|  | 1063 | >; | 
|  | 1064 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1065 | def : GCNPat < | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1066 | (i16 imm:$imm), | 
|  | 1067 | (S_MOV_B32 imm:$imm) | 
|  | 1068 | >; | 
|  | 1069 |  | 
|  | 1070 | // Same as a 32-bit inreg | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1071 | def : GCNPat< | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1072 | (i32 (sext i16:$src)), | 
|  | 1073 | (S_SEXT_I32_I16 $src) | 
|  | 1074 | >; | 
|  | 1075 |  | 
|  | 1076 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1077 | //===----------------------------------------------------------------------===// | 
|  | 1078 | // SOP2 Patterns | 
|  | 1079 | //===----------------------------------------------------------------------===// | 
|  | 1080 |  | 
|  | 1081 | // V_ADD_I32_e32/S_ADD_U32 produces carry in VCC/SCC. For the vector | 
|  | 1082 | // case, the sgpr-copies pass will fix this to use the vector version. | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1083 | def : GCNPat < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1084 | (i32 (addc i32:$src0, i32:$src1)), | 
|  | 1085 | (S_ADD_U32 $src0, $src1) | 
|  | 1086 | >; | 
|  | 1087 |  | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1088 | // FIXME: We need to use COPY_TO_REGCLASS to work-around the fact that | 
|  | 1089 | // REG_SEQUENCE patterns don't support instructions with multiple | 
|  | 1090 | // outputs. | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1091 | def : GCNPat< | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1092 | (i64 (zext i16:$src)), | 
|  | 1093 | (REG_SEQUENCE SReg_64, | 
|  | 1094 | (i32 (COPY_TO_REGCLASS (S_AND_B32 $src, (S_MOV_B32 (i32 0xffff))), SGPR_32)), sub0, | 
|  | 1095 | (S_MOV_B32 (i32 0)), sub1) | 
|  | 1096 | >; | 
|  | 1097 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1098 | def : GCNPat < | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1099 | (i64 (sext i16:$src)), | 
|  | 1100 | (REG_SEQUENCE SReg_64, (i32 (S_SEXT_I32_I16 $src)), sub0, | 
|  | 1101 | (i32 (COPY_TO_REGCLASS (S_ASHR_I32 (i32 (S_SEXT_I32_I16 $src)), (S_MOV_B32 (i32 31))), SGPR_32)), sub1) | 
|  | 1102 | >; | 
|  | 1103 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1104 | def : GCNPat< | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 1105 | (i32 (zext i16:$src)), | 
|  | 1106 | (S_AND_B32 (S_MOV_B32 (i32 0xffff)), $src) | 
|  | 1107 | >; | 
|  | 1108 |  | 
|  | 1109 |  | 
|  | 1110 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1111 | //===----------------------------------------------------------------------===// | 
|  | 1112 | // SOPP Patterns | 
|  | 1113 | //===----------------------------------------------------------------------===// | 
|  | 1114 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 1115 | def : GCNPat < | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1116 | (int_amdgcn_s_waitcnt i32:$simm16), | 
|  | 1117 | (S_WAITCNT (as_i16imm $simm16)) | 
|  | 1118 | >; | 
|  | 1119 |  | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1120 |  | 
|  | 1121 | //===----------------------------------------------------------------------===// | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 1122 | // Target-specific instruction encodings. | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1123 | //===----------------------------------------------------------------------===// | 
|  | 1124 |  | 
|  | 1125 | class Select_si<string opName> : | 
|  | 1126 | SIMCInstr<opName, SIEncodingFamily.SI> { | 
| Stanislav Mekhanoshin | 7895c03 | 2019-04-05 18:24:34 +0000 | [diff] [blame] | 1127 | list<Predicate> AssemblerPredicates = [isGFX6GFX7]; | 
|  | 1128 | string DecoderNamespace = "GFX6GFX7"; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1129 | } | 
|  | 1130 |  | 
|  | 1131 | class SOP1_Real_si<bits<8> op, SOP1_Pseudo ps> : | 
|  | 1132 | SOP1_Real<op, ps>, | 
|  | 1133 | Select_si<ps.Mnemonic>; | 
|  | 1134 |  | 
|  | 1135 | class SOP2_Real_si<bits<7> op, SOP2_Pseudo ps> : | 
|  | 1136 | SOP2_Real<op, ps>, | 
|  | 1137 | Select_si<ps.Mnemonic>; | 
|  | 1138 |  | 
|  | 1139 | class SOPK_Real_si<bits<5> op, SOPK_Pseudo ps> : | 
|  | 1140 | SOPK_Real32<op, ps>, | 
|  | 1141 | Select_si<ps.Mnemonic>; | 
|  | 1142 |  | 
|  | 1143 | def S_MOV_B32_si           : SOP1_Real_si <0x03, S_MOV_B32>; | 
|  | 1144 | def S_MOV_B64_si           : SOP1_Real_si <0x04, S_MOV_B64>; | 
|  | 1145 | def S_CMOV_B32_si          : SOP1_Real_si <0x05, S_CMOV_B32>; | 
|  | 1146 | def S_CMOV_B64_si          : SOP1_Real_si <0x06, S_CMOV_B64>; | 
|  | 1147 | def S_NOT_B32_si           : SOP1_Real_si <0x07, S_NOT_B32>; | 
|  | 1148 | def S_NOT_B64_si           : SOP1_Real_si <0x08, S_NOT_B64>; | 
|  | 1149 | def S_WQM_B32_si           : SOP1_Real_si <0x09, S_WQM_B32>; | 
|  | 1150 | def S_WQM_B64_si           : SOP1_Real_si <0x0a, S_WQM_B64>; | 
|  | 1151 | def S_BREV_B32_si          : SOP1_Real_si <0x0b, S_BREV_B32>; | 
|  | 1152 | def S_BREV_B64_si          : SOP1_Real_si <0x0c, S_BREV_B64>; | 
|  | 1153 | def S_BCNT0_I32_B32_si     : SOP1_Real_si <0x0d, S_BCNT0_I32_B32>; | 
|  | 1154 | def S_BCNT0_I32_B64_si     : SOP1_Real_si <0x0e, S_BCNT0_I32_B64>; | 
|  | 1155 | def S_BCNT1_I32_B32_si     : SOP1_Real_si <0x0f, S_BCNT1_I32_B32>; | 
|  | 1156 | def S_BCNT1_I32_B64_si     : SOP1_Real_si <0x10, S_BCNT1_I32_B64>; | 
|  | 1157 | def S_FF0_I32_B32_si       : SOP1_Real_si <0x11, S_FF0_I32_B32>; | 
|  | 1158 | def S_FF0_I32_B64_si       : SOP1_Real_si <0x12, S_FF0_I32_B64>; | 
|  | 1159 | def S_FF1_I32_B32_si       : SOP1_Real_si <0x13, S_FF1_I32_B32>; | 
|  | 1160 | def S_FF1_I32_B64_si       : SOP1_Real_si <0x14, S_FF1_I32_B64>; | 
|  | 1161 | def S_FLBIT_I32_B32_si     : SOP1_Real_si <0x15, S_FLBIT_I32_B32>; | 
|  | 1162 | def S_FLBIT_I32_B64_si     : SOP1_Real_si <0x16, S_FLBIT_I32_B64>; | 
|  | 1163 | def S_FLBIT_I32_si         : SOP1_Real_si <0x17, S_FLBIT_I32>; | 
|  | 1164 | def S_FLBIT_I32_I64_si     : SOP1_Real_si <0x18, S_FLBIT_I32_I64>; | 
|  | 1165 | def S_SEXT_I32_I8_si       : SOP1_Real_si <0x19, S_SEXT_I32_I8>; | 
|  | 1166 | def S_SEXT_I32_I16_si      : SOP1_Real_si <0x1a, S_SEXT_I32_I16>; | 
|  | 1167 | def S_BITSET0_B32_si       : SOP1_Real_si <0x1b, S_BITSET0_B32>; | 
|  | 1168 | def S_BITSET0_B64_si       : SOP1_Real_si <0x1c, S_BITSET0_B64>; | 
|  | 1169 | def S_BITSET1_B32_si       : SOP1_Real_si <0x1d, S_BITSET1_B32>; | 
|  | 1170 | def S_BITSET1_B64_si       : SOP1_Real_si <0x1e, S_BITSET1_B64>; | 
|  | 1171 | def S_GETPC_B64_si         : SOP1_Real_si <0x1f, S_GETPC_B64>; | 
|  | 1172 | def S_SETPC_B64_si         : SOP1_Real_si <0x20, S_SETPC_B64>; | 
|  | 1173 | def S_SWAPPC_B64_si        : SOP1_Real_si <0x21, S_SWAPPC_B64>; | 
|  | 1174 | def S_RFE_B64_si           : SOP1_Real_si <0x22, S_RFE_B64>; | 
|  | 1175 | def S_AND_SAVEEXEC_B64_si  : SOP1_Real_si <0x24, S_AND_SAVEEXEC_B64>; | 
|  | 1176 | def S_OR_SAVEEXEC_B64_si   : SOP1_Real_si <0x25, S_OR_SAVEEXEC_B64>; | 
|  | 1177 | def S_XOR_SAVEEXEC_B64_si  : SOP1_Real_si <0x26, S_XOR_SAVEEXEC_B64>; | 
|  | 1178 | def S_ANDN2_SAVEEXEC_B64_si: SOP1_Real_si <0x27, S_ANDN2_SAVEEXEC_B64>; | 
|  | 1179 | def S_ORN2_SAVEEXEC_B64_si : SOP1_Real_si <0x28, S_ORN2_SAVEEXEC_B64>; | 
|  | 1180 | def S_NAND_SAVEEXEC_B64_si : SOP1_Real_si <0x29, S_NAND_SAVEEXEC_B64>; | 
|  | 1181 | def S_NOR_SAVEEXEC_B64_si  : SOP1_Real_si <0x2a, S_NOR_SAVEEXEC_B64>; | 
|  | 1182 | def S_XNOR_SAVEEXEC_B64_si : SOP1_Real_si <0x2b, S_XNOR_SAVEEXEC_B64>; | 
|  | 1183 | def S_QUADMASK_B32_si      : SOP1_Real_si <0x2c, S_QUADMASK_B32>; | 
|  | 1184 | def S_QUADMASK_B64_si      : SOP1_Real_si <0x2d, S_QUADMASK_B64>; | 
|  | 1185 | def S_MOVRELS_B32_si       : SOP1_Real_si <0x2e, S_MOVRELS_B32>; | 
|  | 1186 | def S_MOVRELS_B64_si       : SOP1_Real_si <0x2f, S_MOVRELS_B64>; | 
|  | 1187 | def S_MOVRELD_B32_si       : SOP1_Real_si <0x30, S_MOVRELD_B32>; | 
|  | 1188 | def S_MOVRELD_B64_si       : SOP1_Real_si <0x31, S_MOVRELD_B64>; | 
|  | 1189 | def S_CBRANCH_JOIN_si      : SOP1_Real_si <0x32, S_CBRANCH_JOIN>; | 
|  | 1190 | def S_MOV_REGRD_B32_si     : SOP1_Real_si <0x33, S_MOV_REGRD_B32>; | 
|  | 1191 | def S_ABS_I32_si           : SOP1_Real_si <0x34, S_ABS_I32>; | 
|  | 1192 | def S_MOV_FED_B32_si       : SOP1_Real_si <0x35, S_MOV_FED_B32>; | 
|  | 1193 |  | 
|  | 1194 | def S_ADD_U32_si           : SOP2_Real_si <0x00, S_ADD_U32>; | 
|  | 1195 | def S_ADD_I32_si           : SOP2_Real_si <0x02, S_ADD_I32>; | 
|  | 1196 | def S_SUB_U32_si           : SOP2_Real_si <0x01, S_SUB_U32>; | 
|  | 1197 | def S_SUB_I32_si           : SOP2_Real_si <0x03, S_SUB_I32>; | 
|  | 1198 | def S_ADDC_U32_si          : SOP2_Real_si <0x04, S_ADDC_U32>; | 
|  | 1199 | def S_SUBB_U32_si          : SOP2_Real_si <0x05, S_SUBB_U32>; | 
|  | 1200 | def S_MIN_I32_si           : SOP2_Real_si <0x06, S_MIN_I32>; | 
|  | 1201 | def S_MIN_U32_si           : SOP2_Real_si <0x07, S_MIN_U32>; | 
|  | 1202 | def S_MAX_I32_si           : SOP2_Real_si <0x08, S_MAX_I32>; | 
|  | 1203 | def S_MAX_U32_si           : SOP2_Real_si <0x09, S_MAX_U32>; | 
|  | 1204 | def S_CSELECT_B32_si       : SOP2_Real_si <0x0a, S_CSELECT_B32>; | 
|  | 1205 | def S_CSELECT_B64_si       : SOP2_Real_si <0x0b, S_CSELECT_B64>; | 
|  | 1206 | def S_AND_B32_si           : SOP2_Real_si <0x0e, S_AND_B32>; | 
|  | 1207 | def S_AND_B64_si           : SOP2_Real_si <0x0f, S_AND_B64>; | 
|  | 1208 | def S_OR_B32_si            : SOP2_Real_si <0x10, S_OR_B32>; | 
|  | 1209 | def S_OR_B64_si            : SOP2_Real_si <0x11, S_OR_B64>; | 
|  | 1210 | def S_XOR_B32_si           : SOP2_Real_si <0x12, S_XOR_B32>; | 
|  | 1211 | def S_XOR_B64_si           : SOP2_Real_si <0x13, S_XOR_B64>; | 
|  | 1212 | def S_ANDN2_B32_si         : SOP2_Real_si <0x14, S_ANDN2_B32>; | 
|  | 1213 | def S_ANDN2_B64_si         : SOP2_Real_si <0x15, S_ANDN2_B64>; | 
|  | 1214 | def S_ORN2_B32_si          : SOP2_Real_si <0x16, S_ORN2_B32>; | 
|  | 1215 | def S_ORN2_B64_si          : SOP2_Real_si <0x17, S_ORN2_B64>; | 
|  | 1216 | def S_NAND_B32_si          : SOP2_Real_si <0x18, S_NAND_B32>; | 
|  | 1217 | def S_NAND_B64_si          : SOP2_Real_si <0x19, S_NAND_B64>; | 
|  | 1218 | def S_NOR_B32_si           : SOP2_Real_si <0x1a, S_NOR_B32>; | 
|  | 1219 | def S_NOR_B64_si           : SOP2_Real_si <0x1b, S_NOR_B64>; | 
|  | 1220 | def S_XNOR_B32_si          : SOP2_Real_si <0x1c, S_XNOR_B32>; | 
|  | 1221 | def S_XNOR_B64_si          : SOP2_Real_si <0x1d, S_XNOR_B64>; | 
|  | 1222 | def S_LSHL_B32_si          : SOP2_Real_si <0x1e, S_LSHL_B32>; | 
|  | 1223 | def S_LSHL_B64_si          : SOP2_Real_si <0x1f, S_LSHL_B64>; | 
|  | 1224 | def S_LSHR_B32_si          : SOP2_Real_si <0x20, S_LSHR_B32>; | 
|  | 1225 | def S_LSHR_B64_si          : SOP2_Real_si <0x21, S_LSHR_B64>; | 
|  | 1226 | def S_ASHR_I32_si          : SOP2_Real_si <0x22, S_ASHR_I32>; | 
|  | 1227 | def S_ASHR_I64_si          : SOP2_Real_si <0x23, S_ASHR_I64>; | 
|  | 1228 | def S_BFM_B32_si           : SOP2_Real_si <0x24, S_BFM_B32>; | 
|  | 1229 | def S_BFM_B64_si           : SOP2_Real_si <0x25, S_BFM_B64>; | 
|  | 1230 | def S_MUL_I32_si           : SOP2_Real_si <0x26, S_MUL_I32>; | 
|  | 1231 | def S_BFE_U32_si           : SOP2_Real_si <0x27, S_BFE_U32>; | 
|  | 1232 | def S_BFE_I32_si           : SOP2_Real_si <0x28, S_BFE_I32>; | 
|  | 1233 | def S_BFE_U64_si           : SOP2_Real_si <0x29, S_BFE_U64>; | 
|  | 1234 | def S_BFE_I64_si           : SOP2_Real_si <0x2a, S_BFE_I64>; | 
|  | 1235 | def S_CBRANCH_G_FORK_si    : SOP2_Real_si <0x2b, S_CBRANCH_G_FORK>; | 
|  | 1236 | def S_ABSDIFF_I32_si       : SOP2_Real_si <0x2c, S_ABSDIFF_I32>; | 
|  | 1237 |  | 
|  | 1238 | def S_MOVK_I32_si          : SOPK_Real_si <0x00, S_MOVK_I32>; | 
|  | 1239 | def S_CMOVK_I32_si         : SOPK_Real_si <0x02, S_CMOVK_I32>; | 
|  | 1240 | def S_CMPK_EQ_I32_si       : SOPK_Real_si <0x03, S_CMPK_EQ_I32>; | 
|  | 1241 | def S_CMPK_LG_I32_si       : SOPK_Real_si <0x04, S_CMPK_LG_I32>; | 
|  | 1242 | def S_CMPK_GT_I32_si       : SOPK_Real_si <0x05, S_CMPK_GT_I32>; | 
|  | 1243 | def S_CMPK_GE_I32_si       : SOPK_Real_si <0x06, S_CMPK_GE_I32>; | 
|  | 1244 | def S_CMPK_LT_I32_si       : SOPK_Real_si <0x07, S_CMPK_LT_I32>; | 
|  | 1245 | def S_CMPK_LE_I32_si       : SOPK_Real_si <0x08, S_CMPK_LE_I32>; | 
|  | 1246 | def S_CMPK_EQ_U32_si       : SOPK_Real_si <0x09, S_CMPK_EQ_U32>; | 
|  | 1247 | def S_CMPK_LG_U32_si       : SOPK_Real_si <0x0a, S_CMPK_LG_U32>; | 
|  | 1248 | def S_CMPK_GT_U32_si       : SOPK_Real_si <0x0b, S_CMPK_GT_U32>; | 
|  | 1249 | def S_CMPK_GE_U32_si       : SOPK_Real_si <0x0c, S_CMPK_GE_U32>; | 
|  | 1250 | def S_CMPK_LT_U32_si       : SOPK_Real_si <0x0d, S_CMPK_LT_U32>; | 
|  | 1251 | def S_CMPK_LE_U32_si       : SOPK_Real_si <0x0e, S_CMPK_LE_U32>; | 
|  | 1252 | def S_ADDK_I32_si          : SOPK_Real_si <0x0f, S_ADDK_I32>; | 
|  | 1253 | def S_MULK_I32_si          : SOPK_Real_si <0x10, S_MULK_I32>; | 
|  | 1254 | def S_CBRANCH_I_FORK_si    : SOPK_Real_si <0x11, S_CBRANCH_I_FORK>; | 
|  | 1255 | def S_GETREG_B32_si        : SOPK_Real_si <0x12, S_GETREG_B32>; | 
|  | 1256 | def S_SETREG_B32_si        : SOPK_Real_si <0x13, S_SETREG_B32>; | 
|  | 1257 | //def S_GETREG_REGRD_B32_si  : SOPK_Real_si <0x14, S_GETREG_REGRD_B32>; // see pseudo for comments | 
|  | 1258 | def S_SETREG_IMM32_B32_si  : SOPK_Real64<0x15, S_SETREG_IMM32_B32>, | 
|  | 1259 | Select_si<S_SETREG_IMM32_B32.Mnemonic>; | 
|  | 1260 |  | 
|  | 1261 |  | 
|  | 1262 | class Select_vi<string opName> : | 
|  | 1263 | SIMCInstr<opName, SIEncodingFamily.VI> { | 
| Stanislav Mekhanoshin | 5182302 | 2019-04-06 09:20:48 +0000 | [diff] [blame^] | 1264 | list<Predicate> AssemblerPredicates = [isGFX8GFX9]; | 
|  | 1265 | string DecoderNamespace = "GFX8"; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1266 | } | 
|  | 1267 |  | 
|  | 1268 | class SOP1_Real_vi<bits<8> op, SOP1_Pseudo ps> : | 
|  | 1269 | SOP1_Real<op, ps>, | 
|  | 1270 | Select_vi<ps.Mnemonic>; | 
|  | 1271 |  | 
|  | 1272 |  | 
|  | 1273 | class SOP2_Real_vi<bits<7> op, SOP2_Pseudo ps> : | 
|  | 1274 | SOP2_Real<op, ps>, | 
|  | 1275 | Select_vi<ps.Mnemonic>; | 
|  | 1276 |  | 
|  | 1277 | class SOPK_Real_vi<bits<5> op, SOPK_Pseudo ps> : | 
|  | 1278 | SOPK_Real32<op, ps>, | 
|  | 1279 | Select_vi<ps.Mnemonic>; | 
|  | 1280 |  | 
|  | 1281 | def S_MOV_B32_vi           : SOP1_Real_vi <0x00, S_MOV_B32>; | 
|  | 1282 | def S_MOV_B64_vi           : SOP1_Real_vi <0x01, S_MOV_B64>; | 
|  | 1283 | def S_CMOV_B32_vi          : SOP1_Real_vi <0x02, S_CMOV_B32>; | 
|  | 1284 | def S_CMOV_B64_vi          : SOP1_Real_vi <0x03, S_CMOV_B64>; | 
|  | 1285 | def S_NOT_B32_vi           : SOP1_Real_vi <0x04, S_NOT_B32>; | 
|  | 1286 | def S_NOT_B64_vi           : SOP1_Real_vi <0x05, S_NOT_B64>; | 
|  | 1287 | def S_WQM_B32_vi           : SOP1_Real_vi <0x06, S_WQM_B32>; | 
|  | 1288 | def S_WQM_B64_vi           : SOP1_Real_vi <0x07, S_WQM_B64>; | 
|  | 1289 | def S_BREV_B32_vi          : SOP1_Real_vi <0x08, S_BREV_B32>; | 
|  | 1290 | def S_BREV_B64_vi          : SOP1_Real_vi <0x09, S_BREV_B64>; | 
|  | 1291 | def S_BCNT0_I32_B32_vi     : SOP1_Real_vi <0x0a, S_BCNT0_I32_B32>; | 
|  | 1292 | def S_BCNT0_I32_B64_vi     : SOP1_Real_vi <0x0b, S_BCNT0_I32_B64>; | 
|  | 1293 | def S_BCNT1_I32_B32_vi     : SOP1_Real_vi <0x0c, S_BCNT1_I32_B32>; | 
|  | 1294 | def S_BCNT1_I32_B64_vi     : SOP1_Real_vi <0x0d, S_BCNT1_I32_B64>; | 
|  | 1295 | def S_FF0_I32_B32_vi       : SOP1_Real_vi <0x0e, S_FF0_I32_B32>; | 
|  | 1296 | def S_FF0_I32_B64_vi       : SOP1_Real_vi <0x0f, S_FF0_I32_B64>; | 
|  | 1297 | def S_FF1_I32_B32_vi       : SOP1_Real_vi <0x10, S_FF1_I32_B32>; | 
|  | 1298 | def S_FF1_I32_B64_vi       : SOP1_Real_vi <0x11, S_FF1_I32_B64>; | 
|  | 1299 | def S_FLBIT_I32_B32_vi     : SOP1_Real_vi <0x12, S_FLBIT_I32_B32>; | 
|  | 1300 | def S_FLBIT_I32_B64_vi     : SOP1_Real_vi <0x13, S_FLBIT_I32_B64>; | 
|  | 1301 | def S_FLBIT_I32_vi         : SOP1_Real_vi <0x14, S_FLBIT_I32>; | 
|  | 1302 | def S_FLBIT_I32_I64_vi     : SOP1_Real_vi <0x15, S_FLBIT_I32_I64>; | 
|  | 1303 | def S_SEXT_I32_I8_vi       : SOP1_Real_vi <0x16, S_SEXT_I32_I8>; | 
|  | 1304 | def S_SEXT_I32_I16_vi      : SOP1_Real_vi <0x17, S_SEXT_I32_I16>; | 
|  | 1305 | def S_BITSET0_B32_vi       : SOP1_Real_vi <0x18, S_BITSET0_B32>; | 
|  | 1306 | def S_BITSET0_B64_vi       : SOP1_Real_vi <0x19, S_BITSET0_B64>; | 
|  | 1307 | def S_BITSET1_B32_vi       : SOP1_Real_vi <0x1a, S_BITSET1_B32>; | 
|  | 1308 | def S_BITSET1_B64_vi       : SOP1_Real_vi <0x1b, S_BITSET1_B64>; | 
|  | 1309 | def S_GETPC_B64_vi         : SOP1_Real_vi <0x1c, S_GETPC_B64>; | 
|  | 1310 | def S_SETPC_B64_vi         : SOP1_Real_vi <0x1d, S_SETPC_B64>; | 
|  | 1311 | def S_SWAPPC_B64_vi        : SOP1_Real_vi <0x1e, S_SWAPPC_B64>; | 
|  | 1312 | def S_RFE_B64_vi           : SOP1_Real_vi <0x1f, S_RFE_B64>; | 
|  | 1313 | def S_AND_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x20, S_AND_SAVEEXEC_B64>; | 
|  | 1314 | def S_OR_SAVEEXEC_B64_vi   : SOP1_Real_vi <0x21, S_OR_SAVEEXEC_B64>; | 
|  | 1315 | def S_XOR_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x22, S_XOR_SAVEEXEC_B64>; | 
|  | 1316 | def S_ANDN2_SAVEEXEC_B64_vi: SOP1_Real_vi <0x23, S_ANDN2_SAVEEXEC_B64>; | 
|  | 1317 | def S_ORN2_SAVEEXEC_B64_vi : SOP1_Real_vi <0x24, S_ORN2_SAVEEXEC_B64>; | 
|  | 1318 | def S_NAND_SAVEEXEC_B64_vi : SOP1_Real_vi <0x25, S_NAND_SAVEEXEC_B64>; | 
|  | 1319 | def S_NOR_SAVEEXEC_B64_vi  : SOP1_Real_vi <0x26, S_NOR_SAVEEXEC_B64>; | 
|  | 1320 | def S_XNOR_SAVEEXEC_B64_vi : SOP1_Real_vi <0x27, S_XNOR_SAVEEXEC_B64>; | 
|  | 1321 | def S_QUADMASK_B32_vi      : SOP1_Real_vi <0x28, S_QUADMASK_B32>; | 
|  | 1322 | def S_QUADMASK_B64_vi      : SOP1_Real_vi <0x29, S_QUADMASK_B64>; | 
|  | 1323 | def S_MOVRELS_B32_vi       : SOP1_Real_vi <0x2a, S_MOVRELS_B32>; | 
|  | 1324 | def S_MOVRELS_B64_vi       : SOP1_Real_vi <0x2b, S_MOVRELS_B64>; | 
|  | 1325 | def S_MOVRELD_B32_vi       : SOP1_Real_vi <0x2c, S_MOVRELD_B32>; | 
|  | 1326 | def S_MOVRELD_B64_vi       : SOP1_Real_vi <0x2d, S_MOVRELD_B64>; | 
|  | 1327 | def S_CBRANCH_JOIN_vi      : SOP1_Real_vi <0x2e, S_CBRANCH_JOIN>; | 
|  | 1328 | def S_MOV_REGRD_B32_vi     : SOP1_Real_vi <0x2f, S_MOV_REGRD_B32>; | 
|  | 1329 | def S_ABS_I32_vi           : SOP1_Real_vi <0x30, S_ABS_I32>; | 
|  | 1330 | def S_MOV_FED_B32_vi       : SOP1_Real_vi <0x31, S_MOV_FED_B32>; | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 1331 | def S_SET_GPR_IDX_IDX_vi   : SOP1_Real_vi <0x32, S_SET_GPR_IDX_IDX>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1332 |  | 
|  | 1333 | def S_ADD_U32_vi           : SOP2_Real_vi <0x00, S_ADD_U32>; | 
|  | 1334 | def S_ADD_I32_vi           : SOP2_Real_vi <0x02, S_ADD_I32>; | 
|  | 1335 | def S_SUB_U32_vi           : SOP2_Real_vi <0x01, S_SUB_U32>; | 
|  | 1336 | def S_SUB_I32_vi           : SOP2_Real_vi <0x03, S_SUB_I32>; | 
|  | 1337 | def S_ADDC_U32_vi          : SOP2_Real_vi <0x04, S_ADDC_U32>; | 
|  | 1338 | def S_SUBB_U32_vi          : SOP2_Real_vi <0x05, S_SUBB_U32>; | 
|  | 1339 | def S_MIN_I32_vi           : SOP2_Real_vi <0x06, S_MIN_I32>; | 
|  | 1340 | def S_MIN_U32_vi           : SOP2_Real_vi <0x07, S_MIN_U32>; | 
|  | 1341 | def S_MAX_I32_vi           : SOP2_Real_vi <0x08, S_MAX_I32>; | 
|  | 1342 | def S_MAX_U32_vi           : SOP2_Real_vi <0x09, S_MAX_U32>; | 
|  | 1343 | def S_CSELECT_B32_vi       : SOP2_Real_vi <0x0a, S_CSELECT_B32>; | 
|  | 1344 | def S_CSELECT_B64_vi       : SOP2_Real_vi <0x0b, S_CSELECT_B64>; | 
|  | 1345 | def S_AND_B32_vi           : SOP2_Real_vi <0x0c, S_AND_B32>; | 
|  | 1346 | def S_AND_B64_vi           : SOP2_Real_vi <0x0d, S_AND_B64>; | 
|  | 1347 | def S_OR_B32_vi            : SOP2_Real_vi <0x0e, S_OR_B32>; | 
|  | 1348 | def S_OR_B64_vi            : SOP2_Real_vi <0x0f, S_OR_B64>; | 
|  | 1349 | def S_XOR_B32_vi           : SOP2_Real_vi <0x10, S_XOR_B32>; | 
|  | 1350 | def S_XOR_B64_vi           : SOP2_Real_vi <0x11, S_XOR_B64>; | 
|  | 1351 | def S_ANDN2_B32_vi         : SOP2_Real_vi <0x12, S_ANDN2_B32>; | 
|  | 1352 | def S_ANDN2_B64_vi         : SOP2_Real_vi <0x13, S_ANDN2_B64>; | 
|  | 1353 | def S_ORN2_B32_vi          : SOP2_Real_vi <0x14, S_ORN2_B32>; | 
|  | 1354 | def S_ORN2_B64_vi          : SOP2_Real_vi <0x15, S_ORN2_B64>; | 
|  | 1355 | def S_NAND_B32_vi          : SOP2_Real_vi <0x16, S_NAND_B32>; | 
|  | 1356 | def S_NAND_B64_vi          : SOP2_Real_vi <0x17, S_NAND_B64>; | 
|  | 1357 | def S_NOR_B32_vi           : SOP2_Real_vi <0x18, S_NOR_B32>; | 
|  | 1358 | def S_NOR_B64_vi           : SOP2_Real_vi <0x19, S_NOR_B64>; | 
|  | 1359 | def S_XNOR_B32_vi          : SOP2_Real_vi <0x1a, S_XNOR_B32>; | 
|  | 1360 | def S_XNOR_B64_vi          : SOP2_Real_vi <0x1b, S_XNOR_B64>; | 
|  | 1361 | def S_LSHL_B32_vi          : SOP2_Real_vi <0x1c, S_LSHL_B32>; | 
|  | 1362 | def S_LSHL_B64_vi          : SOP2_Real_vi <0x1d, S_LSHL_B64>; | 
|  | 1363 | def S_LSHR_B32_vi          : SOP2_Real_vi <0x1e, S_LSHR_B32>; | 
|  | 1364 | def S_LSHR_B64_vi          : SOP2_Real_vi <0x1f, S_LSHR_B64>; | 
|  | 1365 | def S_ASHR_I32_vi          : SOP2_Real_vi <0x20, S_ASHR_I32>; | 
|  | 1366 | def S_ASHR_I64_vi          : SOP2_Real_vi <0x21, S_ASHR_I64>; | 
|  | 1367 | def S_BFM_B32_vi           : SOP2_Real_vi <0x22, S_BFM_B32>; | 
|  | 1368 | def S_BFM_B64_vi           : SOP2_Real_vi <0x23, S_BFM_B64>; | 
|  | 1369 | def S_MUL_I32_vi           : SOP2_Real_vi <0x24, S_MUL_I32>; | 
|  | 1370 | def S_BFE_U32_vi           : SOP2_Real_vi <0x25, S_BFE_U32>; | 
|  | 1371 | def S_BFE_I32_vi           : SOP2_Real_vi <0x26, S_BFE_I32>; | 
|  | 1372 | def S_BFE_U64_vi           : SOP2_Real_vi <0x27, S_BFE_U64>; | 
|  | 1373 | def S_BFE_I64_vi           : SOP2_Real_vi <0x28, S_BFE_I64>; | 
|  | 1374 | def S_CBRANCH_G_FORK_vi    : SOP2_Real_vi <0x29, S_CBRANCH_G_FORK>; | 
|  | 1375 | def S_ABSDIFF_I32_vi       : SOP2_Real_vi <0x2a, S_ABSDIFF_I32>; | 
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 1376 | def S_PACK_LL_B32_B16_vi   : SOP2_Real_vi <0x32, S_PACK_LL_B32_B16>; | 
|  | 1377 | def S_PACK_LH_B32_B16_vi   : SOP2_Real_vi <0x33, S_PACK_LH_B32_B16>; | 
|  | 1378 | def S_PACK_HH_B32_B16_vi   : SOP2_Real_vi <0x34, S_PACK_HH_B32_B16>; | 
| Dmitry Preobrazhensky | 14104e0 | 2017-04-12 17:10:07 +0000 | [diff] [blame] | 1379 | def S_RFE_RESTORE_B64_vi   : SOP2_Real_vi <0x2b, S_RFE_RESTORE_B64>; | 
| Valery Pykhtin | a34fb49 | 2016-08-30 15:20:31 +0000 | [diff] [blame] | 1380 |  | 
|  | 1381 | def S_MOVK_I32_vi          : SOPK_Real_vi <0x00, S_MOVK_I32>; | 
|  | 1382 | def S_CMOVK_I32_vi         : SOPK_Real_vi <0x01, S_CMOVK_I32>; | 
|  | 1383 | def S_CMPK_EQ_I32_vi       : SOPK_Real_vi <0x02, S_CMPK_EQ_I32>; | 
|  | 1384 | def S_CMPK_LG_I32_vi       : SOPK_Real_vi <0x03, S_CMPK_LG_I32>; | 
|  | 1385 | def S_CMPK_GT_I32_vi       : SOPK_Real_vi <0x04, S_CMPK_GT_I32>; | 
|  | 1386 | def S_CMPK_GE_I32_vi       : SOPK_Real_vi <0x05, S_CMPK_GE_I32>; | 
|  | 1387 | def S_CMPK_LT_I32_vi       : SOPK_Real_vi <0x06, S_CMPK_LT_I32>; | 
|  | 1388 | def S_CMPK_LE_I32_vi       : SOPK_Real_vi <0x07, S_CMPK_LE_I32>; | 
|  | 1389 | def S_CMPK_EQ_U32_vi       : SOPK_Real_vi <0x08, S_CMPK_EQ_U32>; | 
|  | 1390 | def S_CMPK_LG_U32_vi       : SOPK_Real_vi <0x09, S_CMPK_LG_U32>; | 
|  | 1391 | def S_CMPK_GT_U32_vi       : SOPK_Real_vi <0x0A, S_CMPK_GT_U32>; | 
|  | 1392 | def S_CMPK_GE_U32_vi       : SOPK_Real_vi <0x0B, S_CMPK_GE_U32>; | 
|  | 1393 | def S_CMPK_LT_U32_vi       : SOPK_Real_vi <0x0C, S_CMPK_LT_U32>; | 
|  | 1394 | def S_CMPK_LE_U32_vi       : SOPK_Real_vi <0x0D, S_CMPK_LE_U32>; | 
|  | 1395 | def S_ADDK_I32_vi          : SOPK_Real_vi <0x0E, S_ADDK_I32>; | 
|  | 1396 | def S_MULK_I32_vi          : SOPK_Real_vi <0x0F, S_MULK_I32>; | 
|  | 1397 | def S_CBRANCH_I_FORK_vi    : SOPK_Real_vi <0x10, S_CBRANCH_I_FORK>; | 
|  | 1398 | def S_GETREG_B32_vi        : SOPK_Real_vi <0x11, S_GETREG_B32>; | 
|  | 1399 | def S_SETREG_B32_vi        : SOPK_Real_vi <0x12, S_SETREG_B32>; | 
|  | 1400 | //def S_GETREG_REGRD_B32_vi  : SOPK_Real_vi <0x13, S_GETREG_REGRD_B32>; // see pseudo for comments | 
|  | 1401 | def S_SETREG_IMM32_B32_vi  : SOPK_Real64<0x14, S_SETREG_IMM32_B32>, | 
| Tom Stellard | 2add8a1 | 2016-09-06 20:00:26 +0000 | [diff] [blame] | 1402 | Select_vi<S_SETREG_IMM32_B32.Mnemonic>; | 
| Dmitry Preobrazhensky | f20aff5 | 2018-04-06 16:35:11 +0000 | [diff] [blame] | 1403 |  | 
| Dmitry Preobrazhensky | ae31223 | 2018-04-06 18:24:49 +0000 | [diff] [blame] | 1404 | def S_CALL_B64_vi          : SOPK_Real_vi <0x15, S_CALL_B64>; | 
|  | 1405 |  | 
| Dmitry Preobrazhensky | f20aff5 | 2018-04-06 16:35:11 +0000 | [diff] [blame] | 1406 | //===----------------------------------------------------------------------===// | 
|  | 1407 | // SOP1 - GFX9. | 
|  | 1408 | //===----------------------------------------------------------------------===// | 
|  | 1409 |  | 
|  | 1410 | def S_ANDN1_SAVEEXEC_B64_vi   : SOP1_Real_vi<0x33, S_ANDN1_SAVEEXEC_B64>; | 
|  | 1411 | def S_ORN1_SAVEEXEC_B64_vi    : SOP1_Real_vi<0x34, S_ORN1_SAVEEXEC_B64>; | 
|  | 1412 | def S_ANDN1_WREXEC_B64_vi     : SOP1_Real_vi<0x35, S_ANDN1_WREXEC_B64>; | 
|  | 1413 | def S_ANDN2_WREXEC_B64_vi     : SOP1_Real_vi<0x36, S_ANDN2_WREXEC_B64>; | 
|  | 1414 | def S_BITREPLICATE_B64_B32_vi : SOP1_Real_vi<0x37, S_BITREPLICATE_B64_B32>; | 
| Dmitry Preobrazhensky | 2f8e146 | 2018-04-09 13:10:33 +0000 | [diff] [blame] | 1415 |  | 
|  | 1416 | //===----------------------------------------------------------------------===// | 
|  | 1417 | // SOP2 - GFX9. | 
|  | 1418 | //===----------------------------------------------------------------------===// | 
|  | 1419 |  | 
|  | 1420 | def S_LSHL1_ADD_U32_vi   : SOP2_Real_vi<0x2e, S_LSHL1_ADD_U32>; | 
|  | 1421 | def S_LSHL2_ADD_U32_vi   : SOP2_Real_vi<0x2f, S_LSHL2_ADD_U32>; | 
|  | 1422 | def S_LSHL3_ADD_U32_vi   : SOP2_Real_vi<0x30, S_LSHL3_ADD_U32>; | 
|  | 1423 | def S_LSHL4_ADD_U32_vi   : SOP2_Real_vi<0x31, S_LSHL4_ADD_U32>; | 
|  | 1424 | def S_MUL_HI_U32_vi      : SOP2_Real_vi<0x2c, S_MUL_HI_U32>; | 
|  | 1425 | def S_MUL_HI_I32_vi      : SOP2_Real_vi<0x2d, S_MUL_HI_I32>; |