Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 1 | //===- AMDGPUDisassembler.cpp - Disassembler for AMDGPU ISA ---------------===// |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | //===----------------------------------------------------------------------===// |
| 11 | // |
| 12 | /// \file |
| 13 | /// |
| 14 | /// This file contains definition for AMDGPU ISA disassembler |
| 15 | // |
| 16 | //===----------------------------------------------------------------------===// |
| 17 | |
| 18 | // ToDo: What to do with instruction suffixes (v_mov_b32 vs v_mov_b32_e32)? |
| 19 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 20 | #include "Disassembler/AMDGPUDisassembler.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 21 | #include "AMDGPU.h" |
| 22 | #include "AMDGPURegisterInfo.h" |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 23 | #include "SIDefines.h" |
Tom Stellard | 44b30b4 | 2018-05-22 02:03:23 +0000 | [diff] [blame] | 24 | #include "MCTargetDesc/AMDGPUMCTargetDesc.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 25 | #include "Utils/AMDGPUBaseInfo.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 26 | #include "llvm-c/Disassembler.h" |
| 27 | #include "llvm/ADT/APInt.h" |
| 28 | #include "llvm/ADT/ArrayRef.h" |
| 29 | #include "llvm/ADT/Twine.h" |
Zachary Turner | 264b5d9 | 2017-06-07 03:48:56 +0000 | [diff] [blame] | 30 | #include "llvm/BinaryFormat/ELF.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 31 | #include "llvm/MC/MCContext.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 32 | #include "llvm/MC/MCDisassembler/MCDisassembler.h" |
| 33 | #include "llvm/MC/MCExpr.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 34 | #include "llvm/MC/MCFixedLenDisassembler.h" |
| 35 | #include "llvm/MC/MCInst.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 36 | #include "llvm/MC/MCSubtargetInfo.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 37 | #include "llvm/Support/Endian.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 38 | #include "llvm/Support/ErrorHandling.h" |
| 39 | #include "llvm/Support/MathExtras.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 40 | #include "llvm/Support/TargetRegistry.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 41 | #include "llvm/Support/raw_ostream.h" |
| 42 | #include <algorithm> |
| 43 | #include <cassert> |
| 44 | #include <cstddef> |
| 45 | #include <cstdint> |
| 46 | #include <iterator> |
| 47 | #include <tuple> |
| 48 | #include <vector> |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 49 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 50 | using namespace llvm; |
| 51 | |
| 52 | #define DEBUG_TYPE "amdgpu-disassembler" |
| 53 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 54 | using DecodeStatus = llvm::MCDisassembler::DecodeStatus; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 55 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 56 | inline static MCDisassembler::DecodeStatus |
| 57 | addOperand(MCInst &Inst, const MCOperand& Opnd) { |
| 58 | Inst.addOperand(Opnd); |
| 59 | return Opnd.isValid() ? |
| 60 | MCDisassembler::Success : |
| 61 | MCDisassembler::SoftFail; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 62 | } |
| 63 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 64 | static int insertNamedMCOperand(MCInst &MI, const MCOperand &Op, |
| 65 | uint16_t NameIdx) { |
| 66 | int OpIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), NameIdx); |
| 67 | if (OpIdx != -1) { |
| 68 | auto I = MI.begin(); |
| 69 | std::advance(I, OpIdx); |
| 70 | MI.insert(I, Op); |
| 71 | } |
| 72 | return OpIdx; |
| 73 | } |
| 74 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 75 | static DecodeStatus decodeSoppBrTarget(MCInst &Inst, unsigned Imm, |
| 76 | uint64_t Addr, const void *Decoder) { |
| 77 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 78 | |
| 79 | APInt SignedOffset(18, Imm * 4, true); |
| 80 | int64_t Offset = (SignedOffset.sext(64) + 4 + Addr).getSExtValue(); |
| 81 | |
| 82 | if (DAsm->tryAddingSymbolicOperand(Inst, Offset, Addr, true, 2, 2)) |
| 83 | return MCDisassembler::Success; |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 84 | return addOperand(Inst, MCOperand::createImm(Imm)); |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 85 | } |
| 86 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 87 | #define DECODE_OPERAND(StaticDecoderName, DecoderName) \ |
| 88 | static DecodeStatus StaticDecoderName(MCInst &Inst, \ |
| 89 | unsigned Imm, \ |
| 90 | uint64_t /*Addr*/, \ |
| 91 | const void *Decoder) { \ |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 92 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); \ |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 93 | return addOperand(Inst, DAsm->DecoderName(Imm)); \ |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 94 | } |
| 95 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 96 | #define DECODE_OPERAND_REG(RegClass) \ |
| 97 | DECODE_OPERAND(Decode##RegClass##RegisterClass, decodeOperand_##RegClass) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 98 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 99 | DECODE_OPERAND_REG(VGPR_32) |
| 100 | DECODE_OPERAND_REG(VS_32) |
| 101 | DECODE_OPERAND_REG(VS_64) |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 102 | DECODE_OPERAND_REG(VS_128) |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 103 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 104 | DECODE_OPERAND_REG(VReg_64) |
| 105 | DECODE_OPERAND_REG(VReg_96) |
| 106 | DECODE_OPERAND_REG(VReg_128) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 107 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 108 | DECODE_OPERAND_REG(SReg_32) |
| 109 | DECODE_OPERAND_REG(SReg_32_XM0_XEXEC) |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 110 | DECODE_OPERAND_REG(SReg_32_XEXEC_HI) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 111 | DECODE_OPERAND_REG(SReg_64) |
| 112 | DECODE_OPERAND_REG(SReg_64_XEXEC) |
| 113 | DECODE_OPERAND_REG(SReg_128) |
| 114 | DECODE_OPERAND_REG(SReg_256) |
| 115 | DECODE_OPERAND_REG(SReg_512) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 116 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 117 | static DecodeStatus decodeOperand_VSrc16(MCInst &Inst, |
| 118 | unsigned Imm, |
| 119 | uint64_t Addr, |
| 120 | const void *Decoder) { |
| 121 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 122 | return addOperand(Inst, DAsm->decodeOperand_VSrc16(Imm)); |
| 123 | } |
| 124 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 125 | static DecodeStatus decodeOperand_VSrcV216(MCInst &Inst, |
| 126 | unsigned Imm, |
| 127 | uint64_t Addr, |
| 128 | const void *Decoder) { |
| 129 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 130 | return addOperand(Inst, DAsm->decodeOperand_VSrcV216(Imm)); |
| 131 | } |
| 132 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 133 | #define DECODE_SDWA(DecName) \ |
| 134 | DECODE_OPERAND(decodeSDWA##DecName, decodeSDWA##DecName) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 135 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 136 | DECODE_SDWA(Src32) |
| 137 | DECODE_SDWA(Src16) |
| 138 | DECODE_SDWA(VopcDst) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 139 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 140 | #include "AMDGPUGenDisassemblerTables.inc" |
| 141 | |
| 142 | //===----------------------------------------------------------------------===// |
| 143 | // |
| 144 | //===----------------------------------------------------------------------===// |
| 145 | |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 146 | template <typename T> static inline T eatBytes(ArrayRef<uint8_t>& Bytes) { |
| 147 | assert(Bytes.size() >= sizeof(T)); |
| 148 | const auto Res = support::endian::read<T, support::endianness::little>(Bytes.data()); |
| 149 | Bytes = Bytes.slice(sizeof(T)); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 150 | return Res; |
| 151 | } |
| 152 | |
| 153 | DecodeStatus AMDGPUDisassembler::tryDecodeInst(const uint8_t* Table, |
| 154 | MCInst &MI, |
| 155 | uint64_t Inst, |
| 156 | uint64_t Address) const { |
| 157 | assert(MI.getOpcode() == 0); |
| 158 | assert(MI.getNumOperands() == 0); |
| 159 | MCInst TmpInst; |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 160 | HasLiteral = false; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 161 | const auto SavedBytes = Bytes; |
| 162 | if (decodeInstruction(Table, TmpInst, Inst, Address, this, STI)) { |
| 163 | MI = TmpInst; |
| 164 | return MCDisassembler::Success; |
| 165 | } |
| 166 | Bytes = SavedBytes; |
| 167 | return MCDisassembler::Fail; |
| 168 | } |
| 169 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 170 | DecodeStatus AMDGPUDisassembler::getInstruction(MCInst &MI, uint64_t &Size, |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 171 | ArrayRef<uint8_t> Bytes_, |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 172 | uint64_t Address, |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 173 | raw_ostream &WS, |
| 174 | raw_ostream &CS) const { |
| 175 | CommentStream = &CS; |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 176 | bool IsSDWA = false; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 177 | |
| 178 | // ToDo: AMDGPUDisassembler supports only VI ISA. |
Matt Arsenault | d122abe | 2017-02-15 21:50:34 +0000 | [diff] [blame] | 179 | if (!STI.getFeatureBits()[AMDGPU::FeatureGCN3Encoding]) |
| 180 | report_fatal_error("Disassembly not yet supported for subtarget"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 181 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 182 | const unsigned MaxInstBytesNum = (std::min)((size_t)8, Bytes_.size()); |
| 183 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 184 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 185 | DecodeStatus Res = MCDisassembler::Fail; |
| 186 | do { |
Valery Pykhtin | 824e804 | 2016-03-04 10:59:50 +0000 | [diff] [blame] | 187 | // ToDo: better to switch encoding length using some bit predicate |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 188 | // but it is unknown yet, so try all we can |
Matt Arsenault | 37fefd6 | 2016-06-10 02:18:02 +0000 | [diff] [blame] | 189 | |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 190 | // Try to decode DPP and SDWA first to solve conflict with VOP1 and VOP2 |
| 191 | // encodings |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 192 | if (Bytes.size() >= 8) { |
| 193 | const uint64_t QW = eatBytes<uint64_t>(Bytes); |
| 194 | Res = tryDecodeInst(DecoderTableDPP64, MI, QW, Address); |
| 195 | if (Res) break; |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 196 | |
| 197 | Res = tryDecodeInst(DecoderTableSDWA64, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 198 | if (Res) { IsSDWA = true; break; } |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 199 | |
| 200 | Res = tryDecodeInst(DecoderTableSDWA964, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 201 | if (Res) { IsSDWA = true; break; } |
Changpeng Fang | 0905870 | 2018-01-30 16:42:40 +0000 | [diff] [blame] | 202 | |
| 203 | if (STI.getFeatureBits()[AMDGPU::FeatureUnpackedD16VMem]) { |
| 204 | Res = tryDecodeInst(DecoderTableGFX80_UNPACKED64, MI, QW, Address); |
Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 205 | if (Res) |
| 206 | break; |
| 207 | } |
| 208 | |
| 209 | // Some GFX9 subtargets repurposed the v_mad_mix_f32, v_mad_mixlo_f16 and |
| 210 | // v_mad_mixhi_f16 for FMA variants. Try to decode using this special |
| 211 | // table first so we print the correct name. |
| 212 | if (STI.getFeatureBits()[AMDGPU::FeatureFmaMixInsts]) { |
| 213 | Res = tryDecodeInst(DecoderTableGFX9_DL64, MI, QW, Address); |
| 214 | if (Res) |
| 215 | break; |
Changpeng Fang | 0905870 | 2018-01-30 16:42:40 +0000 | [diff] [blame] | 216 | } |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 217 | } |
| 218 | |
| 219 | // Reinitialize Bytes as DPP64 could have eaten too much |
| 220 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
| 221 | |
| 222 | // Try decode 32-bit instruction |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 223 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 224 | const uint32_t DW = eatBytes<uint32_t>(Bytes); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 225 | Res = tryDecodeInst(DecoderTableVI32, MI, DW, Address); |
| 226 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 227 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 228 | Res = tryDecodeInst(DecoderTableAMDGPU32, MI, DW, Address); |
| 229 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 230 | |
Dmitry Preobrazhensky | a0342dc | 2017-11-20 18:24:21 +0000 | [diff] [blame] | 231 | Res = tryDecodeInst(DecoderTableGFX932, MI, DW, Address); |
| 232 | if (Res) break; |
| 233 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 234 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 235 | const uint64_t QW = ((uint64_t)eatBytes<uint32_t>(Bytes) << 32) | DW; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 236 | Res = tryDecodeInst(DecoderTableVI64, MI, QW, Address); |
| 237 | if (Res) break; |
| 238 | |
| 239 | Res = tryDecodeInst(DecoderTableAMDGPU64, MI, QW, Address); |
Dmitry Preobrazhensky | 1e32550 | 2017-08-09 17:10:47 +0000 | [diff] [blame] | 240 | if (Res) break; |
| 241 | |
| 242 | Res = tryDecodeInst(DecoderTableGFX964, MI, QW, Address); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 243 | } while (false); |
| 244 | |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 245 | if (Res && (MI.getOpcode() == AMDGPU::V_MAC_F32_e64_vi || |
| 246 | MI.getOpcode() == AMDGPU::V_MAC_F32_e64_si || |
Konstantin Zhuravlyov | 603a43f | 2018-05-15 17:39:13 +0000 | [diff] [blame] | 247 | MI.getOpcode() == AMDGPU::V_MAC_F16_e64_vi || |
| 248 | MI.getOpcode() == AMDGPU::V_FMAC_F32_e64_vi)) { |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 249 | // Insert dummy unused src2_modifiers. |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 250 | insertNamedMCOperand(MI, MCOperand::createImm(0), |
| 251 | AMDGPU::OpName::src2_modifiers); |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 252 | } |
| 253 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 254 | if (Res && (MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::MIMG)) { |
| 255 | Res = convertMIMGInst(MI); |
| 256 | } |
| 257 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 258 | if (Res && IsSDWA) |
| 259 | Res = convertSDWAInst(MI); |
| 260 | |
Tim Corringham | 7116e89 | 2018-03-26 17:06:33 +0000 | [diff] [blame] | 261 | // if the opcode was not recognized we'll assume a Size of 4 bytes |
| 262 | // (unless there are fewer bytes left) |
| 263 | Size = Res ? (MaxInstBytesNum - Bytes.size()) |
| 264 | : std::min((size_t)4, Bytes_.size()); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 265 | return Res; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 266 | } |
| 267 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 268 | DecodeStatus AMDGPUDisassembler::convertSDWAInst(MCInst &MI) const { |
| 269 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
| 270 | if (AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst) != -1) |
| 271 | // VOPC - insert clamp |
| 272 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::clamp); |
| 273 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 274 | int SDst = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst); |
| 275 | if (SDst != -1) { |
| 276 | // VOPC - insert VCC register as sdst |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 277 | insertNamedMCOperand(MI, createRegOperand(AMDGPU::VCC), |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 278 | AMDGPU::OpName::sdst); |
| 279 | } else { |
| 280 | // VOP1/2 - insert omod if present in instruction |
| 281 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::omod); |
| 282 | } |
| 283 | } |
| 284 | return MCDisassembler::Success; |
| 285 | } |
| 286 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 287 | // Note that MIMG format provides no information about VADDR size. |
| 288 | // Consequently, decoded instructions always show address |
| 289 | // as if it has 1 dword, which could be not really so. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 290 | DecodeStatus AMDGPUDisassembler::convertMIMGInst(MCInst &MI) const { |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 291 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 292 | int VDstIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 293 | AMDGPU::OpName::vdst); |
| 294 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 295 | int VDataIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 296 | AMDGPU::OpName::vdata); |
| 297 | |
| 298 | int DMaskIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 299 | AMDGPU::OpName::dmask); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 300 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 301 | int TFEIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 302 | AMDGPU::OpName::tfe); |
Nicolai Haehnle | f267431 | 2018-06-21 13:36:01 +0000 | [diff] [blame^] | 303 | int D16Idx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 304 | AMDGPU::OpName::d16); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 305 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 306 | assert(VDataIdx != -1); |
| 307 | assert(DMaskIdx != -1); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 308 | assert(TFEIdx != -1); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 309 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 310 | bool IsAtomic = (VDstIdx != -1); |
Nicolai Haehnle | f267431 | 2018-06-21 13:36:01 +0000 | [diff] [blame^] | 311 | bool IsGather4 = MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::Gather4; |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 312 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 313 | unsigned DMask = MI.getOperand(DMaskIdx).getImm() & 0xf; |
| 314 | if (DMask == 0) |
| 315 | return MCDisassembler::Success; |
| 316 | |
Nicolai Haehnle | f267431 | 2018-06-21 13:36:01 +0000 | [diff] [blame^] | 317 | unsigned DstSize = IsGather4 ? 4 : countPopulation(DMask); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 318 | if (DstSize == 1) |
| 319 | return MCDisassembler::Success; |
| 320 | |
Nicolai Haehnle | f267431 | 2018-06-21 13:36:01 +0000 | [diff] [blame^] | 321 | bool D16 = D16Idx >= 0 && MI.getOperand(D16Idx).getImm(); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 322 | if (D16 && AMDGPU::hasPackedD16(STI)) { |
| 323 | DstSize = (DstSize + 1) / 2; |
| 324 | } |
| 325 | |
| 326 | // FIXME: Add tfe support |
| 327 | if (MI.getOperand(TFEIdx).getImm()) |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 328 | return MCDisassembler::Success; |
| 329 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 330 | int NewOpcode = -1; |
| 331 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 332 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 333 | if (DMask == 0x1 || DMask == 0x3 || DMask == 0xF) { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 334 | NewOpcode = AMDGPU::getMaskedMIMGAtomicOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 335 | } |
| 336 | if (NewOpcode == -1) return MCDisassembler::Success; |
Nicolai Haehnle | f267431 | 2018-06-21 13:36:01 +0000 | [diff] [blame^] | 337 | } else if (IsGather4) { |
| 338 | if (D16 && AMDGPU::hasPackedD16(STI)) |
| 339 | NewOpcode = AMDGPU::getMIMGGatherOpPackedD16(MI.getOpcode()); |
| 340 | else |
| 341 | return MCDisassembler::Success; |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 342 | } else { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 343 | NewOpcode = AMDGPU::getMaskedMIMGOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 344 | assert(NewOpcode != -1 && "could not find matching mimg channel instruction"); |
| 345 | } |
| 346 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 347 | auto RCID = MCII->get(NewOpcode).OpInfo[VDataIdx].RegClass; |
| 348 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 349 | // Get first subregister of VData |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 350 | unsigned Vdata0 = MI.getOperand(VDataIdx).getReg(); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 351 | unsigned VdataSub0 = MRI.getSubReg(Vdata0, AMDGPU::sub0); |
| 352 | Vdata0 = (VdataSub0 != 0)? VdataSub0 : Vdata0; |
| 353 | |
| 354 | // Widen the register to the correct number of enabled channels. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 355 | auto NewVdata = MRI.getMatchingSuperReg(Vdata0, AMDGPU::sub0, |
| 356 | &MRI.getRegClass(RCID)); |
| 357 | if (NewVdata == AMDGPU::NoRegister) { |
| 358 | // It's possible to encode this such that the low register + enabled |
| 359 | // components exceeds the register count. |
| 360 | return MCDisassembler::Success; |
| 361 | } |
| 362 | |
| 363 | MI.setOpcode(NewOpcode); |
| 364 | // vaddr will be always appear as a single VGPR. This will look different than |
| 365 | // how it is usually emitted because the number of register components is not |
| 366 | // in the instruction encoding. |
| 367 | MI.getOperand(VDataIdx) = MCOperand::createReg(NewVdata); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 368 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 369 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 370 | // Atomic operations have an additional operand (a copy of data) |
| 371 | MI.getOperand(VDstIdx) = MCOperand::createReg(NewVdata); |
| 372 | } |
| 373 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 374 | return MCDisassembler::Success; |
| 375 | } |
| 376 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 377 | const char* AMDGPUDisassembler::getRegClassName(unsigned RegClassID) const { |
| 378 | return getContext().getRegisterInfo()-> |
| 379 | getRegClassName(&AMDGPUMCRegisterClasses[RegClassID]); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 380 | } |
| 381 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 382 | inline |
| 383 | MCOperand AMDGPUDisassembler::errOperand(unsigned V, |
| 384 | const Twine& ErrMsg) const { |
| 385 | *CommentStream << "Error: " + ErrMsg; |
| 386 | |
| 387 | // ToDo: add support for error operands to MCInst.h |
| 388 | // return MCOperand::createError(V); |
| 389 | return MCOperand(); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 390 | } |
| 391 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 392 | inline |
| 393 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned int RegId) const { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 394 | return MCOperand::createReg(AMDGPU::getMCReg(RegId, STI)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 395 | } |
| 396 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 397 | inline |
| 398 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned RegClassID, |
| 399 | unsigned Val) const { |
| 400 | const auto& RegCl = AMDGPUMCRegisterClasses[RegClassID]; |
| 401 | if (Val >= RegCl.getNumRegs()) |
| 402 | return errOperand(Val, Twine(getRegClassName(RegClassID)) + |
| 403 | ": unknown register " + Twine(Val)); |
| 404 | return createRegOperand(RegCl.getRegister(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 405 | } |
| 406 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 407 | inline |
| 408 | MCOperand AMDGPUDisassembler::createSRegOperand(unsigned SRegClassID, |
| 409 | unsigned Val) const { |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 410 | // ToDo: SI/CI have 104 SGPRs, VI - 102 |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 411 | // Valery: here we accepting as much as we can, let assembler sort it out |
| 412 | int shift = 0; |
| 413 | switch (SRegClassID) { |
| 414 | case AMDGPU::SGPR_32RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 415 | case AMDGPU::TTMP_32RegClassID: |
| 416 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 417 | case AMDGPU::SGPR_64RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 418 | case AMDGPU::TTMP_64RegClassID: |
| 419 | shift = 1; |
| 420 | break; |
| 421 | case AMDGPU::SGPR_128RegClassID: |
| 422 | case AMDGPU::TTMP_128RegClassID: |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 423 | // ToDo: unclear if s[100:104] is available on VI. Can we use VCC as SGPR in |
| 424 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 425 | case AMDGPU::SGPR_256RegClassID: |
| 426 | case AMDGPU::TTMP_256RegClassID: |
| 427 | // ToDo: unclear if s[96:104] is available on VI. Can we use VCC as SGPR in |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 428 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 429 | case AMDGPU::SGPR_512RegClassID: |
| 430 | case AMDGPU::TTMP_512RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 431 | shift = 2; |
| 432 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 433 | // ToDo: unclear if s[88:104] is available on VI. Can we use VCC as SGPR in |
| 434 | // this bundle? |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 435 | default: |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 436 | llvm_unreachable("unhandled register class"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 437 | } |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 438 | |
| 439 | if (Val % (1 << shift)) { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 440 | *CommentStream << "Warning: " << getRegClassName(SRegClassID) |
| 441 | << ": scalar reg isn't aligned " << Val; |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 442 | } |
| 443 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 444 | return createRegOperand(SRegClassID, Val >> shift); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 445 | } |
| 446 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 447 | MCOperand AMDGPUDisassembler::decodeOperand_VS_32(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 448 | return decodeSrcOp(OPW32, Val); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 449 | } |
| 450 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 451 | MCOperand AMDGPUDisassembler::decodeOperand_VS_64(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 452 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 453 | } |
| 454 | |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 455 | MCOperand AMDGPUDisassembler::decodeOperand_VS_128(unsigned Val) const { |
| 456 | return decodeSrcOp(OPW128, Val); |
| 457 | } |
| 458 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 459 | MCOperand AMDGPUDisassembler::decodeOperand_VSrc16(unsigned Val) const { |
| 460 | return decodeSrcOp(OPW16, Val); |
| 461 | } |
| 462 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 463 | MCOperand AMDGPUDisassembler::decodeOperand_VSrcV216(unsigned Val) const { |
| 464 | return decodeSrcOp(OPWV216, Val); |
| 465 | } |
| 466 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 467 | MCOperand AMDGPUDisassembler::decodeOperand_VGPR_32(unsigned Val) const { |
Matt Arsenault | cb540bc | 2016-07-19 00:35:03 +0000 | [diff] [blame] | 468 | // Some instructions have operand restrictions beyond what the encoding |
| 469 | // allows. Some ordinarily VSrc_32 operands are VGPR_32, so clear the extra |
| 470 | // high bit. |
| 471 | Val &= 255; |
| 472 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 473 | return createRegOperand(AMDGPU::VGPR_32RegClassID, Val); |
| 474 | } |
| 475 | |
| 476 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_64(unsigned Val) const { |
| 477 | return createRegOperand(AMDGPU::VReg_64RegClassID, Val); |
| 478 | } |
| 479 | |
| 480 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_96(unsigned Val) const { |
| 481 | return createRegOperand(AMDGPU::VReg_96RegClassID, Val); |
| 482 | } |
| 483 | |
| 484 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_128(unsigned Val) const { |
| 485 | return createRegOperand(AMDGPU::VReg_128RegClassID, Val); |
| 486 | } |
| 487 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 488 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32(unsigned Val) const { |
| 489 | // table-gen generated disassembler doesn't care about operand types |
| 490 | // leaving only registry class so SSrc_32 operand turns into SReg_32 |
| 491 | // and therefore we accept immediates and literals here as well |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 492 | return decodeSrcOp(OPW32, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 493 | } |
| 494 | |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 495 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XM0_XEXEC( |
| 496 | unsigned Val) const { |
| 497 | // SReg_32_XM0 is SReg_32 without M0 or EXEC_LO/EXEC_HI |
Artem Tamazov | 38e496b | 2016-04-29 17:04:50 +0000 | [diff] [blame] | 498 | return decodeOperand_SReg_32(Val); |
| 499 | } |
| 500 | |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 501 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XEXEC_HI( |
| 502 | unsigned Val) const { |
| 503 | // SReg_32_XM0 is SReg_32 without EXEC_HI |
| 504 | return decodeOperand_SReg_32(Val); |
| 505 | } |
| 506 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 507 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64(unsigned Val) const { |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 508 | return decodeSrcOp(OPW64, Val); |
| 509 | } |
| 510 | |
| 511 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64_XEXEC(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 512 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 513 | } |
| 514 | |
| 515 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_128(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 516 | return decodeSrcOp(OPW128, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 517 | } |
| 518 | |
| 519 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_256(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 520 | return decodeDstOp(OPW256, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 521 | } |
| 522 | |
| 523 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_512(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 524 | return decodeDstOp(OPW512, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 525 | } |
| 526 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 527 | MCOperand AMDGPUDisassembler::decodeLiteralConstant() const { |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 528 | // For now all literal constants are supposed to be unsigned integer |
| 529 | // ToDo: deal with signed/unsigned 64-bit integer constants |
| 530 | // ToDo: deal with float/double constants |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 531 | if (!HasLiteral) { |
| 532 | if (Bytes.size() < 4) { |
| 533 | return errOperand(0, "cannot read literal, inst bytes left " + |
| 534 | Twine(Bytes.size())); |
| 535 | } |
| 536 | HasLiteral = true; |
| 537 | Literal = eatBytes<uint32_t>(Bytes); |
| 538 | } |
| 539 | return MCOperand::createImm(Literal); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 540 | } |
| 541 | |
| 542 | MCOperand AMDGPUDisassembler::decodeIntImmed(unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 543 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 544 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 545 | assert(Imm >= INLINE_INTEGER_C_MIN && Imm <= INLINE_INTEGER_C_MAX); |
| 546 | return MCOperand::createImm((Imm <= INLINE_INTEGER_C_POSITIVE_MAX) ? |
| 547 | (static_cast<int64_t>(Imm) - INLINE_INTEGER_C_MIN) : |
| 548 | (INLINE_INTEGER_C_POSITIVE_MAX - static_cast<int64_t>(Imm))); |
| 549 | // Cast prevents negative overflow. |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 550 | } |
| 551 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 552 | static int64_t getInlineImmVal32(unsigned Imm) { |
| 553 | switch (Imm) { |
| 554 | case 240: |
| 555 | return FloatToBits(0.5f); |
| 556 | case 241: |
| 557 | return FloatToBits(-0.5f); |
| 558 | case 242: |
| 559 | return FloatToBits(1.0f); |
| 560 | case 243: |
| 561 | return FloatToBits(-1.0f); |
| 562 | case 244: |
| 563 | return FloatToBits(2.0f); |
| 564 | case 245: |
| 565 | return FloatToBits(-2.0f); |
| 566 | case 246: |
| 567 | return FloatToBits(4.0f); |
| 568 | case 247: |
| 569 | return FloatToBits(-4.0f); |
| 570 | case 248: // 1 / (2 * PI) |
| 571 | return 0x3e22f983; |
| 572 | default: |
| 573 | llvm_unreachable("invalid fp inline imm"); |
| 574 | } |
| 575 | } |
| 576 | |
| 577 | static int64_t getInlineImmVal64(unsigned Imm) { |
| 578 | switch (Imm) { |
| 579 | case 240: |
| 580 | return DoubleToBits(0.5); |
| 581 | case 241: |
| 582 | return DoubleToBits(-0.5); |
| 583 | case 242: |
| 584 | return DoubleToBits(1.0); |
| 585 | case 243: |
| 586 | return DoubleToBits(-1.0); |
| 587 | case 244: |
| 588 | return DoubleToBits(2.0); |
| 589 | case 245: |
| 590 | return DoubleToBits(-2.0); |
| 591 | case 246: |
| 592 | return DoubleToBits(4.0); |
| 593 | case 247: |
| 594 | return DoubleToBits(-4.0); |
| 595 | case 248: // 1 / (2 * PI) |
| 596 | return 0x3fc45f306dc9c882; |
| 597 | default: |
| 598 | llvm_unreachable("invalid fp inline imm"); |
| 599 | } |
| 600 | } |
| 601 | |
| 602 | static int64_t getInlineImmVal16(unsigned Imm) { |
| 603 | switch (Imm) { |
| 604 | case 240: |
| 605 | return 0x3800; |
| 606 | case 241: |
| 607 | return 0xB800; |
| 608 | case 242: |
| 609 | return 0x3C00; |
| 610 | case 243: |
| 611 | return 0xBC00; |
| 612 | case 244: |
| 613 | return 0x4000; |
| 614 | case 245: |
| 615 | return 0xC000; |
| 616 | case 246: |
| 617 | return 0x4400; |
| 618 | case 247: |
| 619 | return 0xC400; |
| 620 | case 248: // 1 / (2 * PI) |
| 621 | return 0x3118; |
| 622 | default: |
| 623 | llvm_unreachable("invalid fp inline imm"); |
| 624 | } |
| 625 | } |
| 626 | |
| 627 | MCOperand AMDGPUDisassembler::decodeFPImmed(OpWidthTy Width, unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 628 | assert(Imm >= AMDGPU::EncValues::INLINE_FLOATING_C_MIN |
| 629 | && Imm <= AMDGPU::EncValues::INLINE_FLOATING_C_MAX); |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 630 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 631 | // ToDo: case 248: 1/(2*PI) - is allowed only on VI |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 632 | switch (Width) { |
| 633 | case OPW32: |
| 634 | return MCOperand::createImm(getInlineImmVal32(Imm)); |
| 635 | case OPW64: |
| 636 | return MCOperand::createImm(getInlineImmVal64(Imm)); |
| 637 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 638 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 639 | return MCOperand::createImm(getInlineImmVal16(Imm)); |
| 640 | default: |
| 641 | llvm_unreachable("implement me"); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 642 | } |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 643 | } |
| 644 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 645 | unsigned AMDGPUDisassembler::getVgprClassId(const OpWidthTy Width) const { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 646 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 647 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 648 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 649 | switch (Width) { |
| 650 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 651 | case OPW32: |
| 652 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 653 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 654 | return VGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 655 | case OPW64: return VReg_64RegClassID; |
| 656 | case OPW128: return VReg_128RegClassID; |
| 657 | } |
| 658 | } |
| 659 | |
| 660 | unsigned AMDGPUDisassembler::getSgprClassId(const OpWidthTy Width) const { |
| 661 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 662 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 663 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 664 | switch (Width) { |
| 665 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 666 | case OPW32: |
| 667 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 668 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 669 | return SGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 670 | case OPW64: return SGPR_64RegClassID; |
| 671 | case OPW128: return SGPR_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 672 | case OPW256: return SGPR_256RegClassID; |
| 673 | case OPW512: return SGPR_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 674 | } |
| 675 | } |
| 676 | |
| 677 | unsigned AMDGPUDisassembler::getTtmpClassId(const OpWidthTy Width) const { |
| 678 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 679 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 680 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 681 | switch (Width) { |
| 682 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 683 | case OPW32: |
| 684 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 685 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 686 | return TTMP_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 687 | case OPW64: return TTMP_64RegClassID; |
| 688 | case OPW128: return TTMP_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 689 | case OPW256: return TTMP_256RegClassID; |
| 690 | case OPW512: return TTMP_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 691 | } |
| 692 | } |
| 693 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 694 | int AMDGPUDisassembler::getTTmpIdx(unsigned Val) const { |
| 695 | using namespace AMDGPU::EncValues; |
| 696 | |
| 697 | unsigned TTmpMin = isGFX9() ? TTMP_GFX9_MIN : TTMP_VI_MIN; |
| 698 | unsigned TTmpMax = isGFX9() ? TTMP_GFX9_MAX : TTMP_VI_MAX; |
| 699 | |
| 700 | return (TTmpMin <= Val && Val <= TTmpMax)? Val - TTmpMin : -1; |
| 701 | } |
| 702 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 703 | MCOperand AMDGPUDisassembler::decodeSrcOp(const OpWidthTy Width, unsigned Val) const { |
| 704 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 705 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 706 | assert(Val < 512); // enum9 |
| 707 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 708 | if (VGPR_MIN <= Val && Val <= VGPR_MAX) { |
| 709 | return createRegOperand(getVgprClassId(Width), Val - VGPR_MIN); |
| 710 | } |
Artem Tamazov | b49c336 | 2016-05-26 15:52:16 +0000 | [diff] [blame] | 711 | if (Val <= SGPR_MAX) { |
| 712 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 713 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 714 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 715 | |
| 716 | int TTmpIdx = getTTmpIdx(Val); |
| 717 | if (TTmpIdx >= 0) { |
| 718 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 719 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 720 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 721 | if (INLINE_INTEGER_C_MIN <= Val && Val <= INLINE_INTEGER_C_MAX) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 722 | return decodeIntImmed(Val); |
| 723 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 724 | if (INLINE_FLOATING_C_MIN <= Val && Val <= INLINE_FLOATING_C_MAX) |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 725 | return decodeFPImmed(Width, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 726 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 727 | if (Val == LITERAL_CONST) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 728 | return decodeLiteralConstant(); |
| 729 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 730 | switch (Width) { |
| 731 | case OPW32: |
| 732 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 733 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 734 | return decodeSpecialReg32(Val); |
| 735 | case OPW64: |
| 736 | return decodeSpecialReg64(Val); |
| 737 | default: |
| 738 | llvm_unreachable("unexpected immediate type"); |
| 739 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 740 | } |
| 741 | |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 742 | MCOperand AMDGPUDisassembler::decodeDstOp(const OpWidthTy Width, unsigned Val) const { |
| 743 | using namespace AMDGPU::EncValues; |
| 744 | |
| 745 | assert(Val < 128); |
| 746 | assert(Width == OPW256 || Width == OPW512); |
| 747 | |
| 748 | if (Val <= SGPR_MAX) { |
| 749 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
| 750 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 751 | } |
| 752 | |
| 753 | int TTmpIdx = getTTmpIdx(Val); |
| 754 | if (TTmpIdx >= 0) { |
| 755 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
| 756 | } |
| 757 | |
| 758 | llvm_unreachable("unknown dst register"); |
| 759 | } |
| 760 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 761 | MCOperand AMDGPUDisassembler::decodeSpecialReg32(unsigned Val) const { |
| 762 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 763 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 764 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 765 | case 102: return createRegOperand(FLAT_SCR_LO); |
| 766 | case 103: return createRegOperand(FLAT_SCR_HI); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 767 | case 104: return createRegOperand(XNACK_MASK_LO); |
| 768 | case 105: return createRegOperand(XNACK_MASK_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 769 | case 106: return createRegOperand(VCC_LO); |
| 770 | case 107: return createRegOperand(VCC_HI); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 771 | case 108: assert(!isGFX9()); return createRegOperand(TBA_LO); |
| 772 | case 109: assert(!isGFX9()); return createRegOperand(TBA_HI); |
| 773 | case 110: assert(!isGFX9()); return createRegOperand(TMA_LO); |
| 774 | case 111: assert(!isGFX9()); return createRegOperand(TMA_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 775 | case 124: return createRegOperand(M0); |
| 776 | case 126: return createRegOperand(EXEC_LO); |
| 777 | case 127: return createRegOperand(EXEC_HI); |
Matt Arsenault | a3b3b48 | 2017-02-18 18:41:41 +0000 | [diff] [blame] | 778 | case 235: return createRegOperand(SRC_SHARED_BASE); |
| 779 | case 236: return createRegOperand(SRC_SHARED_LIMIT); |
| 780 | case 237: return createRegOperand(SRC_PRIVATE_BASE); |
| 781 | case 238: return createRegOperand(SRC_PRIVATE_LIMIT); |
| 782 | // TODO: SRC_POPS_EXITING_WAVE_ID |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 783 | // ToDo: no support for vccz register |
| 784 | case 251: break; |
| 785 | // ToDo: no support for execz register |
| 786 | case 252: break; |
| 787 | case 253: return createRegOperand(SCC); |
| 788 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 789 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 790 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 791 | } |
| 792 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 793 | MCOperand AMDGPUDisassembler::decodeSpecialReg64(unsigned Val) const { |
| 794 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 795 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 796 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 797 | case 102: return createRegOperand(FLAT_SCR); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 798 | case 104: return createRegOperand(XNACK_MASK); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 799 | case 106: return createRegOperand(VCC); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 800 | case 108: assert(!isGFX9()); return createRegOperand(TBA); |
| 801 | case 110: assert(!isGFX9()); return createRegOperand(TMA); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 802 | case 126: return createRegOperand(EXEC); |
| 803 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 804 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 805 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 806 | } |
| 807 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 808 | MCOperand AMDGPUDisassembler::decodeSDWASrc(const OpWidthTy Width, |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 809 | const unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 810 | using namespace AMDGPU::SDWA; |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 811 | using namespace AMDGPU::EncValues; |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 812 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 813 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
Sam Kolton | a179d25 | 2017-06-27 15:02:23 +0000 | [diff] [blame] | 814 | // XXX: static_cast<int> is needed to avoid stupid warning: |
| 815 | // compare with unsigned is always true |
| 816 | if (SDWA9EncValues::SRC_VGPR_MIN <= static_cast<int>(Val) && |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 817 | Val <= SDWA9EncValues::SRC_VGPR_MAX) { |
| 818 | return createRegOperand(getVgprClassId(Width), |
| 819 | Val - SDWA9EncValues::SRC_VGPR_MIN); |
| 820 | } |
| 821 | if (SDWA9EncValues::SRC_SGPR_MIN <= Val && |
| 822 | Val <= SDWA9EncValues::SRC_SGPR_MAX) { |
| 823 | return createSRegOperand(getSgprClassId(Width), |
| 824 | Val - SDWA9EncValues::SRC_SGPR_MIN); |
| 825 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 826 | if (SDWA9EncValues::SRC_TTMP_MIN <= Val && |
| 827 | Val <= SDWA9EncValues::SRC_TTMP_MAX) { |
| 828 | return createSRegOperand(getTtmpClassId(Width), |
| 829 | Val - SDWA9EncValues::SRC_TTMP_MIN); |
| 830 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 831 | |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 832 | const unsigned SVal = Val - SDWA9EncValues::SRC_SGPR_MIN; |
| 833 | |
| 834 | if (INLINE_INTEGER_C_MIN <= SVal && SVal <= INLINE_INTEGER_C_MAX) |
| 835 | return decodeIntImmed(SVal); |
| 836 | |
| 837 | if (INLINE_FLOATING_C_MIN <= SVal && SVal <= INLINE_FLOATING_C_MAX) |
| 838 | return decodeFPImmed(Width, SVal); |
| 839 | |
| 840 | return decodeSpecialReg32(SVal); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 841 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 842 | return createRegOperand(getVgprClassId(Width), Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 843 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 844 | llvm_unreachable("unsupported target"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 845 | } |
| 846 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 847 | MCOperand AMDGPUDisassembler::decodeSDWASrc16(unsigned Val) const { |
| 848 | return decodeSDWASrc(OPW16, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 849 | } |
| 850 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 851 | MCOperand AMDGPUDisassembler::decodeSDWASrc32(unsigned Val) const { |
| 852 | return decodeSDWASrc(OPW32, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 853 | } |
| 854 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 855 | MCOperand AMDGPUDisassembler::decodeSDWAVopcDst(unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 856 | using namespace AMDGPU::SDWA; |
| 857 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 858 | assert(STI.getFeatureBits()[AMDGPU::FeatureGFX9] && |
| 859 | "SDWAVopcDst should be present only on GFX9"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 860 | if (Val & SDWA9EncValues::VOPC_DST_VCC_MASK) { |
| 861 | Val &= SDWA9EncValues::VOPC_DST_SGPR_MASK; |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 862 | |
| 863 | int TTmpIdx = getTTmpIdx(Val); |
| 864 | if (TTmpIdx >= 0) { |
| 865 | return createSRegOperand(getTtmpClassId(OPW64), TTmpIdx); |
| 866 | } else if (Val > AMDGPU::EncValues::SGPR_MAX) { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 867 | return decodeSpecialReg64(Val); |
| 868 | } else { |
| 869 | return createSRegOperand(getSgprClassId(OPW64), Val); |
| 870 | } |
| 871 | } else { |
| 872 | return createRegOperand(AMDGPU::VCC); |
| 873 | } |
| 874 | } |
| 875 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 876 | bool AMDGPUDisassembler::isVI() const { |
| 877 | return STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]; |
| 878 | } |
| 879 | |
| 880 | bool AMDGPUDisassembler::isGFX9() const { |
| 881 | return STI.getFeatureBits()[AMDGPU::FeatureGFX9]; |
| 882 | } |
| 883 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 884 | //===----------------------------------------------------------------------===// |
| 885 | // AMDGPUSymbolizer |
| 886 | //===----------------------------------------------------------------------===// |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 887 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 888 | // Try to find symbol name for specified label |
| 889 | bool AMDGPUSymbolizer::tryAddingSymbolicOperand(MCInst &Inst, |
| 890 | raw_ostream &/*cStream*/, int64_t Value, |
| 891 | uint64_t /*Address*/, bool IsBranch, |
| 892 | uint64_t /*Offset*/, uint64_t /*InstSize*/) { |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 893 | using SymbolInfoTy = std::tuple<uint64_t, StringRef, uint8_t>; |
| 894 | using SectionSymbolsTy = std::vector<SymbolInfoTy>; |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 895 | |
| 896 | if (!IsBranch) { |
| 897 | return false; |
| 898 | } |
| 899 | |
| 900 | auto *Symbols = static_cast<SectionSymbolsTy *>(DisInfo); |
Nicolai Haehnle | b1c3b22 | 2018-04-10 15:46:43 +0000 | [diff] [blame] | 901 | if (!Symbols) |
| 902 | return false; |
| 903 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 904 | auto Result = std::find_if(Symbols->begin(), Symbols->end(), |
| 905 | [Value](const SymbolInfoTy& Val) { |
| 906 | return std::get<0>(Val) == static_cast<uint64_t>(Value) |
| 907 | && std::get<2>(Val) == ELF::STT_NOTYPE; |
| 908 | }); |
| 909 | if (Result != Symbols->end()) { |
| 910 | auto *Sym = Ctx.getOrCreateSymbol(std::get<1>(*Result)); |
| 911 | const auto *Add = MCSymbolRefExpr::create(Sym, Ctx); |
| 912 | Inst.addOperand(MCOperand::createExpr(Add)); |
| 913 | return true; |
| 914 | } |
| 915 | return false; |
| 916 | } |
| 917 | |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 918 | void AMDGPUSymbolizer::tryAddingPcLoadReferenceComment(raw_ostream &cStream, |
| 919 | int64_t Value, |
| 920 | uint64_t Address) { |
| 921 | llvm_unreachable("unimplemented"); |
| 922 | } |
| 923 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 924 | //===----------------------------------------------------------------------===// |
| 925 | // Initialization |
| 926 | //===----------------------------------------------------------------------===// |
| 927 | |
| 928 | static MCSymbolizer *createAMDGPUSymbolizer(const Triple &/*TT*/, |
| 929 | LLVMOpInfoCallback /*GetOpInfo*/, |
| 930 | LLVMSymbolLookupCallback /*SymbolLookUp*/, |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 931 | void *DisInfo, |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 932 | MCContext *Ctx, |
| 933 | std::unique_ptr<MCRelocationInfo> &&RelInfo) { |
| 934 | return new AMDGPUSymbolizer(*Ctx, std::move(RelInfo), DisInfo); |
| 935 | } |
| 936 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 937 | static MCDisassembler *createAMDGPUDisassembler(const Target &T, |
| 938 | const MCSubtargetInfo &STI, |
| 939 | MCContext &Ctx) { |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 940 | return new AMDGPUDisassembler(STI, Ctx, T.createMCInstrInfo()); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 941 | } |
| 942 | |
| 943 | extern "C" void LLVMInitializeAMDGPUDisassembler() { |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 944 | TargetRegistry::RegisterMCDisassembler(getTheGCNTarget(), |
| 945 | createAMDGPUDisassembler); |
| 946 | TargetRegistry::RegisterMCSymbolizer(getTheGCNTarget(), |
| 947 | createAMDGPUSymbolizer); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 948 | } |