Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 1 | //===- AMDGPUDisassembler.cpp - Disassembler for AMDGPU ISA ---------------===// |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | //===----------------------------------------------------------------------===// |
| 11 | // |
| 12 | /// \file |
| 13 | /// |
| 14 | /// This file contains definition for AMDGPU ISA disassembler |
| 15 | // |
| 16 | //===----------------------------------------------------------------------===// |
| 17 | |
| 18 | // ToDo: What to do with instruction suffixes (v_mov_b32 vs v_mov_b32_e32)? |
| 19 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 20 | #include "Disassembler/AMDGPUDisassembler.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 21 | #include "AMDGPU.h" |
| 22 | #include "AMDGPURegisterInfo.h" |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 23 | #include "SIDefines.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 24 | #include "Utils/AMDGPUBaseInfo.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 25 | #include "llvm-c/Disassembler.h" |
| 26 | #include "llvm/ADT/APInt.h" |
| 27 | #include "llvm/ADT/ArrayRef.h" |
| 28 | #include "llvm/ADT/Twine.h" |
Zachary Turner | 264b5d9 | 2017-06-07 03:48:56 +0000 | [diff] [blame] | 29 | #include "llvm/BinaryFormat/ELF.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 30 | #include "llvm/MC/MCContext.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 31 | #include "llvm/MC/MCDisassembler/MCDisassembler.h" |
| 32 | #include "llvm/MC/MCExpr.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 33 | #include "llvm/MC/MCFixedLenDisassembler.h" |
| 34 | #include "llvm/MC/MCInst.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 35 | #include "llvm/MC/MCSubtargetInfo.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 36 | #include "llvm/Support/Endian.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 37 | #include "llvm/Support/ErrorHandling.h" |
| 38 | #include "llvm/Support/MathExtras.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 39 | #include "llvm/Support/TargetRegistry.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 40 | #include "llvm/Support/raw_ostream.h" |
| 41 | #include <algorithm> |
| 42 | #include <cassert> |
| 43 | #include <cstddef> |
| 44 | #include <cstdint> |
| 45 | #include <iterator> |
| 46 | #include <tuple> |
| 47 | #include <vector> |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 48 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 49 | using namespace llvm; |
| 50 | |
| 51 | #define DEBUG_TYPE "amdgpu-disassembler" |
| 52 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 53 | using DecodeStatus = llvm::MCDisassembler::DecodeStatus; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 54 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 55 | inline static MCDisassembler::DecodeStatus |
| 56 | addOperand(MCInst &Inst, const MCOperand& Opnd) { |
| 57 | Inst.addOperand(Opnd); |
| 58 | return Opnd.isValid() ? |
| 59 | MCDisassembler::Success : |
| 60 | MCDisassembler::SoftFail; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 61 | } |
| 62 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 63 | static int insertNamedMCOperand(MCInst &MI, const MCOperand &Op, |
| 64 | uint16_t NameIdx) { |
| 65 | int OpIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), NameIdx); |
| 66 | if (OpIdx != -1) { |
| 67 | auto I = MI.begin(); |
| 68 | std::advance(I, OpIdx); |
| 69 | MI.insert(I, Op); |
| 70 | } |
| 71 | return OpIdx; |
| 72 | } |
| 73 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 74 | static DecodeStatus decodeSoppBrTarget(MCInst &Inst, unsigned Imm, |
| 75 | uint64_t Addr, const void *Decoder) { |
| 76 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 77 | |
| 78 | APInt SignedOffset(18, Imm * 4, true); |
| 79 | int64_t Offset = (SignedOffset.sext(64) + 4 + Addr).getSExtValue(); |
| 80 | |
| 81 | if (DAsm->tryAddingSymbolicOperand(Inst, Offset, Addr, true, 2, 2)) |
| 82 | return MCDisassembler::Success; |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 83 | return addOperand(Inst, MCOperand::createImm(Imm)); |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 84 | } |
| 85 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 86 | #define DECODE_OPERAND(StaticDecoderName, DecoderName) \ |
| 87 | static DecodeStatus StaticDecoderName(MCInst &Inst, \ |
| 88 | unsigned Imm, \ |
| 89 | uint64_t /*Addr*/, \ |
| 90 | const void *Decoder) { \ |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 91 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); \ |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 92 | return addOperand(Inst, DAsm->DecoderName(Imm)); \ |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 93 | } |
| 94 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 95 | #define DECODE_OPERAND_REG(RegClass) \ |
| 96 | DECODE_OPERAND(Decode##RegClass##RegisterClass, decodeOperand_##RegClass) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 97 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 98 | DECODE_OPERAND_REG(VGPR_32) |
| 99 | DECODE_OPERAND_REG(VS_32) |
| 100 | DECODE_OPERAND_REG(VS_64) |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 101 | DECODE_OPERAND_REG(VS_128) |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 102 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 103 | DECODE_OPERAND_REG(VReg_64) |
| 104 | DECODE_OPERAND_REG(VReg_96) |
| 105 | DECODE_OPERAND_REG(VReg_128) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 106 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 107 | DECODE_OPERAND_REG(SReg_32) |
| 108 | DECODE_OPERAND_REG(SReg_32_XM0_XEXEC) |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 109 | DECODE_OPERAND_REG(SReg_32_XEXEC_HI) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 110 | DECODE_OPERAND_REG(SReg_64) |
| 111 | DECODE_OPERAND_REG(SReg_64_XEXEC) |
| 112 | DECODE_OPERAND_REG(SReg_128) |
| 113 | DECODE_OPERAND_REG(SReg_256) |
| 114 | DECODE_OPERAND_REG(SReg_512) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 115 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 116 | static DecodeStatus decodeOperand_VSrc16(MCInst &Inst, |
| 117 | unsigned Imm, |
| 118 | uint64_t Addr, |
| 119 | const void *Decoder) { |
| 120 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 121 | return addOperand(Inst, DAsm->decodeOperand_VSrc16(Imm)); |
| 122 | } |
| 123 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 124 | static DecodeStatus decodeOperand_VSrcV216(MCInst &Inst, |
| 125 | unsigned Imm, |
| 126 | uint64_t Addr, |
| 127 | const void *Decoder) { |
| 128 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 129 | return addOperand(Inst, DAsm->decodeOperand_VSrcV216(Imm)); |
| 130 | } |
| 131 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 132 | #define DECODE_SDWA(DecName) \ |
| 133 | DECODE_OPERAND(decodeSDWA##DecName, decodeSDWA##DecName) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 134 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 135 | DECODE_SDWA(Src32) |
| 136 | DECODE_SDWA(Src16) |
| 137 | DECODE_SDWA(VopcDst) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 138 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 139 | #include "AMDGPUGenDisassemblerTables.inc" |
| 140 | |
| 141 | //===----------------------------------------------------------------------===// |
| 142 | // |
| 143 | //===----------------------------------------------------------------------===// |
| 144 | |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 145 | template <typename T> static inline T eatBytes(ArrayRef<uint8_t>& Bytes) { |
| 146 | assert(Bytes.size() >= sizeof(T)); |
| 147 | const auto Res = support::endian::read<T, support::endianness::little>(Bytes.data()); |
| 148 | Bytes = Bytes.slice(sizeof(T)); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 149 | return Res; |
| 150 | } |
| 151 | |
| 152 | DecodeStatus AMDGPUDisassembler::tryDecodeInst(const uint8_t* Table, |
| 153 | MCInst &MI, |
| 154 | uint64_t Inst, |
| 155 | uint64_t Address) const { |
| 156 | assert(MI.getOpcode() == 0); |
| 157 | assert(MI.getNumOperands() == 0); |
| 158 | MCInst TmpInst; |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 159 | HasLiteral = false; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 160 | const auto SavedBytes = Bytes; |
| 161 | if (decodeInstruction(Table, TmpInst, Inst, Address, this, STI)) { |
| 162 | MI = TmpInst; |
| 163 | return MCDisassembler::Success; |
| 164 | } |
| 165 | Bytes = SavedBytes; |
| 166 | return MCDisassembler::Fail; |
| 167 | } |
| 168 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 169 | DecodeStatus AMDGPUDisassembler::getInstruction(MCInst &MI, uint64_t &Size, |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 170 | ArrayRef<uint8_t> Bytes_, |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 171 | uint64_t Address, |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 172 | raw_ostream &WS, |
| 173 | raw_ostream &CS) const { |
| 174 | CommentStream = &CS; |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 175 | bool IsSDWA = false; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 176 | |
| 177 | // ToDo: AMDGPUDisassembler supports only VI ISA. |
Matt Arsenault | d122abe | 2017-02-15 21:50:34 +0000 | [diff] [blame] | 178 | if (!STI.getFeatureBits()[AMDGPU::FeatureGCN3Encoding]) |
| 179 | report_fatal_error("Disassembly not yet supported for subtarget"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 180 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 181 | const unsigned MaxInstBytesNum = (std::min)((size_t)8, Bytes_.size()); |
| 182 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 183 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 184 | DecodeStatus Res = MCDisassembler::Fail; |
| 185 | do { |
Valery Pykhtin | 824e804 | 2016-03-04 10:59:50 +0000 | [diff] [blame] | 186 | // ToDo: better to switch encoding length using some bit predicate |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 187 | // but it is unknown yet, so try all we can |
Matt Arsenault | 37fefd6 | 2016-06-10 02:18:02 +0000 | [diff] [blame] | 188 | |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 189 | // Try to decode DPP and SDWA first to solve conflict with VOP1 and VOP2 |
| 190 | // encodings |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 191 | if (Bytes.size() >= 8) { |
| 192 | const uint64_t QW = eatBytes<uint64_t>(Bytes); |
| 193 | Res = tryDecodeInst(DecoderTableDPP64, MI, QW, Address); |
| 194 | if (Res) break; |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 195 | |
| 196 | Res = tryDecodeInst(DecoderTableSDWA64, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 197 | if (Res) { IsSDWA = true; break; } |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 198 | |
| 199 | Res = tryDecodeInst(DecoderTableSDWA964, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 200 | if (Res) { IsSDWA = true; break; } |
Changpeng Fang | 0905870 | 2018-01-30 16:42:40 +0000 | [diff] [blame] | 201 | |
| 202 | if (STI.getFeatureBits()[AMDGPU::FeatureUnpackedD16VMem]) { |
| 203 | Res = tryDecodeInst(DecoderTableGFX80_UNPACKED64, MI, QW, Address); |
| 204 | if (Res) break; |
| 205 | } |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 206 | } |
| 207 | |
| 208 | // Reinitialize Bytes as DPP64 could have eaten too much |
| 209 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
| 210 | |
| 211 | // Try decode 32-bit instruction |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 212 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 213 | const uint32_t DW = eatBytes<uint32_t>(Bytes); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 214 | Res = tryDecodeInst(DecoderTableVI32, MI, DW, Address); |
| 215 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 216 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 217 | Res = tryDecodeInst(DecoderTableAMDGPU32, MI, DW, Address); |
| 218 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 219 | |
Dmitry Preobrazhensky | a0342dc | 2017-11-20 18:24:21 +0000 | [diff] [blame] | 220 | Res = tryDecodeInst(DecoderTableGFX932, MI, DW, Address); |
| 221 | if (Res) break; |
| 222 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 223 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 224 | const uint64_t QW = ((uint64_t)eatBytes<uint32_t>(Bytes) << 32) | DW; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 225 | Res = tryDecodeInst(DecoderTableVI64, MI, QW, Address); |
| 226 | if (Res) break; |
| 227 | |
| 228 | Res = tryDecodeInst(DecoderTableAMDGPU64, MI, QW, Address); |
Dmitry Preobrazhensky | 1e32550 | 2017-08-09 17:10:47 +0000 | [diff] [blame] | 229 | if (Res) break; |
| 230 | |
| 231 | Res = tryDecodeInst(DecoderTableGFX964, MI, QW, Address); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 232 | } while (false); |
| 233 | |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 234 | if (Res && (MI.getOpcode() == AMDGPU::V_MAC_F32_e64_vi || |
| 235 | MI.getOpcode() == AMDGPU::V_MAC_F32_e64_si || |
| 236 | MI.getOpcode() == AMDGPU::V_MAC_F16_e64_vi)) { |
| 237 | // Insert dummy unused src2_modifiers. |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 238 | insertNamedMCOperand(MI, MCOperand::createImm(0), |
| 239 | AMDGPU::OpName::src2_modifiers); |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 240 | } |
| 241 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 242 | if (Res && (MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::MIMG)) { |
| 243 | Res = convertMIMGInst(MI); |
| 244 | } |
| 245 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 246 | if (Res && IsSDWA) |
| 247 | Res = convertSDWAInst(MI); |
| 248 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 249 | Size = Res ? (MaxInstBytesNum - Bytes.size()) : 0; |
| 250 | return Res; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 251 | } |
| 252 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 253 | DecodeStatus AMDGPUDisassembler::convertSDWAInst(MCInst &MI) const { |
| 254 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
| 255 | if (AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst) != -1) |
| 256 | // VOPC - insert clamp |
| 257 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::clamp); |
| 258 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 259 | int SDst = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst); |
| 260 | if (SDst != -1) { |
| 261 | // VOPC - insert VCC register as sdst |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 262 | insertNamedMCOperand(MI, createRegOperand(AMDGPU::VCC), |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 263 | AMDGPU::OpName::sdst); |
| 264 | } else { |
| 265 | // VOP1/2 - insert omod if present in instruction |
| 266 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::omod); |
| 267 | } |
| 268 | } |
| 269 | return MCDisassembler::Success; |
| 270 | } |
| 271 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 272 | // Note that MIMG format provides no information about VADDR size. |
| 273 | // Consequently, decoded instructions always show address |
| 274 | // as if it has 1 dword, which could be not really so. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 275 | DecodeStatus AMDGPUDisassembler::convertMIMGInst(MCInst &MI) const { |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 276 | |
| 277 | if (MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::Gather4) { |
| 278 | return MCDisassembler::Success; |
| 279 | } |
| 280 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 281 | int VDstIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 282 | AMDGPU::OpName::vdst); |
| 283 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 284 | int VDataIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 285 | AMDGPU::OpName::vdata); |
| 286 | |
| 287 | int DMaskIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 288 | AMDGPU::OpName::dmask); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 289 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 290 | int TFEIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 291 | AMDGPU::OpName::tfe); |
| 292 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 293 | assert(VDataIdx != -1); |
| 294 | assert(DMaskIdx != -1); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 295 | assert(TFEIdx != -1); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 296 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 297 | bool IsAtomic = (VDstIdx != -1); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 298 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 299 | unsigned DMask = MI.getOperand(DMaskIdx).getImm() & 0xf; |
| 300 | if (DMask == 0) |
| 301 | return MCDisassembler::Success; |
| 302 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 303 | unsigned DstSize = countPopulation(DMask); |
| 304 | if (DstSize == 1) |
| 305 | return MCDisassembler::Success; |
| 306 | |
| 307 | bool D16 = MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::D16; |
| 308 | if (D16 && AMDGPU::hasPackedD16(STI)) { |
| 309 | DstSize = (DstSize + 1) / 2; |
| 310 | } |
| 311 | |
| 312 | // FIXME: Add tfe support |
| 313 | if (MI.getOperand(TFEIdx).getImm()) |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 314 | return MCDisassembler::Success; |
| 315 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 316 | int NewOpcode = -1; |
| 317 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 318 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 319 | if (DMask == 0x1 || DMask == 0x3 || DMask == 0xF) { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 320 | NewOpcode = AMDGPU::getMaskedMIMGAtomicOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 321 | } |
| 322 | if (NewOpcode == -1) return MCDisassembler::Success; |
| 323 | } else { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 324 | NewOpcode = AMDGPU::getMaskedMIMGOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 325 | assert(NewOpcode != -1 && "could not find matching mimg channel instruction"); |
| 326 | } |
| 327 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 328 | auto RCID = MCII->get(NewOpcode).OpInfo[VDataIdx].RegClass; |
| 329 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 330 | // Get first subregister of VData |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 331 | unsigned Vdata0 = MI.getOperand(VDataIdx).getReg(); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 332 | unsigned VdataSub0 = MRI.getSubReg(Vdata0, AMDGPU::sub0); |
| 333 | Vdata0 = (VdataSub0 != 0)? VdataSub0 : Vdata0; |
| 334 | |
| 335 | // Widen the register to the correct number of enabled channels. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 336 | auto NewVdata = MRI.getMatchingSuperReg(Vdata0, AMDGPU::sub0, |
| 337 | &MRI.getRegClass(RCID)); |
| 338 | if (NewVdata == AMDGPU::NoRegister) { |
| 339 | // It's possible to encode this such that the low register + enabled |
| 340 | // components exceeds the register count. |
| 341 | return MCDisassembler::Success; |
| 342 | } |
| 343 | |
| 344 | MI.setOpcode(NewOpcode); |
| 345 | // vaddr will be always appear as a single VGPR. This will look different than |
| 346 | // how it is usually emitted because the number of register components is not |
| 347 | // in the instruction encoding. |
| 348 | MI.getOperand(VDataIdx) = MCOperand::createReg(NewVdata); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 349 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 350 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 351 | // Atomic operations have an additional operand (a copy of data) |
| 352 | MI.getOperand(VDstIdx) = MCOperand::createReg(NewVdata); |
| 353 | } |
| 354 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 355 | return MCDisassembler::Success; |
| 356 | } |
| 357 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 358 | const char* AMDGPUDisassembler::getRegClassName(unsigned RegClassID) const { |
| 359 | return getContext().getRegisterInfo()-> |
| 360 | getRegClassName(&AMDGPUMCRegisterClasses[RegClassID]); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 361 | } |
| 362 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 363 | inline |
| 364 | MCOperand AMDGPUDisassembler::errOperand(unsigned V, |
| 365 | const Twine& ErrMsg) const { |
| 366 | *CommentStream << "Error: " + ErrMsg; |
| 367 | |
| 368 | // ToDo: add support for error operands to MCInst.h |
| 369 | // return MCOperand::createError(V); |
| 370 | return MCOperand(); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 371 | } |
| 372 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 373 | inline |
| 374 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned int RegId) const { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 375 | return MCOperand::createReg(AMDGPU::getMCReg(RegId, STI)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 376 | } |
| 377 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 378 | inline |
| 379 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned RegClassID, |
| 380 | unsigned Val) const { |
| 381 | const auto& RegCl = AMDGPUMCRegisterClasses[RegClassID]; |
| 382 | if (Val >= RegCl.getNumRegs()) |
| 383 | return errOperand(Val, Twine(getRegClassName(RegClassID)) + |
| 384 | ": unknown register " + Twine(Val)); |
| 385 | return createRegOperand(RegCl.getRegister(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 386 | } |
| 387 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 388 | inline |
| 389 | MCOperand AMDGPUDisassembler::createSRegOperand(unsigned SRegClassID, |
| 390 | unsigned Val) const { |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 391 | // ToDo: SI/CI have 104 SGPRs, VI - 102 |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 392 | // Valery: here we accepting as much as we can, let assembler sort it out |
| 393 | int shift = 0; |
| 394 | switch (SRegClassID) { |
| 395 | case AMDGPU::SGPR_32RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 396 | case AMDGPU::TTMP_32RegClassID: |
| 397 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 398 | case AMDGPU::SGPR_64RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 399 | case AMDGPU::TTMP_64RegClassID: |
| 400 | shift = 1; |
| 401 | break; |
| 402 | case AMDGPU::SGPR_128RegClassID: |
| 403 | case AMDGPU::TTMP_128RegClassID: |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 404 | // ToDo: unclear if s[100:104] is available on VI. Can we use VCC as SGPR in |
| 405 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 406 | case AMDGPU::SGPR_256RegClassID: |
| 407 | case AMDGPU::TTMP_256RegClassID: |
| 408 | // ToDo: unclear if s[96:104] is available on VI. Can we use VCC as SGPR in |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 409 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 410 | case AMDGPU::SGPR_512RegClassID: |
| 411 | case AMDGPU::TTMP_512RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 412 | shift = 2; |
| 413 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 414 | // ToDo: unclear if s[88:104] is available on VI. Can we use VCC as SGPR in |
| 415 | // this bundle? |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 416 | default: |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 417 | llvm_unreachable("unhandled register class"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 418 | } |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 419 | |
| 420 | if (Val % (1 << shift)) { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 421 | *CommentStream << "Warning: " << getRegClassName(SRegClassID) |
| 422 | << ": scalar reg isn't aligned " << Val; |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 423 | } |
| 424 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 425 | return createRegOperand(SRegClassID, Val >> shift); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 426 | } |
| 427 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 428 | MCOperand AMDGPUDisassembler::decodeOperand_VS_32(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 429 | return decodeSrcOp(OPW32, Val); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 430 | } |
| 431 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 432 | MCOperand AMDGPUDisassembler::decodeOperand_VS_64(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 433 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 434 | } |
| 435 | |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 436 | MCOperand AMDGPUDisassembler::decodeOperand_VS_128(unsigned Val) const { |
| 437 | return decodeSrcOp(OPW128, Val); |
| 438 | } |
| 439 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 440 | MCOperand AMDGPUDisassembler::decodeOperand_VSrc16(unsigned Val) const { |
| 441 | return decodeSrcOp(OPW16, Val); |
| 442 | } |
| 443 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 444 | MCOperand AMDGPUDisassembler::decodeOperand_VSrcV216(unsigned Val) const { |
| 445 | return decodeSrcOp(OPWV216, Val); |
| 446 | } |
| 447 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 448 | MCOperand AMDGPUDisassembler::decodeOperand_VGPR_32(unsigned Val) const { |
Matt Arsenault | cb540bc | 2016-07-19 00:35:03 +0000 | [diff] [blame] | 449 | // Some instructions have operand restrictions beyond what the encoding |
| 450 | // allows. Some ordinarily VSrc_32 operands are VGPR_32, so clear the extra |
| 451 | // high bit. |
| 452 | Val &= 255; |
| 453 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 454 | return createRegOperand(AMDGPU::VGPR_32RegClassID, Val); |
| 455 | } |
| 456 | |
| 457 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_64(unsigned Val) const { |
| 458 | return createRegOperand(AMDGPU::VReg_64RegClassID, Val); |
| 459 | } |
| 460 | |
| 461 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_96(unsigned Val) const { |
| 462 | return createRegOperand(AMDGPU::VReg_96RegClassID, Val); |
| 463 | } |
| 464 | |
| 465 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_128(unsigned Val) const { |
| 466 | return createRegOperand(AMDGPU::VReg_128RegClassID, Val); |
| 467 | } |
| 468 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 469 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32(unsigned Val) const { |
| 470 | // table-gen generated disassembler doesn't care about operand types |
| 471 | // leaving only registry class so SSrc_32 operand turns into SReg_32 |
| 472 | // and therefore we accept immediates and literals here as well |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 473 | return decodeSrcOp(OPW32, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 474 | } |
| 475 | |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 476 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XM0_XEXEC( |
| 477 | unsigned Val) const { |
| 478 | // SReg_32_XM0 is SReg_32 without M0 or EXEC_LO/EXEC_HI |
Artem Tamazov | 38e496b | 2016-04-29 17:04:50 +0000 | [diff] [blame] | 479 | return decodeOperand_SReg_32(Val); |
| 480 | } |
| 481 | |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 482 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XEXEC_HI( |
| 483 | unsigned Val) const { |
| 484 | // SReg_32_XM0 is SReg_32 without EXEC_HI |
| 485 | return decodeOperand_SReg_32(Val); |
| 486 | } |
| 487 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 488 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64(unsigned Val) const { |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 489 | return decodeSrcOp(OPW64, Val); |
| 490 | } |
| 491 | |
| 492 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64_XEXEC(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 493 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 494 | } |
| 495 | |
| 496 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_128(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 497 | return decodeSrcOp(OPW128, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 498 | } |
| 499 | |
| 500 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_256(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 501 | return decodeDstOp(OPW256, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 502 | } |
| 503 | |
| 504 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_512(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 505 | return decodeDstOp(OPW512, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 506 | } |
| 507 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 508 | MCOperand AMDGPUDisassembler::decodeLiteralConstant() const { |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 509 | // For now all literal constants are supposed to be unsigned integer |
| 510 | // ToDo: deal with signed/unsigned 64-bit integer constants |
| 511 | // ToDo: deal with float/double constants |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 512 | if (!HasLiteral) { |
| 513 | if (Bytes.size() < 4) { |
| 514 | return errOperand(0, "cannot read literal, inst bytes left " + |
| 515 | Twine(Bytes.size())); |
| 516 | } |
| 517 | HasLiteral = true; |
| 518 | Literal = eatBytes<uint32_t>(Bytes); |
| 519 | } |
| 520 | return MCOperand::createImm(Literal); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 521 | } |
| 522 | |
| 523 | MCOperand AMDGPUDisassembler::decodeIntImmed(unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 524 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 525 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 526 | assert(Imm >= INLINE_INTEGER_C_MIN && Imm <= INLINE_INTEGER_C_MAX); |
| 527 | return MCOperand::createImm((Imm <= INLINE_INTEGER_C_POSITIVE_MAX) ? |
| 528 | (static_cast<int64_t>(Imm) - INLINE_INTEGER_C_MIN) : |
| 529 | (INLINE_INTEGER_C_POSITIVE_MAX - static_cast<int64_t>(Imm))); |
| 530 | // Cast prevents negative overflow. |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 531 | } |
| 532 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 533 | static int64_t getInlineImmVal32(unsigned Imm) { |
| 534 | switch (Imm) { |
| 535 | case 240: |
| 536 | return FloatToBits(0.5f); |
| 537 | case 241: |
| 538 | return FloatToBits(-0.5f); |
| 539 | case 242: |
| 540 | return FloatToBits(1.0f); |
| 541 | case 243: |
| 542 | return FloatToBits(-1.0f); |
| 543 | case 244: |
| 544 | return FloatToBits(2.0f); |
| 545 | case 245: |
| 546 | return FloatToBits(-2.0f); |
| 547 | case 246: |
| 548 | return FloatToBits(4.0f); |
| 549 | case 247: |
| 550 | return FloatToBits(-4.0f); |
| 551 | case 248: // 1 / (2 * PI) |
| 552 | return 0x3e22f983; |
| 553 | default: |
| 554 | llvm_unreachable("invalid fp inline imm"); |
| 555 | } |
| 556 | } |
| 557 | |
| 558 | static int64_t getInlineImmVal64(unsigned Imm) { |
| 559 | switch (Imm) { |
| 560 | case 240: |
| 561 | return DoubleToBits(0.5); |
| 562 | case 241: |
| 563 | return DoubleToBits(-0.5); |
| 564 | case 242: |
| 565 | return DoubleToBits(1.0); |
| 566 | case 243: |
| 567 | return DoubleToBits(-1.0); |
| 568 | case 244: |
| 569 | return DoubleToBits(2.0); |
| 570 | case 245: |
| 571 | return DoubleToBits(-2.0); |
| 572 | case 246: |
| 573 | return DoubleToBits(4.0); |
| 574 | case 247: |
| 575 | return DoubleToBits(-4.0); |
| 576 | case 248: // 1 / (2 * PI) |
| 577 | return 0x3fc45f306dc9c882; |
| 578 | default: |
| 579 | llvm_unreachable("invalid fp inline imm"); |
| 580 | } |
| 581 | } |
| 582 | |
| 583 | static int64_t getInlineImmVal16(unsigned Imm) { |
| 584 | switch (Imm) { |
| 585 | case 240: |
| 586 | return 0x3800; |
| 587 | case 241: |
| 588 | return 0xB800; |
| 589 | case 242: |
| 590 | return 0x3C00; |
| 591 | case 243: |
| 592 | return 0xBC00; |
| 593 | case 244: |
| 594 | return 0x4000; |
| 595 | case 245: |
| 596 | return 0xC000; |
| 597 | case 246: |
| 598 | return 0x4400; |
| 599 | case 247: |
| 600 | return 0xC400; |
| 601 | case 248: // 1 / (2 * PI) |
| 602 | return 0x3118; |
| 603 | default: |
| 604 | llvm_unreachable("invalid fp inline imm"); |
| 605 | } |
| 606 | } |
| 607 | |
| 608 | MCOperand AMDGPUDisassembler::decodeFPImmed(OpWidthTy Width, unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 609 | assert(Imm >= AMDGPU::EncValues::INLINE_FLOATING_C_MIN |
| 610 | && Imm <= AMDGPU::EncValues::INLINE_FLOATING_C_MAX); |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 611 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 612 | // ToDo: case 248: 1/(2*PI) - is allowed only on VI |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 613 | switch (Width) { |
| 614 | case OPW32: |
| 615 | return MCOperand::createImm(getInlineImmVal32(Imm)); |
| 616 | case OPW64: |
| 617 | return MCOperand::createImm(getInlineImmVal64(Imm)); |
| 618 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 619 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 620 | return MCOperand::createImm(getInlineImmVal16(Imm)); |
| 621 | default: |
| 622 | llvm_unreachable("implement me"); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 623 | } |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 624 | } |
| 625 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 626 | unsigned AMDGPUDisassembler::getVgprClassId(const OpWidthTy Width) const { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 627 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 628 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 629 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 630 | switch (Width) { |
| 631 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 632 | case OPW32: |
| 633 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 634 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 635 | return VGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 636 | case OPW64: return VReg_64RegClassID; |
| 637 | case OPW128: return VReg_128RegClassID; |
| 638 | } |
| 639 | } |
| 640 | |
| 641 | unsigned AMDGPUDisassembler::getSgprClassId(const OpWidthTy Width) const { |
| 642 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 643 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 644 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 645 | switch (Width) { |
| 646 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 647 | case OPW32: |
| 648 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 649 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 650 | return SGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 651 | case OPW64: return SGPR_64RegClassID; |
| 652 | case OPW128: return SGPR_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 653 | case OPW256: return SGPR_256RegClassID; |
| 654 | case OPW512: return SGPR_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 655 | } |
| 656 | } |
| 657 | |
| 658 | unsigned AMDGPUDisassembler::getTtmpClassId(const OpWidthTy Width) const { |
| 659 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 660 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 661 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 662 | switch (Width) { |
| 663 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 664 | case OPW32: |
| 665 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 666 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 667 | return TTMP_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 668 | case OPW64: return TTMP_64RegClassID; |
| 669 | case OPW128: return TTMP_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 670 | case OPW256: return TTMP_256RegClassID; |
| 671 | case OPW512: return TTMP_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 672 | } |
| 673 | } |
| 674 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 675 | int AMDGPUDisassembler::getTTmpIdx(unsigned Val) const { |
| 676 | using namespace AMDGPU::EncValues; |
| 677 | |
| 678 | unsigned TTmpMin = isGFX9() ? TTMP_GFX9_MIN : TTMP_VI_MIN; |
| 679 | unsigned TTmpMax = isGFX9() ? TTMP_GFX9_MAX : TTMP_VI_MAX; |
| 680 | |
| 681 | return (TTmpMin <= Val && Val <= TTmpMax)? Val - TTmpMin : -1; |
| 682 | } |
| 683 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 684 | MCOperand AMDGPUDisassembler::decodeSrcOp(const OpWidthTy Width, unsigned Val) const { |
| 685 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 686 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 687 | assert(Val < 512); // enum9 |
| 688 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 689 | if (VGPR_MIN <= Val && Val <= VGPR_MAX) { |
| 690 | return createRegOperand(getVgprClassId(Width), Val - VGPR_MIN); |
| 691 | } |
Artem Tamazov | b49c336 | 2016-05-26 15:52:16 +0000 | [diff] [blame] | 692 | if (Val <= SGPR_MAX) { |
| 693 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 694 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 695 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 696 | |
| 697 | int TTmpIdx = getTTmpIdx(Val); |
| 698 | if (TTmpIdx >= 0) { |
| 699 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 700 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 701 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 702 | if (INLINE_INTEGER_C_MIN <= Val && Val <= INLINE_INTEGER_C_MAX) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 703 | return decodeIntImmed(Val); |
| 704 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 705 | if (INLINE_FLOATING_C_MIN <= Val && Val <= INLINE_FLOATING_C_MAX) |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 706 | return decodeFPImmed(Width, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 707 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 708 | if (Val == LITERAL_CONST) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 709 | return decodeLiteralConstant(); |
| 710 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 711 | switch (Width) { |
| 712 | case OPW32: |
| 713 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 714 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 715 | return decodeSpecialReg32(Val); |
| 716 | case OPW64: |
| 717 | return decodeSpecialReg64(Val); |
| 718 | default: |
| 719 | llvm_unreachable("unexpected immediate type"); |
| 720 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 721 | } |
| 722 | |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 723 | MCOperand AMDGPUDisassembler::decodeDstOp(const OpWidthTy Width, unsigned Val) const { |
| 724 | using namespace AMDGPU::EncValues; |
| 725 | |
| 726 | assert(Val < 128); |
| 727 | assert(Width == OPW256 || Width == OPW512); |
| 728 | |
| 729 | if (Val <= SGPR_MAX) { |
| 730 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
| 731 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 732 | } |
| 733 | |
| 734 | int TTmpIdx = getTTmpIdx(Val); |
| 735 | if (TTmpIdx >= 0) { |
| 736 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
| 737 | } |
| 738 | |
| 739 | llvm_unreachable("unknown dst register"); |
| 740 | } |
| 741 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 742 | MCOperand AMDGPUDisassembler::decodeSpecialReg32(unsigned Val) const { |
| 743 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 744 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 745 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 746 | case 102: return createRegOperand(FLAT_SCR_LO); |
| 747 | case 103: return createRegOperand(FLAT_SCR_HI); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 748 | case 104: return createRegOperand(XNACK_MASK_LO); |
| 749 | case 105: return createRegOperand(XNACK_MASK_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 750 | case 106: return createRegOperand(VCC_LO); |
| 751 | case 107: return createRegOperand(VCC_HI); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 752 | case 108: assert(!isGFX9()); return createRegOperand(TBA_LO); |
| 753 | case 109: assert(!isGFX9()); return createRegOperand(TBA_HI); |
| 754 | case 110: assert(!isGFX9()); return createRegOperand(TMA_LO); |
| 755 | case 111: assert(!isGFX9()); return createRegOperand(TMA_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 756 | case 124: return createRegOperand(M0); |
| 757 | case 126: return createRegOperand(EXEC_LO); |
| 758 | case 127: return createRegOperand(EXEC_HI); |
Matt Arsenault | a3b3b48 | 2017-02-18 18:41:41 +0000 | [diff] [blame] | 759 | case 235: return createRegOperand(SRC_SHARED_BASE); |
| 760 | case 236: return createRegOperand(SRC_SHARED_LIMIT); |
| 761 | case 237: return createRegOperand(SRC_PRIVATE_BASE); |
| 762 | case 238: return createRegOperand(SRC_PRIVATE_LIMIT); |
| 763 | // TODO: SRC_POPS_EXITING_WAVE_ID |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 764 | // ToDo: no support for vccz register |
| 765 | case 251: break; |
| 766 | // ToDo: no support for execz register |
| 767 | case 252: break; |
| 768 | case 253: return createRegOperand(SCC); |
| 769 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 770 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 771 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 772 | } |
| 773 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 774 | MCOperand AMDGPUDisassembler::decodeSpecialReg64(unsigned Val) const { |
| 775 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 776 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 777 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 778 | case 102: return createRegOperand(FLAT_SCR); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 779 | case 104: return createRegOperand(XNACK_MASK); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 780 | case 106: return createRegOperand(VCC); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 781 | case 108: assert(!isGFX9()); return createRegOperand(TBA); |
| 782 | case 110: assert(!isGFX9()); return createRegOperand(TMA); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 783 | case 126: return createRegOperand(EXEC); |
| 784 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 785 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 786 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 787 | } |
| 788 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 789 | MCOperand AMDGPUDisassembler::decodeSDWASrc(const OpWidthTy Width, |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 790 | const unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 791 | using namespace AMDGPU::SDWA; |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 792 | using namespace AMDGPU::EncValues; |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 793 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 794 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
Sam Kolton | a179d25 | 2017-06-27 15:02:23 +0000 | [diff] [blame] | 795 | // XXX: static_cast<int> is needed to avoid stupid warning: |
| 796 | // compare with unsigned is always true |
| 797 | if (SDWA9EncValues::SRC_VGPR_MIN <= static_cast<int>(Val) && |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 798 | Val <= SDWA9EncValues::SRC_VGPR_MAX) { |
| 799 | return createRegOperand(getVgprClassId(Width), |
| 800 | Val - SDWA9EncValues::SRC_VGPR_MIN); |
| 801 | } |
| 802 | if (SDWA9EncValues::SRC_SGPR_MIN <= Val && |
| 803 | Val <= SDWA9EncValues::SRC_SGPR_MAX) { |
| 804 | return createSRegOperand(getSgprClassId(Width), |
| 805 | Val - SDWA9EncValues::SRC_SGPR_MIN); |
| 806 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 807 | if (SDWA9EncValues::SRC_TTMP_MIN <= Val && |
| 808 | Val <= SDWA9EncValues::SRC_TTMP_MAX) { |
| 809 | return createSRegOperand(getTtmpClassId(Width), |
| 810 | Val - SDWA9EncValues::SRC_TTMP_MIN); |
| 811 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 812 | |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 813 | const unsigned SVal = Val - SDWA9EncValues::SRC_SGPR_MIN; |
| 814 | |
| 815 | if (INLINE_INTEGER_C_MIN <= SVal && SVal <= INLINE_INTEGER_C_MAX) |
| 816 | return decodeIntImmed(SVal); |
| 817 | |
| 818 | if (INLINE_FLOATING_C_MIN <= SVal && SVal <= INLINE_FLOATING_C_MAX) |
| 819 | return decodeFPImmed(Width, SVal); |
| 820 | |
| 821 | return decodeSpecialReg32(SVal); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 822 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 823 | return createRegOperand(getVgprClassId(Width), Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 824 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 825 | llvm_unreachable("unsupported target"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 826 | } |
| 827 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 828 | MCOperand AMDGPUDisassembler::decodeSDWASrc16(unsigned Val) const { |
| 829 | return decodeSDWASrc(OPW16, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 830 | } |
| 831 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 832 | MCOperand AMDGPUDisassembler::decodeSDWASrc32(unsigned Val) const { |
| 833 | return decodeSDWASrc(OPW32, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 834 | } |
| 835 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 836 | MCOperand AMDGPUDisassembler::decodeSDWAVopcDst(unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 837 | using namespace AMDGPU::SDWA; |
| 838 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 839 | assert(STI.getFeatureBits()[AMDGPU::FeatureGFX9] && |
| 840 | "SDWAVopcDst should be present only on GFX9"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 841 | if (Val & SDWA9EncValues::VOPC_DST_VCC_MASK) { |
| 842 | Val &= SDWA9EncValues::VOPC_DST_SGPR_MASK; |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 843 | |
| 844 | int TTmpIdx = getTTmpIdx(Val); |
| 845 | if (TTmpIdx >= 0) { |
| 846 | return createSRegOperand(getTtmpClassId(OPW64), TTmpIdx); |
| 847 | } else if (Val > AMDGPU::EncValues::SGPR_MAX) { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 848 | return decodeSpecialReg64(Val); |
| 849 | } else { |
| 850 | return createSRegOperand(getSgprClassId(OPW64), Val); |
| 851 | } |
| 852 | } else { |
| 853 | return createRegOperand(AMDGPU::VCC); |
| 854 | } |
| 855 | } |
| 856 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 857 | bool AMDGPUDisassembler::isVI() const { |
| 858 | return STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]; |
| 859 | } |
| 860 | |
| 861 | bool AMDGPUDisassembler::isGFX9() const { |
| 862 | return STI.getFeatureBits()[AMDGPU::FeatureGFX9]; |
| 863 | } |
| 864 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 865 | //===----------------------------------------------------------------------===// |
| 866 | // AMDGPUSymbolizer |
| 867 | //===----------------------------------------------------------------------===// |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 868 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 869 | // Try to find symbol name for specified label |
| 870 | bool AMDGPUSymbolizer::tryAddingSymbolicOperand(MCInst &Inst, |
| 871 | raw_ostream &/*cStream*/, int64_t Value, |
| 872 | uint64_t /*Address*/, bool IsBranch, |
| 873 | uint64_t /*Offset*/, uint64_t /*InstSize*/) { |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 874 | using SymbolInfoTy = std::tuple<uint64_t, StringRef, uint8_t>; |
| 875 | using SectionSymbolsTy = std::vector<SymbolInfoTy>; |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 876 | |
| 877 | if (!IsBranch) { |
| 878 | return false; |
| 879 | } |
| 880 | |
| 881 | auto *Symbols = static_cast<SectionSymbolsTy *>(DisInfo); |
| 882 | auto Result = std::find_if(Symbols->begin(), Symbols->end(), |
| 883 | [Value](const SymbolInfoTy& Val) { |
| 884 | return std::get<0>(Val) == static_cast<uint64_t>(Value) |
| 885 | && std::get<2>(Val) == ELF::STT_NOTYPE; |
| 886 | }); |
| 887 | if (Result != Symbols->end()) { |
| 888 | auto *Sym = Ctx.getOrCreateSymbol(std::get<1>(*Result)); |
| 889 | const auto *Add = MCSymbolRefExpr::create(Sym, Ctx); |
| 890 | Inst.addOperand(MCOperand::createExpr(Add)); |
| 891 | return true; |
| 892 | } |
| 893 | return false; |
| 894 | } |
| 895 | |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 896 | void AMDGPUSymbolizer::tryAddingPcLoadReferenceComment(raw_ostream &cStream, |
| 897 | int64_t Value, |
| 898 | uint64_t Address) { |
| 899 | llvm_unreachable("unimplemented"); |
| 900 | } |
| 901 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 902 | //===----------------------------------------------------------------------===// |
| 903 | // Initialization |
| 904 | //===----------------------------------------------------------------------===// |
| 905 | |
| 906 | static MCSymbolizer *createAMDGPUSymbolizer(const Triple &/*TT*/, |
| 907 | LLVMOpInfoCallback /*GetOpInfo*/, |
| 908 | LLVMSymbolLookupCallback /*SymbolLookUp*/, |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 909 | void *DisInfo, |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 910 | MCContext *Ctx, |
| 911 | std::unique_ptr<MCRelocationInfo> &&RelInfo) { |
| 912 | return new AMDGPUSymbolizer(*Ctx, std::move(RelInfo), DisInfo); |
| 913 | } |
| 914 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 915 | static MCDisassembler *createAMDGPUDisassembler(const Target &T, |
| 916 | const MCSubtargetInfo &STI, |
| 917 | MCContext &Ctx) { |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 918 | return new AMDGPUDisassembler(STI, Ctx, T.createMCInstrInfo()); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 919 | } |
| 920 | |
| 921 | extern "C" void LLVMInitializeAMDGPUDisassembler() { |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 922 | TargetRegistry::RegisterMCDisassembler(getTheGCNTarget(), |
| 923 | createAMDGPUDisassembler); |
| 924 | TargetRegistry::RegisterMCSymbolizer(getTheGCNTarget(), |
| 925 | createAMDGPUSymbolizer); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 926 | } |