Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 1 | //===- AMDGPUDisassembler.cpp - Disassembler for AMDGPU ISA ---------------===// |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | //===----------------------------------------------------------------------===// |
| 11 | // |
| 12 | /// \file |
| 13 | /// |
| 14 | /// This file contains definition for AMDGPU ISA disassembler |
| 15 | // |
| 16 | //===----------------------------------------------------------------------===// |
| 17 | |
| 18 | // ToDo: What to do with instruction suffixes (v_mov_b32 vs v_mov_b32_e32)? |
| 19 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 20 | #include "Disassembler/AMDGPUDisassembler.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 21 | #include "AMDGPU.h" |
| 22 | #include "AMDGPURegisterInfo.h" |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 23 | #include "SIDefines.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 24 | #include "Utils/AMDGPUBaseInfo.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 25 | #include "llvm-c/Disassembler.h" |
| 26 | #include "llvm/ADT/APInt.h" |
| 27 | #include "llvm/ADT/ArrayRef.h" |
| 28 | #include "llvm/ADT/Twine.h" |
Zachary Turner | 264b5d9 | 2017-06-07 03:48:56 +0000 | [diff] [blame] | 29 | #include "llvm/BinaryFormat/ELF.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 30 | #include "llvm/MC/MCContext.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 31 | #include "llvm/MC/MCDisassembler/MCDisassembler.h" |
| 32 | #include "llvm/MC/MCExpr.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 33 | #include "llvm/MC/MCFixedLenDisassembler.h" |
| 34 | #include "llvm/MC/MCInst.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 35 | #include "llvm/MC/MCSubtargetInfo.h" |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 36 | #include "llvm/Support/Endian.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 37 | #include "llvm/Support/ErrorHandling.h" |
| 38 | #include "llvm/Support/MathExtras.h" |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 39 | #include "llvm/Support/TargetRegistry.h" |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 40 | #include "llvm/Support/raw_ostream.h" |
| 41 | #include <algorithm> |
| 42 | #include <cassert> |
| 43 | #include <cstddef> |
| 44 | #include <cstdint> |
| 45 | #include <iterator> |
| 46 | #include <tuple> |
| 47 | #include <vector> |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 48 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 49 | using namespace llvm; |
| 50 | |
| 51 | #define DEBUG_TYPE "amdgpu-disassembler" |
| 52 | |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 53 | using DecodeStatus = llvm::MCDisassembler::DecodeStatus; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 54 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 55 | inline static MCDisassembler::DecodeStatus |
| 56 | addOperand(MCInst &Inst, const MCOperand& Opnd) { |
| 57 | Inst.addOperand(Opnd); |
| 58 | return Opnd.isValid() ? |
| 59 | MCDisassembler::Success : |
| 60 | MCDisassembler::SoftFail; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 61 | } |
| 62 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 63 | static int insertNamedMCOperand(MCInst &MI, const MCOperand &Op, |
| 64 | uint16_t NameIdx) { |
| 65 | int OpIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), NameIdx); |
| 66 | if (OpIdx != -1) { |
| 67 | auto I = MI.begin(); |
| 68 | std::advance(I, OpIdx); |
| 69 | MI.insert(I, Op); |
| 70 | } |
| 71 | return OpIdx; |
| 72 | } |
| 73 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 74 | static DecodeStatus decodeSoppBrTarget(MCInst &Inst, unsigned Imm, |
| 75 | uint64_t Addr, const void *Decoder) { |
| 76 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 77 | |
| 78 | APInt SignedOffset(18, Imm * 4, true); |
| 79 | int64_t Offset = (SignedOffset.sext(64) + 4 + Addr).getSExtValue(); |
| 80 | |
| 81 | if (DAsm->tryAddingSymbolicOperand(Inst, Offset, Addr, true, 2, 2)) |
| 82 | return MCDisassembler::Success; |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 83 | return addOperand(Inst, MCOperand::createImm(Imm)); |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 84 | } |
| 85 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 86 | #define DECODE_OPERAND(StaticDecoderName, DecoderName) \ |
| 87 | static DecodeStatus StaticDecoderName(MCInst &Inst, \ |
| 88 | unsigned Imm, \ |
| 89 | uint64_t /*Addr*/, \ |
| 90 | const void *Decoder) { \ |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 91 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); \ |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 92 | return addOperand(Inst, DAsm->DecoderName(Imm)); \ |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 93 | } |
| 94 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 95 | #define DECODE_OPERAND_REG(RegClass) \ |
| 96 | DECODE_OPERAND(Decode##RegClass##RegisterClass, decodeOperand_##RegClass) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 97 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 98 | DECODE_OPERAND_REG(VGPR_32) |
| 99 | DECODE_OPERAND_REG(VS_32) |
| 100 | DECODE_OPERAND_REG(VS_64) |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 101 | DECODE_OPERAND_REG(VS_128) |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 102 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 103 | DECODE_OPERAND_REG(VReg_64) |
| 104 | DECODE_OPERAND_REG(VReg_96) |
| 105 | DECODE_OPERAND_REG(VReg_128) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 106 | |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 107 | DECODE_OPERAND_REG(SReg_32) |
| 108 | DECODE_OPERAND_REG(SReg_32_XM0_XEXEC) |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 109 | DECODE_OPERAND_REG(SReg_32_XEXEC_HI) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 110 | DECODE_OPERAND_REG(SReg_64) |
| 111 | DECODE_OPERAND_REG(SReg_64_XEXEC) |
| 112 | DECODE_OPERAND_REG(SReg_128) |
| 113 | DECODE_OPERAND_REG(SReg_256) |
| 114 | DECODE_OPERAND_REG(SReg_512) |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 115 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 116 | static DecodeStatus decodeOperand_VSrc16(MCInst &Inst, |
| 117 | unsigned Imm, |
| 118 | uint64_t Addr, |
| 119 | const void *Decoder) { |
| 120 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 121 | return addOperand(Inst, DAsm->decodeOperand_VSrc16(Imm)); |
| 122 | } |
| 123 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 124 | static DecodeStatus decodeOperand_VSrcV216(MCInst &Inst, |
| 125 | unsigned Imm, |
| 126 | uint64_t Addr, |
| 127 | const void *Decoder) { |
| 128 | auto DAsm = static_cast<const AMDGPUDisassembler*>(Decoder); |
| 129 | return addOperand(Inst, DAsm->decodeOperand_VSrcV216(Imm)); |
| 130 | } |
| 131 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 132 | #define DECODE_SDWA(DecName) \ |
| 133 | DECODE_OPERAND(decodeSDWA##DecName, decodeSDWA##DecName) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 134 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 135 | DECODE_SDWA(Src32) |
| 136 | DECODE_SDWA(Src16) |
| 137 | DECODE_SDWA(VopcDst) |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 138 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 139 | #include "AMDGPUGenDisassemblerTables.inc" |
| 140 | |
| 141 | //===----------------------------------------------------------------------===// |
| 142 | // |
| 143 | //===----------------------------------------------------------------------===// |
| 144 | |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 145 | template <typename T> static inline T eatBytes(ArrayRef<uint8_t>& Bytes) { |
| 146 | assert(Bytes.size() >= sizeof(T)); |
| 147 | const auto Res = support::endian::read<T, support::endianness::little>(Bytes.data()); |
| 148 | Bytes = Bytes.slice(sizeof(T)); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 149 | return Res; |
| 150 | } |
| 151 | |
| 152 | DecodeStatus AMDGPUDisassembler::tryDecodeInst(const uint8_t* Table, |
| 153 | MCInst &MI, |
| 154 | uint64_t Inst, |
| 155 | uint64_t Address) const { |
| 156 | assert(MI.getOpcode() == 0); |
| 157 | assert(MI.getNumOperands() == 0); |
| 158 | MCInst TmpInst; |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 159 | HasLiteral = false; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 160 | const auto SavedBytes = Bytes; |
| 161 | if (decodeInstruction(Table, TmpInst, Inst, Address, this, STI)) { |
| 162 | MI = TmpInst; |
| 163 | return MCDisassembler::Success; |
| 164 | } |
| 165 | Bytes = SavedBytes; |
| 166 | return MCDisassembler::Fail; |
| 167 | } |
| 168 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 169 | DecodeStatus AMDGPUDisassembler::getInstruction(MCInst &MI, uint64_t &Size, |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 170 | ArrayRef<uint8_t> Bytes_, |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 171 | uint64_t Address, |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 172 | raw_ostream &WS, |
| 173 | raw_ostream &CS) const { |
| 174 | CommentStream = &CS; |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 175 | bool IsSDWA = false; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 176 | |
| 177 | // ToDo: AMDGPUDisassembler supports only VI ISA. |
Matt Arsenault | d122abe | 2017-02-15 21:50:34 +0000 | [diff] [blame] | 178 | if (!STI.getFeatureBits()[AMDGPU::FeatureGCN3Encoding]) |
| 179 | report_fatal_error("Disassembly not yet supported for subtarget"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 180 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 181 | const unsigned MaxInstBytesNum = (std::min)((size_t)8, Bytes_.size()); |
| 182 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 183 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 184 | DecodeStatus Res = MCDisassembler::Fail; |
| 185 | do { |
Valery Pykhtin | 824e804 | 2016-03-04 10:59:50 +0000 | [diff] [blame] | 186 | // ToDo: better to switch encoding length using some bit predicate |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 187 | // but it is unknown yet, so try all we can |
Matt Arsenault | 37fefd6 | 2016-06-10 02:18:02 +0000 | [diff] [blame] | 188 | |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 189 | // Try to decode DPP and SDWA first to solve conflict with VOP1 and VOP2 |
| 190 | // encodings |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 191 | if (Bytes.size() >= 8) { |
| 192 | const uint64_t QW = eatBytes<uint64_t>(Bytes); |
| 193 | Res = tryDecodeInst(DecoderTableDPP64, MI, QW, Address); |
| 194 | if (Res) break; |
Sam Kolton | c9bdcb7 | 2016-06-09 11:04:45 +0000 | [diff] [blame] | 195 | |
| 196 | Res = tryDecodeInst(DecoderTableSDWA64, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 197 | if (Res) { IsSDWA = true; break; } |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 198 | |
| 199 | Res = tryDecodeInst(DecoderTableSDWA964, MI, QW, Address); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 200 | if (Res) { IsSDWA = true; break; } |
Changpeng Fang | 0905870 | 2018-01-30 16:42:40 +0000 | [diff] [blame] | 201 | |
| 202 | if (STI.getFeatureBits()[AMDGPU::FeatureUnpackedD16VMem]) { |
| 203 | Res = tryDecodeInst(DecoderTableGFX80_UNPACKED64, MI, QW, Address); |
Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 204 | if (Res) |
| 205 | break; |
| 206 | } |
| 207 | |
| 208 | // Some GFX9 subtargets repurposed the v_mad_mix_f32, v_mad_mixlo_f16 and |
| 209 | // v_mad_mixhi_f16 for FMA variants. Try to decode using this special |
| 210 | // table first so we print the correct name. |
| 211 | if (STI.getFeatureBits()[AMDGPU::FeatureFmaMixInsts]) { |
| 212 | Res = tryDecodeInst(DecoderTableGFX9_DL64, MI, QW, Address); |
| 213 | if (Res) |
| 214 | break; |
Changpeng Fang | 0905870 | 2018-01-30 16:42:40 +0000 | [diff] [blame] | 215 | } |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 216 | } |
| 217 | |
| 218 | // Reinitialize Bytes as DPP64 could have eaten too much |
| 219 | Bytes = Bytes_.slice(0, MaxInstBytesNum); |
| 220 | |
| 221 | // Try decode 32-bit instruction |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 222 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 223 | const uint32_t DW = eatBytes<uint32_t>(Bytes); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 224 | Res = tryDecodeInst(DecoderTableVI32, MI, DW, Address); |
| 225 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 226 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 227 | Res = tryDecodeInst(DecoderTableAMDGPU32, MI, DW, Address); |
| 228 | if (Res) break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 229 | |
Dmitry Preobrazhensky | a0342dc | 2017-11-20 18:24:21 +0000 | [diff] [blame] | 230 | Res = tryDecodeInst(DecoderTableGFX932, MI, DW, Address); |
| 231 | if (Res) break; |
| 232 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 233 | if (Bytes.size() < 4) break; |
Sam Kolton | 1048fb1 | 2016-03-31 14:15:04 +0000 | [diff] [blame] | 234 | const uint64_t QW = ((uint64_t)eatBytes<uint32_t>(Bytes) << 32) | DW; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 235 | Res = tryDecodeInst(DecoderTableVI64, MI, QW, Address); |
| 236 | if (Res) break; |
| 237 | |
| 238 | Res = tryDecodeInst(DecoderTableAMDGPU64, MI, QW, Address); |
Dmitry Preobrazhensky | 1e32550 | 2017-08-09 17:10:47 +0000 | [diff] [blame] | 239 | if (Res) break; |
| 240 | |
| 241 | Res = tryDecodeInst(DecoderTableGFX964, MI, QW, Address); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 242 | } while (false); |
| 243 | |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 244 | if (Res && (MI.getOpcode() == AMDGPU::V_MAC_F32_e64_vi || |
| 245 | MI.getOpcode() == AMDGPU::V_MAC_F32_e64_si || |
Konstantin Zhuravlyov | 603a43f | 2018-05-15 17:39:13 +0000 | [diff] [blame^] | 246 | MI.getOpcode() == AMDGPU::V_MAC_F16_e64_vi || |
| 247 | MI.getOpcode() == AMDGPU::V_FMAC_F32_e64_vi)) { |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 248 | // Insert dummy unused src2_modifiers. |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 249 | insertNamedMCOperand(MI, MCOperand::createImm(0), |
| 250 | AMDGPU::OpName::src2_modifiers); |
Matt Arsenault | 678e111 | 2017-04-10 17:58:06 +0000 | [diff] [blame] | 251 | } |
| 252 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 253 | if (Res && (MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::MIMG)) { |
| 254 | Res = convertMIMGInst(MI); |
| 255 | } |
| 256 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 257 | if (Res && IsSDWA) |
| 258 | Res = convertSDWAInst(MI); |
| 259 | |
Tim Corringham | 7116e89 | 2018-03-26 17:06:33 +0000 | [diff] [blame] | 260 | // if the opcode was not recognized we'll assume a Size of 4 bytes |
| 261 | // (unless there are fewer bytes left) |
| 262 | Size = Res ? (MaxInstBytesNum - Bytes.size()) |
| 263 | : std::min((size_t)4, Bytes_.size()); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 264 | return Res; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 265 | } |
| 266 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 267 | DecodeStatus AMDGPUDisassembler::convertSDWAInst(MCInst &MI) const { |
| 268 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
| 269 | if (AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst) != -1) |
| 270 | // VOPC - insert clamp |
| 271 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::clamp); |
| 272 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 273 | int SDst = AMDGPU::getNamedOperandIdx(MI.getOpcode(), AMDGPU::OpName::sdst); |
| 274 | if (SDst != -1) { |
| 275 | // VOPC - insert VCC register as sdst |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 276 | insertNamedMCOperand(MI, createRegOperand(AMDGPU::VCC), |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 277 | AMDGPU::OpName::sdst); |
| 278 | } else { |
| 279 | // VOP1/2 - insert omod if present in instruction |
| 280 | insertNamedMCOperand(MI, MCOperand::createImm(0), AMDGPU::OpName::omod); |
| 281 | } |
| 282 | } |
| 283 | return MCDisassembler::Success; |
| 284 | } |
| 285 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 286 | // Note that MIMG format provides no information about VADDR size. |
| 287 | // Consequently, decoded instructions always show address |
| 288 | // as if it has 1 dword, which could be not really so. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 289 | DecodeStatus AMDGPUDisassembler::convertMIMGInst(MCInst &MI) const { |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 290 | |
| 291 | if (MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::Gather4) { |
| 292 | return MCDisassembler::Success; |
| 293 | } |
| 294 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 295 | int VDstIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 296 | AMDGPU::OpName::vdst); |
| 297 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 298 | int VDataIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 299 | AMDGPU::OpName::vdata); |
| 300 | |
| 301 | int DMaskIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 302 | AMDGPU::OpName::dmask); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 303 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 304 | int TFEIdx = AMDGPU::getNamedOperandIdx(MI.getOpcode(), |
| 305 | AMDGPU::OpName::tfe); |
| 306 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 307 | assert(VDataIdx != -1); |
| 308 | assert(DMaskIdx != -1); |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 309 | assert(TFEIdx != -1); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 310 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 311 | bool IsAtomic = (VDstIdx != -1); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 312 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 313 | unsigned DMask = MI.getOperand(DMaskIdx).getImm() & 0xf; |
| 314 | if (DMask == 0) |
| 315 | return MCDisassembler::Success; |
| 316 | |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 317 | unsigned DstSize = countPopulation(DMask); |
| 318 | if (DstSize == 1) |
| 319 | return MCDisassembler::Success; |
| 320 | |
| 321 | bool D16 = MCII->get(MI.getOpcode()).TSFlags & SIInstrFlags::D16; |
| 322 | if (D16 && AMDGPU::hasPackedD16(STI)) { |
| 323 | DstSize = (DstSize + 1) / 2; |
| 324 | } |
| 325 | |
| 326 | // FIXME: Add tfe support |
| 327 | if (MI.getOperand(TFEIdx).getImm()) |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 328 | return MCDisassembler::Success; |
| 329 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 330 | int NewOpcode = -1; |
| 331 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 332 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 333 | if (DMask == 0x1 || DMask == 0x3 || DMask == 0xF) { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 334 | NewOpcode = AMDGPU::getMaskedMIMGAtomicOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 335 | } |
| 336 | if (NewOpcode == -1) return MCDisassembler::Success; |
| 337 | } else { |
Dmitry Preobrazhensky | 0a1ff46 | 2018-02-05 14:18:53 +0000 | [diff] [blame] | 338 | NewOpcode = AMDGPU::getMaskedMIMGOp(*MCII, MI.getOpcode(), DstSize); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 339 | assert(NewOpcode != -1 && "could not find matching mimg channel instruction"); |
| 340 | } |
| 341 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 342 | auto RCID = MCII->get(NewOpcode).OpInfo[VDataIdx].RegClass; |
| 343 | |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 344 | // Get first subregister of VData |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 345 | unsigned Vdata0 = MI.getOperand(VDataIdx).getReg(); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 346 | unsigned VdataSub0 = MRI.getSubReg(Vdata0, AMDGPU::sub0); |
| 347 | Vdata0 = (VdataSub0 != 0)? VdataSub0 : Vdata0; |
| 348 | |
| 349 | // Widen the register to the correct number of enabled channels. |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 350 | auto NewVdata = MRI.getMatchingSuperReg(Vdata0, AMDGPU::sub0, |
| 351 | &MRI.getRegClass(RCID)); |
| 352 | if (NewVdata == AMDGPU::NoRegister) { |
| 353 | // It's possible to encode this such that the low register + enabled |
| 354 | // components exceeds the register count. |
| 355 | return MCDisassembler::Success; |
| 356 | } |
| 357 | |
| 358 | MI.setOpcode(NewOpcode); |
| 359 | // vaddr will be always appear as a single VGPR. This will look different than |
| 360 | // how it is usually emitted because the number of register components is not |
| 361 | // in the instruction encoding. |
| 362 | MI.getOperand(VDataIdx) = MCOperand::createReg(NewVdata); |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 363 | |
Dmitry Preobrazhensky | da4a7c0 | 2018-03-12 15:03:34 +0000 | [diff] [blame] | 364 | if (IsAtomic) { |
Dmitry Preobrazhensky | 0b4eb1e | 2018-01-26 15:43:29 +0000 | [diff] [blame] | 365 | // Atomic operations have an additional operand (a copy of data) |
| 366 | MI.getOperand(VDstIdx) = MCOperand::createReg(NewVdata); |
| 367 | } |
| 368 | |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 369 | return MCDisassembler::Success; |
| 370 | } |
| 371 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 372 | const char* AMDGPUDisassembler::getRegClassName(unsigned RegClassID) const { |
| 373 | return getContext().getRegisterInfo()-> |
| 374 | getRegClassName(&AMDGPUMCRegisterClasses[RegClassID]); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 375 | } |
| 376 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 377 | inline |
| 378 | MCOperand AMDGPUDisassembler::errOperand(unsigned V, |
| 379 | const Twine& ErrMsg) const { |
| 380 | *CommentStream << "Error: " + ErrMsg; |
| 381 | |
| 382 | // ToDo: add support for error operands to MCInst.h |
| 383 | // return MCOperand::createError(V); |
| 384 | return MCOperand(); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 385 | } |
| 386 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 387 | inline |
| 388 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned int RegId) const { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 389 | return MCOperand::createReg(AMDGPU::getMCReg(RegId, STI)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 390 | } |
| 391 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 392 | inline |
| 393 | MCOperand AMDGPUDisassembler::createRegOperand(unsigned RegClassID, |
| 394 | unsigned Val) const { |
| 395 | const auto& RegCl = AMDGPUMCRegisterClasses[RegClassID]; |
| 396 | if (Val >= RegCl.getNumRegs()) |
| 397 | return errOperand(Val, Twine(getRegClassName(RegClassID)) + |
| 398 | ": unknown register " + Twine(Val)); |
| 399 | return createRegOperand(RegCl.getRegister(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 400 | } |
| 401 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 402 | inline |
| 403 | MCOperand AMDGPUDisassembler::createSRegOperand(unsigned SRegClassID, |
| 404 | unsigned Val) const { |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 405 | // ToDo: SI/CI have 104 SGPRs, VI - 102 |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 406 | // Valery: here we accepting as much as we can, let assembler sort it out |
| 407 | int shift = 0; |
| 408 | switch (SRegClassID) { |
| 409 | case AMDGPU::SGPR_32RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 410 | case AMDGPU::TTMP_32RegClassID: |
| 411 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 412 | case AMDGPU::SGPR_64RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 413 | case AMDGPU::TTMP_64RegClassID: |
| 414 | shift = 1; |
| 415 | break; |
| 416 | case AMDGPU::SGPR_128RegClassID: |
| 417 | case AMDGPU::TTMP_128RegClassID: |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 418 | // ToDo: unclear if s[100:104] is available on VI. Can we use VCC as SGPR in |
| 419 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 420 | case AMDGPU::SGPR_256RegClassID: |
| 421 | case AMDGPU::TTMP_256RegClassID: |
| 422 | // ToDo: unclear if s[96:104] is available on VI. Can we use VCC as SGPR in |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 423 | // this bundle? |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 424 | case AMDGPU::SGPR_512RegClassID: |
| 425 | case AMDGPU::TTMP_512RegClassID: |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 426 | shift = 2; |
| 427 | break; |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 428 | // ToDo: unclear if s[88:104] is available on VI. Can we use VCC as SGPR in |
| 429 | // this bundle? |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 430 | default: |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 431 | llvm_unreachable("unhandled register class"); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 432 | } |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 433 | |
| 434 | if (Val % (1 << shift)) { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 435 | *CommentStream << "Warning: " << getRegClassName(SRegClassID) |
| 436 | << ": scalar reg isn't aligned " << Val; |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 437 | } |
| 438 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 439 | return createRegOperand(SRegClassID, Val >> shift); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 440 | } |
| 441 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 442 | MCOperand AMDGPUDisassembler::decodeOperand_VS_32(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 443 | return decodeSrcOp(OPW32, Val); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 444 | } |
| 445 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 446 | MCOperand AMDGPUDisassembler::decodeOperand_VS_64(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 447 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 448 | } |
| 449 | |
Dmitry Preobrazhensky | 30fc523 | 2017-07-18 13:12:48 +0000 | [diff] [blame] | 450 | MCOperand AMDGPUDisassembler::decodeOperand_VS_128(unsigned Val) const { |
| 451 | return decodeSrcOp(OPW128, Val); |
| 452 | } |
| 453 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 454 | MCOperand AMDGPUDisassembler::decodeOperand_VSrc16(unsigned Val) const { |
| 455 | return decodeSrcOp(OPW16, Val); |
| 456 | } |
| 457 | |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 458 | MCOperand AMDGPUDisassembler::decodeOperand_VSrcV216(unsigned Val) const { |
| 459 | return decodeSrcOp(OPWV216, Val); |
| 460 | } |
| 461 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 462 | MCOperand AMDGPUDisassembler::decodeOperand_VGPR_32(unsigned Val) const { |
Matt Arsenault | cb540bc | 2016-07-19 00:35:03 +0000 | [diff] [blame] | 463 | // Some instructions have operand restrictions beyond what the encoding |
| 464 | // allows. Some ordinarily VSrc_32 operands are VGPR_32, so clear the extra |
| 465 | // high bit. |
| 466 | Val &= 255; |
| 467 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 468 | return createRegOperand(AMDGPU::VGPR_32RegClassID, Val); |
| 469 | } |
| 470 | |
| 471 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_64(unsigned Val) const { |
| 472 | return createRegOperand(AMDGPU::VReg_64RegClassID, Val); |
| 473 | } |
| 474 | |
| 475 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_96(unsigned Val) const { |
| 476 | return createRegOperand(AMDGPU::VReg_96RegClassID, Val); |
| 477 | } |
| 478 | |
| 479 | MCOperand AMDGPUDisassembler::decodeOperand_VReg_128(unsigned Val) const { |
| 480 | return createRegOperand(AMDGPU::VReg_128RegClassID, Val); |
| 481 | } |
| 482 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 483 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32(unsigned Val) const { |
| 484 | // table-gen generated disassembler doesn't care about operand types |
| 485 | // leaving only registry class so SSrc_32 operand turns into SReg_32 |
| 486 | // and therefore we accept immediates and literals here as well |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 487 | return decodeSrcOp(OPW32, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 488 | } |
| 489 | |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 490 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XM0_XEXEC( |
| 491 | unsigned Val) const { |
| 492 | // SReg_32_XM0 is SReg_32 without M0 or EXEC_LO/EXEC_HI |
Artem Tamazov | 38e496b | 2016-04-29 17:04:50 +0000 | [diff] [blame] | 493 | return decodeOperand_SReg_32(Val); |
| 494 | } |
| 495 | |
Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 496 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_32_XEXEC_HI( |
| 497 | unsigned Val) const { |
| 498 | // SReg_32_XM0 is SReg_32 without EXEC_HI |
| 499 | return decodeOperand_SReg_32(Val); |
| 500 | } |
| 501 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 502 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64(unsigned Val) const { |
Matt Arsenault | 640c44b | 2016-11-29 19:39:53 +0000 | [diff] [blame] | 503 | return decodeSrcOp(OPW64, Val); |
| 504 | } |
| 505 | |
| 506 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_64_XEXEC(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 507 | return decodeSrcOp(OPW64, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 508 | } |
| 509 | |
| 510 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_128(unsigned Val) const { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 511 | return decodeSrcOp(OPW128, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 512 | } |
| 513 | |
| 514 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_256(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 515 | return decodeDstOp(OPW256, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 516 | } |
| 517 | |
| 518 | MCOperand AMDGPUDisassembler::decodeOperand_SReg_512(unsigned Val) const { |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 519 | return decodeDstOp(OPW512, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 520 | } |
| 521 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 522 | MCOperand AMDGPUDisassembler::decodeLiteralConstant() const { |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 523 | // For now all literal constants are supposed to be unsigned integer |
| 524 | // ToDo: deal with signed/unsigned 64-bit integer constants |
| 525 | // ToDo: deal with float/double constants |
Dmitry Preobrazhensky | ce941c9 | 2017-05-19 14:27:52 +0000 | [diff] [blame] | 526 | if (!HasLiteral) { |
| 527 | if (Bytes.size() < 4) { |
| 528 | return errOperand(0, "cannot read literal, inst bytes left " + |
| 529 | Twine(Bytes.size())); |
| 530 | } |
| 531 | HasLiteral = true; |
| 532 | Literal = eatBytes<uint32_t>(Bytes); |
| 533 | } |
| 534 | return MCOperand::createImm(Literal); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 535 | } |
| 536 | |
| 537 | MCOperand AMDGPUDisassembler::decodeIntImmed(unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 538 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 539 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 540 | assert(Imm >= INLINE_INTEGER_C_MIN && Imm <= INLINE_INTEGER_C_MAX); |
| 541 | return MCOperand::createImm((Imm <= INLINE_INTEGER_C_POSITIVE_MAX) ? |
| 542 | (static_cast<int64_t>(Imm) - INLINE_INTEGER_C_MIN) : |
| 543 | (INLINE_INTEGER_C_POSITIVE_MAX - static_cast<int64_t>(Imm))); |
| 544 | // Cast prevents negative overflow. |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 545 | } |
| 546 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 547 | static int64_t getInlineImmVal32(unsigned Imm) { |
| 548 | switch (Imm) { |
| 549 | case 240: |
| 550 | return FloatToBits(0.5f); |
| 551 | case 241: |
| 552 | return FloatToBits(-0.5f); |
| 553 | case 242: |
| 554 | return FloatToBits(1.0f); |
| 555 | case 243: |
| 556 | return FloatToBits(-1.0f); |
| 557 | case 244: |
| 558 | return FloatToBits(2.0f); |
| 559 | case 245: |
| 560 | return FloatToBits(-2.0f); |
| 561 | case 246: |
| 562 | return FloatToBits(4.0f); |
| 563 | case 247: |
| 564 | return FloatToBits(-4.0f); |
| 565 | case 248: // 1 / (2 * PI) |
| 566 | return 0x3e22f983; |
| 567 | default: |
| 568 | llvm_unreachable("invalid fp inline imm"); |
| 569 | } |
| 570 | } |
| 571 | |
| 572 | static int64_t getInlineImmVal64(unsigned Imm) { |
| 573 | switch (Imm) { |
| 574 | case 240: |
| 575 | return DoubleToBits(0.5); |
| 576 | case 241: |
| 577 | return DoubleToBits(-0.5); |
| 578 | case 242: |
| 579 | return DoubleToBits(1.0); |
| 580 | case 243: |
| 581 | return DoubleToBits(-1.0); |
| 582 | case 244: |
| 583 | return DoubleToBits(2.0); |
| 584 | case 245: |
| 585 | return DoubleToBits(-2.0); |
| 586 | case 246: |
| 587 | return DoubleToBits(4.0); |
| 588 | case 247: |
| 589 | return DoubleToBits(-4.0); |
| 590 | case 248: // 1 / (2 * PI) |
| 591 | return 0x3fc45f306dc9c882; |
| 592 | default: |
| 593 | llvm_unreachable("invalid fp inline imm"); |
| 594 | } |
| 595 | } |
| 596 | |
| 597 | static int64_t getInlineImmVal16(unsigned Imm) { |
| 598 | switch (Imm) { |
| 599 | case 240: |
| 600 | return 0x3800; |
| 601 | case 241: |
| 602 | return 0xB800; |
| 603 | case 242: |
| 604 | return 0x3C00; |
| 605 | case 243: |
| 606 | return 0xBC00; |
| 607 | case 244: |
| 608 | return 0x4000; |
| 609 | case 245: |
| 610 | return 0xC000; |
| 611 | case 246: |
| 612 | return 0x4400; |
| 613 | case 247: |
| 614 | return 0xC400; |
| 615 | case 248: // 1 / (2 * PI) |
| 616 | return 0x3118; |
| 617 | default: |
| 618 | llvm_unreachable("invalid fp inline imm"); |
| 619 | } |
| 620 | } |
| 621 | |
| 622 | MCOperand AMDGPUDisassembler::decodeFPImmed(OpWidthTy Width, unsigned Imm) { |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 623 | assert(Imm >= AMDGPU::EncValues::INLINE_FLOATING_C_MIN |
| 624 | && Imm <= AMDGPU::EncValues::INLINE_FLOATING_C_MAX); |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 625 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 626 | // ToDo: case 248: 1/(2*PI) - is allowed only on VI |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 627 | switch (Width) { |
| 628 | case OPW32: |
| 629 | return MCOperand::createImm(getInlineImmVal32(Imm)); |
| 630 | case OPW64: |
| 631 | return MCOperand::createImm(getInlineImmVal64(Imm)); |
| 632 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 633 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 634 | return MCOperand::createImm(getInlineImmVal16(Imm)); |
| 635 | default: |
| 636 | llvm_unreachable("implement me"); |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 637 | } |
Nikolay Haustov | 161a158 | 2016-02-25 16:09:14 +0000 | [diff] [blame] | 638 | } |
| 639 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 640 | unsigned AMDGPUDisassembler::getVgprClassId(const OpWidthTy Width) const { |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 641 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 642 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 643 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 644 | switch (Width) { |
| 645 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 646 | case OPW32: |
| 647 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 648 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 649 | return VGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 650 | case OPW64: return VReg_64RegClassID; |
| 651 | case OPW128: return VReg_128RegClassID; |
| 652 | } |
| 653 | } |
| 654 | |
| 655 | unsigned AMDGPUDisassembler::getSgprClassId(const OpWidthTy Width) const { |
| 656 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 657 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 658 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 659 | switch (Width) { |
| 660 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 661 | case OPW32: |
| 662 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 663 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 664 | return SGPR_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 665 | case OPW64: return SGPR_64RegClassID; |
| 666 | case OPW128: return SGPR_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 667 | case OPW256: return SGPR_256RegClassID; |
| 668 | case OPW512: return SGPR_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 669 | } |
| 670 | } |
| 671 | |
| 672 | unsigned AMDGPUDisassembler::getTtmpClassId(const OpWidthTy Width) const { |
| 673 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 674 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 675 | assert(OPW_FIRST_ <= Width && Width < OPW_LAST_); |
| 676 | switch (Width) { |
| 677 | default: // fall |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 678 | case OPW32: |
| 679 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 680 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 681 | return TTMP_32RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 682 | case OPW64: return TTMP_64RegClassID; |
| 683 | case OPW128: return TTMP_128RegClassID; |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 684 | case OPW256: return TTMP_256RegClassID; |
| 685 | case OPW512: return TTMP_512RegClassID; |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 686 | } |
| 687 | } |
| 688 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 689 | int AMDGPUDisassembler::getTTmpIdx(unsigned Val) const { |
| 690 | using namespace AMDGPU::EncValues; |
| 691 | |
| 692 | unsigned TTmpMin = isGFX9() ? TTMP_GFX9_MIN : TTMP_VI_MIN; |
| 693 | unsigned TTmpMax = isGFX9() ? TTMP_GFX9_MAX : TTMP_VI_MAX; |
| 694 | |
| 695 | return (TTmpMin <= Val && Val <= TTmpMax)? Val - TTmpMin : -1; |
| 696 | } |
| 697 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 698 | MCOperand AMDGPUDisassembler::decodeSrcOp(const OpWidthTy Width, unsigned Val) const { |
| 699 | using namespace AMDGPU::EncValues; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 700 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 701 | assert(Val < 512); // enum9 |
| 702 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 703 | if (VGPR_MIN <= Val && Val <= VGPR_MAX) { |
| 704 | return createRegOperand(getVgprClassId(Width), Val - VGPR_MIN); |
| 705 | } |
Artem Tamazov | b49c336 | 2016-05-26 15:52:16 +0000 | [diff] [blame] | 706 | if (Val <= SGPR_MAX) { |
| 707 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 708 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 709 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 710 | |
| 711 | int TTmpIdx = getTTmpIdx(Val); |
| 712 | if (TTmpIdx >= 0) { |
| 713 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 714 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 715 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 716 | if (INLINE_INTEGER_C_MIN <= Val && Val <= INLINE_INTEGER_C_MAX) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 717 | return decodeIntImmed(Val); |
| 718 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 719 | if (INLINE_FLOATING_C_MIN <= Val && Val <= INLINE_FLOATING_C_MAX) |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 720 | return decodeFPImmed(Width, Val); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 721 | |
Artem Tamazov | 212a251 | 2016-05-24 12:05:16 +0000 | [diff] [blame] | 722 | if (Val == LITERAL_CONST) |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 723 | return decodeLiteralConstant(); |
| 724 | |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 725 | switch (Width) { |
| 726 | case OPW32: |
| 727 | case OPW16: |
Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 728 | case OPWV216: |
Matt Arsenault | 4bd7236 | 2016-12-10 00:39:12 +0000 | [diff] [blame] | 729 | return decodeSpecialReg32(Val); |
| 730 | case OPW64: |
| 731 | return decodeSpecialReg64(Val); |
| 732 | default: |
| 733 | llvm_unreachable("unexpected immediate type"); |
| 734 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 735 | } |
| 736 | |
Dmitry Preobrazhensky | 2713495 | 2017-12-22 15:18:06 +0000 | [diff] [blame] | 737 | MCOperand AMDGPUDisassembler::decodeDstOp(const OpWidthTy Width, unsigned Val) const { |
| 738 | using namespace AMDGPU::EncValues; |
| 739 | |
| 740 | assert(Val < 128); |
| 741 | assert(Width == OPW256 || Width == OPW512); |
| 742 | |
| 743 | if (Val <= SGPR_MAX) { |
| 744 | assert(SGPR_MIN == 0); // "SGPR_MIN <= Val" is always true and causes compilation warning. |
| 745 | return createSRegOperand(getSgprClassId(Width), Val - SGPR_MIN); |
| 746 | } |
| 747 | |
| 748 | int TTmpIdx = getTTmpIdx(Val); |
| 749 | if (TTmpIdx >= 0) { |
| 750 | return createSRegOperand(getTtmpClassId(Width), TTmpIdx); |
| 751 | } |
| 752 | |
| 753 | llvm_unreachable("unknown dst register"); |
| 754 | } |
| 755 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 756 | MCOperand AMDGPUDisassembler::decodeSpecialReg32(unsigned Val) const { |
| 757 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 758 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 759 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 760 | case 102: return createRegOperand(FLAT_SCR_LO); |
| 761 | case 103: return createRegOperand(FLAT_SCR_HI); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 762 | case 104: return createRegOperand(XNACK_MASK_LO); |
| 763 | case 105: return createRegOperand(XNACK_MASK_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 764 | case 106: return createRegOperand(VCC_LO); |
| 765 | case 107: return createRegOperand(VCC_HI); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 766 | case 108: assert(!isGFX9()); return createRegOperand(TBA_LO); |
| 767 | case 109: assert(!isGFX9()); return createRegOperand(TBA_HI); |
| 768 | case 110: assert(!isGFX9()); return createRegOperand(TMA_LO); |
| 769 | case 111: assert(!isGFX9()); return createRegOperand(TMA_HI); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 770 | case 124: return createRegOperand(M0); |
| 771 | case 126: return createRegOperand(EXEC_LO); |
| 772 | case 127: return createRegOperand(EXEC_HI); |
Matt Arsenault | a3b3b48 | 2017-02-18 18:41:41 +0000 | [diff] [blame] | 773 | case 235: return createRegOperand(SRC_SHARED_BASE); |
| 774 | case 236: return createRegOperand(SRC_SHARED_LIMIT); |
| 775 | case 237: return createRegOperand(SRC_PRIVATE_BASE); |
| 776 | case 238: return createRegOperand(SRC_PRIVATE_LIMIT); |
| 777 | // TODO: SRC_POPS_EXITING_WAVE_ID |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 778 | // ToDo: no support for vccz register |
| 779 | case 251: break; |
| 780 | // ToDo: no support for execz register |
| 781 | case 252: break; |
| 782 | case 253: return createRegOperand(SCC); |
| 783 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 784 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 785 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 786 | } |
| 787 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 788 | MCOperand AMDGPUDisassembler::decodeSpecialReg64(unsigned Val) const { |
| 789 | using namespace AMDGPU; |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 790 | |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 791 | switch (Val) { |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 792 | case 102: return createRegOperand(FLAT_SCR); |
Dmitry Preobrazhensky | 3afbd82 | 2018-01-10 14:22:19 +0000 | [diff] [blame] | 793 | case 104: return createRegOperand(XNACK_MASK); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 794 | case 106: return createRegOperand(VCC); |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 795 | case 108: assert(!isGFX9()); return createRegOperand(TBA); |
| 796 | case 110: assert(!isGFX9()); return createRegOperand(TMA); |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 797 | case 126: return createRegOperand(EXEC); |
| 798 | default: break; |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 799 | } |
Nikolay Haustov | ac106ad | 2016-03-01 13:57:29 +0000 | [diff] [blame] | 800 | return errOperand(Val, "unknown operand encoding " + Twine(Val)); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 801 | } |
| 802 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 803 | MCOperand AMDGPUDisassembler::decodeSDWASrc(const OpWidthTy Width, |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 804 | const unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 805 | using namespace AMDGPU::SDWA; |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 806 | using namespace AMDGPU::EncValues; |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 807 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 808 | if (STI.getFeatureBits()[AMDGPU::FeatureGFX9]) { |
Sam Kolton | a179d25 | 2017-06-27 15:02:23 +0000 | [diff] [blame] | 809 | // XXX: static_cast<int> is needed to avoid stupid warning: |
| 810 | // compare with unsigned is always true |
| 811 | if (SDWA9EncValues::SRC_VGPR_MIN <= static_cast<int>(Val) && |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 812 | Val <= SDWA9EncValues::SRC_VGPR_MAX) { |
| 813 | return createRegOperand(getVgprClassId(Width), |
| 814 | Val - SDWA9EncValues::SRC_VGPR_MIN); |
| 815 | } |
| 816 | if (SDWA9EncValues::SRC_SGPR_MIN <= Val && |
| 817 | Val <= SDWA9EncValues::SRC_SGPR_MAX) { |
| 818 | return createSRegOperand(getSgprClassId(Width), |
| 819 | Val - SDWA9EncValues::SRC_SGPR_MIN); |
| 820 | } |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 821 | if (SDWA9EncValues::SRC_TTMP_MIN <= Val && |
| 822 | Val <= SDWA9EncValues::SRC_TTMP_MAX) { |
| 823 | return createSRegOperand(getTtmpClassId(Width), |
| 824 | Val - SDWA9EncValues::SRC_TTMP_MIN); |
| 825 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 826 | |
Dmitry Preobrazhensky | 6b65f7c | 2018-01-17 14:00:48 +0000 | [diff] [blame] | 827 | const unsigned SVal = Val - SDWA9EncValues::SRC_SGPR_MIN; |
| 828 | |
| 829 | if (INLINE_INTEGER_C_MIN <= SVal && SVal <= INLINE_INTEGER_C_MAX) |
| 830 | return decodeIntImmed(SVal); |
| 831 | |
| 832 | if (INLINE_FLOATING_C_MIN <= SVal && SVal <= INLINE_FLOATING_C_MAX) |
| 833 | return decodeFPImmed(Width, SVal); |
| 834 | |
| 835 | return decodeSpecialReg32(SVal); |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 836 | } else if (STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]) { |
| 837 | return createRegOperand(getVgprClassId(Width), Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 838 | } |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 839 | llvm_unreachable("unsupported target"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 840 | } |
| 841 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 842 | MCOperand AMDGPUDisassembler::decodeSDWASrc16(unsigned Val) const { |
| 843 | return decodeSDWASrc(OPW16, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 844 | } |
| 845 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 846 | MCOperand AMDGPUDisassembler::decodeSDWASrc32(unsigned Val) const { |
| 847 | return decodeSDWASrc(OPW32, Val); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 848 | } |
| 849 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 850 | MCOperand AMDGPUDisassembler::decodeSDWAVopcDst(unsigned Val) const { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 851 | using namespace AMDGPU::SDWA; |
| 852 | |
Sam Kolton | 549c89d | 2017-06-21 08:53:38 +0000 | [diff] [blame] | 853 | assert(STI.getFeatureBits()[AMDGPU::FeatureGFX9] && |
| 854 | "SDWAVopcDst should be present only on GFX9"); |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 855 | if (Val & SDWA9EncValues::VOPC_DST_VCC_MASK) { |
| 856 | Val &= SDWA9EncValues::VOPC_DST_SGPR_MASK; |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 857 | |
| 858 | int TTmpIdx = getTTmpIdx(Val); |
| 859 | if (TTmpIdx >= 0) { |
| 860 | return createSRegOperand(getTtmpClassId(OPW64), TTmpIdx); |
| 861 | } else if (Val > AMDGPU::EncValues::SGPR_MAX) { |
Sam Kolton | 363f47a | 2017-05-26 15:52:00 +0000 | [diff] [blame] | 862 | return decodeSpecialReg64(Val); |
| 863 | } else { |
| 864 | return createSRegOperand(getSgprClassId(OPW64), Val); |
| 865 | } |
| 866 | } else { |
| 867 | return createRegOperand(AMDGPU::VCC); |
| 868 | } |
| 869 | } |
| 870 | |
Dmitry Preobrazhensky | ac2b026 | 2017-12-11 15:23:20 +0000 | [diff] [blame] | 871 | bool AMDGPUDisassembler::isVI() const { |
| 872 | return STI.getFeatureBits()[AMDGPU::FeatureVolcanicIslands]; |
| 873 | } |
| 874 | |
| 875 | bool AMDGPUDisassembler::isGFX9() const { |
| 876 | return STI.getFeatureBits()[AMDGPU::FeatureGFX9]; |
| 877 | } |
| 878 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 879 | //===----------------------------------------------------------------------===// |
| 880 | // AMDGPUSymbolizer |
| 881 | //===----------------------------------------------------------------------===// |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 882 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 883 | // Try to find symbol name for specified label |
| 884 | bool AMDGPUSymbolizer::tryAddingSymbolicOperand(MCInst &Inst, |
| 885 | raw_ostream &/*cStream*/, int64_t Value, |
| 886 | uint64_t /*Address*/, bool IsBranch, |
| 887 | uint64_t /*Offset*/, uint64_t /*InstSize*/) { |
Eugene Zelenko | c8fbf6f | 2017-08-10 00:46:15 +0000 | [diff] [blame] | 888 | using SymbolInfoTy = std::tuple<uint64_t, StringRef, uint8_t>; |
| 889 | using SectionSymbolsTy = std::vector<SymbolInfoTy>; |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 890 | |
| 891 | if (!IsBranch) { |
| 892 | return false; |
| 893 | } |
| 894 | |
| 895 | auto *Symbols = static_cast<SectionSymbolsTy *>(DisInfo); |
Nicolai Haehnle | b1c3b22 | 2018-04-10 15:46:43 +0000 | [diff] [blame] | 896 | if (!Symbols) |
| 897 | return false; |
| 898 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 899 | auto Result = std::find_if(Symbols->begin(), Symbols->end(), |
| 900 | [Value](const SymbolInfoTy& Val) { |
| 901 | return std::get<0>(Val) == static_cast<uint64_t>(Value) |
| 902 | && std::get<2>(Val) == ELF::STT_NOTYPE; |
| 903 | }); |
| 904 | if (Result != Symbols->end()) { |
| 905 | auto *Sym = Ctx.getOrCreateSymbol(std::get<1>(*Result)); |
| 906 | const auto *Add = MCSymbolRefExpr::create(Sym, Ctx); |
| 907 | Inst.addOperand(MCOperand::createExpr(Add)); |
| 908 | return true; |
| 909 | } |
| 910 | return false; |
| 911 | } |
| 912 | |
Matt Arsenault | 92b355b | 2016-11-15 19:34:37 +0000 | [diff] [blame] | 913 | void AMDGPUSymbolizer::tryAddingPcLoadReferenceComment(raw_ostream &cStream, |
| 914 | int64_t Value, |
| 915 | uint64_t Address) { |
| 916 | llvm_unreachable("unimplemented"); |
| 917 | } |
| 918 | |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 919 | //===----------------------------------------------------------------------===// |
| 920 | // Initialization |
| 921 | //===----------------------------------------------------------------------===// |
| 922 | |
| 923 | static MCSymbolizer *createAMDGPUSymbolizer(const Triple &/*TT*/, |
| 924 | LLVMOpInfoCallback /*GetOpInfo*/, |
| 925 | LLVMSymbolLookupCallback /*SymbolLookUp*/, |
Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 926 | void *DisInfo, |
Sam Kolton | 3381d7a | 2016-10-06 13:46:08 +0000 | [diff] [blame] | 927 | MCContext *Ctx, |
| 928 | std::unique_ptr<MCRelocationInfo> &&RelInfo) { |
| 929 | return new AMDGPUSymbolizer(*Ctx, std::move(RelInfo), DisInfo); |
| 930 | } |
| 931 | |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 932 | static MCDisassembler *createAMDGPUDisassembler(const Target &T, |
| 933 | const MCSubtargetInfo &STI, |
| 934 | MCContext &Ctx) { |
Matt Arsenault | cad7fa8 | 2017-12-13 21:07:51 +0000 | [diff] [blame] | 935 | return new AMDGPUDisassembler(STI, Ctx, T.createMCInstrInfo()); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 936 | } |
| 937 | |
| 938 | extern "C" void LLVMInitializeAMDGPUDisassembler() { |
Mehdi Amini | f42454b | 2016-10-09 23:00:34 +0000 | [diff] [blame] | 939 | TargetRegistry::RegisterMCDisassembler(getTheGCNTarget(), |
| 940 | createAMDGPUDisassembler); |
| 941 | TargetRegistry::RegisterMCSymbolizer(getTheGCNTarget(), |
| 942 | createAMDGPUSymbolizer); |
Tom Stellard | e1818af | 2016-02-18 03:42:32 +0000 | [diff] [blame] | 943 | } |