blob: dc91924c73e43891a9d629bf1f19985424a1e7ea [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===- R600MCCodeEmitter.cpp - Code Emitter for R600->Cayman GPU families -===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11///
12/// This code emitter outputs bytecode that is understood by the r600g driver
13/// in the Mesa [1] project. The bytecode is very similar to the hardware's ISA,
14/// but it still needs to be run through a finalizer in order to be executed
15/// by the GPU.
16///
17/// [1] http://www.mesa3d.org/
18//
19//===----------------------------------------------------------------------===//
20
21#include "R600Defines.h"
22#include "MCTargetDesc/AMDGPUMCTargetDesc.h"
23#include "MCTargetDesc/AMDGPUMCCodeEmitter.h"
24#include "llvm/MC/MCCodeEmitter.h"
25#include "llvm/MC/MCContext.h"
26#include "llvm/MC/MCInst.h"
27#include "llvm/MC/MCInstrInfo.h"
28#include "llvm/MC/MCRegisterInfo.h"
29#include "llvm/MC/MCSubtargetInfo.h"
30#include "llvm/Support/raw_ostream.h"
31
32#include <stdio.h>
33
34#define SRC_BYTE_COUNT 11
35#define DST_BYTE_COUNT 5
36
37using namespace llvm;
38
39namespace {
40
41class R600MCCodeEmitter : public AMDGPUMCCodeEmitter {
42 R600MCCodeEmitter(const R600MCCodeEmitter &); // DO NOT IMPLEMENT
43 void operator=(const R600MCCodeEmitter &); // DO NOT IMPLEMENT
44 const MCInstrInfo &MCII;
45 const MCRegisterInfo &MRI;
46 const MCSubtargetInfo &STI;
47 MCContext &Ctx;
48
49public:
50
51 R600MCCodeEmitter(const MCInstrInfo &mcii, const MCRegisterInfo &mri,
52 const MCSubtargetInfo &sti, MCContext &ctx)
53 : MCII(mcii), MRI(mri), STI(sti), Ctx(ctx) { }
54
55 /// \brief Encode the instruction and write it to the OS.
56 virtual void EncodeInstruction(const MCInst &MI, raw_ostream &OS,
57 SmallVectorImpl<MCFixup> &Fixups) const;
58
59 /// \returns the encoding for an MCOperand.
60 virtual uint64_t getMachineOpValue(const MCInst &MI, const MCOperand &MO,
61 SmallVectorImpl<MCFixup> &Fixups) const;
62private:
63
64 void EmitALUInstr(const MCInst &MI, SmallVectorImpl<MCFixup> &Fixups,
65 raw_ostream &OS) const;
66 void EmitSrc(const MCInst &MI, unsigned OpIdx, raw_ostream &OS) const;
67 void EmitSrcISA(const MCInst &MI, unsigned OpIdx, uint64_t &Value,
68 raw_ostream &OS) const;
69 void EmitDst(const MCInst &MI, raw_ostream &OS) const;
70 void EmitTexInstr(const MCInst &MI, SmallVectorImpl<MCFixup> &Fixups,
71 raw_ostream &OS) const;
72 void EmitFCInstr(const MCInst &MI, raw_ostream &OS) const;
73
74 void EmitNullBytes(unsigned int byteCount, raw_ostream &OS) const;
75
76 void EmitByte(unsigned int byte, raw_ostream &OS) const;
77
78 void EmitTwoBytes(uint32_t bytes, raw_ostream &OS) const;
79
80 void Emit(uint32_t value, raw_ostream &OS) const;
81 void Emit(uint64_t value, raw_ostream &OS) const;
82
83 unsigned getHWRegChan(unsigned reg) const;
84 unsigned getHWReg(unsigned regNo) const;
85
86 bool isFCOp(unsigned opcode) const;
87 bool isTexOp(unsigned opcode) const;
88 bool isFlagSet(const MCInst &MI, unsigned Operand, unsigned Flag) const;
89
90};
91
92} // End anonymous namespace
93
94enum RegElement {
95 ELEMENT_X = 0,
96 ELEMENT_Y,
97 ELEMENT_Z,
98 ELEMENT_W
99};
100
101enum InstrTypes {
102 INSTR_ALU = 0,
103 INSTR_TEX,
104 INSTR_FC,
105 INSTR_NATIVE,
106 INSTR_VTX,
107 INSTR_EXPORT
108};
109
110enum FCInstr {
111 FC_IF_PREDICATE = 0,
112 FC_ELSE,
113 FC_ENDIF,
114 FC_BGNLOOP,
115 FC_ENDLOOP,
116 FC_BREAK_PREDICATE,
117 FC_CONTINUE
118};
119
120enum TextureTypes {
121 TEXTURE_1D = 1,
122 TEXTURE_2D,
123 TEXTURE_3D,
124 TEXTURE_CUBE,
125 TEXTURE_RECT,
126 TEXTURE_SHADOW1D,
127 TEXTURE_SHADOW2D,
128 TEXTURE_SHADOWRECT,
129 TEXTURE_1D_ARRAY,
130 TEXTURE_2D_ARRAY,
131 TEXTURE_SHADOW1D_ARRAY,
132 TEXTURE_SHADOW2D_ARRAY
133};
134
135MCCodeEmitter *llvm::createR600MCCodeEmitter(const MCInstrInfo &MCII,
136 const MCRegisterInfo &MRI,
137 const MCSubtargetInfo &STI,
138 MCContext &Ctx) {
139 return new R600MCCodeEmitter(MCII, MRI, STI, Ctx);
140}
141
142void R600MCCodeEmitter::EncodeInstruction(const MCInst &MI, raw_ostream &OS,
143 SmallVectorImpl<MCFixup> &Fixups) const {
144 if (isTexOp(MI.getOpcode())) {
145 EmitTexInstr(MI, Fixups, OS);
146 } else if (isFCOp(MI.getOpcode())){
147 EmitFCInstr(MI, OS);
148 } else if (MI.getOpcode() == AMDGPU::RETURN ||
149 MI.getOpcode() == AMDGPU::BUNDLE ||
150 MI.getOpcode() == AMDGPU::KILL) {
151 return;
152 } else {
153 switch(MI.getOpcode()) {
154 case AMDGPU::RAT_WRITE_CACHELESS_32_eg:
155 case AMDGPU::RAT_WRITE_CACHELESS_128_eg: {
156 uint64_t inst = getBinaryCodeForInstr(MI, Fixups);
157 EmitByte(INSTR_NATIVE, OS);
158 Emit(inst, OS);
159 break;
160 }
161 case AMDGPU::CONSTANT_LOAD_eg:
162 case AMDGPU::VTX_READ_PARAM_8_eg:
163 case AMDGPU::VTX_READ_PARAM_16_eg:
164 case AMDGPU::VTX_READ_PARAM_32_eg:
165 case AMDGPU::VTX_READ_GLOBAL_8_eg:
166 case AMDGPU::VTX_READ_GLOBAL_32_eg:
167 case AMDGPU::VTX_READ_GLOBAL_128_eg: {
168 uint64_t InstWord01 = getBinaryCodeForInstr(MI, Fixups);
169 uint32_t InstWord2 = MI.getOperand(2).getImm(); // Offset
170
171 EmitByte(INSTR_VTX, OS);
172 Emit(InstWord01, OS);
173 Emit(InstWord2, OS);
174 break;
175 }
176 case AMDGPU::EG_ExportSwz:
177 case AMDGPU::R600_ExportSwz:
178 case AMDGPU::EG_ExportBuf:
179 case AMDGPU::R600_ExportBuf: {
180 uint64_t Inst = getBinaryCodeForInstr(MI, Fixups);
181 EmitByte(INSTR_EXPORT, OS);
182 Emit(Inst, OS);
183 break;
184 }
185
186 default:
187 EmitALUInstr(MI, Fixups, OS);
188 break;
189 }
190 }
191}
192
193void R600MCCodeEmitter::EmitALUInstr(const MCInst &MI,
194 SmallVectorImpl<MCFixup> &Fixups,
195 raw_ostream &OS) const {
196 const MCInstrDesc &MCDesc = MCII.get(MI.getOpcode());
197 unsigned NumOperands = MI.getNumOperands();
198
199 // Emit instruction type
200 EmitByte(INSTR_ALU, OS);
201
202 uint64_t InstWord01 = getBinaryCodeForInstr(MI, Fixups);
203
204 //older alu have different encoding for instructions with one or two src
205 //parameters.
206 if ((STI.getFeatureBits() & AMDGPU::FeatureR600ALUInst) &&
207 !(MCDesc.TSFlags & R600_InstFlag::OP3)) {
208 uint64_t ISAOpCode = InstWord01 & (0x3FFULL << 39);
209 InstWord01 &= ~(0x3FFULL << 39);
210 InstWord01 |= ISAOpCode << 1;
211 }
212
213 unsigned SrcIdx = 0;
214 for (unsigned int OpIdx = 1; OpIdx < NumOperands; ++OpIdx) {
215 if (MI.getOperand(OpIdx).isImm() || MI.getOperand(OpIdx).isFPImm() ||
216 OpIdx == (unsigned)MCDesc.findFirstPredOperandIdx()) {
217 continue;
218 }
219 EmitSrcISA(MI, OpIdx, InstWord01, OS);
220 SrcIdx++;
221 }
222
223 // Emit zeros for unused sources
224 for ( ; SrcIdx < 3; SrcIdx++) {
225 EmitNullBytes(SRC_BYTE_COUNT - 6, OS);
226 }
227
228 Emit(InstWord01, OS);
229 return;
230}
231
232void R600MCCodeEmitter::EmitSrc(const MCInst &MI, unsigned OpIdx,
233 raw_ostream &OS) const {
234 const MCOperand &MO = MI.getOperand(OpIdx);
235 union {
236 float f;
237 uint32_t i;
238 } Value;
239 Value.i = 0;
240 // Emit the source select (2 bytes). For GPRs, this is the register index.
241 // For other potential instruction operands, (e.g. constant registers) the
242 // value of the source select is defined in the r600isa docs.
243 if (MO.isReg()) {
244 unsigned reg = MO.getReg();
245 EmitTwoBytes(getHWReg(reg), OS);
246 if (reg == AMDGPU::ALU_LITERAL_X) {
247 unsigned ImmOpIndex = MI.getNumOperands() - 1;
248 MCOperand ImmOp = MI.getOperand(ImmOpIndex);
249 if (ImmOp.isFPImm()) {
250 Value.f = ImmOp.getFPImm();
251 } else {
252 assert(ImmOp.isImm());
253 Value.i = ImmOp.getImm();
254 }
255 }
256 } else {
257 // XXX: Handle other operand types.
258 EmitTwoBytes(0, OS);
259 }
260
261 // Emit the source channel (1 byte)
262 if (MO.isReg()) {
263 EmitByte(getHWRegChan(MO.getReg()), OS);
264 } else {
265 EmitByte(0, OS);
266 }
267
268 // XXX: Emit isNegated (1 byte)
269 if ((!(isFlagSet(MI, OpIdx, MO_FLAG_ABS)))
270 && (isFlagSet(MI, OpIdx, MO_FLAG_NEG) ||
271 (MO.isReg() &&
272 (MO.getReg() == AMDGPU::NEG_ONE || MO.getReg() == AMDGPU::NEG_HALF)))){
273 EmitByte(1, OS);
274 } else {
275 EmitByte(0, OS);
276 }
277
278 // Emit isAbsolute (1 byte)
279 if (isFlagSet(MI, OpIdx, MO_FLAG_ABS)) {
280 EmitByte(1, OS);
281 } else {
282 EmitByte(0, OS);
283 }
284
285 // XXX: Emit relative addressing mode (1 byte)
286 EmitByte(0, OS);
287
288 // Emit kc_bank, This will be adjusted later by r600_asm
289 EmitByte(0, OS);
290
291 // Emit the literal value, if applicable (4 bytes).
292 Emit(Value.i, OS);
293
294}
295
296void R600MCCodeEmitter::EmitSrcISA(const MCInst &MI, unsigned OpIdx,
297 uint64_t &Value, raw_ostream &OS) const {
298 const MCOperand &MO = MI.getOperand(OpIdx);
299 union {
300 float f;
301 uint32_t i;
302 } InlineConstant;
303 InlineConstant.i = 0;
304 // Emit the source select (2 bytes). For GPRs, this is the register index.
305 // For other potential instruction operands, (e.g. constant registers) the
306 // value of the source select is defined in the r600isa docs.
307 if (MO.isReg()) {
308 unsigned Reg = MO.getReg();
309 if (AMDGPUMCRegisterClasses[AMDGPU::R600_CReg32RegClassID].contains(Reg)) {
310 EmitByte(1, OS);
311 } else {
312 EmitByte(0, OS);
313 }
314
315 if (Reg == AMDGPU::ALU_LITERAL_X) {
316 unsigned ImmOpIndex = MI.getNumOperands() - 1;
317 MCOperand ImmOp = MI.getOperand(ImmOpIndex);
318 if (ImmOp.isFPImm()) {
319 InlineConstant.f = ImmOp.getFPImm();
320 } else {
321 assert(ImmOp.isImm());
322 InlineConstant.i = ImmOp.getImm();
323 }
324 }
325 }
326
327 // Emit the literal value, if applicable (4 bytes).
328 Emit(InlineConstant.i, OS);
329}
330
331void R600MCCodeEmitter::EmitTexInstr(const MCInst &MI,
332 SmallVectorImpl<MCFixup> &Fixups,
333 raw_ostream &OS) const {
334
335 unsigned Opcode = MI.getOpcode();
336 bool hasOffsets = (Opcode == AMDGPU::TEX_LD);
337 unsigned OpOffset = hasOffsets ? 3 : 0;
338 int64_t Resource = MI.getOperand(OpOffset + 2).getImm();
339 int64_t Sampler = MI.getOperand(OpOffset + 3).getImm();
340 int64_t TextureType = MI.getOperand(OpOffset + 4).getImm();
341 unsigned srcSelect[4] = {0, 1, 2, 3};
342
343 // Emit instruction type
344 EmitByte(1, OS);
345
346 // Emit instruction
347 EmitByte(getBinaryCodeForInstr(MI, Fixups), OS);
348
349 // Emit resource id
350 EmitByte(Resource, OS);
351
352 // Emit source register
353 EmitByte(getHWReg(MI.getOperand(1).getReg()), OS);
354
355 // XXX: Emit src isRelativeAddress
356 EmitByte(0, OS);
357
358 // Emit destination register
359 EmitByte(getHWReg(MI.getOperand(0).getReg()), OS);
360
361 // XXX: Emit dst isRealtiveAddress
362 EmitByte(0, OS);
363
364 // XXX: Emit dst select
365 EmitByte(0, OS); // X
366 EmitByte(1, OS); // Y
367 EmitByte(2, OS); // Z
368 EmitByte(3, OS); // W
369
370 // XXX: Emit lod bias
371 EmitByte(0, OS);
372
373 // XXX: Emit coord types
374 unsigned coordType[4] = {1, 1, 1, 1};
375
376 if (TextureType == TEXTURE_RECT
377 || TextureType == TEXTURE_SHADOWRECT) {
378 coordType[ELEMENT_X] = 0;
379 coordType[ELEMENT_Y] = 0;
380 }
381
382 if (TextureType == TEXTURE_1D_ARRAY
383 || TextureType == TEXTURE_SHADOW1D_ARRAY) {
384 if (Opcode == AMDGPU::TEX_SAMPLE_C_L || Opcode == AMDGPU::TEX_SAMPLE_C_LB) {
385 coordType[ELEMENT_Y] = 0;
386 } else {
387 coordType[ELEMENT_Z] = 0;
388 srcSelect[ELEMENT_Z] = ELEMENT_Y;
389 }
390 } else if (TextureType == TEXTURE_2D_ARRAY
391 || TextureType == TEXTURE_SHADOW2D_ARRAY) {
392 coordType[ELEMENT_Z] = 0;
393 }
394
395 for (unsigned i = 0; i < 4; i++) {
396 EmitByte(coordType[i], OS);
397 }
398
399 // XXX: Emit offsets
400 if (hasOffsets)
401 for (unsigned i = 2; i < 5; i++)
402 EmitByte(MI.getOperand(i).getImm()<<1, OS);
403 else
404 EmitNullBytes(3, OS);
405
406 // Emit sampler id
407 EmitByte(Sampler, OS);
408
409 // XXX:Emit source select
410 if ((TextureType == TEXTURE_SHADOW1D
411 || TextureType == TEXTURE_SHADOW2D
412 || TextureType == TEXTURE_SHADOWRECT
413 || TextureType == TEXTURE_SHADOW1D_ARRAY)
414 && Opcode != AMDGPU::TEX_SAMPLE_C_L
415 && Opcode != AMDGPU::TEX_SAMPLE_C_LB) {
416 srcSelect[ELEMENT_W] = ELEMENT_Z;
417 }
418
419 for (unsigned i = 0; i < 4; i++) {
420 EmitByte(srcSelect[i], OS);
421 }
422}
423
424void R600MCCodeEmitter::EmitFCInstr(const MCInst &MI, raw_ostream &OS) const {
425
426 // Emit instruction type
427 EmitByte(INSTR_FC, OS);
428
429 // Emit SRC
430 unsigned NumOperands = MI.getNumOperands();
431 if (NumOperands > 0) {
432 assert(NumOperands == 1);
433 EmitSrc(MI, 0, OS);
434 } else {
435 EmitNullBytes(SRC_BYTE_COUNT, OS);
436 }
437
438 // Emit FC Instruction
439 enum FCInstr instr;
440 switch (MI.getOpcode()) {
441 case AMDGPU::PREDICATED_BREAK:
442 instr = FC_BREAK_PREDICATE;
443 break;
444 case AMDGPU::CONTINUE:
445 instr = FC_CONTINUE;
446 break;
447 case AMDGPU::IF_PREDICATE_SET:
448 instr = FC_IF_PREDICATE;
449 break;
450 case AMDGPU::ELSE:
451 instr = FC_ELSE;
452 break;
453 case AMDGPU::ENDIF:
454 instr = FC_ENDIF;
455 break;
456 case AMDGPU::ENDLOOP:
457 instr = FC_ENDLOOP;
458 break;
459 case AMDGPU::WHILELOOP:
460 instr = FC_BGNLOOP;
461 break;
462 default:
463 abort();
464 break;
465 }
466 EmitByte(instr, OS);
467}
468
469void R600MCCodeEmitter::EmitNullBytes(unsigned int ByteCount,
470 raw_ostream &OS) const {
471
472 for (unsigned int i = 0; i < ByteCount; i++) {
473 EmitByte(0, OS);
474 }
475}
476
477void R600MCCodeEmitter::EmitByte(unsigned int Byte, raw_ostream &OS) const {
478 OS.write((uint8_t) Byte & 0xff);
479}
480
481void R600MCCodeEmitter::EmitTwoBytes(unsigned int Bytes,
482 raw_ostream &OS) const {
483 OS.write((uint8_t) (Bytes & 0xff));
484 OS.write((uint8_t) ((Bytes >> 8) & 0xff));
485}
486
487void R600MCCodeEmitter::Emit(uint32_t Value, raw_ostream &OS) const {
488 for (unsigned i = 0; i < 4; i++) {
489 OS.write((uint8_t) ((Value >> (8 * i)) & 0xff));
490 }
491}
492
493void R600MCCodeEmitter::Emit(uint64_t Value, raw_ostream &OS) const {
494 for (unsigned i = 0; i < 8; i++) {
495 EmitByte((Value >> (8 * i)) & 0xff, OS);
496 }
497}
498
499unsigned R600MCCodeEmitter::getHWRegChan(unsigned reg) const {
500 return MRI.getEncodingValue(reg) >> HW_CHAN_SHIFT;
501}
502
503unsigned R600MCCodeEmitter::getHWReg(unsigned RegNo) const {
504 return MRI.getEncodingValue(RegNo) & HW_REG_MASK;
505}
506
507uint64_t R600MCCodeEmitter::getMachineOpValue(const MCInst &MI,
508 const MCOperand &MO,
509 SmallVectorImpl<MCFixup> &Fixup) const {
510 if (MO.isReg()) {
511 if (HAS_NATIVE_OPERANDS(MCII.get(MI.getOpcode()).TSFlags)) {
512 return MRI.getEncodingValue(MO.getReg());
513 } else {
514 return getHWReg(MO.getReg());
515 }
516 } else if (MO.isImm()) {
517 return MO.getImm();
518 } else {
519 assert(0);
520 return 0;
521 }
522}
523
524//===----------------------------------------------------------------------===//
525// Encoding helper functions
526//===----------------------------------------------------------------------===//
527
528bool R600MCCodeEmitter::isFCOp(unsigned opcode) const {
529 switch(opcode) {
530 default: return false;
531 case AMDGPU::PREDICATED_BREAK:
532 case AMDGPU::CONTINUE:
533 case AMDGPU::IF_PREDICATE_SET:
534 case AMDGPU::ELSE:
535 case AMDGPU::ENDIF:
536 case AMDGPU::ENDLOOP:
537 case AMDGPU::WHILELOOP:
538 return true;
539 }
540}
541
542bool R600MCCodeEmitter::isTexOp(unsigned opcode) const {
543 switch(opcode) {
544 default: return false;
545 case AMDGPU::TEX_LD:
546 case AMDGPU::TEX_GET_TEXTURE_RESINFO:
547 case AMDGPU::TEX_SAMPLE:
548 case AMDGPU::TEX_SAMPLE_C:
549 case AMDGPU::TEX_SAMPLE_L:
550 case AMDGPU::TEX_SAMPLE_C_L:
551 case AMDGPU::TEX_SAMPLE_LB:
552 case AMDGPU::TEX_SAMPLE_C_LB:
553 case AMDGPU::TEX_SAMPLE_G:
554 case AMDGPU::TEX_SAMPLE_C_G:
555 case AMDGPU::TEX_GET_GRADIENTS_H:
556 case AMDGPU::TEX_GET_GRADIENTS_V:
557 case AMDGPU::TEX_SET_GRADIENTS_H:
558 case AMDGPU::TEX_SET_GRADIENTS_V:
559 return true;
560 }
561}
562
563bool R600MCCodeEmitter::isFlagSet(const MCInst &MI, unsigned Operand,
564 unsigned Flag) const {
565 const MCInstrDesc &MCDesc = MCII.get(MI.getOpcode());
566 unsigned FlagIndex = GET_FLAG_OPERAND_IDX(MCDesc.TSFlags);
567 if (FlagIndex == 0) {
568 return false;
569 }
570 assert(MI.getOperand(FlagIndex).isImm());
571 return !!((MI.getOperand(FlagIndex).getImm() >>
572 (NUM_MO_FLAGS * Operand)) & Flag);
573}
574
575#include "AMDGPUGenMCCodeEmitter.inc"