Blame - llvm/lib/Target/AMDGPU/AMDGPUInstrInfo.cpp - toolchain/llvm-project

blob: 36a60b32d8f751065cd173be81e11c089ef3cbcc [file] [log] [blame]

Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	1	//===-- AMDGPUInstrInfo.cpp - Base class for AMD GPU InstrInfo ------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	/// \file
				11	/// \brief Implementation of the TargetInstrInfo class that is common to all
				12	/// AMD GPUs.
				13	//
				14	//===----------------------------------------------------------------------===//
				15
				16	#include "AMDGPUInstrInfo.h"
				17	#include "AMDGPURegisterInfo.h"
				18	#include "AMDGPUTargetMachine.h"
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	19	#include "llvm/CodeGen/MachineFrameInfo.h"
				20	#include "llvm/CodeGen/MachineInstrBuilder.h"
				21	#include "llvm/CodeGen/MachineRegisterInfo.h"
				22
Chandler Carruth	d174b72	2014-04-22 02:03:14 +0000	[diff] [blame]	23	using namespace llvm;
				24
Juergen Ributzka	d12ccbd	2013-11-19 00:57:56 +0000	[diff] [blame]	25	#define GET_INSTRINFO_CTOR_DTOR
Christian Konig	f741fbf	2013-02-26 17:52:42 +0000	[diff] [blame]	26	#define GET_INSTRMAP_INFO
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	27	#include "AMDGPUGenInstrInfo.inc"
				28
Juergen Ributzka	d12ccbd	2013-11-19 00:57:56 +0000	[diff] [blame]	29	// Pin the vtable to this file.
				30	void AMDGPUInstrInfo::anchor() {}
				31
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	32	AMDGPUInstrInfo::AMDGPUInstrInfo(const AMDGPUSubtarget &ST)
Matt Arsenault	b62a4eb	2017-08-01 19:54:18 +0000	[diff] [blame]	33	: AMDGPUGenInstrInfo(AMDGPU::ADJCALLSTACKUP, AMDGPU::ADJCALLSTACKDOWN),
				34	ST(ST),
				35	AMDGPUASI(ST.getAMDGPUAS()) {}
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	36
Matt Arsenault	d5f4de2	2014-08-06 00:29:49 +0000	[diff] [blame]	37	// FIXME: This behaves strangely. If, for example, you have 32 load + stores,
				38	// the first 16 loads will be interleaved with the stores, and the next 16 will
				39	// be clustered as expected. It should really split into 2 16 store batches.
				40	//
				41	// Loads are clustered until this returns false, rather than trying to schedule
				42	// groups of stores. This also means we have to deal with saying different
				43	// address space loads should be clustered, and ones which might cause bank
				44	// conflicts.
				45	//
				46	// This might be deprecated so it might not be worth that much effort to fix.
				47	bool AMDGPUInstrInfo::shouldScheduleLoadsNear(SDNode Load0, SDNode Load1,
				48	int64_t Offset0, int64_t Offset1,
				49	unsigned NumLoads) const {
				50	assert(Offset1 > Offset0 &&
				51	"Second offset should be larger than first offset!");
				52	// If we have less than 16 loads in a row, and the offsets are within 64
				53	// bytes, then schedule together.
				54
				55	// A cacheline is 64 bytes (for global memory).
				56	return (NumLoads <= 16 && (Offset1 - Offset0) < 64);
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	57	}
				58
Tom Stellard	682bfbc	2013-10-10 17:11:24 +0000	[diff] [blame]	59	int AMDGPUInstrInfo::getMaskedMIMGOp(uint16_t Opcode, unsigned Channels) const {
				60	switch (Channels) {
				61	default: return Opcode;
				62	case 1: return AMDGPU::getMaskedMIMGOp(Opcode, AMDGPU::Channels_1);
				63	case 2: return AMDGPU::getMaskedMIMGOp(Opcode, AMDGPU::Channels_2);
				64	case 3: return AMDGPU::getMaskedMIMGOp(Opcode, AMDGPU::Channels_3);
				65	}
				66	}
Tom Stellard	c721a23	2014-05-16 20:56:47 +0000	[diff] [blame]	67
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	68	// This must be kept in sync with the SIEncodingFamily class in SIInstrInfo.td
				69	enum SIEncodingFamily {
				70	SI = 0,
Sam Kolton	549c89d	2017-06-21 08:53:38 +0000	[diff] [blame]	71	VI = 1,
				72	SDWA = 2,
				73	SDWA9 = 3
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	74	};
				75
Tom Stellard	c721a23	2014-05-16 20:56:47 +0000	[diff] [blame]	76	// Wrapper for Tablegen'd function. enum Subtarget is not defined in any
Matt Arsenault	1f0227a	2014-10-07 21:29:56 +0000	[diff] [blame]	77	// header files, so we need to wrap it in a function that takes unsigned
Tom Stellard	c721a23	2014-05-16 20:56:47 +0000	[diff] [blame]	78	// instead.
				79	namespace llvm {
				80	namespace AMDGPU {
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	81	static int getMCOpcode(uint16_t Opcode, unsigned Gen) {
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	82	return getMCOpcodeGen(Opcode, static_cast<Subtarget>(Gen));
Tom Stellard	c721a23	2014-05-16 20:56:47 +0000	[diff] [blame]	83	}
				84	}
				85	}
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	86
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	87	static SIEncodingFamily subtargetEncodingFamily(const AMDGPUSubtarget &ST) {
				88	switch (ST.getGeneration()) {
				89	case AMDGPUSubtarget::SOUTHERN_ISLANDS:
				90	case AMDGPUSubtarget::SEA_ISLANDS:
				91	return SIEncodingFamily::SI;
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	92	case AMDGPUSubtarget::VOLCANIC_ISLANDS:
Matt Arsenault	e823d92	2017-02-18 18:29:53 +0000	[diff] [blame]	93	case AMDGPUSubtarget::GFX9:
Matt Arsenault	43e92fe	2016-06-24 06:30:11 +0000	[diff] [blame]	94	return SIEncodingFamily::VI;
				95
				96	// FIXME: This should never be called for r600 GPUs.
				97	case AMDGPUSubtarget::R600:
				98	case AMDGPUSubtarget::R700:
				99	case AMDGPUSubtarget::EVERGREEN:
				100	case AMDGPUSubtarget::NORTHERN_ISLANDS:
				101	return SIEncodingFamily::SI;
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	102	}
Simon Pilgrim	634dde3	2016-06-27 12:58:10 +0000	[diff] [blame]	103
				104	llvm_unreachable("Unknown subtarget generation!");
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	105	}
				106
				107	int AMDGPUInstrInfo::pseudoToMCOpcode(int Opcode) const {
Sam Kolton	549c89d	2017-06-21 08:53:38 +0000	[diff] [blame]	108	SIEncodingFamily Gen = subtargetEncodingFamily(ST);
				109	if (get(Opcode).TSFlags & SIInstrFlags::SDWA)
				110	Gen = ST.getGeneration() == AMDGPUSubtarget::GFX9 ? SIEncodingFamily::SDWA9
				111	: SIEncodingFamily::SDWA;
				112
				113	int MCOp = AMDGPU::getMCOpcode(Opcode, Gen);
Marek Olsak	a93603d	2015-01-15 18:42:51 +0000	[diff] [blame]	114
				115	// -1 means that Opcode is already a native instruction.
				116	if (MCOp == -1)
				117	return Opcode;
				118
				119	// (uint16_t)-1 means that Opcode is a pseudo instruction that has
				120	// no encoding in the given subtarget generation.
				121	if (MCOp == (uint16_t)-1)
				122	return -1;
				123
				124	return MCOp;
				125	}