Blame - llvm/lib/Target/AMDGPU/AMDGPUTargetTransformInfo.h - toolchain/llvm-project

blob: ea4f5826f6bd93b96cf36a8060c648984c3294ed [file] [log] [blame]

Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	1	//===-- AMDGPUTargetTransformInfo.h - AMDGPU specific TTI -------- C++ --===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	/// \file
				10	/// This file a TargetTransformInfo::Concept conforming object specific to the
				11	/// AMDGPU target machine. It uses the target's detailed information to
				12	/// provide more precise answers to certain TTI queries, while letting the
				13	/// target independent and default TTI implementations handle the rest.
				14	///
				15	//===----------------------------------------------------------------------===//
				16
Matt Arsenault	6b6a2c3	2016-03-11 08:00:27 +0000	[diff] [blame]	17	#ifndef LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H
				18	#define LLVM_LIB_TARGET_AMDGPU_AMDGPUTARGETTRANSFORMINFO_H
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	19
				20	#include "AMDGPU.h"
				21	#include "AMDGPUTargetMachine.h"
				22	#include "llvm/Analysis/TargetTransformInfo.h"
				23	#include "llvm/CodeGen/BasicTTIImpl.h"
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	24
				25	namespace llvm {
Matt Arsenault	9651813	2016-03-25 01:00:32 +0000	[diff] [blame]	26	class AMDGPUTargetLowering;
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	27
Matt Arsenault	6b6a2c3	2016-03-11 08:00:27 +0000	[diff] [blame]	28	class AMDGPUTTIImpl final : public BasicTTIImplBase<AMDGPUTTIImpl> {
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	29	typedef BasicTTIImplBase<AMDGPUTTIImpl> BaseT;
				30	typedef TargetTransformInfo TTI;
Chandler Carruth	c340ca8	2015-02-01 14:01:15 +0000	[diff] [blame]	31	friend BaseT;
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	32
				33	const AMDGPUSubtarget *ST;
Chandler Carruth	c340ca8	2015-02-01 14:01:15 +0000	[diff] [blame]	34	const AMDGPUTargetLowering *TLI;
				35
Chandler Carruth	c956ab66	2015-02-01 14:22:17 +0000	[diff] [blame]	36	const AMDGPUSubtarget *getST() const { return ST; }
Chandler Carruth	c340ca8	2015-02-01 14:01:15 +0000	[diff] [blame]	37	const AMDGPUTargetLowering *getTLI() const { return TLI; }
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	38
Matt Arsenault	9651813	2016-03-25 01:00:32 +0000	[diff] [blame]	39
				40	static inline int getFullRateInstrCost() {
				41	return TargetTransformInfo::TCC_Basic;
				42	}
				43
				44	static inline int getHalfRateInstrCost() {
				45	return 2 * TargetTransformInfo::TCC_Basic;
				46	}
				47
				48	// TODO: The size is usually 8 bytes, but takes 4x as many cycles. Maybe
				49	// should be 2 or 4.
				50	static inline int getQuarterRateInstrCost() {
				51	return 3 * TargetTransformInfo::TCC_Basic;
				52	}
				53
				54	// On some parts, normal fp64 operations are half rate, and others
				55	// quarter. This also applies to some integer operations.
				56	inline int get64BitInstrCost() const {
				57	return ST->hasHalfRate64Ops() ?
				58	getHalfRateInstrCost() : getQuarterRateInstrCost();
				59	}
				60
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	61	public:
Matt Arsenault	59c0ffa	2016-06-27 20:48:03 +0000	[diff] [blame^]	62	explicit AMDGPUTTIImpl(const AMDGPUTargetMachine *TM, const Function &F)
				63	: BaseT(TM, F.getParent()->getDataLayout()),
				64	ST(TM->getSubtargetImpl(F)),
				65	TLI(ST->getTargetLowering()) {}
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	66
				67	// Provide value semantics. MSVC requires that we spell all of these out.
				68	AMDGPUTTIImpl(const AMDGPUTTIImpl &Arg)
Chandler Carruth	c956ab66	2015-02-01 14:22:17 +0000	[diff] [blame]	69	: BaseT(static_cast<const BaseT &>(Arg)), ST(Arg.ST), TLI(Arg.TLI) {}
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	70	AMDGPUTTIImpl(AMDGPUTTIImpl &&Arg)
Chandler Carruth	c956ab66	2015-02-01 14:22:17 +0000	[diff] [blame]	71	: BaseT(std::move(static_cast<BaseT &>(Arg))), ST(std::move(Arg.ST)),
				72	TLI(std::move(Arg.TLI)) {}
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	73
				74	bool hasBranchDivergence() { return true; }
				75
Chandler Carruth	ab5cb36	2015-02-01 14:31:23 +0000	[diff] [blame]	76	void getUnrollingPreferences(Loop *L, TTI::UnrollingPreferences &UP);
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	77
				78	TTI::PopcntSupportKind getPopcntSupport(unsigned TyWidth) {
				79	assert(isPowerOf2_32(TyWidth) && "Ty width must be power of 2");
Matt Arsenault	1735da4	2016-05-18 16:10:19 +0000	[diff] [blame]	80	return TTI::PSK_FastHardware;
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	81	}
				82
				83	unsigned getNumberOfRegisters(bool Vector);
				84	unsigned getRegisterBitWidth(bool Vector);
Wei Mi	062c744	2015-05-06 17:12:25 +0000	[diff] [blame]	85	unsigned getMaxInterleaveFactor(unsigned VF);
Matt Arsenault	e830f54	2015-12-01 19:08:39 +0000	[diff] [blame]	86
Matt Arsenault	9651813	2016-03-25 01:00:32 +0000	[diff] [blame]	87	int getArithmeticInstrCost(
				88	unsigned Opcode, Type *Ty,
				89	TTI::OperandValueKind Opd1Info = TTI::OK_AnyValue,
				90	TTI::OperandValueKind Opd2Info = TTI::OK_AnyValue,
				91	TTI::OperandValueProperties Opd1PropInfo = TTI::OP_None,
				92	TTI::OperandValueProperties Opd2PropInfo = TTI::OP_None);
				93
Matt Arsenault	e05ff15	2015-12-16 18:37:19 +0000	[diff] [blame]	94	unsigned getCFInstrCost(unsigned Opcode);
				95
Matt Arsenault	e830f54	2015-12-01 19:08:39 +0000	[diff] [blame]	96	int getVectorInstrCost(unsigned Opcode, Type *ValTy, unsigned Index);
Tom Stellard	dbe374b	2015-12-15 18:04:38 +0000	[diff] [blame]	97	bool isSourceOfDivergence(const Value *V) const;
Chandler Carruth	93dcdc4	2015-01-31 11:17:59 +0000	[diff] [blame]	98	};
				99
				100	} // end namespace llvm
				101
				102	#endif