Blame - llvm/lib/Target/R600/AMDGPUISelLowering.h - toolchain/llvm-project

blob: 84cb52282f87de59d061bf232a0f45786475ee54 [file] [log] [blame]

Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	1	//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------- C++ --===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	/// \file
				11	/// \brief Interface definition of the TargetLowering class that is common
				12	/// to all AMD GPUs.
				13	//
				14	//===----------------------------------------------------------------------===//
				15
Benjamin Kramer	a7c40ef	2014-08-13 16:26:38 +0000	[diff] [blame]	16	#ifndef LLVM_LIB_TARGET_R600_AMDGPUISELLOWERING_H
				17	#define LLVM_LIB_TARGET_R600_AMDGPUISELLOWERING_H
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	18
				19	#include "llvm/Target/TargetLowering.h"
				20
				21	namespace llvm {
				22
Tom Stellard	c026e8b	2013-06-28 15:47:08 +0000	[diff] [blame]	23	class AMDGPUMachineFunction;
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	24	class AMDGPUSubtarget;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	25	class MachineRegisterInfo;
				26
				27	class AMDGPUTargetLowering : public TargetLowering {
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	28	protected:
				29	const AMDGPUSubtarget *Subtarget;
				30
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	31	private:
Tom Stellard	04c0e98	2014-01-22 19:24:21 +0000	[diff] [blame]	32	SDValue LowerConstantInitializer(const Constant* Init, const GlobalValue *GV,
				33	const SDValue &InitPtr,
				34	SDValue Chain,
				35	SelectionDAG &DAG) const;
Tom Stellard	81d871d	2013-11-13 23:36:50 +0000	[diff] [blame]	36	SDValue LowerFrameIndex(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	d86003e	2013-08-14 23:25:00 +0000	[diff] [blame]	37	SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;
				38	SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	39	SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	40	/// \brief Lower vector stores by merging the vector elements into an integer
				41	/// of the same bitwidth.
				42	SDValue MergeVectorStore(const SDValue &Op, SelectionDAG &DAG) const;
				43	/// \brief Split a vector store into multiple scalar stores.
Matt Arsenault	209a7b9	2014-04-18 07:40:20 +0000	[diff] [blame]	44	/// \returns The resulting chain.
Matt Arsenault	1578aa7	2014-06-15 20:08:02 +0000	[diff] [blame]	45
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	46	SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	16e3133	2014-09-10 21:44:27 +0000	[diff] [blame]	47	SDValue LowerFREM(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	48	SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const;
				49	SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	e8208ec	2014-06-18 17:05:26 +0000	[diff] [blame]	50	SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	692bd5e	2014-06-18 22:03:45 +0000	[diff] [blame]	51	SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	52	SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const;
				53
Matt Arsenault	f7c95e3	2014-10-03 23:54:41 +0000	[diff] [blame^]	54	SDValue LowerINT_TO_FP64(SDValue Op, SelectionDAG &DAG, bool Signed) const;
Tom Stellard	c947d8c	2013-10-30 17:22:05 +0000	[diff] [blame]	55	SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	f7c95e3	2014-10-03 23:54:41 +0000	[diff] [blame^]	56	SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	57
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	58	SDValue ExpandSIGN_EXTEND_INREG(SDValue Op,
				59	unsigned BitsDiff,
				60	SelectionDAG &DAG) const;
				61	SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;
				62
Matt Arsenault	ca3976f	2014-07-15 02:06:31 +0000	[diff] [blame]	63	SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const;
Matt Arsenault	d0e0f0a	2014-06-30 17:55:48 +0000	[diff] [blame]	64	SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const;
				65
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	66	protected:
Matt Arsenault	c9df794	2014-06-11 03:29:54 +0000	[diff] [blame]	67	static EVT getEquivalentMemType(LLVMContext &Context, EVT VT);
				68	static EVT getEquivalentLoadRegType(LLVMContext &Context, EVT VT);
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	69
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	70	virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op,
				71	SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame]	72
				73	/// \brief Split a vector load into a scalar load of each component.
				74	SDValue ScalarizeVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				75
				76	/// \brief Split a vector load into 2 loads of half the vector.
				77	SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				78
				79	/// \brief Split a vector store into a scalar store of each component.
				80	SDValue ScalarizeVectorStore(SDValue Op, SelectionDAG &DAG) const;
				81
				82	/// \brief Split a vector store into 2 stores of half the vector.
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	83	SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame]	84
Tom Stellard	e937360	2014-01-22 19:24:14 +0000	[diff] [blame]	85	SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	86	SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
Jan Vesely	343cd6f0	2014-06-22 21:43:01 +0000	[diff] [blame]	87	SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const;
Jan Vesely	e5ca27d	2014-08-12 17:31:20 +0000	[diff] [blame]	88	SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	89	bool isHWTrueValue(SDValue Op) const;
				90	bool isHWFalseValue(SDValue Op) const;
				91
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	92	/// The SelectionDAGBuilder will automatically promote function arguments
				93	/// with illegal types. However, this does not work for the AMDGPU targets
				94	/// since the function arguments are stored in memory as these illegal types.
				95	/// In order to handle this properly we need to get the origianl types sizes
				96	/// from the LLVM IR Function and fixup the ISD:InputArg values before
				97	/// passing them to AnalyzeFormalArguments()
				98	void getOriginalFunctionArgs(SelectionDAG &DAG,
				99	const Function *F,
				100	const SmallVectorImpl<ISD::InputArg> &Ins,
				101	SmallVectorImpl<ISD::InputArg> &OrigIns) const;
Christian Konig	2c8f6d5	2013-03-07 09:03:52 +0000	[diff] [blame]	102	void AnalyzeFormalArguments(CCState &State,
				103	const SmallVectorImpl<ISD::InputArg> &Ins) const;
				104
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	105	public:
				106	AMDGPUTargetLowering(TargetMachine &TM);
				107
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	108	bool isFAbsFree(EVT VT) const override;
				109	bool isFNegFree(EVT VT) const override;
				110	bool isTruncateFree(EVT Src, EVT Dest) const override;
				111	bool isTruncateFree(Type Src, Type Dest) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	112
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	113	bool isZExtFree(Type Src, Type Dest) const override;
				114	bool isZExtFree(EVT Src, EVT Dest) const override;
Aaron Ballman	3c81e46	2014-06-26 13:45:47 +0000	[diff] [blame]	115	bool isZExtFree(SDValue Val, EVT VT2) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	116
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	117	bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
Matt Arsenault	a7f1e0c	2014-03-24 19:43:31 +0000	[diff] [blame]	118
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	119	MVT getVectorIdxTy() const override;
Matt Arsenault	1d555c4	2014-06-23 18:00:55 +0000	[diff] [blame]	120	bool isSelectSupported(SelectSupportKind) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	121
				122	bool isFPImmLegal(const APFloat &Imm, EVT VT) const override;
				123	bool ShouldShrinkFPConstant(EVT VT) const override;
				124
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	125	bool isLoadBitCastBeneficial(EVT, EVT) const override;
				126	SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
				127	bool isVarArg,
				128	const SmallVectorImpl<ISD::OutputArg> &Outs,
				129	const SmallVectorImpl<SDValue> &OutVals,
				130	SDLoc DL, SelectionDAG &DAG) const override;
				131	SDValue LowerCall(CallLoweringInfo &CLI,
				132	SmallVectorImpl<SDValue> &InVals) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	133
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	134	SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	135	SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	136	void ReplaceNodeResults(SDNode * N,
				137	SmallVectorImpl<SDValue> &Results,
				138	SelectionDAG &DAG) const override;
Matt Arsenault	d125d74	2014-03-27 17:23:24 +0000	[diff] [blame]	139
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	140	SDValue LowerIntrinsicIABS(SDValue Op, SelectionDAG &DAG) const;
				141	SDValue LowerIntrinsicLRP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	afa8b53	2014-05-09 16:42:16 +0000	[diff] [blame]	142	SDValue CombineMinMax(SDNode *N, SelectionDAG &DAG) const;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	143	const char* getTargetNodeName(unsigned Opcode) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	144
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	145	virtual SDNode PostISelFolding(MachineSDNode N,
				146	SelectionDAG &DAG) const {
Christian Konig	d910b7d	2013-02-26 17:52:16 +0000	[diff] [blame]	147	return N;
				148	}
				149
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	150	/// \brief Determine which of the bits specified in \p Mask are known to be
				151	/// either zero or one and return them in the \p KnownZero and \p KnownOne
				152	/// bitsets.
Jay Foad	a0653a3	2014-05-14 21:14:37 +0000	[diff] [blame]	153	void computeKnownBitsForTargetNode(const SDValue Op,
				154	APInt &KnownZero,
				155	APInt &KnownOne,
				156	const SelectionDAG &DAG,
				157	unsigned Depth = 0) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	158
Benjamin Kramer	8c90fd7	2014-09-03 11:41:21 +0000	[diff] [blame]	159	unsigned ComputeNumSignBitsForTargetNode(SDValue Op, const SelectionDAG &DAG,
				160	unsigned Depth = 0) const override;
Tom Stellard	b02094e	2014-07-21 15:45:01 +0000	[diff] [blame]	161
				162	/// \brief Helper function that adds Reg to the LiveIn list of the DAG's
				163	/// MachineFunction.
				164	///
				165	/// \returns a RegisterSDNode representing Reg.
				166	virtual SDValue CreateLiveInRegister(SelectionDAG &DAG,
				167	const TargetRegisterClass *RC,
				168	unsigned Reg, EVT VT) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	169	};
				170
				171	namespace AMDGPUISD {
				172
				173	enum {
				174	// AMDIL ISD Opcodes
				175	FIRST_NUMBER = ISD::BUILTIN_OP_END,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	176	CALL, // Function call based on a single integer
				177	UMUL, // 32bit unsigned multiplication
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	178	RET_FLAG,
				179	BRANCH_COND,
				180	// End AMDIL ISD Opcodes
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	181	DWORDADDR,
				182	FRACT,
Matt Arsenault	5d47d4a	2014-06-12 21:15:44 +0000	[diff] [blame]	183	CLAMP,
Matt Arsenault	8675db1	2014-08-29 16:01:14 +0000	[diff] [blame]	184	MAD, // Multiply + add with same result as the separate operations.
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	185
				186	// SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.
				187	// Denormals handled on some parts.
Vincent Lejeune	b55940c	2013-07-09 15:03:11 +0000	[diff] [blame]	188	COS_HW,
				189	SIN_HW,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	190	FMAX,
				191	SMAX,
				192	UMAX,
				193	FMIN,
				194	SMIN,
				195	UMIN,
				196	URECIP,
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	197	DIV_SCALE,
				198	DIV_FMAS,
				199	DIV_FIXUP,
				200	TRIG_PREOP, // 1 ULP max error for f64
				201
				202	// RCP, RSQ - For f32, 1 ULP max error, no denormal handling.
				203	// For f64, max error 2^29 ULP, handles denormals.
				204	RCP,
				205	RSQ,
Matt Arsenault	257d48d	2014-06-24 22:13:39 +0000	[diff] [blame]	206	RSQ_LEGACY,
				207	RSQ_CLAMPED,
Matt Arsenault	2e7cc48	2014-08-15 17:30:25 +0000	[diff] [blame]	208	LDEXP,
Vincent Lejeune	519f21e	2013-05-17 16:50:32 +0000	[diff] [blame]	209	DOT4,
Matt Arsenault	fae0298	2014-03-17 18:58:11 +0000	[diff] [blame]	210	BFE_U32, // Extract range of bits with zero extension to 32-bits.
				211	BFE_I32, // Extract range of bits with sign extension to 32-bits.
Matt Arsenault	b345836	2014-03-31 18:21:13 +0000	[diff] [blame]	212	BFI, // (src0 & src1) \| (~src0 & src2)
				213	BFM, // Insert a range of bits into a 32-bit word.
Matt Arsenault	43160e7	2014-06-18 17:13:57 +0000	[diff] [blame]	214	BREV, // Reverse bits.
Tom Stellard	50122a5	2014-04-07 19:45:41 +0000	[diff] [blame]	215	MUL_U24,
				216	MUL_I24,
Matt Arsenault	eb26020	2014-05-22 18:00:15 +0000	[diff] [blame]	217	MAD_U24,
				218	MAD_I24,
Vincent Lejeune	d3eed66	2013-05-17 16:50:20 +0000	[diff] [blame]	219	TEXTURE_FETCH,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	220	EXPORT,
Tom Stellard	ff62c35	2013-01-23 02:09:03 +0000	[diff] [blame]	221	CONST_ADDRESS,
Tom Stellard	f3b2a1e	2013-02-06 17:32:29 +0000	[diff] [blame]	222	REGISTER_LOAD,
				223	REGISTER_STORE,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	224	LOAD_INPUT,
				225	SAMPLE,
				226	SAMPLEB,
				227	SAMPLED,
				228	SAMPLEL,
Matt Arsenault	364a674	2014-06-11 17:50:44 +0000	[diff] [blame]	229
				230	// These cvt_f32_ubyte* nodes need to remain consecutive and in order.
				231	CVT_F32_UBYTE0,
				232	CVT_F32_UBYTE1,
				233	CVT_F32_UBYTE2,
				234	CVT_F32_UBYTE3,
Tom Stellard	880a80a	2014-06-17 16:53:14 +0000	[diff] [blame]	235	/// This node is for VLIW targets and it is used to represent a vector
				236	/// that is stored in consecutive registers with the same channel.
				237	/// For example:
				238	/// \|X \|Y\|Z\|W\|
				239	/// T0\|v.x\| \| \| \|
				240	/// T1\|v.y\| \| \| \|
				241	/// T2\|v.z\| \| \| \|
				242	/// T3\|v.w\| \| \| \|
				243	BUILD_VERTICAL_VECTOR,
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	244	/// Pointer to the start of the shader's constant data.
				245	CONST_DATA_PTR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	246	FIRST_MEM_OPCODE_NUMBER = ISD::FIRST_TARGET_MEMORY_OPCODE,
Tom Stellard	d3ee8c1	2013-08-16 01:12:06 +0000	[diff] [blame]	247	STORE_MSKOR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	248	LOAD_CONSTANT,
Tom Stellard	afcf12f	2013-09-12 02:55:14 +0000	[diff] [blame]	249	TBUFFER_STORE_FORMAT,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	250	LAST_AMDGPU_ISD_NUMBER
				251	};
				252
				253
				254	} // End namespace AMDGPUISD
				255
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	256	} // End namespace llvm
				257
Benjamin Kramer	a7c40ef	2014-08-13 16:26:38 +0000	[diff] [blame]	258	#endif