Blame - llvm/lib/Target/R600/AMDGPUISelLowering.h - toolchain/llvm-project

blob: 769ea97830d01e83dd5859d0ebeb77d3bfcdafc7 [file] [log] [blame]

Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	1	//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------- C++ --===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	/// \file
				11	/// \brief Interface definition of the TargetLowering class that is common
				12	/// to all AMD GPUs.
				13	//
				14	//===----------------------------------------------------------------------===//
				15
				16	#ifndef AMDGPUISELLOWERING_H
				17	#define AMDGPUISELLOWERING_H
				18
				19	#include "llvm/Target/TargetLowering.h"
				20
				21	namespace llvm {
				22
Tom Stellard	c026e8b	2013-06-28 15:47:08 +0000	[diff] [blame]	23	class AMDGPUMachineFunction;
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	24	class AMDGPUSubtarget;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	25	class MachineRegisterInfo;
				26
				27	class AMDGPUTargetLowering : public TargetLowering {
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	28	protected:
				29	const AMDGPUSubtarget *Subtarget;
				30
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	31	private:
Tom Stellard	04c0e98	2014-01-22 19:24:21 +0000	[diff] [blame]	32	SDValue LowerConstantInitializer(const Constant* Init, const GlobalValue *GV,
				33	const SDValue &InitPtr,
				34	SDValue Chain,
				35	SelectionDAG &DAG) const;
Tom Stellard	81d871d	2013-11-13 23:36:50 +0000	[diff] [blame]	36	SDValue LowerFrameIndex(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	d86003e	2013-08-14 23:25:00 +0000	[diff] [blame]	37	SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;
				38	SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	39	SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	40	/// \brief Lower vector stores by merging the vector elements into an integer
				41	/// of the same bitwidth.
				42	SDValue MergeVectorStore(const SDValue &Op, SelectionDAG &DAG) const;
				43	/// \brief Split a vector store into multiple scalar stores.
Matt Arsenault	209a7b9	2014-04-18 07:40:20 +0000	[diff] [blame]	44	/// \returns The resulting chain.
Matt Arsenault	1578aa7	2014-06-15 20:08:02 +0000	[diff] [blame]	45
				46	SDValue LowerSDIV(SDValue Op, SelectionDAG &DAG) const;
				47	SDValue LowerSDIV24(SDValue Op, SelectionDAG &DAG) const;
				48	SDValue LowerSDIV32(SDValue Op, SelectionDAG &DAG) const;
				49	SDValue LowerSDIV64(SDValue Op, SelectionDAG &DAG) const;
				50	SDValue LowerSREM(SDValue Op, SelectionDAG &DAG) const;
				51	SDValue LowerSREM32(SDValue Op, SelectionDAG &DAG) const;
				52	SDValue LowerSREM64(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	53	SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	54	SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const;
				55	SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	e8208ec	2014-06-18 17:05:26 +0000	[diff] [blame]	56	SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	692bd5e	2014-06-18 22:03:45 +0000	[diff] [blame]	57	SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	58	SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const;
				59
Tom Stellard	c947d8c	2013-10-30 17:22:05 +0000	[diff] [blame]	60	SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	61
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	62	SDValue ExpandSIGN_EXTEND_INREG(SDValue Op,
				63	unsigned BitsDiff,
				64	SelectionDAG &DAG) const;
				65	SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;
				66
Matt Arsenault	ca3976f	2014-07-15 02:06:31 +0000	[diff] [blame]	67	SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const;
Matt Arsenault	d0e0f0a	2014-06-30 17:55:48 +0000	[diff] [blame]	68	SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const;
				69
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	70	protected:
Matt Arsenault	c9df794	2014-06-11 03:29:54 +0000	[diff] [blame]	71	static EVT getEquivalentMemType(LLVMContext &Context, EVT VT);
				72	static EVT getEquivalentLoadRegType(LLVMContext &Context, EVT VT);
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	73
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	74	virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op,
				75	SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame^]	76
				77	/// \brief Split a vector load into a scalar load of each component.
				78	SDValue ScalarizeVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				79
				80	/// \brief Split a vector load into 2 loads of half the vector.
				81	SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				82
				83	/// \brief Split a vector store into a scalar store of each component.
				84	SDValue ScalarizeVectorStore(SDValue Op, SelectionDAG &DAG) const;
				85
				86	/// \brief Split a vector store into 2 stores of half the vector.
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	87	SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame^]	88
Tom Stellard	e937360	2014-01-22 19:24:14 +0000	[diff] [blame]	89	SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	90	SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
Jan Vesely	343cd6f0	2014-06-22 21:43:01 +0000	[diff] [blame]	91	SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	92	bool isHWTrueValue(SDValue Op) const;
				93	bool isHWFalseValue(SDValue Op) const;
				94
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	95	/// The SelectionDAGBuilder will automatically promote function arguments
				96	/// with illegal types. However, this does not work for the AMDGPU targets
				97	/// since the function arguments are stored in memory as these illegal types.
				98	/// In order to handle this properly we need to get the origianl types sizes
				99	/// from the LLVM IR Function and fixup the ISD:InputArg values before
				100	/// passing them to AnalyzeFormalArguments()
				101	void getOriginalFunctionArgs(SelectionDAG &DAG,
				102	const Function *F,
				103	const SmallVectorImpl<ISD::InputArg> &Ins,
				104	SmallVectorImpl<ISD::InputArg> &OrigIns) const;
Christian Konig	2c8f6d5	2013-03-07 09:03:52 +0000	[diff] [blame]	105	void AnalyzeFormalArguments(CCState &State,
				106	const SmallVectorImpl<ISD::InputArg> &Ins) const;
				107
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	108	public:
				109	AMDGPUTargetLowering(TargetMachine &TM);
				110
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	111	bool isFAbsFree(EVT VT) const override;
				112	bool isFNegFree(EVT VT) const override;
				113	bool isTruncateFree(EVT Src, EVT Dest) const override;
				114	bool isTruncateFree(Type Src, Type Dest) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	115
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	116	bool isZExtFree(Type Src, Type Dest) const override;
				117	bool isZExtFree(EVT Src, EVT Dest) const override;
Aaron Ballman	3c81e46	2014-06-26 13:45:47 +0000	[diff] [blame]	118	bool isZExtFree(SDValue Val, EVT VT2) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	119
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	120	bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
Matt Arsenault	a7f1e0c	2014-03-24 19:43:31 +0000	[diff] [blame]	121
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	122	MVT getVectorIdxTy() const override;
Matt Arsenault	1d555c4	2014-06-23 18:00:55 +0000	[diff] [blame]	123	bool isSelectSupported(SelectSupportKind) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	124
				125	bool isFPImmLegal(const APFloat &Imm, EVT VT) const override;
				126	bool ShouldShrinkFPConstant(EVT VT) const override;
				127
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	128	bool isLoadBitCastBeneficial(EVT, EVT) const override;
				129	SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
				130	bool isVarArg,
				131	const SmallVectorImpl<ISD::OutputArg> &Outs,
				132	const SmallVectorImpl<SDValue> &OutVals,
				133	SDLoc DL, SelectionDAG &DAG) const override;
				134	SDValue LowerCall(CallLoweringInfo &CLI,
				135	SmallVectorImpl<SDValue> &InVals) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	136
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	137	SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	138	SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	139	void ReplaceNodeResults(SDNode * N,
				140	SmallVectorImpl<SDValue> &Results,
				141	SelectionDAG &DAG) const override;
Matt Arsenault	d125d74	2014-03-27 17:23:24 +0000	[diff] [blame]	142
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	143	SDValue LowerIntrinsicIABS(SDValue Op, SelectionDAG &DAG) const;
				144	SDValue LowerIntrinsicLRP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	afa8b53	2014-05-09 16:42:16 +0000	[diff] [blame]	145	SDValue CombineMinMax(SDNode *N, SelectionDAG &DAG) const;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	146	const char* getTargetNodeName(unsigned Opcode) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	147
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	148	virtual SDNode PostISelFolding(MachineSDNode N,
				149	SelectionDAG &DAG) const {
Christian Konig	d910b7d	2013-02-26 17:52:16 +0000	[diff] [blame]	150	return N;
				151	}
				152
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	153	/// \brief Determine which of the bits specified in \p Mask are known to be
				154	/// either zero or one and return them in the \p KnownZero and \p KnownOne
				155	/// bitsets.
Jay Foad	a0653a3	2014-05-14 21:14:37 +0000	[diff] [blame]	156	void computeKnownBitsForTargetNode(const SDValue Op,
				157	APInt &KnownZero,
				158	APInt &KnownOne,
				159	const SelectionDAG &DAG,
				160	unsigned Depth = 0) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	161
Matt Arsenault	bf8694d	2014-05-22 18:09:03 +0000	[diff] [blame]	162	virtual unsigned ComputeNumSignBitsForTargetNode(
				163	SDValue Op,
				164	const SelectionDAG &DAG,
				165	unsigned Depth = 0) const override;
Tom Stellard	b02094e	2014-07-21 15:45:01 +0000	[diff] [blame]	166
				167	/// \brief Helper function that adds Reg to the LiveIn list of the DAG's
				168	/// MachineFunction.
				169	///
				170	/// \returns a RegisterSDNode representing Reg.
				171	virtual SDValue CreateLiveInRegister(SelectionDAG &DAG,
				172	const TargetRegisterClass *RC,
				173	unsigned Reg, EVT VT) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	174	};
				175
				176	namespace AMDGPUISD {
				177
				178	enum {
				179	// AMDIL ISD Opcodes
				180	FIRST_NUMBER = ISD::BUILTIN_OP_END,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	181	CALL, // Function call based on a single integer
				182	UMUL, // 32bit unsigned multiplication
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	183	RET_FLAG,
				184	BRANCH_COND,
				185	// End AMDIL ISD Opcodes
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	186	DWORDADDR,
				187	FRACT,
Matt Arsenault	5d47d4a	2014-06-12 21:15:44 +0000	[diff] [blame]	188	CLAMP,
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	189
				190	// SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.
				191	// Denormals handled on some parts.
Vincent Lejeune	b55940c	2013-07-09 15:03:11 +0000	[diff] [blame]	192	COS_HW,
				193	SIN_HW,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	194	FMAX,
				195	SMAX,
				196	UMAX,
				197	FMIN,
				198	SMIN,
				199	UMIN,
				200	URECIP,
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	201	DIV_SCALE,
				202	DIV_FMAS,
				203	DIV_FIXUP,
				204	TRIG_PREOP, // 1 ULP max error for f64
				205
				206	// RCP, RSQ - For f32, 1 ULP max error, no denormal handling.
				207	// For f64, max error 2^29 ULP, handles denormals.
				208	RCP,
				209	RSQ,
Matt Arsenault	257d48d	2014-06-24 22:13:39 +0000	[diff] [blame]	210	RSQ_LEGACY,
				211	RSQ_CLAMPED,
Vincent Lejeune	519f21e	2013-05-17 16:50:32 +0000	[diff] [blame]	212	DOT4,
Matt Arsenault	fae0298	2014-03-17 18:58:11 +0000	[diff] [blame]	213	BFE_U32, // Extract range of bits with zero extension to 32-bits.
				214	BFE_I32, // Extract range of bits with sign extension to 32-bits.
Matt Arsenault	b345836	2014-03-31 18:21:13 +0000	[diff] [blame]	215	BFI, // (src0 & src1) \| (~src0 & src2)
				216	BFM, // Insert a range of bits into a 32-bit word.
Matt Arsenault	43160e7	2014-06-18 17:13:57 +0000	[diff] [blame]	217	BREV, // Reverse bits.
Tom Stellard	50122a5	2014-04-07 19:45:41 +0000	[diff] [blame]	218	MUL_U24,
				219	MUL_I24,
Matt Arsenault	eb26020	2014-05-22 18:00:15 +0000	[diff] [blame]	220	MAD_U24,
				221	MAD_I24,
Vincent Lejeune	d3eed66	2013-05-17 16:50:20 +0000	[diff] [blame]	222	TEXTURE_FETCH,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	223	EXPORT,
Tom Stellard	ff62c35	2013-01-23 02:09:03 +0000	[diff] [blame]	224	CONST_ADDRESS,
Tom Stellard	f3b2a1e	2013-02-06 17:32:29 +0000	[diff] [blame]	225	REGISTER_LOAD,
				226	REGISTER_STORE,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	227	LOAD_INPUT,
				228	SAMPLE,
				229	SAMPLEB,
				230	SAMPLED,
				231	SAMPLEL,
Matt Arsenault	364a674	2014-06-11 17:50:44 +0000	[diff] [blame]	232
				233	// These cvt_f32_ubyte* nodes need to remain consecutive and in order.
				234	CVT_F32_UBYTE0,
				235	CVT_F32_UBYTE1,
				236	CVT_F32_UBYTE2,
				237	CVT_F32_UBYTE3,
Tom Stellard	880a80a	2014-06-17 16:53:14 +0000	[diff] [blame]	238	/// This node is for VLIW targets and it is used to represent a vector
				239	/// that is stored in consecutive registers with the same channel.
				240	/// For example:
				241	/// \|X \|Y\|Z\|W\|
				242	/// T0\|v.x\| \| \| \|
				243	/// T1\|v.y\| \| \| \|
				244	/// T2\|v.z\| \| \| \|
				245	/// T3\|v.w\| \| \| \|
				246	BUILD_VERTICAL_VECTOR,
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	247	/// Pointer to the start of the shader's constant data.
				248	CONST_DATA_PTR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	249	FIRST_MEM_OPCODE_NUMBER = ISD::FIRST_TARGET_MEMORY_OPCODE,
Tom Stellard	d3ee8c1	2013-08-16 01:12:06 +0000	[diff] [blame]	250	STORE_MSKOR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	251	LOAD_CONSTANT,
Tom Stellard	afcf12f	2013-09-12 02:55:14 +0000	[diff] [blame]	252	TBUFFER_STORE_FORMAT,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	253	LAST_AMDGPU_ISD_NUMBER
				254	};
				255
				256
				257	} // End namespace AMDGPUISD
				258
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	259	} // End namespace llvm
				260
				261	#endif // AMDGPUISELLOWERING_H