Blame - llvm/lib/Target/R600/AMDGPUISelLowering.h - toolchain/llvm-project

blob: 3dc703520cb9dfe0a43b6f45ed3e6f5f548ffe0b [file] [log] [blame]

Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	1	//===-- AMDGPUISelLowering.h - AMDGPU Lowering Interface --------- C++ --===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	/// \file
				11	/// \brief Interface definition of the TargetLowering class that is common
				12	/// to all AMD GPUs.
				13	//
				14	//===----------------------------------------------------------------------===//
				15
Benjamin Kramer	a7c40ef	2014-08-13 16:26:38 +0000	[diff] [blame]	16	#ifndef LLVM_LIB_TARGET_R600_AMDGPUISELLOWERING_H
				17	#define LLVM_LIB_TARGET_R600_AMDGPUISELLOWERING_H
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	18
				19	#include "llvm/Target/TargetLowering.h"
				20
				21	namespace llvm {
				22
Tom Stellard	c026e8b	2013-06-28 15:47:08 +0000	[diff] [blame]	23	class AMDGPUMachineFunction;
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	24	class AMDGPUSubtarget;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	25	class MachineRegisterInfo;
				26
				27	class AMDGPUTargetLowering : public TargetLowering {
Matt Arsenault	41e2f2b	2014-02-24 21:01:28 +0000	[diff] [blame]	28	protected:
				29	const AMDGPUSubtarget *Subtarget;
				30
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	31	private:
Tom Stellard	04c0e98	2014-01-22 19:24:21 +0000	[diff] [blame]	32	SDValue LowerConstantInitializer(const Constant* Init, const GlobalValue *GV,
				33	const SDValue &InitPtr,
				34	SDValue Chain,
				35	SelectionDAG &DAG) const;
Tom Stellard	81d871d	2013-11-13 23:36:50 +0000	[diff] [blame]	36	SDValue LowerFrameIndex(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	d86003e	2013-08-14 23:25:00 +0000	[diff] [blame]	37	SDValue LowerEXTRACT_SUBVECTOR(SDValue Op, SelectionDAG &DAG) const;
				38	SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	39	SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	40	/// \brief Lower vector stores by merging the vector elements into an integer
				41	/// of the same bitwidth.
				42	SDValue MergeVectorStore(const SDValue &Op, SelectionDAG &DAG) const;
				43	/// \brief Split a vector store into multiple scalar stores.
Matt Arsenault	209a7b9	2014-04-18 07:40:20 +0000	[diff] [blame]	44	/// \returns The resulting chain.
Matt Arsenault	1578aa7	2014-06-15 20:08:02 +0000	[diff] [blame]	45
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	46	SDValue LowerUDIVREM(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	47	SDValue LowerFCEIL(SDValue Op, SelectionDAG &DAG) const;
				48	SDValue LowerFTRUNC(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	e8208ec	2014-06-18 17:05:26 +0000	[diff] [blame]	49	SDValue LowerFRINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	692bd5e	2014-06-18 22:03:45 +0000	[diff] [blame]	50	SDValue LowerFNEARBYINT(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	4601093	2014-06-18 17:05:30 +0000	[diff] [blame]	51	SDValue LowerFFLOOR(SDValue Op, SelectionDAG &DAG) const;
				52
Tom Stellard	c947d8c	2013-10-30 17:22:05 +0000	[diff] [blame]	53	SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	54
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	55	SDValue ExpandSIGN_EXTEND_INREG(SDValue Op,
				56	unsigned BitsDiff,
				57	SelectionDAG &DAG) const;
				58	SDValue LowerSIGN_EXTEND_INREG(SDValue Op, SelectionDAG &DAG) const;
				59
Matt Arsenault	ca3976f	2014-07-15 02:06:31 +0000	[diff] [blame]	60	SDValue performStoreCombine(SDNode *N, DAGCombinerInfo &DCI) const;
Matt Arsenault	d0e0f0a	2014-06-30 17:55:48 +0000	[diff] [blame]	61	SDValue performMulCombine(SDNode *N, DAGCombinerInfo &DCI) const;
				62
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	63	protected:
Matt Arsenault	c9df794	2014-06-11 03:29:54 +0000	[diff] [blame]	64	static EVT getEquivalentMemType(LLVMContext &Context, EVT VT);
				65	static EVT getEquivalentLoadRegType(LLVMContext &Context, EVT VT);
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	66
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	67	virtual SDValue LowerGlobalAddress(AMDGPUMachineFunction *MFI, SDValue Op,
				68	SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame]	69
				70	/// \brief Split a vector load into a scalar load of each component.
				71	SDValue ScalarizeVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				72
				73	/// \brief Split a vector load into 2 loads of half the vector.
				74	SDValue SplitVectorLoad(SDValue Op, SelectionDAG &DAG) const;
				75
				76	/// \brief Split a vector store into a scalar store of each component.
				77	SDValue ScalarizeVectorStore(SDValue Op, SelectionDAG &DAG) const;
				78
				79	/// \brief Split a vector store into 2 stores of half the vector.
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	80	SDValue SplitVectorStore(SDValue Op, SelectionDAG &DAG) const;
Matt Arsenault	83e6058	2014-07-24 17:10:35 +0000	[diff] [blame]	81
Tom Stellard	e937360	2014-01-22 19:24:14 +0000	[diff] [blame]	82	SDValue LowerLOAD(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	2ffc330	2013-08-26 15:05:44 +0000	[diff] [blame]	83	SDValue LowerSTORE(SDValue Op, SelectionDAG &DAG) const;
Jan Vesely	343cd6f0	2014-06-22 21:43:01 +0000	[diff] [blame]	84	SDValue LowerSDIVREM(SDValue Op, SelectionDAG &DAG) const;
Jan Vesely	e5ca27d	2014-08-12 17:31:20 +0000	[diff] [blame]	85	SDValue LowerDIVREM24(SDValue Op, SelectionDAG &DAG, bool sign) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	86	bool isHWTrueValue(SDValue Op) const;
				87	bool isHWFalseValue(SDValue Op) const;
				88
Tom Stellard	af77543	2013-10-23 00:44:32 +0000	[diff] [blame]	89	/// The SelectionDAGBuilder will automatically promote function arguments
				90	/// with illegal types. However, this does not work for the AMDGPU targets
				91	/// since the function arguments are stored in memory as these illegal types.
				92	/// In order to handle this properly we need to get the origianl types sizes
				93	/// from the LLVM IR Function and fixup the ISD:InputArg values before
				94	/// passing them to AnalyzeFormalArguments()
				95	void getOriginalFunctionArgs(SelectionDAG &DAG,
				96	const Function *F,
				97	const SmallVectorImpl<ISD::InputArg> &Ins,
				98	SmallVectorImpl<ISD::InputArg> &OrigIns) const;
Christian Konig	2c8f6d5	2013-03-07 09:03:52 +0000	[diff] [blame]	99	void AnalyzeFormalArguments(CCState &State,
				100	const SmallVectorImpl<ISD::InputArg> &Ins) const;
				101
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	102	public:
				103	AMDGPUTargetLowering(TargetMachine &TM);
				104
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	105	bool isFAbsFree(EVT VT) const override;
				106	bool isFNegFree(EVT VT) const override;
				107	bool isTruncateFree(EVT Src, EVT Dest) const override;
				108	bool isTruncateFree(Type Src, Type Dest) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	109
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	110	bool isZExtFree(Type Src, Type Dest) const override;
				111	bool isZExtFree(EVT Src, EVT Dest) const override;
Aaron Ballman	3c81e46	2014-06-26 13:45:47 +0000	[diff] [blame]	112	bool isZExtFree(SDValue Val, EVT VT2) const override;
Matt Arsenault	b517c81	2014-03-27 17:23:31 +0000	[diff] [blame]	113
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	114	bool isNarrowingProfitable(EVT VT1, EVT VT2) const override;
Matt Arsenault	a7f1e0c	2014-03-24 19:43:31 +0000	[diff] [blame]	115
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	116	MVT getVectorIdxTy() const override;
Matt Arsenault	1d555c4	2014-06-23 18:00:55 +0000	[diff] [blame]	117	bool isSelectSupported(SelectSupportKind) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	118
				119	bool isFPImmLegal(const APFloat &Imm, EVT VT) const override;
				120	bool ShouldShrinkFPConstant(EVT VT) const override;
				121
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	122	bool isLoadBitCastBeneficial(EVT, EVT) const override;
				123	SDValue LowerReturn(SDValue Chain, CallingConv::ID CallConv,
				124	bool isVarArg,
				125	const SmallVectorImpl<ISD::OutputArg> &Outs,
				126	const SmallVectorImpl<SDValue> &OutVals,
				127	SDLoc DL, SelectionDAG &DAG) const override;
				128	SDValue LowerCall(CallLoweringInfo &CLI,
				129	SmallVectorImpl<SDValue> &InVals) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	130
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	131	SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override;
Matt Arsenault	14d4645	2014-06-15 20:23:38 +0000	[diff] [blame]	132	SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const override;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	133	void ReplaceNodeResults(SDNode * N,
				134	SmallVectorImpl<SDValue> &Results,
				135	SelectionDAG &DAG) const override;
Matt Arsenault	d125d74	2014-03-27 17:23:24 +0000	[diff] [blame]	136
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	137	SDValue LowerIntrinsicIABS(SDValue Op, SelectionDAG &DAG) const;
				138	SDValue LowerIntrinsicLRP(SDValue Op, SelectionDAG &DAG) const;
Tom Stellard	afa8b53	2014-05-09 16:42:16 +0000	[diff] [blame]	139	SDValue CombineMinMax(SDNode *N, SelectionDAG &DAG) const;
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	140	const char* getTargetNodeName(unsigned Opcode) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	141
Craig Topper	5656db4	2014-04-29 07:57:24 +0000	[diff] [blame]	142	virtual SDNode PostISelFolding(MachineSDNode N,
				143	SelectionDAG &DAG) const {
Christian Konig	d910b7d	2013-02-26 17:52:16 +0000	[diff] [blame]	144	return N;
				145	}
				146
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	147	/// \brief Determine which of the bits specified in \p Mask are known to be
				148	/// either zero or one and return them in the \p KnownZero and \p KnownOne
				149	/// bitsets.
Jay Foad	a0653a3	2014-05-14 21:14:37 +0000	[diff] [blame]	150	void computeKnownBitsForTargetNode(const SDValue Op,
				151	APInt &KnownZero,
				152	APInt &KnownOne,
				153	const SelectionDAG &DAG,
				154	unsigned Depth = 0) const override;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	155
Matt Arsenault	bf8694d	2014-05-22 18:09:03 +0000	[diff] [blame]	156	virtual unsigned ComputeNumSignBitsForTargetNode(
				157	SDValue Op,
				158	const SelectionDAG &DAG,
				159	unsigned Depth = 0) const override;
Tom Stellard	b02094e	2014-07-21 15:45:01 +0000	[diff] [blame]	160
				161	/// \brief Helper function that adds Reg to the LiveIn list of the DAG's
				162	/// MachineFunction.
				163	///
				164	/// \returns a RegisterSDNode representing Reg.
				165	virtual SDValue CreateLiveInRegister(SelectionDAG &DAG,
				166	const TargetRegisterClass *RC,
				167	unsigned Reg, EVT VT) const;
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	168	};
				169
				170	namespace AMDGPUISD {
				171
				172	enum {
				173	// AMDIL ISD Opcodes
				174	FIRST_NUMBER = ISD::BUILTIN_OP_END,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	175	CALL, // Function call based on a single integer
				176	UMUL, // 32bit unsigned multiplication
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	177	RET_FLAG,
				178	BRANCH_COND,
				179	// End AMDIL ISD Opcodes
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	180	DWORDADDR,
				181	FRACT,
Matt Arsenault	5d47d4a	2014-06-12 21:15:44 +0000	[diff] [blame]	182	CLAMP,
Matt Arsenault	8675db1	2014-08-29 16:01:14 +0000	[diff] [blame]	183	MAD, // Multiply + add with same result as the separate operations.
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	184
				185	// SIN_HW, COS_HW - f32 for SI, 1 ULP max error, valid from -100 pi to 100 pi.
				186	// Denormals handled on some parts.
Vincent Lejeune	b55940c	2013-07-09 15:03:11 +0000	[diff] [blame]	187	COS_HW,
				188	SIN_HW,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	189	FMAX,
				190	SMAX,
				191	UMAX,
				192	FMIN,
				193	SMIN,
				194	UMIN,
				195	URECIP,
Matt Arsenault	a0050b0	2014-06-19 01:19:19 +0000	[diff] [blame]	196	DIV_SCALE,
				197	DIV_FMAS,
				198	DIV_FIXUP,
				199	TRIG_PREOP, // 1 ULP max error for f64
				200
				201	// RCP, RSQ - For f32, 1 ULP max error, no denormal handling.
				202	// For f64, max error 2^29 ULP, handles denormals.
				203	RCP,
				204	RSQ,
Matt Arsenault	257d48d	2014-06-24 22:13:39 +0000	[diff] [blame]	205	RSQ_LEGACY,
				206	RSQ_CLAMPED,
Matt Arsenault	2e7cc48	2014-08-15 17:30:25 +0000	[diff] [blame]	207	LDEXP,
Vincent Lejeune	519f21e	2013-05-17 16:50:32 +0000	[diff] [blame]	208	DOT4,
Matt Arsenault	fae0298	2014-03-17 18:58:11 +0000	[diff] [blame]	209	BFE_U32, // Extract range of bits with zero extension to 32-bits.
				210	BFE_I32, // Extract range of bits with sign extension to 32-bits.
Matt Arsenault	b345836	2014-03-31 18:21:13 +0000	[diff] [blame]	211	BFI, // (src0 & src1) \| (~src0 & src2)
				212	BFM, // Insert a range of bits into a 32-bit word.
Matt Arsenault	43160e7	2014-06-18 17:13:57 +0000	[diff] [blame]	213	BREV, // Reverse bits.
Tom Stellard	50122a5	2014-04-07 19:45:41 +0000	[diff] [blame]	214	MUL_U24,
				215	MUL_I24,
Matt Arsenault	eb26020	2014-05-22 18:00:15 +0000	[diff] [blame]	216	MAD_U24,
				217	MAD_I24,
Vincent Lejeune	d3eed66	2013-05-17 16:50:20 +0000	[diff] [blame]	218	TEXTURE_FETCH,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	219	EXPORT,
Tom Stellard	ff62c35	2013-01-23 02:09:03 +0000	[diff] [blame]	220	CONST_ADDRESS,
Tom Stellard	f3b2a1e	2013-02-06 17:32:29 +0000	[diff] [blame]	221	REGISTER_LOAD,
				222	REGISTER_STORE,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	223	LOAD_INPUT,
				224	SAMPLE,
				225	SAMPLEB,
				226	SAMPLED,
				227	SAMPLEL,
Matt Arsenault	364a674	2014-06-11 17:50:44 +0000	[diff] [blame]	228
				229	// These cvt_f32_ubyte* nodes need to remain consecutive and in order.
				230	CVT_F32_UBYTE0,
				231	CVT_F32_UBYTE1,
				232	CVT_F32_UBYTE2,
				233	CVT_F32_UBYTE3,
Tom Stellard	880a80a	2014-06-17 16:53:14 +0000	[diff] [blame]	234	/// This node is for VLIW targets and it is used to represent a vector
				235	/// that is stored in consecutive registers with the same channel.
				236	/// For example:
				237	/// \|X \|Y\|Z\|W\|
				238	/// T0\|v.x\| \| \| \|
				239	/// T1\|v.y\| \| \| \|
				240	/// T2\|v.z\| \| \| \|
				241	/// T3\|v.w\| \| \| \|
				242	BUILD_VERTICAL_VECTOR,
Tom Stellard	067c815	2014-07-21 14:01:14 +0000	[diff] [blame]	243	/// Pointer to the start of the shader's constant data.
				244	CONST_DATA_PTR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	245	FIRST_MEM_OPCODE_NUMBER = ISD::FIRST_TARGET_MEMORY_OPCODE,
Tom Stellard	d3ee8c1	2013-08-16 01:12:06 +0000	[diff] [blame]	246	STORE_MSKOR,
Tom Stellard	9fa1791	2013-08-14 23:24:45 +0000	[diff] [blame]	247	LOAD_CONSTANT,
Tom Stellard	afcf12f	2013-09-12 02:55:14 +0000	[diff] [blame]	248	TBUFFER_STORE_FORMAT,
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	249	LAST_AMDGPU_ISD_NUMBER
				250	};
				251
				252
				253	} // End namespace AMDGPUISD
				254
Tom Stellard	75aadc2	2012-12-11 21:25:42 +0000	[diff] [blame]	255	} // End namespace llvm
				256
Benjamin Kramer	a7c40ef	2014-08-13 16:26:38 +0000	[diff] [blame]	257	#endif