blob: b99a09be7cede1b36a2836f7ed260cfc1ae314d3 [file] [log] [blame]
Dan Gohmanf17a25c2007-07-18 16:29:46 +00001//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Dan Gohmanf17a25c2007-07-18 16:29:46 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the interfaces that X86 uses to lower LLVM code into a
11// selection DAG.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef X86ISELLOWERING_H
16#define X86ISELLOWERING_H
17
18#include "X86Subtarget.h"
19#include "X86RegisterInfo.h"
Gordon Henriksen18ace102008-01-05 16:56:59 +000020#include "X86MachineFunctionInfo.h"
Dan Gohmanf17a25c2007-07-18 16:29:46 +000021#include "llvm/Target/TargetLowering.h"
22#include "llvm/CodeGen/SelectionDAG.h"
Rafael Espindoladdb88da2007-08-31 15:06:30 +000023#include "llvm/CodeGen/CallingConvLower.h"
Dan Gohmanf17a25c2007-07-18 16:29:46 +000024
25namespace llvm {
26 namespace X86ISD {
27 // X86 Specific DAG Nodes
28 enum NodeType {
29 // Start the numbering where the builtin ops leave off.
30 FIRST_NUMBER = ISD::BUILTIN_OP_END+X86::INSTRUCTION_LIST_END,
31
Evan Cheng48679f42007-12-14 02:13:44 +000032 /// BSF - Bit scan forward.
33 /// BSR - Bit scan reverse.
34 BSF,
35 BSR,
36
Dan Gohmanf17a25c2007-07-18 16:29:46 +000037 /// SHLD, SHRD - Double shift instructions. These correspond to
38 /// X86::SHLDxx and X86::SHRDxx instructions.
39 SHLD,
40 SHRD,
41
42 /// FAND - Bitwise logical AND of floating point values. This corresponds
43 /// to X86::ANDPS or X86::ANDPD.
44 FAND,
45
46 /// FOR - Bitwise logical OR of floating point values. This corresponds
47 /// to X86::ORPS or X86::ORPD.
48 FOR,
49
50 /// FXOR - Bitwise logical XOR of floating point values. This corresponds
51 /// to X86::XORPS or X86::XORPD.
52 FXOR,
53
54 /// FSRL - Bitwise logical right shift of floating point values. These
55 /// corresponds to X86::PSRLDQ.
56 FSRL,
57
58 /// FILD, FILD_FLAG - This instruction implements SINT_TO_FP with the
59 /// integer source in memory and FP reg result. This corresponds to the
60 /// X86::FILD*m instructions. It has three inputs (token chain, address,
61 /// and source type) and two outputs (FP value and token chain). FILD_FLAG
62 /// also produces a flag).
63 FILD,
64 FILD_FLAG,
65
66 /// FP_TO_INT*_IN_MEM - This instruction implements FP_TO_SINT with the
67 /// integer destination in memory and a FP reg source. This corresponds
68 /// to the X86::FIST*m instructions and the rounding mode change stuff. It
69 /// has two inputs (token chain and address) and two outputs (int value
70 /// and token chain).
71 FP_TO_INT16_IN_MEM,
72 FP_TO_INT32_IN_MEM,
73 FP_TO_INT64_IN_MEM,
74
75 /// FLD - This instruction implements an extending load to FP stack slots.
76 /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
77 /// operand, ptr to load from, and a ValueType node indicating the type
78 /// to load to.
79 FLD,
80
81 /// FST - This instruction implements a truncating store to FP stack
82 /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
83 /// chain operand, value to store, address, and a ValueType to store it
84 /// as.
85 FST,
86
Dan Gohmanf17a25c2007-07-18 16:29:46 +000087 /// CALL/TAILCALL - These operations represent an abstract X86 call
88 /// instruction, which includes a bunch of information. In particular the
89 /// operands of these node are:
90 ///
91 /// #0 - The incoming token chain
92 /// #1 - The callee
93 /// #2 - The number of arg bytes the caller pushes on the stack.
94 /// #3 - The number of arg bytes the callee pops off the stack.
95 /// #4 - The value to pass in AL/AX/EAX (optional)
96 /// #5 - The value to pass in DL/DX/EDX (optional)
97 ///
98 /// The result values of these nodes are:
99 ///
100 /// #0 - The outgoing token chain
101 /// #1 - The first register result value (optional)
102 /// #2 - The second register result value (optional)
103 ///
104 /// The CALL vs TAILCALL distinction boils down to whether the callee is
105 /// known not to modify the caller's stack frame, as is standard with
106 /// LLVM.
107 CALL,
108 TAILCALL,
109
110 /// RDTSC_DAG - This operation implements the lowering for
111 /// readcyclecounter
112 RDTSC_DAG,
113
114 /// X86 compare and logical compare instructions.
Evan Cheng904febe2007-09-17 17:42:53 +0000115 CMP, COMI, UCOMI,
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000116
117 /// X86 SetCC. Operand 1 is condition code, and operand 2 is the flag
118 /// operand produced by a CMP instruction.
119 SETCC,
120
121 /// X86 conditional moves. Operand 1 and operand 2 are the two values
122 /// to select from (operand 1 is a R/W operand). Operand 3 is the
123 /// condition code, and operand 4 is the flag operand produced by a CMP
124 /// or TEST instruction. It also writes a flag result.
125 CMOV,
126
127 /// X86 conditional branches. Operand 1 is the chain operand, operand 2
128 /// is the block to branch if condition is true, operand 3 is the
129 /// condition code, and operand 4 is the flag operand produced by a CMP
130 /// or TEST instruction.
131 BRCOND,
132
133 /// Return with a flag operand. Operand 1 is the chain operand, operand
134 /// 2 is the number of bytes of stack to pop.
135 RET_FLAG,
136
137 /// REP_STOS - Repeat fill, corresponds to X86::REP_STOSx.
138 REP_STOS,
139
140 /// REP_MOVS - Repeat move, corresponds to X86::REP_MOVSx.
141 REP_MOVS,
142
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000143 /// GlobalBaseReg - On Darwin, this node represents the result of the popl
144 /// at function entry, used for PIC code.
145 GlobalBaseReg,
146
147 /// Wrapper - A wrapper node for TargetConstantPool,
148 /// TargetExternalSymbol, and TargetGlobalAddress.
149 Wrapper,
150
151 /// WrapperRIP - Special wrapper used under X86-64 PIC mode for RIP
152 /// relative displacements.
153 WrapperRIP,
154
Nate Begemand77e59e2008-02-11 04:19:36 +0000155 /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to
156 /// i32, corresponds to X86::PEXTRB.
157 PEXTRB,
158
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000159 /// PEXTRW - Extract a 16-bit value from a vector and zero extend it to
160 /// i32, corresponds to X86::PEXTRW.
161 PEXTRW,
162
Nate Begemand77e59e2008-02-11 04:19:36 +0000163 /// INSERTPS - Insert any element of a 4 x float vector into any element
164 /// of a destination 4 x floatvector.
165 INSERTPS,
166
167 /// PINSRB - Insert the lower 8-bits of a 32-bit value to a vector,
168 /// corresponds to X86::PINSRB.
169 PINSRB,
170
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000171 /// PINSRW - Insert the lower 16-bits of a 32-bit value to a vector,
172 /// corresponds to X86::PINSRW.
173 PINSRW,
174
175 /// FMAX, FMIN - Floating point max and min.
176 ///
177 FMAX, FMIN,
178
179 /// FRSQRT, FRCP - Floating point reciprocal-sqrt and reciprocal
180 /// approximation. Note that these typically require refinement
181 /// in order to obtain suitable precision.
182 FRSQRT, FRCP,
183
Evan Cheng40ee6e52008-05-08 00:57:18 +0000184 // TLSADDR, THREAThread - Thread Local Storage.
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000185 TLSADDR, THREAD_POINTER,
186
Evan Cheng40ee6e52008-05-08 00:57:18 +0000187 // EH_RETURN - Exception Handling helpers.
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000188 EH_RETURN,
189
Arnold Schwaighofer6fd37ac2008-03-19 16:39:45 +0000190 /// TC_RETURN - Tail call return.
191 /// operand #0 chain
192 /// operand #1 callee (register or absolute)
193 /// operand #2 stack adjustment
194 /// operand #3 optional in flag
Anton Korobeynikovfbe230e2007-11-16 01:31:51 +0000195 TC_RETURN,
196
Evan Cheng40ee6e52008-05-08 00:57:18 +0000197 // LCMPXCHG_DAG, LCMPXCHG8_DAG - Compare and swap.
Andrew Lenharth7dfe23f2008-03-01 21:52:34 +0000198 LCMPXCHG_DAG,
Andrew Lenharth81580822008-03-05 01:15:49 +0000199 LCMPXCHG8_DAG,
Andrew Lenharth7dfe23f2008-03-01 21:52:34 +0000200
Evan Cheng40ee6e52008-05-08 00:57:18 +0000201 // FNSTCW16m - Store FP control world into i16 memory.
202 FNSTCW16m,
203
Evan Chenge9b9c672008-05-09 21:53:03 +0000204 // VZEXT_MOVL - Vector move low and zero extend.
205 VZEXT_MOVL,
206
207 // VZEXT_LOAD - Load, scalar_to_vector, and zero extend.
208 VZEXT_LOAD
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000209 };
210 }
211
Evan Cheng931a8f42008-01-29 19:34:22 +0000212 /// Define some predicates that are used for node matching.
213 namespace X86 {
214 /// isPSHUFDMask - Return true if the specified VECTOR_SHUFFLE operand
215 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
216 bool isPSHUFDMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000217
Evan Cheng931a8f42008-01-29 19:34:22 +0000218 /// isPSHUFHWMask - Return true if the specified VECTOR_SHUFFLE operand
219 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
220 bool isPSHUFHWMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000221
Evan Cheng931a8f42008-01-29 19:34:22 +0000222 /// isPSHUFLWMask - Return true if the specified VECTOR_SHUFFLE operand
223 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
224 bool isPSHUFLWMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000225
Evan Cheng931a8f42008-01-29 19:34:22 +0000226 /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
227 /// specifies a shuffle of elements that is suitable for input to SHUFP*.
228 bool isSHUFPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000229
Evan Cheng931a8f42008-01-29 19:34:22 +0000230 /// isMOVHLPSMask - Return true if the specified VECTOR_SHUFFLE operand
231 /// specifies a shuffle of elements that is suitable for input to MOVHLPS.
232 bool isMOVHLPSMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000233
Evan Cheng931a8f42008-01-29 19:34:22 +0000234 /// isMOVHLPS_v_undef_Mask - Special case of isMOVHLPSMask for canonical form
235 /// of vector_shuffle v, v, <2, 3, 2, 3>, i.e. vector_shuffle v, undef,
236 /// <2, 3, 2, 3>
237 bool isMOVHLPS_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000238
Evan Cheng931a8f42008-01-29 19:34:22 +0000239 /// isMOVLPMask - Return true if the specified VECTOR_SHUFFLE operand
240 /// specifies a shuffle of elements that is suitable for input to MOVLP{S|D}.
241 bool isMOVLPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000242
Evan Cheng931a8f42008-01-29 19:34:22 +0000243 /// isMOVHPMask - Return true if the specified VECTOR_SHUFFLE operand
244 /// specifies a shuffle of elements that is suitable for input to MOVHP{S|D}
245 /// as well as MOVLHPS.
246 bool isMOVHPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000247
Evan Cheng931a8f42008-01-29 19:34:22 +0000248 /// isUNPCKLMask - Return true if the specified VECTOR_SHUFFLE operand
249 /// specifies a shuffle of elements that is suitable for input to UNPCKL.
250 bool isUNPCKLMask(SDNode *N, bool V2IsSplat = false);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000251
Evan Cheng931a8f42008-01-29 19:34:22 +0000252 /// isUNPCKHMask - Return true if the specified VECTOR_SHUFFLE operand
253 /// specifies a shuffle of elements that is suitable for input to UNPCKH.
254 bool isUNPCKHMask(SDNode *N, bool V2IsSplat = false);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000255
Evan Cheng931a8f42008-01-29 19:34:22 +0000256 /// isUNPCKL_v_undef_Mask - Special case of isUNPCKLMask for canonical form
257 /// of vector_shuffle v, v, <0, 4, 1, 5>, i.e. vector_shuffle v, undef,
258 /// <0, 0, 1, 1>
259 bool isUNPCKL_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000260
Evan Cheng931a8f42008-01-29 19:34:22 +0000261 /// isUNPCKH_v_undef_Mask - Special case of isUNPCKHMask for canonical form
262 /// of vector_shuffle v, v, <2, 6, 3, 7>, i.e. vector_shuffle v, undef,
263 /// <2, 2, 3, 3>
264 bool isUNPCKH_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000265
Evan Cheng931a8f42008-01-29 19:34:22 +0000266 /// isMOVLMask - Return true if the specified VECTOR_SHUFFLE operand
267 /// specifies a shuffle of elements that is suitable for input to MOVSS,
268 /// MOVSD, and MOVD, i.e. setting the lowest element.
269 bool isMOVLMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000270
Evan Cheng931a8f42008-01-29 19:34:22 +0000271 /// isMOVSHDUPMask - Return true if the specified VECTOR_SHUFFLE operand
272 /// specifies a shuffle of elements that is suitable for input to MOVSHDUP.
273 bool isMOVSHDUPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000274
Evan Cheng931a8f42008-01-29 19:34:22 +0000275 /// isMOVSLDUPMask - Return true if the specified VECTOR_SHUFFLE operand
276 /// specifies a shuffle of elements that is suitable for input to MOVSLDUP.
277 bool isMOVSLDUPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000278
Evan Cheng931a8f42008-01-29 19:34:22 +0000279 /// isSplatMask - Return true if the specified VECTOR_SHUFFLE operand
280 /// specifies a splat of a single element.
281 bool isSplatMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000282
Evan Cheng931a8f42008-01-29 19:34:22 +0000283 /// isSplatLoMask - Return true if the specified VECTOR_SHUFFLE operand
284 /// specifies a splat of zero element.
285 bool isSplatLoMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000286
Evan Cheng931a8f42008-01-29 19:34:22 +0000287 /// getShuffleSHUFImmediate - Return the appropriate immediate to shuffle
288 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP*
289 /// instructions.
290 unsigned getShuffleSHUFImmediate(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000291
Evan Cheng931a8f42008-01-29 19:34:22 +0000292 /// getShufflePSHUFHWImmediate - Return the appropriate immediate to shuffle
293 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFHW
294 /// instructions.
295 unsigned getShufflePSHUFHWImmediate(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000296
Evan Cheng931a8f42008-01-29 19:34:22 +0000297 /// getShufflePSHUFKWImmediate - Return the appropriate immediate to shuffle
298 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFLW
299 /// instructions.
300 unsigned getShufflePSHUFLWImmediate(SDNode *N);
301 }
302
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000303 //===--------------------------------------------------------------------===//
304 // X86TargetLowering - X86 Implementation of the TargetLowering interface
305 class X86TargetLowering : public TargetLowering {
306 int VarArgsFrameIndex; // FrameIndex for start of varargs area.
307 int RegSaveFrameIndex; // X86-64 vararg func register save area.
308 unsigned VarArgsGPOffset; // X86-64 vararg func int reg offset.
309 unsigned VarArgsFPOffset; // X86-64 vararg func fp reg offset.
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000310 int BytesToPopOnReturn; // Number of arg bytes ret should pop.
311 int BytesCallerReserves; // Number of arg bytes caller makes.
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000312
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000313 public:
Dan Gohmanb41dfba2008-05-14 01:58:56 +0000314 explicit X86TargetLowering(X86TargetMachine &TM);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000315
Evan Cheng6fb06762007-11-09 01:32:10 +0000316 /// getPICJumpTableRelocaBase - Returns relocation base for the given PIC
317 /// jumptable.
318 SDOperand getPICJumpTableRelocBase(SDOperand Table,
319 SelectionDAG &DAG) const;
320
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000321 // Return the number of bytes that a function should pop when it returns (in
322 // addition to the space used by the return address).
323 //
324 unsigned getBytesToPopOnReturn() const { return BytesToPopOnReturn; }
325
326 // Return the number of bytes that the caller reserves for arguments passed
327 // to this function.
328 unsigned getBytesCallerReserves() const { return BytesCallerReserves; }
329
330 /// getStackPtrReg - Return the stack pointer register we are using: either
331 /// ESP or RSP.
332 unsigned getStackPtrReg() const { return X86StackPtr; }
Evan Cheng5a67b812008-01-23 23:17:41 +0000333
334 /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
335 /// function arguments in the caller parameter area. For X86, aggregates
336 /// that contains are placed at 16-byte boundaries while the rest are at
337 /// 4-byte boundaries.
338 virtual unsigned getByValTypeAlignment(const Type *Ty) const;
Evan Cheng8c590372008-05-15 08:39:06 +0000339
340 /// getOptimalMemOpType - Returns the target specific optimal type for load
Evan Cheng2f1033e2008-05-15 22:13:02 +0000341 /// and store operations as a result of memset, memcpy, and memmove
342 /// lowering. It returns MVT::iAny if SelectionDAG should be responsible for
Evan Cheng8c590372008-05-15 08:39:06 +0000343 /// determining it.
344 virtual
345 MVT::ValueType getOptimalMemOpType(uint64_t Size, unsigned Align,
346 bool isSrcConst, bool isSrcStr) const;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000347
348 /// LowerOperation - Provide custom lowering hooks for some operations.
349 ///
350 virtual SDOperand LowerOperation(SDOperand Op, SelectionDAG &DAG);
351
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000352 /// ExpandOperation - Custom lower the specified operation, splitting the
353 /// value into two pieces.
354 ///
355 virtual SDNode *ExpandOperationResult(SDNode *N, SelectionDAG &DAG);
356
357
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000358 virtual SDOperand PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const;
359
Evan Chenge637db12008-01-30 18:18:23 +0000360 virtual MachineBasicBlock *EmitInstrWithCustomInserter(MachineInstr *MI,
361 MachineBasicBlock *MBB);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000362
Mon P Wang078a62d2008-05-05 19:05:59 +0000363
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000364 /// getTargetNodeName - This method returns the name of a target specific
365 /// DAG node.
366 virtual const char *getTargetNodeName(unsigned Opcode) const;
367
Scott Michel502151f2008-03-10 15:42:14 +0000368 /// getSetCCResultType - Return the ISD::SETCC ValueType
369 virtual MVT::ValueType getSetCCResultType(const SDOperand &) const;
370
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000371 /// computeMaskedBitsForTargetNode - Determine which of the bits specified
372 /// in Mask are known to be either zero or one and return them in the
373 /// KnownZero/KnownOne bitsets.
374 virtual void computeMaskedBitsForTargetNode(const SDOperand Op,
Dan Gohmand0dfc772008-02-13 22:28:48 +0000375 const APInt &Mask,
Dan Gohman229fa052008-02-13 00:35:47 +0000376 APInt &KnownZero,
377 APInt &KnownOne,
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000378 const SelectionDAG &DAG,
379 unsigned Depth = 0) const;
Evan Chengef7be082008-05-12 19:56:52 +0000380
381 virtual bool
382 isGAPlusOffset(SDNode *N, GlobalValue* &GA, int64_t &Offset) const;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000383
384 SDOperand getReturnAddressFrameIndex(SelectionDAG &DAG);
385
386 ConstraintType getConstraintType(const std::string &Constraint) const;
387
388 std::vector<unsigned>
389 getRegClassForInlineAsmConstraint(const std::string &Constraint,
390 MVT::ValueType VT) const;
Chris Lattnera531abc2007-08-25 00:47:38 +0000391
Chris Lattnereca405c2008-04-26 23:02:14 +0000392 virtual const char *LowerXConstraint(MVT::ValueType ConstraintVT) const;
Dale Johannesene99fc902008-01-29 02:21:21 +0000393
Chris Lattnera531abc2007-08-25 00:47:38 +0000394 /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
395 /// vector. If it is invalid, don't add anything to Ops.
396 virtual void LowerAsmOperandForConstraint(SDOperand Op,
397 char ConstraintLetter,
398 std::vector<SDOperand> &Ops,
Chris Lattnereca405c2008-04-26 23:02:14 +0000399 SelectionDAG &DAG) const;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000400
401 /// getRegForInlineAsmConstraint - Given a physical register constraint
402 /// (e.g. {edx}), return the register number and the register class for the
403 /// register. This should only be used for C_Register constraints. On
404 /// error, this returns a register number of 0.
405 std::pair<unsigned, const TargetRegisterClass*>
406 getRegForInlineAsmConstraint(const std::string &Constraint,
407 MVT::ValueType VT) const;
408
409 /// isLegalAddressingMode - Return true if the addressing mode represented
410 /// by AM is legal for this target, for a load/store of the specified type.
411 virtual bool isLegalAddressingMode(const AddrMode &AM, const Type *Ty)const;
412
Evan Cheng27a820a2007-10-26 01:56:11 +0000413 /// isTruncateFree - Return true if it's free to truncate a value of
414 /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
415 /// register EAX to i16 by referencing its sub-register AX.
416 virtual bool isTruncateFree(const Type *Ty1, const Type *Ty2) const;
Evan Cheng9decb332007-10-29 19:58:20 +0000417 virtual bool isTruncateFree(MVT::ValueType VT1, MVT::ValueType VT2) const;
Evan Cheng27a820a2007-10-26 01:56:11 +0000418
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000419 /// isShuffleMaskLegal - Targets can use this to indicate that they only
420 /// support *some* VECTOR_SHUFFLE operations, those with specific masks.
421 /// By default, if a target supports the VECTOR_SHUFFLE node, all mask
422 /// values are assumed to be legal.
423 virtual bool isShuffleMaskLegal(SDOperand Mask, MVT::ValueType VT) const;
424
425 /// isVectorClearMaskLegal - Similar to isShuffleMaskLegal. This is
426 /// used by Targets can use this to indicate if there is a suitable
427 /// VECTOR_SHUFFLE that can be used to replace a VAND with a constant
428 /// pool entry.
Dan Gohman48d5f062008-04-09 20:09:42 +0000429 virtual bool isVectorClearMaskLegal(const std::vector<SDOperand> &BVOps,
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000430 MVT::ValueType EVT,
431 SelectionDAG &DAG) const;
Evan Cheng35190fd2008-03-05 01:30:59 +0000432
433 /// ShouldShrinkFPConstant - If true, then instruction selection should
434 /// seek to shrink the FP constant of the specified type to a smaller type
435 /// in order to save space and / or reduce runtime.
436 virtual bool ShouldShrinkFPConstant(MVT::ValueType VT) const {
437 // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
438 // expensive than a straight movsd. On the other hand, it's important to
439 // shrink long double fp constant since fldt is very slow.
440 return !X86ScalarSSEf64 || VT == MVT::f80;
441 }
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000442
443 /// IsEligibleForTailCallOptimization - Check whether the call is eligible
444 /// for tail call optimization. Target which want to do tail call
445 /// optimization should implement this function.
446 virtual bool IsEligibleForTailCallOptimization(SDOperand Call,
447 SDOperand Ret,
448 SelectionDAG &DAG) const;
449
Dan Gohmane8b391e2008-04-12 04:36:06 +0000450 virtual const X86Subtarget* getSubtarget() {
451 return Subtarget;
Rafael Espindoladd867c72007-11-05 23:12:20 +0000452 }
453
Chris Lattnerc3d7cfa2008-01-18 06:52:41 +0000454 /// isScalarFPTypeInSSEReg - Return true if the specified scalar FP type is
455 /// computed in an SSE register, not on the X87 floating point stack.
456 bool isScalarFPTypeInSSEReg(MVT::ValueType VT) const {
457 return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
458 (VT == MVT::f32 && X86ScalarSSEf32); // f32 is when SSE1
459 }
460
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000461 private:
462 /// Subtarget - Keep a pointer to the X86Subtarget around so that we can
463 /// make the right decision when generating code for different targets.
464 const X86Subtarget *Subtarget;
Dan Gohmanb41dfba2008-05-14 01:58:56 +0000465 const X86RegisterInfo *RegInfo;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000466
467 /// X86StackPtr - X86 physical register used as stack ptr.
468 unsigned X86StackPtr;
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000469
Dale Johannesene0e0fd02007-09-23 14:52:20 +0000470 /// X86ScalarSSEf32, X86ScalarSSEf64 - Select between SSE or x87
471 /// floating point ops.
472 /// When SSE is available, use it for f32 operations.
473 /// When SSE2 is available, use it for f64 operations.
474 bool X86ScalarSSEf32;
475 bool X86ScalarSSEf64;
Evan Cheng931a8f42008-01-29 19:34:22 +0000476
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000477 SDNode *LowerCallResult(SDOperand Chain, SDOperand InFlag, SDNode*TheCall,
478 unsigned CallingConv, SelectionDAG &DAG);
Evan Cheng931a8f42008-01-29 19:34:22 +0000479
Rafael Espindola03cbeb72007-09-14 15:48:13 +0000480 SDOperand LowerMemArgument(SDOperand Op, SelectionDAG &DAG,
481 const CCValAssign &VA, MachineFrameInfo *MFI,
Arnold Schwaighofere2db0f42008-02-26 09:19:59 +0000482 unsigned CC, SDOperand Root, unsigned i);
Rafael Espindola03cbeb72007-09-14 15:48:13 +0000483
Rafael Espindoladdb88da2007-08-31 15:06:30 +0000484 SDOperand LowerMemOpCallTo(SDOperand Op, SelectionDAG &DAG,
485 const SDOperand &StackPtr,
486 const CCValAssign &VA, SDOperand Chain,
487 SDOperand Arg);
488
Gordon Henriksen18ace102008-01-05 16:56:59 +0000489 // Call lowering helpers.
490 bool IsCalleePop(SDOperand Op);
Arnold Schwaighofer87f75262008-02-26 22:21:54 +0000491 bool CallRequiresGOTPtrInReg(bool Is64Bit, bool IsTailCall);
492 bool CallRequiresFnAddressInReg(bool Is64Bit, bool IsTailCall);
Arnold Schwaighofera38df102008-04-12 18:11:06 +0000493 SDOperand EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDOperand &OutRetAddr,
494 SDOperand Chain, bool IsTailCall, bool Is64Bit,
495 int FPDiff);
Arnold Schwaighofera38df102008-04-12 18:11:06 +0000496
Gordon Henriksen18ace102008-01-05 16:56:59 +0000497 CCAssignFn *CCAssignFnForNode(SDOperand Op) const;
498 NameDecorationStyle NameDecorationForFORMAL_ARGUMENTS(SDOperand Op);
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000499 unsigned GetAlignedArgumentStackSize(unsigned StackSize, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000500
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000501 std::pair<SDOperand,SDOperand> FP_TO_SINTHelper(SDOperand Op,
502 SelectionDAG &DAG);
503
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000504 SDOperand LowerBUILD_VECTOR(SDOperand Op, SelectionDAG &DAG);
505 SDOperand LowerVECTOR_SHUFFLE(SDOperand Op, SelectionDAG &DAG);
506 SDOperand LowerEXTRACT_VECTOR_ELT(SDOperand Op, SelectionDAG &DAG);
Nate Begemand77e59e2008-02-11 04:19:36 +0000507 SDOperand LowerEXTRACT_VECTOR_ELT_SSE4(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000508 SDOperand LowerINSERT_VECTOR_ELT(SDOperand Op, SelectionDAG &DAG);
Nate Begemand77e59e2008-02-11 04:19:36 +0000509 SDOperand LowerINSERT_VECTOR_ELT_SSE4(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000510 SDOperand LowerSCALAR_TO_VECTOR(SDOperand Op, SelectionDAG &DAG);
511 SDOperand LowerConstantPool(SDOperand Op, SelectionDAG &DAG);
512 SDOperand LowerGlobalAddress(SDOperand Op, SelectionDAG &DAG);
513 SDOperand LowerGlobalTLSAddress(SDOperand Op, SelectionDAG &DAG);
514 SDOperand LowerExternalSymbol(SDOperand Op, SelectionDAG &DAG);
515 SDOperand LowerShift(SDOperand Op, SelectionDAG &DAG);
516 SDOperand LowerSINT_TO_FP(SDOperand Op, SelectionDAG &DAG);
517 SDOperand LowerFP_TO_SINT(SDOperand Op, SelectionDAG &DAG);
518 SDOperand LowerFABS(SDOperand Op, SelectionDAG &DAG);
519 SDOperand LowerFNEG(SDOperand Op, SelectionDAG &DAG);
520 SDOperand LowerFCOPYSIGN(SDOperand Op, SelectionDAG &DAG);
Evan Cheng621216e2007-09-29 00:00:36 +0000521 SDOperand LowerSETCC(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000522 SDOperand LowerSELECT(SDOperand Op, SelectionDAG &DAG);
523 SDOperand LowerBRCOND(SDOperand Op, SelectionDAG &DAG);
524 SDOperand LowerMEMSET(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000525 SDOperand LowerJumpTable(SDOperand Op, SelectionDAG &DAG);
526 SDOperand LowerCALL(SDOperand Op, SelectionDAG &DAG);
527 SDOperand LowerRET(SDOperand Op, SelectionDAG &DAG);
528 SDOperand LowerDYNAMIC_STACKALLOC(SDOperand Op, SelectionDAG &DAG);
529 SDOperand LowerFORMAL_ARGUMENTS(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000530 SDOperand LowerVASTART(SDOperand Op, SelectionDAG &DAG);
Dan Gohman827cb1f2008-05-10 01:26:14 +0000531 SDOperand LowerVAARG(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000532 SDOperand LowerVACOPY(SDOperand Op, SelectionDAG &DAG);
533 SDOperand LowerINTRINSIC_WO_CHAIN(SDOperand Op, SelectionDAG &DAG);
534 SDOperand LowerRETURNADDR(SDOperand Op, SelectionDAG &DAG);
535 SDOperand LowerFRAMEADDR(SDOperand Op, SelectionDAG &DAG);
536 SDOperand LowerFRAME_TO_ARGS_OFFSET(SDOperand Op, SelectionDAG &DAG);
537 SDOperand LowerEH_RETURN(SDOperand Op, SelectionDAG &DAG);
Duncan Sandsd8455ca2007-07-27 20:02:49 +0000538 SDOperand LowerTRAMPOLINE(SDOperand Op, SelectionDAG &DAG);
Dan Gohman819574c2008-01-31 00:41:03 +0000539 SDOperand LowerFLT_ROUNDS_(SDOperand Op, SelectionDAG &DAG);
Evan Cheng48679f42007-12-14 02:13:44 +0000540 SDOperand LowerCTLZ(SDOperand Op, SelectionDAG &DAG);
541 SDOperand LowerCTTZ(SDOperand Op, SelectionDAG &DAG);
Andrew Lenharth81580822008-03-05 01:15:49 +0000542 SDOperand LowerLCS(SDOperand Op, SelectionDAG &DAG);
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000543 SDNode *ExpandFP_TO_SINT(SDNode *N, SelectionDAG &DAG);
544 SDNode *ExpandREADCYCLECOUNTER(SDNode *N, SelectionDAG &DAG);
Andrew Lenharth81580822008-03-05 01:15:49 +0000545 SDNode *ExpandATOMIC_LCS(SDNode *N, SelectionDAG &DAG);
Mon P Wang078a62d2008-05-05 19:05:59 +0000546 SDNode *ExpandATOMIC_LSS(SDNode *N, SelectionDAG &DAG);
547
Dan Gohmane8b391e2008-04-12 04:36:06 +0000548 SDOperand EmitTargetCodeForMemset(SelectionDAG &DAG,
549 SDOperand Chain,
550 SDOperand Dst, SDOperand Src,
551 SDOperand Size, unsigned Align,
Dan Gohman65118f42008-04-28 17:15:20 +0000552 const Value *DstSV, uint64_t DstSVOff);
Dan Gohmane8b391e2008-04-12 04:36:06 +0000553 SDOperand EmitTargetCodeForMemcpy(SelectionDAG &DAG,
554 SDOperand Chain,
555 SDOperand Dst, SDOperand Src,
556 SDOperand Size, unsigned Align,
557 bool AlwaysInline,
Dan Gohman65118f42008-04-28 17:15:20 +0000558 const Value *DstSV, uint64_t DstSVOff,
559 const Value *SrcSV, uint64_t SrcSVOff);
Mon P Wang078a62d2008-05-05 19:05:59 +0000560
561 /// Utility function to emit atomic bitwise operations (and, or, xor).
562 // It takes the bitwise instruction to expand, the associated machine basic
563 // block, and the associated X86 opcodes for reg/reg and reg/imm.
564 MachineBasicBlock *EmitAtomicBitwiseWithCustomInserter(
565 MachineInstr *BInstr,
566 MachineBasicBlock *BB,
567 unsigned regOpc,
568 unsigned immOpc);
569
570 /// Utility function to emit atomic min and max. It takes the min/max
571 // instruction to expand, the associated basic block, and the associated
572 // cmov opcode for moving the min or max value.
573 MachineBasicBlock *EmitAtomicMinMaxWithCustomInserter(MachineInstr *BInstr,
574 MachineBasicBlock *BB,
575 unsigned cmovOpc);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000576 };
577}
578
579#endif // X86ISELLOWERING_H