blob: ec3524ce3c345a8badd137a9f52374e802e0e0e1 [file] [log] [blame]
Dan Gohmanf17a25c2007-07-18 16:29:46 +00001//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner081ce942007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Dan Gohmanf17a25c2007-07-18 16:29:46 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the interfaces that X86 uses to lower LLVM code into a
11// selection DAG.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef X86ISELLOWERING_H
16#define X86ISELLOWERING_H
17
18#include "X86Subtarget.h"
19#include "X86RegisterInfo.h"
Gordon Henriksen18ace102008-01-05 16:56:59 +000020#include "X86MachineFunctionInfo.h"
Dan Gohmanf17a25c2007-07-18 16:29:46 +000021#include "llvm/Target/TargetLowering.h"
22#include "llvm/CodeGen/SelectionDAG.h"
Rafael Espindoladdb88da2007-08-31 15:06:30 +000023#include "llvm/CodeGen/CallingConvLower.h"
Dan Gohmanf17a25c2007-07-18 16:29:46 +000024
25namespace llvm {
26 namespace X86ISD {
27 // X86 Specific DAG Nodes
28 enum NodeType {
29 // Start the numbering where the builtin ops leave off.
30 FIRST_NUMBER = ISD::BUILTIN_OP_END+X86::INSTRUCTION_LIST_END,
31
Evan Cheng48679f42007-12-14 02:13:44 +000032 /// BSF - Bit scan forward.
33 /// BSR - Bit scan reverse.
34 BSF,
35 BSR,
36
Dan Gohmanf17a25c2007-07-18 16:29:46 +000037 /// SHLD, SHRD - Double shift instructions. These correspond to
38 /// X86::SHLDxx and X86::SHRDxx instructions.
39 SHLD,
40 SHRD,
41
42 /// FAND - Bitwise logical AND of floating point values. This corresponds
43 /// to X86::ANDPS or X86::ANDPD.
44 FAND,
45
46 /// FOR - Bitwise logical OR of floating point values. This corresponds
47 /// to X86::ORPS or X86::ORPD.
48 FOR,
49
50 /// FXOR - Bitwise logical XOR of floating point values. This corresponds
51 /// to X86::XORPS or X86::XORPD.
52 FXOR,
53
54 /// FSRL - Bitwise logical right shift of floating point values. These
55 /// corresponds to X86::PSRLDQ.
56 FSRL,
57
58 /// FILD, FILD_FLAG - This instruction implements SINT_TO_FP with the
59 /// integer source in memory and FP reg result. This corresponds to the
60 /// X86::FILD*m instructions. It has three inputs (token chain, address,
61 /// and source type) and two outputs (FP value and token chain). FILD_FLAG
62 /// also produces a flag).
63 FILD,
64 FILD_FLAG,
65
66 /// FP_TO_INT*_IN_MEM - This instruction implements FP_TO_SINT with the
67 /// integer destination in memory and a FP reg source. This corresponds
68 /// to the X86::FIST*m instructions and the rounding mode change stuff. It
69 /// has two inputs (token chain and address) and two outputs (int value
70 /// and token chain).
71 FP_TO_INT16_IN_MEM,
72 FP_TO_INT32_IN_MEM,
73 FP_TO_INT64_IN_MEM,
74
75 /// FLD - This instruction implements an extending load to FP stack slots.
76 /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
77 /// operand, ptr to load from, and a ValueType node indicating the type
78 /// to load to.
79 FLD,
80
81 /// FST - This instruction implements a truncating store to FP stack
82 /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
83 /// chain operand, value to store, address, and a ValueType to store it
84 /// as.
85 FST,
86
Chris Lattneraaef8dc2008-03-09 07:08:44 +000087 /// FP_GET_ST0_ST1 - Same as FP_GET_ST0 except it copies two values
Evan Cheng931a8f42008-01-29 19:34:22 +000088 /// ST(0) and ST(1).
Chris Lattner5d294e52008-03-09 07:05:32 +000089 FP_GET_ST0_ST1,
Evan Cheng931a8f42008-01-29 19:34:22 +000090
Dan Gohmanf17a25c2007-07-18 16:29:46 +000091 /// CALL/TAILCALL - These operations represent an abstract X86 call
92 /// instruction, which includes a bunch of information. In particular the
93 /// operands of these node are:
94 ///
95 /// #0 - The incoming token chain
96 /// #1 - The callee
97 /// #2 - The number of arg bytes the caller pushes on the stack.
98 /// #3 - The number of arg bytes the callee pops off the stack.
99 /// #4 - The value to pass in AL/AX/EAX (optional)
100 /// #5 - The value to pass in DL/DX/EDX (optional)
101 ///
102 /// The result values of these nodes are:
103 ///
104 /// #0 - The outgoing token chain
105 /// #1 - The first register result value (optional)
106 /// #2 - The second register result value (optional)
107 ///
108 /// The CALL vs TAILCALL distinction boils down to whether the callee is
109 /// known not to modify the caller's stack frame, as is standard with
110 /// LLVM.
111 CALL,
112 TAILCALL,
113
114 /// RDTSC_DAG - This operation implements the lowering for
115 /// readcyclecounter
116 RDTSC_DAG,
117
118 /// X86 compare and logical compare instructions.
Evan Cheng904febe2007-09-17 17:42:53 +0000119 CMP, COMI, UCOMI,
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000120
121 /// X86 SetCC. Operand 1 is condition code, and operand 2 is the flag
122 /// operand produced by a CMP instruction.
123 SETCC,
124
125 /// X86 conditional moves. Operand 1 and operand 2 are the two values
126 /// to select from (operand 1 is a R/W operand). Operand 3 is the
127 /// condition code, and operand 4 is the flag operand produced by a CMP
128 /// or TEST instruction. It also writes a flag result.
129 CMOV,
130
131 /// X86 conditional branches. Operand 1 is the chain operand, operand 2
132 /// is the block to branch if condition is true, operand 3 is the
133 /// condition code, and operand 4 is the flag operand produced by a CMP
134 /// or TEST instruction.
135 BRCOND,
136
137 /// Return with a flag operand. Operand 1 is the chain operand, operand
138 /// 2 is the number of bytes of stack to pop.
139 RET_FLAG,
140
141 /// REP_STOS - Repeat fill, corresponds to X86::REP_STOSx.
142 REP_STOS,
143
144 /// REP_MOVS - Repeat move, corresponds to X86::REP_MOVSx.
145 REP_MOVS,
146
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000147 /// GlobalBaseReg - On Darwin, this node represents the result of the popl
148 /// at function entry, used for PIC code.
149 GlobalBaseReg,
150
151 /// Wrapper - A wrapper node for TargetConstantPool,
152 /// TargetExternalSymbol, and TargetGlobalAddress.
153 Wrapper,
154
155 /// WrapperRIP - Special wrapper used under X86-64 PIC mode for RIP
156 /// relative displacements.
157 WrapperRIP,
158
Nate Begemand77e59e2008-02-11 04:19:36 +0000159 /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to
160 /// i32, corresponds to X86::PEXTRB.
161 PEXTRB,
162
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000163 /// PEXTRW - Extract a 16-bit value from a vector and zero extend it to
164 /// i32, corresponds to X86::PEXTRW.
165 PEXTRW,
166
Nate Begemand77e59e2008-02-11 04:19:36 +0000167 /// INSERTPS - Insert any element of a 4 x float vector into any element
168 /// of a destination 4 x floatvector.
169 INSERTPS,
170
171 /// PINSRB - Insert the lower 8-bits of a 32-bit value to a vector,
172 /// corresponds to X86::PINSRB.
173 PINSRB,
174
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000175 /// PINSRW - Insert the lower 16-bits of a 32-bit value to a vector,
176 /// corresponds to X86::PINSRW.
177 PINSRW,
178
179 /// FMAX, FMIN - Floating point max and min.
180 ///
181 FMAX, FMIN,
182
183 /// FRSQRT, FRCP - Floating point reciprocal-sqrt and reciprocal
184 /// approximation. Note that these typically require refinement
185 /// in order to obtain suitable precision.
186 FRSQRT, FRCP,
187
188 // Thread Local Storage
189 TLSADDR, THREAD_POINTER,
190
191 // Exception Handling helpers
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000192 EH_RETURN,
193
Arnold Schwaighofer6fd37ac2008-03-19 16:39:45 +0000194 /// TC_RETURN - Tail call return.
195 /// operand #0 chain
196 /// operand #1 callee (register or absolute)
197 /// operand #2 stack adjustment
198 /// operand #3 optional in flag
Anton Korobeynikovfbe230e2007-11-16 01:31:51 +0000199 TC_RETURN,
200
Andrew Lenharth7dfe23f2008-03-01 21:52:34 +0000201 // compare and swap
202 LCMPXCHG_DAG,
Andrew Lenharth81580822008-03-05 01:15:49 +0000203 LCMPXCHG8_DAG,
Andrew Lenharth7dfe23f2008-03-01 21:52:34 +0000204
Anton Korobeynikovfbe230e2007-11-16 01:31:51 +0000205 // Store FP control world into i16 memory
Chris Lattner56b941f2008-01-15 21:58:22 +0000206 FNSTCW16m
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000207 };
208 }
209
Evan Cheng931a8f42008-01-29 19:34:22 +0000210 /// Define some predicates that are used for node matching.
211 namespace X86 {
212 /// isPSHUFDMask - Return true if the specified VECTOR_SHUFFLE operand
213 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
214 bool isPSHUFDMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000215
Evan Cheng931a8f42008-01-29 19:34:22 +0000216 /// isPSHUFHWMask - Return true if the specified VECTOR_SHUFFLE operand
217 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
218 bool isPSHUFHWMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000219
Evan Cheng931a8f42008-01-29 19:34:22 +0000220 /// isPSHUFLWMask - Return true if the specified VECTOR_SHUFFLE operand
221 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
222 bool isPSHUFLWMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000223
Evan Cheng931a8f42008-01-29 19:34:22 +0000224 /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
225 /// specifies a shuffle of elements that is suitable for input to SHUFP*.
226 bool isSHUFPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000227
Evan Cheng931a8f42008-01-29 19:34:22 +0000228 /// isMOVHLPSMask - Return true if the specified VECTOR_SHUFFLE operand
229 /// specifies a shuffle of elements that is suitable for input to MOVHLPS.
230 bool isMOVHLPSMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000231
Evan Cheng931a8f42008-01-29 19:34:22 +0000232 /// isMOVHLPS_v_undef_Mask - Special case of isMOVHLPSMask for canonical form
233 /// of vector_shuffle v, v, <2, 3, 2, 3>, i.e. vector_shuffle v, undef,
234 /// <2, 3, 2, 3>
235 bool isMOVHLPS_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000236
Evan Cheng931a8f42008-01-29 19:34:22 +0000237 /// isMOVLPMask - Return true if the specified VECTOR_SHUFFLE operand
238 /// specifies a shuffle of elements that is suitable for input to MOVLP{S|D}.
239 bool isMOVLPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000240
Evan Cheng931a8f42008-01-29 19:34:22 +0000241 /// isMOVHPMask - Return true if the specified VECTOR_SHUFFLE operand
242 /// specifies a shuffle of elements that is suitable for input to MOVHP{S|D}
243 /// as well as MOVLHPS.
244 bool isMOVHPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000245
Evan Cheng931a8f42008-01-29 19:34:22 +0000246 /// isUNPCKLMask - Return true if the specified VECTOR_SHUFFLE operand
247 /// specifies a shuffle of elements that is suitable for input to UNPCKL.
248 bool isUNPCKLMask(SDNode *N, bool V2IsSplat = false);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000249
Evan Cheng931a8f42008-01-29 19:34:22 +0000250 /// isUNPCKHMask - Return true if the specified VECTOR_SHUFFLE operand
251 /// specifies a shuffle of elements that is suitable for input to UNPCKH.
252 bool isUNPCKHMask(SDNode *N, bool V2IsSplat = false);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000253
Evan Cheng931a8f42008-01-29 19:34:22 +0000254 /// isUNPCKL_v_undef_Mask - Special case of isUNPCKLMask for canonical form
255 /// of vector_shuffle v, v, <0, 4, 1, 5>, i.e. vector_shuffle v, undef,
256 /// <0, 0, 1, 1>
257 bool isUNPCKL_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000258
Evan Cheng931a8f42008-01-29 19:34:22 +0000259 /// isUNPCKH_v_undef_Mask - Special case of isUNPCKHMask for canonical form
260 /// of vector_shuffle v, v, <2, 6, 3, 7>, i.e. vector_shuffle v, undef,
261 /// <2, 2, 3, 3>
262 bool isUNPCKH_v_undef_Mask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000263
Evan Cheng931a8f42008-01-29 19:34:22 +0000264 /// isMOVLMask - Return true if the specified VECTOR_SHUFFLE operand
265 /// specifies a shuffle of elements that is suitable for input to MOVSS,
266 /// MOVSD, and MOVD, i.e. setting the lowest element.
267 bool isMOVLMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000268
Evan Cheng931a8f42008-01-29 19:34:22 +0000269 /// isMOVSHDUPMask - Return true if the specified VECTOR_SHUFFLE operand
270 /// specifies a shuffle of elements that is suitable for input to MOVSHDUP.
271 bool isMOVSHDUPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000272
Evan Cheng931a8f42008-01-29 19:34:22 +0000273 /// isMOVSLDUPMask - Return true if the specified VECTOR_SHUFFLE operand
274 /// specifies a shuffle of elements that is suitable for input to MOVSLDUP.
275 bool isMOVSLDUPMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000276
Evan Cheng931a8f42008-01-29 19:34:22 +0000277 /// isSplatMask - Return true if the specified VECTOR_SHUFFLE operand
278 /// specifies a splat of a single element.
279 bool isSplatMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000280
Evan Cheng931a8f42008-01-29 19:34:22 +0000281 /// isSplatLoMask - Return true if the specified VECTOR_SHUFFLE operand
282 /// specifies a splat of zero element.
283 bool isSplatLoMask(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000284
Evan Cheng931a8f42008-01-29 19:34:22 +0000285 /// getShuffleSHUFImmediate - Return the appropriate immediate to shuffle
286 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP*
287 /// instructions.
288 unsigned getShuffleSHUFImmediate(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000289
Evan Cheng931a8f42008-01-29 19:34:22 +0000290 /// getShufflePSHUFHWImmediate - Return the appropriate immediate to shuffle
291 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFHW
292 /// instructions.
293 unsigned getShufflePSHUFHWImmediate(SDNode *N);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000294
Evan Cheng931a8f42008-01-29 19:34:22 +0000295 /// getShufflePSHUFKWImmediate - Return the appropriate immediate to shuffle
296 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFLW
297 /// instructions.
298 unsigned getShufflePSHUFLWImmediate(SDNode *N);
299 }
300
301 namespace X86 {
302 /// X86_64SRet - These represent different ways to implement x86_64 struct
303 /// returns call results.
304 enum X86_64SRet {
305 InMemory, // Really is sret, returns in memory.
306 InGPR64, // Returns in a pair of 64-bit integer registers.
307 InSSE, // Returns in a pair of SSE registers.
308 InX87 // Returns in a pair of f80 X87 registers.
309 };
310 }
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000311
312 //===--------------------------------------------------------------------===//
313 // X86TargetLowering - X86 Implementation of the TargetLowering interface
314 class X86TargetLowering : public TargetLowering {
315 int VarArgsFrameIndex; // FrameIndex for start of varargs area.
316 int RegSaveFrameIndex; // X86-64 vararg func register save area.
317 unsigned VarArgsGPOffset; // X86-64 vararg func int reg offset.
318 unsigned VarArgsFPOffset; // X86-64 vararg func fp reg offset.
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000319 int BytesToPopOnReturn; // Number of arg bytes ret should pop.
320 int BytesCallerReserves; // Number of arg bytes caller makes.
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000321
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000322 public:
Dan Gohman3a78bbf2007-08-02 21:21:54 +0000323 explicit X86TargetLowering(TargetMachine &TM);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000324
Evan Cheng6fb06762007-11-09 01:32:10 +0000325 /// getPICJumpTableRelocaBase - Returns relocation base for the given PIC
326 /// jumptable.
327 SDOperand getPICJumpTableRelocBase(SDOperand Table,
328 SelectionDAG &DAG) const;
329
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000330 // Return the number of bytes that a function should pop when it returns (in
331 // addition to the space used by the return address).
332 //
333 unsigned getBytesToPopOnReturn() const { return BytesToPopOnReturn; }
334
335 // Return the number of bytes that the caller reserves for arguments passed
336 // to this function.
337 unsigned getBytesCallerReserves() const { return BytesCallerReserves; }
338
339 /// getStackPtrReg - Return the stack pointer register we are using: either
340 /// ESP or RSP.
341 unsigned getStackPtrReg() const { return X86StackPtr; }
Evan Cheng5a67b812008-01-23 23:17:41 +0000342
343 /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
344 /// function arguments in the caller parameter area. For X86, aggregates
345 /// that contains are placed at 16-byte boundaries while the rest are at
346 /// 4-byte boundaries.
347 virtual unsigned getByValTypeAlignment(const Type *Ty) const;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000348
349 /// LowerOperation - Provide custom lowering hooks for some operations.
350 ///
351 virtual SDOperand LowerOperation(SDOperand Op, SelectionDAG &DAG);
352
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000353 /// ExpandOperation - Custom lower the specified operation, splitting the
354 /// value into two pieces.
355 ///
356 virtual SDNode *ExpandOperationResult(SDNode *N, SelectionDAG &DAG);
357
358
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000359 virtual SDOperand PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const;
360
Evan Chenge637db12008-01-30 18:18:23 +0000361 virtual MachineBasicBlock *EmitInstrWithCustomInserter(MachineInstr *MI,
362 MachineBasicBlock *MBB);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000363
364 /// getTargetNodeName - This method returns the name of a target specific
365 /// DAG node.
366 virtual const char *getTargetNodeName(unsigned Opcode) const;
367
Scott Michel502151f2008-03-10 15:42:14 +0000368 /// getSetCCResultType - Return the ISD::SETCC ValueType
369 virtual MVT::ValueType getSetCCResultType(const SDOperand &) const;
370
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000371 /// computeMaskedBitsForTargetNode - Determine which of the bits specified
372 /// in Mask are known to be either zero or one and return them in the
373 /// KnownZero/KnownOne bitsets.
374 virtual void computeMaskedBitsForTargetNode(const SDOperand Op,
Dan Gohmand0dfc772008-02-13 22:28:48 +0000375 const APInt &Mask,
Dan Gohman229fa052008-02-13 00:35:47 +0000376 APInt &KnownZero,
377 APInt &KnownOne,
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000378 const SelectionDAG &DAG,
379 unsigned Depth = 0) const;
380
381 SDOperand getReturnAddressFrameIndex(SelectionDAG &DAG);
382
383 ConstraintType getConstraintType(const std::string &Constraint) const;
384
385 std::vector<unsigned>
386 getRegClassForInlineAsmConstraint(const std::string &Constraint,
387 MVT::ValueType VT) const;
Chris Lattnera531abc2007-08-25 00:47:38 +0000388
Dale Johannesene99fc902008-01-29 02:21:21 +0000389 virtual void lowerXConstraint(MVT::ValueType ConstraintVT,
390 std::string&) const;
391
Chris Lattnera531abc2007-08-25 00:47:38 +0000392 /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
393 /// vector. If it is invalid, don't add anything to Ops.
394 virtual void LowerAsmOperandForConstraint(SDOperand Op,
395 char ConstraintLetter,
396 std::vector<SDOperand> &Ops,
397 SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000398
399 /// getRegForInlineAsmConstraint - Given a physical register constraint
400 /// (e.g. {edx}), return the register number and the register class for the
401 /// register. This should only be used for C_Register constraints. On
402 /// error, this returns a register number of 0.
403 std::pair<unsigned, const TargetRegisterClass*>
404 getRegForInlineAsmConstraint(const std::string &Constraint,
405 MVT::ValueType VT) const;
406
407 /// isLegalAddressingMode - Return true if the addressing mode represented
408 /// by AM is legal for this target, for a load/store of the specified type.
409 virtual bool isLegalAddressingMode(const AddrMode &AM, const Type *Ty)const;
410
Evan Cheng27a820a2007-10-26 01:56:11 +0000411 /// isTruncateFree - Return true if it's free to truncate a value of
412 /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
413 /// register EAX to i16 by referencing its sub-register AX.
414 virtual bool isTruncateFree(const Type *Ty1, const Type *Ty2) const;
Evan Cheng9decb332007-10-29 19:58:20 +0000415 virtual bool isTruncateFree(MVT::ValueType VT1, MVT::ValueType VT2) const;
Evan Cheng27a820a2007-10-26 01:56:11 +0000416
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000417 /// isShuffleMaskLegal - Targets can use this to indicate that they only
418 /// support *some* VECTOR_SHUFFLE operations, those with specific masks.
419 /// By default, if a target supports the VECTOR_SHUFFLE node, all mask
420 /// values are assumed to be legal.
421 virtual bool isShuffleMaskLegal(SDOperand Mask, MVT::ValueType VT) const;
422
423 /// isVectorClearMaskLegal - Similar to isShuffleMaskLegal. This is
424 /// used by Targets can use this to indicate if there is a suitable
425 /// VECTOR_SHUFFLE that can be used to replace a VAND with a constant
426 /// pool entry.
427 virtual bool isVectorClearMaskLegal(std::vector<SDOperand> &BVOps,
428 MVT::ValueType EVT,
429 SelectionDAG &DAG) const;
Evan Cheng35190fd2008-03-05 01:30:59 +0000430
431 /// ShouldShrinkFPConstant - If true, then instruction selection should
432 /// seek to shrink the FP constant of the specified type to a smaller type
433 /// in order to save space and / or reduce runtime.
434 virtual bool ShouldShrinkFPConstant(MVT::ValueType VT) const {
435 // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
436 // expensive than a straight movsd. On the other hand, it's important to
437 // shrink long double fp constant since fldt is very slow.
438 return !X86ScalarSSEf64 || VT == MVT::f80;
439 }
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000440
441 /// IsEligibleForTailCallOptimization - Check whether the call is eligible
442 /// for tail call optimization. Target which want to do tail call
443 /// optimization should implement this function.
444 virtual bool IsEligibleForTailCallOptimization(SDOperand Call,
445 SDOperand Ret,
446 SelectionDAG &DAG) const;
447
Rafael Espindoladd867c72007-11-05 23:12:20 +0000448 virtual const TargetSubtarget* getSubtarget() {
449 return static_cast<const TargetSubtarget*>(Subtarget);
450 }
451
Chris Lattnerc3d7cfa2008-01-18 06:52:41 +0000452 /// isScalarFPTypeInSSEReg - Return true if the specified scalar FP type is
453 /// computed in an SSE register, not on the X87 floating point stack.
454 bool isScalarFPTypeInSSEReg(MVT::ValueType VT) const {
455 return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
456 (VT == MVT::f32 && X86ScalarSSEf32); // f32 is when SSE1
457 }
458
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000459 private:
460 /// Subtarget - Keep a pointer to the X86Subtarget around so that we can
461 /// make the right decision when generating code for different targets.
462 const X86Subtarget *Subtarget;
Dan Gohman1e57df32008-02-10 18:45:23 +0000463 const TargetRegisterInfo *RegInfo;
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000464
465 /// X86StackPtr - X86 physical register used as stack ptr.
466 unsigned X86StackPtr;
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000467
Dale Johannesene0e0fd02007-09-23 14:52:20 +0000468 /// X86ScalarSSEf32, X86ScalarSSEf64 - Select between SSE or x87
469 /// floating point ops.
470 /// When SSE is available, use it for f32 operations.
471 /// When SSE2 is available, use it for f64 operations.
472 bool X86ScalarSSEf32;
473 bool X86ScalarSSEf64;
Evan Cheng931a8f42008-01-29 19:34:22 +0000474
475 X86::X86_64SRet ClassifyX86_64SRetCallReturn(const Function *Fn);
476
477 void X86_64AnalyzeSRetCallOperands(SDNode*, CCAssignFn*, CCState&);
478
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000479 SDNode *LowerCallResult(SDOperand Chain, SDOperand InFlag, SDNode*TheCall,
480 unsigned CallingConv, SelectionDAG &DAG);
Evan Cheng931a8f42008-01-29 19:34:22 +0000481
482 SDNode *LowerCallResultToTwo64BitRegs(SDOperand Chain, SDOperand InFlag,
483 SDNode *TheCall, unsigned Reg1,
484 unsigned Reg2, MVT::ValueType VT,
485 SelectionDAG &DAG);
486
487 SDNode *LowerCallResultToTwoX87Regs(SDOperand Chain, SDOperand InFlag,
488 SDNode *TheCall, SelectionDAG &DAG);
Rafael Espindoladdb88da2007-08-31 15:06:30 +0000489
Rafael Espindola03cbeb72007-09-14 15:48:13 +0000490 SDOperand LowerMemArgument(SDOperand Op, SelectionDAG &DAG,
491 const CCValAssign &VA, MachineFrameInfo *MFI,
Arnold Schwaighofere2db0f42008-02-26 09:19:59 +0000492 unsigned CC, SDOperand Root, unsigned i);
Rafael Espindola03cbeb72007-09-14 15:48:13 +0000493
Rafael Espindoladdb88da2007-08-31 15:06:30 +0000494 SDOperand LowerMemOpCallTo(SDOperand Op, SelectionDAG &DAG,
495 const SDOperand &StackPtr,
496 const CCValAssign &VA, SDOperand Chain,
497 SDOperand Arg);
498
Gordon Henriksen18ace102008-01-05 16:56:59 +0000499 // Call lowering helpers.
500 bool IsCalleePop(SDOperand Op);
Arnold Schwaighofer87f75262008-02-26 22:21:54 +0000501 bool CallRequiresGOTPtrInReg(bool Is64Bit, bool IsTailCall);
502 bool CallRequiresFnAddressInReg(bool Is64Bit, bool IsTailCall);
Gordon Henriksen18ace102008-01-05 16:56:59 +0000503 CCAssignFn *CCAssignFnForNode(SDOperand Op) const;
504 NameDecorationStyle NameDecorationForFORMAL_ARGUMENTS(SDOperand Op);
Arnold Schwaighofere2d6bbb2007-10-11 19:40:01 +0000505 unsigned GetAlignedArgumentStackSize(unsigned StackSize, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000506
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000507 std::pair<SDOperand,SDOperand> FP_TO_SINTHelper(SDOperand Op,
508 SelectionDAG &DAG);
509
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000510 SDOperand LowerBUILD_VECTOR(SDOperand Op, SelectionDAG &DAG);
511 SDOperand LowerVECTOR_SHUFFLE(SDOperand Op, SelectionDAG &DAG);
512 SDOperand LowerEXTRACT_VECTOR_ELT(SDOperand Op, SelectionDAG &DAG);
Nate Begemand77e59e2008-02-11 04:19:36 +0000513 SDOperand LowerEXTRACT_VECTOR_ELT_SSE4(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000514 SDOperand LowerINSERT_VECTOR_ELT(SDOperand Op, SelectionDAG &DAG);
Nate Begemand77e59e2008-02-11 04:19:36 +0000515 SDOperand LowerINSERT_VECTOR_ELT_SSE4(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000516 SDOperand LowerSCALAR_TO_VECTOR(SDOperand Op, SelectionDAG &DAG);
517 SDOperand LowerConstantPool(SDOperand Op, SelectionDAG &DAG);
518 SDOperand LowerGlobalAddress(SDOperand Op, SelectionDAG &DAG);
519 SDOperand LowerGlobalTLSAddress(SDOperand Op, SelectionDAG &DAG);
520 SDOperand LowerExternalSymbol(SDOperand Op, SelectionDAG &DAG);
521 SDOperand LowerShift(SDOperand Op, SelectionDAG &DAG);
522 SDOperand LowerSINT_TO_FP(SDOperand Op, SelectionDAG &DAG);
523 SDOperand LowerFP_TO_SINT(SDOperand Op, SelectionDAG &DAG);
524 SDOperand LowerFABS(SDOperand Op, SelectionDAG &DAG);
525 SDOperand LowerFNEG(SDOperand Op, SelectionDAG &DAG);
526 SDOperand LowerFCOPYSIGN(SDOperand Op, SelectionDAG &DAG);
Evan Cheng621216e2007-09-29 00:00:36 +0000527 SDOperand LowerSETCC(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000528 SDOperand LowerSELECT(SDOperand Op, SelectionDAG &DAG);
529 SDOperand LowerBRCOND(SDOperand Op, SelectionDAG &DAG);
530 SDOperand LowerMEMSET(SDOperand Op, SelectionDAG &DAG);
Rafael Espindolaf12f3a92007-09-28 12:53:01 +0000531 SDOperand LowerMEMCPYInline(SDOperand Dest, SDOperand Source,
532 SDOperand Chain, unsigned Size, unsigned Align,
533 SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000534 SDOperand LowerJumpTable(SDOperand Op, SelectionDAG &DAG);
535 SDOperand LowerCALL(SDOperand Op, SelectionDAG &DAG);
536 SDOperand LowerRET(SDOperand Op, SelectionDAG &DAG);
537 SDOperand LowerDYNAMIC_STACKALLOC(SDOperand Op, SelectionDAG &DAG);
538 SDOperand LowerFORMAL_ARGUMENTS(SDOperand Op, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000539 SDOperand LowerVASTART(SDOperand Op, SelectionDAG &DAG);
540 SDOperand LowerVACOPY(SDOperand Op, SelectionDAG &DAG);
541 SDOperand LowerINTRINSIC_WO_CHAIN(SDOperand Op, SelectionDAG &DAG);
542 SDOperand LowerRETURNADDR(SDOperand Op, SelectionDAG &DAG);
543 SDOperand LowerFRAMEADDR(SDOperand Op, SelectionDAG &DAG);
544 SDOperand LowerFRAME_TO_ARGS_OFFSET(SDOperand Op, SelectionDAG &DAG);
545 SDOperand LowerEH_RETURN(SDOperand Op, SelectionDAG &DAG);
Duncan Sandsd8455ca2007-07-27 20:02:49 +0000546 SDOperand LowerTRAMPOLINE(SDOperand Op, SelectionDAG &DAG);
Dan Gohman819574c2008-01-31 00:41:03 +0000547 SDOperand LowerFLT_ROUNDS_(SDOperand Op, SelectionDAG &DAG);
Evan Cheng48679f42007-12-14 02:13:44 +0000548 SDOperand LowerCTLZ(SDOperand Op, SelectionDAG &DAG);
549 SDOperand LowerCTTZ(SDOperand Op, SelectionDAG &DAG);
Andrew Lenharth81580822008-03-05 01:15:49 +0000550 SDOperand LowerLCS(SDOperand Op, SelectionDAG &DAG);
Chris Lattnerdfb947d2007-11-24 07:07:01 +0000551 SDNode *ExpandFP_TO_SINT(SDNode *N, SelectionDAG &DAG);
552 SDNode *ExpandREADCYCLECOUNTER(SDNode *N, SelectionDAG &DAG);
Andrew Lenharth81580822008-03-05 01:15:49 +0000553 SDNode *ExpandATOMIC_LCS(SDNode *N, SelectionDAG &DAG);
Dan Gohmanf17a25c2007-07-18 16:29:46 +0000554 };
555}
556
557#endif // X86ISELLOWERING_H