blob: 7cd9a157a3bbbe789700b64888e6dbbf31f8d482 [file] [log] [blame]
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +00001//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the interfaces that X86 uses to lower LLVM code into a
11// selection DAG.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef X86ISELLOWERING_H
16#define X86ISELLOWERING_H
17
Evan Cheng559806f2006-01-27 08:10:46 +000018#include "X86Subtarget.h"
Anton Korobeynikov2365f512007-07-14 14:06:15 +000019#include "X86RegisterInfo.h"
Gordon Henriksen86737662008-01-05 16:56:59 +000020#include "X86MachineFunctionInfo.h"
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000021#include "llvm/Target/TargetLowering.h"
Evan Chengddc419c2010-01-26 19:04:47 +000022#include "llvm/Target/TargetOptions.h"
Ted Kremenekb388eb82008-09-03 02:54:11 +000023#include "llvm/CodeGen/FastISel.h"
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000024#include "llvm/CodeGen/SelectionDAG.h"
Rafael Espindola1b5dcc32007-08-31 15:06:30 +000025#include "llvm/CodeGen/CallingConvLower.h"
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000026
27namespace llvm {
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000028 namespace X86ISD {
Evan Chengd9558e02006-01-06 00:43:03 +000029 // X86 Specific DAG Nodes
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000030 enum NodeType {
31 // Start the numbering where the builtin ops leave off.
Dan Gohman0ba2bcf2008-09-23 18:42:32 +000032 FIRST_NUMBER = ISD::BUILTIN_OP_END,
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000033
Evan Cheng18efe262007-12-14 02:13:44 +000034 /// BSF - Bit scan forward.
35 /// BSR - Bit scan reverse.
36 BSF,
37 BSR,
38
Evan Chenge3413162006-01-09 18:33:28 +000039 /// SHLD, SHRD - Double shift instructions. These correspond to
40 /// X86::SHLDxx and X86::SHRDxx instructions.
41 SHLD,
42 SHRD,
43
Evan Chengef6ffb12006-01-31 03:14:29 +000044 /// FAND - Bitwise logical AND of floating point values. This corresponds
45 /// to X86::ANDPS or X86::ANDPD.
46 FAND,
47
Evan Cheng68c47cb2007-01-05 07:55:56 +000048 /// FOR - Bitwise logical OR of floating point values. This corresponds
49 /// to X86::ORPS or X86::ORPD.
50 FOR,
51
Evan Cheng223547a2006-01-31 22:28:30 +000052 /// FXOR - Bitwise logical XOR of floating point values. This corresponds
53 /// to X86::XORPS or X86::XORPD.
54 FXOR,
55
Evan Cheng73d6cf12007-01-05 21:37:56 +000056 /// FSRL - Bitwise logical right shift of floating point values. These
57 /// corresponds to X86::PSRLDQ.
Evan Cheng68c47cb2007-01-05 07:55:56 +000058 FSRL,
59
Evan Chenge3de85b2006-02-04 02:20:30 +000060 /// FILD, FILD_FLAG - This instruction implements SINT_TO_FP with the
61 /// integer source in memory and FP reg result. This corresponds to the
62 /// X86::FILD*m instructions. It has three inputs (token chain, address,
63 /// and source type) and two outputs (FP value and token chain). FILD_FLAG
64 /// also produces a flag).
Evan Chenga3195e82006-01-12 22:54:21 +000065 FILD,
Evan Chenge3de85b2006-02-04 02:20:30 +000066 FILD_FLAG,
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000067
68 /// FP_TO_INT*_IN_MEM - This instruction implements FP_TO_SINT with the
69 /// integer destination in memory and a FP reg source. This corresponds
70 /// to the X86::FIST*m instructions and the rounding mode change stuff. It
Chris Lattner91897772006-10-18 18:26:48 +000071 /// has two inputs (token chain and address) and two outputs (int value
72 /// and token chain).
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000073 FP_TO_INT16_IN_MEM,
74 FP_TO_INT32_IN_MEM,
75 FP_TO_INT64_IN_MEM,
76
Evan Chengb077b842005-12-21 02:39:21 +000077 /// FLD - This instruction implements an extending load to FP stack slots.
78 /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
Evan Cheng38bcbaf2005-12-23 07:31:11 +000079 /// operand, ptr to load from, and a ValueType node indicating the type
80 /// to load to.
Evan Chengb077b842005-12-21 02:39:21 +000081 FLD,
82
Evan Chengd90eb7f2006-01-05 00:27:02 +000083 /// FST - This instruction implements a truncating store to FP stack
84 /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
85 /// chain operand, value to store, address, and a ValueType to store it
86 /// as.
87 FST,
88
Dan Gohman98ca4f22009-08-05 01:29:28 +000089 /// CALL - These operations represent an abstract X86 call
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +000090 /// instruction, which includes a bunch of information. In particular the
91 /// operands of these node are:
92 ///
93 /// #0 - The incoming token chain
94 /// #1 - The callee
95 /// #2 - The number of arg bytes the caller pushes on the stack.
96 /// #3 - The number of arg bytes the callee pops off the stack.
97 /// #4 - The value to pass in AL/AX/EAX (optional)
98 /// #5 - The value to pass in DL/DX/EDX (optional)
99 ///
100 /// The result values of these nodes are:
101 ///
102 /// #0 - The outgoing token chain
103 /// #1 - The first register result value (optional)
104 /// #2 - The second register result value (optional)
105 ///
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000106 CALL,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000107
Andrew Lenharthb873ff32005-11-20 21:41:10 +0000108 /// RDTSC_DAG - This operation implements the lowering for
109 /// readcyclecounter
110 RDTSC_DAG,
Evan Cheng7df96d62005-12-17 01:21:05 +0000111
112 /// X86 compare and logical compare instructions.
Evan Cheng7d6ff3a2007-09-17 17:42:53 +0000113 CMP, COMI, UCOMI,
Evan Cheng7df96d62005-12-17 01:21:05 +0000114
Dan Gohmanc7a37d42008-12-23 22:45:23 +0000115 /// X86 bit-test instructions.
116 BT,
117
Dan Gohman2004eb62009-03-23 15:40:10 +0000118 /// X86 SetCC. Operand 0 is condition code, and operand 1 is the flag
Evan Chengd5781fc2005-12-21 20:21:51 +0000119 /// operand produced by a CMP instruction.
120 SETCC,
121
Evan Chengad9c0a32009-12-15 00:53:42 +0000122 // Same as SETCC except it's materialized with a sbb and the value is all
123 // one's or all zero's.
124 SETCC_CARRY,
125
Chris Lattner2b9f4342009-03-12 06:46:02 +0000126 /// X86 conditional moves. Operand 0 and operand 1 are the two values
127 /// to select from. Operand 2 is the condition code, and operand 3 is the
128 /// flag operand produced by a CMP or TEST instruction. It also writes a
129 /// flag result.
Evan Cheng7df96d62005-12-17 01:21:05 +0000130 CMOV,
Evan Cheng898101c2005-12-19 23:12:38 +0000131
Dan Gohman2004eb62009-03-23 15:40:10 +0000132 /// X86 conditional branches. Operand 0 is the chain operand, operand 1
133 /// is the block to branch if condition is true, operand 2 is the
134 /// condition code, and operand 3 is the flag operand produced by a CMP
Evan Chengd5781fc2005-12-21 20:21:51 +0000135 /// or TEST instruction.
Evan Cheng898101c2005-12-19 23:12:38 +0000136 BRCOND,
Evan Chengb077b842005-12-21 02:39:21 +0000137
Dan Gohman2004eb62009-03-23 15:40:10 +0000138 /// Return with a flag operand. Operand 0 is the chain operand, operand
139 /// 1 is the number of bytes of stack to pop.
Evan Chengb077b842005-12-21 02:39:21 +0000140 RET_FLAG,
Evan Cheng67f92a72006-01-11 22:15:48 +0000141
142 /// REP_STOS - Repeat fill, corresponds to X86::REP_STOSx.
143 REP_STOS,
144
145 /// REP_MOVS - Repeat move, corresponds to X86::REP_MOVSx.
146 REP_MOVS,
Evan Cheng223547a2006-01-31 22:28:30 +0000147
Evan Cheng7ccced62006-02-18 00:15:05 +0000148 /// GlobalBaseReg - On Darwin, this node represents the result of the popl
149 /// at function entry, used for PIC code.
150 GlobalBaseReg,
Evan Chenga0ea0532006-02-23 02:43:52 +0000151
Bill Wendling056292f2008-09-16 21:48:12 +0000152 /// Wrapper - A wrapper node for TargetConstantPool,
153 /// TargetExternalSymbol, and TargetGlobalAddress.
Evan Cheng020d2e82006-02-23 20:41:18 +0000154 Wrapper,
Evan Cheng48090aa2006-03-21 23:01:21 +0000155
Evan Cheng0085a282006-11-30 21:55:46 +0000156 /// WrapperRIP - Special wrapper used under X86-64 PIC mode for RIP
157 /// relative displacements.
158 WrapperRIP,
159
Mon P Wangeb38ebf2010-01-24 00:05:03 +0000160 /// MOVQ2DQ - Copies a 64-bit value from a vector to another vector.
161 /// Can be used to move a vector value from a MMX register to a XMM
162 /// register.
163 MOVQ2DQ,
164
Nate Begeman14d12ca2008-02-11 04:19:36 +0000165 /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to
166 /// i32, corresponds to X86::PEXTRB.
167 PEXTRB,
168
Evan Chengb067a1e2006-03-31 19:22:53 +0000169 /// PEXTRW - Extract a 16-bit value from a vector and zero extend it to
Evan Cheng653159f2006-03-31 21:55:24 +0000170 /// i32, corresponds to X86::PEXTRW.
Evan Chengb067a1e2006-03-31 19:22:53 +0000171 PEXTRW,
Evan Cheng653159f2006-03-31 21:55:24 +0000172
Nate Begeman14d12ca2008-02-11 04:19:36 +0000173 /// INSERTPS - Insert any element of a 4 x float vector into any element
174 /// of a destination 4 x floatvector.
175 INSERTPS,
176
177 /// PINSRB - Insert the lower 8-bits of a 32-bit value to a vector,
178 /// corresponds to X86::PINSRB.
179 PINSRB,
180
Evan Cheng653159f2006-03-31 21:55:24 +0000181 /// PINSRW - Insert the lower 16-bits of a 32-bit value to a vector,
182 /// corresponds to X86::PINSRW.
Chris Lattner8f2b4cc2010-02-23 02:07:48 +0000183 PINSRW, MMX_PINSRW,
Evan Cheng8ca29322006-11-10 21:43:37 +0000184
Nate Begemanb9a47b82009-02-23 08:49:38 +0000185 /// PSHUFB - Shuffle 16 8-bit values within a vector.
186 PSHUFB,
187
Evan Cheng8ca29322006-11-10 21:43:37 +0000188 /// FMAX, FMIN - Floating point max and min.
189 ///
Lauro Ramos Venanciob3a04172007-04-20 21:38:10 +0000190 FMAX, FMIN,
Dan Gohman20382522007-07-10 00:05:58 +0000191
192 /// FRSQRT, FRCP - Floating point reciprocal-sqrt and reciprocal
193 /// approximation. Note that these typically require refinement
194 /// in order to obtain suitable precision.
195 FRSQRT, FRCP,
196
Rafael Espindola094fad32009-04-08 21:14:34 +0000197 // TLSADDR - Thread Local Storage.
198 TLSADDR,
Eric Christopher30ef0e52010-06-03 04:07:48 +0000199
200 // TLSCALL - Thread Local Storage. When calling to an OS provided
201 // thunk at the address from an earlier relocation.
202 TLSCALL,
Rafael Espindola094fad32009-04-08 21:14:34 +0000203
204 // SegmentBaseAddress - The address segment:0
205 SegmentBaseAddress,
Anton Korobeynikov2365f512007-07-14 14:06:15 +0000206
Evan Cheng7e2ff772008-05-08 00:57:18 +0000207 // EH_RETURN - Exception Handling helpers.
Arnold Schwaighoferc85e1712007-10-11 19:40:01 +0000208 EH_RETURN,
209
Arnold Schwaighofer4fe30732008-03-19 16:39:45 +0000210 /// TC_RETURN - Tail call return.
211 /// operand #0 chain
212 /// operand #1 callee (register or absolute)
213 /// operand #2 stack adjustment
214 /// operand #3 optional in flag
Anton Korobeynikov45b22fa2007-11-16 01:31:51 +0000215 TC_RETURN,
216
Evan Cheng7e2ff772008-05-08 00:57:18 +0000217 // LCMPXCHG_DAG, LCMPXCHG8_DAG - Compare and swap.
Andrew Lenharth26ed8692008-03-01 21:52:34 +0000218 LCMPXCHG_DAG,
Andrew Lenharthd19189e2008-03-05 01:15:49 +0000219 LCMPXCHG8_DAG,
Andrew Lenharth26ed8692008-03-01 21:52:34 +0000220
Evan Cheng7e2ff772008-05-08 00:57:18 +0000221 // FNSTCW16m - Store FP control world into i16 memory.
222 FNSTCW16m,
223
Evan Chengd880b972008-05-09 21:53:03 +0000224 // VZEXT_MOVL - Vector move low and zero extend.
225 VZEXT_MOVL,
226
227 // VZEXT_LOAD - Load, scalar_to_vector, and zero extend.
Evan Chengf26ffe92008-05-29 08:22:04 +0000228 VZEXT_LOAD,
229
230 // VSHL, VSRL - Vector logical left / right shift.
Nate Begeman30a0de92008-07-17 16:51:19 +0000231 VSHL, VSRL,
Nate Begeman9008ca62009-04-27 18:41:29 +0000232
233 // CMPPD, CMPPS - Vector double/float comparison.
Nate Begeman30a0de92008-07-17 16:51:19 +0000234 // CMPPD, CMPPS - Vector double/float comparison.
235 CMPPD, CMPPS,
236
237 // PCMP* - Vector integer comparisons.
238 PCMPEQB, PCMPEQW, PCMPEQD, PCMPEQQ,
Bill Wendlingab55ebd2008-12-12 00:56:36 +0000239 PCMPGTB, PCMPGTW, PCMPGTD, PCMPGTQ,
240
Dan Gohman076aee32009-03-04 19:44:21 +0000241 // ADD, SUB, SMUL, UMUL, etc. - Arithmetic operations with FLAGS results.
242 ADD, SUB, SMUL, UMUL,
Dan Gohmane220c4b2009-09-18 19:59:53 +0000243 INC, DEC, OR, XOR, AND,
Evan Cheng73f24c92009-03-30 21:36:47 +0000244
245 // MUL_IMM - X86 specific multiply by immediate.
Eric Christopher71c67532009-07-29 00:28:05 +0000246 MUL_IMM,
247
248 // PTEST - Vector bitwise comparisons
Dan Gohmand6708ea2009-08-15 01:38:56 +0000249 PTEST,
250
Bruno Cardoso Lopes045573c2010-08-10 23:25:42 +0000251 // TESTP - Vector packed fp sign bitwise comparisons
252 TESTP,
253
Bruno Cardoso Lopes3157ef12010-08-20 22:55:05 +0000254 // Several flavors of instructions with vector shuffle behaviors.
255 PALIGN,
256 PSHUFD,
257 PSHUFHW,
258 PSHUFLW,
259 PSHUFHW_LD,
260 PSHUFLW_LD,
261 SHUFPD,
262 SHUFPS,
263 MOVDDUP,
264 MOVSHDUP,
265 MOVSLDUP,
266 MOVSHDUP_LD,
267 MOVSLDUP_LD,
268 MOVLHPS,
Bruno Cardoso Lopes3157ef12010-08-20 22:55:05 +0000269 MOVLHPD,
Bruno Cardoso Lopesf2db5b42010-08-31 21:15:21 +0000270 MOVHLPS,
Bruno Cardoso Lopes3157ef12010-08-20 22:55:05 +0000271 MOVHLPD,
Bruno Cardoso Lopes3157ef12010-08-20 22:55:05 +0000272 MOVSD,
273 MOVSS,
274 UNPCKLPS,
275 UNPCKLPD,
276 UNPCKHPS,
277 UNPCKHPD,
278 PUNPCKLBW,
279 PUNPCKLWD,
280 PUNPCKLDQ,
281 PUNPCKLQDQ,
282 PUNPCKHBW,
283 PUNPCKHWD,
284 PUNPCKHDQ,
285 PUNPCKHQDQ,
286
Dan Gohmand6708ea2009-08-15 01:38:56 +0000287 // VASTART_SAVE_XMM_REGS - Save xmm argument registers to the stack,
288 // according to %al. An operator is needed so that this can be expanded
289 // with control flow.
Dan Gohmanc76909a2009-09-25 20:36:54 +0000290 VASTART_SAVE_XMM_REGS,
291
Anton Korobeynikov043f3c22010-03-06 19:32:29 +0000292 // MINGW_ALLOCA - MingW's __alloca call to do stack probing.
293 MINGW_ALLOCA,
294
Dan Gohmanc76909a2009-09-25 20:36:54 +0000295 // ATOMADD64_DAG, ATOMSUB64_DAG, ATOMOR64_DAG, ATOMAND64_DAG,
296 // ATOMXOR64_DAG, ATOMNAND64_DAG, ATOMSWAP64_DAG -
297 // Atomic 64-bit binary operations.
298 ATOMADD64_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
299 ATOMSUB64_DAG,
300 ATOMOR64_DAG,
301 ATOMXOR64_DAG,
302 ATOMAND64_DAG,
303 ATOMNAND64_DAG,
Eric Christopher9a9d2752010-07-22 02:48:34 +0000304 ATOMSWAP64_DAG,
305
306 // Memory barrier
307 MEMBARRIER,
308 MFENCE,
309 SFENCE,
310 LFENCE
Anton Korobeynikov043f3c22010-03-06 19:32:29 +0000311
312 // WARNING: Do not add anything in the end unless you want the node to
313 // have memop! In fact, starting from ATOMADD64_DAG all opcodes will be
314 // thought as target memory ops!
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000315 };
316 }
317
Evan Cheng0d9e9762008-01-29 19:34:22 +0000318 /// Define some predicates that are used for node matching.
319 namespace X86 {
320 /// isPSHUFDMask - Return true if the specified VECTOR_SHUFFLE operand
321 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman9008ca62009-04-27 18:41:29 +0000322 bool isPSHUFDMask(ShuffleVectorSDNode *N);
Evan Cheng0188ecb2006-03-22 18:59:22 +0000323
Evan Cheng0d9e9762008-01-29 19:34:22 +0000324 /// isPSHUFHWMask - Return true if the specified VECTOR_SHUFFLE operand
325 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman9008ca62009-04-27 18:41:29 +0000326 bool isPSHUFHWMask(ShuffleVectorSDNode *N);
Evan Cheng506d3df2006-03-29 23:07:14 +0000327
Evan Cheng0d9e9762008-01-29 19:34:22 +0000328 /// isPSHUFLWMask - Return true if the specified VECTOR_SHUFFLE operand
329 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman9008ca62009-04-27 18:41:29 +0000330 bool isPSHUFLWMask(ShuffleVectorSDNode *N);
Evan Cheng506d3df2006-03-29 23:07:14 +0000331
Evan Cheng0d9e9762008-01-29 19:34:22 +0000332 /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
333 /// specifies a shuffle of elements that is suitable for input to SHUFP*.
Nate Begeman9008ca62009-04-27 18:41:29 +0000334 bool isSHUFPMask(ShuffleVectorSDNode *N);
Evan Cheng14aed5e2006-03-24 01:18:28 +0000335
Evan Cheng0d9e9762008-01-29 19:34:22 +0000336 /// isMOVHLPSMask - Return true if the specified VECTOR_SHUFFLE operand
337 /// specifies a shuffle of elements that is suitable for input to MOVHLPS.
Nate Begeman9008ca62009-04-27 18:41:29 +0000338 bool isMOVHLPSMask(ShuffleVectorSDNode *N);
Evan Cheng2c0dbd02006-03-24 02:58:06 +0000339
Evan Cheng0d9e9762008-01-29 19:34:22 +0000340 /// isMOVHLPS_v_undef_Mask - Special case of isMOVHLPSMask for canonical form
341 /// of vector_shuffle v, v, <2, 3, 2, 3>, i.e. vector_shuffle v, undef,
342 /// <2, 3, 2, 3>
Nate Begeman9008ca62009-04-27 18:41:29 +0000343 bool isMOVHLPS_v_undef_Mask(ShuffleVectorSDNode *N);
Evan Cheng6e56e2c2006-11-07 22:14:24 +0000344
Evan Cheng0d9e9762008-01-29 19:34:22 +0000345 /// isMOVLPMask - Return true if the specified VECTOR_SHUFFLE operand
Nate Begeman9008ca62009-04-27 18:41:29 +0000346 /// specifies a shuffle of elements that is suitable for MOVLP{S|D}.
347 bool isMOVLPMask(ShuffleVectorSDNode *N);
Evan Cheng5ced1d82006-04-06 23:23:56 +0000348
Evan Cheng0d9e9762008-01-29 19:34:22 +0000349 /// isMOVHPMask - Return true if the specified VECTOR_SHUFFLE operand
Nate Begeman9008ca62009-04-27 18:41:29 +0000350 /// specifies a shuffle of elements that is suitable for MOVHP{S|D}.
Evan Cheng0d9e9762008-01-29 19:34:22 +0000351 /// as well as MOVLHPS.
Nate Begeman0b10b912009-11-07 23:17:15 +0000352 bool isMOVLHPSMask(ShuffleVectorSDNode *N);
Evan Cheng5ced1d82006-04-06 23:23:56 +0000353
Evan Cheng0d9e9762008-01-29 19:34:22 +0000354 /// isUNPCKLMask - Return true if the specified VECTOR_SHUFFLE operand
355 /// specifies a shuffle of elements that is suitable for input to UNPCKL.
Nate Begeman9008ca62009-04-27 18:41:29 +0000356 bool isUNPCKLMask(ShuffleVectorSDNode *N, bool V2IsSplat = false);
Evan Cheng0038e592006-03-28 00:39:58 +0000357
Evan Cheng0d9e9762008-01-29 19:34:22 +0000358 /// isUNPCKHMask - Return true if the specified VECTOR_SHUFFLE operand
359 /// specifies a shuffle of elements that is suitable for input to UNPCKH.
Nate Begeman9008ca62009-04-27 18:41:29 +0000360 bool isUNPCKHMask(ShuffleVectorSDNode *N, bool V2IsSplat = false);
Evan Cheng4fcb9222006-03-28 02:43:26 +0000361
Evan Cheng0d9e9762008-01-29 19:34:22 +0000362 /// isUNPCKL_v_undef_Mask - Special case of isUNPCKLMask for canonical form
363 /// of vector_shuffle v, v, <0, 4, 1, 5>, i.e. vector_shuffle v, undef,
364 /// <0, 0, 1, 1>
Nate Begeman9008ca62009-04-27 18:41:29 +0000365 bool isUNPCKL_v_undef_Mask(ShuffleVectorSDNode *N);
Evan Cheng1d5a8cc2006-04-05 07:20:06 +0000366
Evan Cheng0d9e9762008-01-29 19:34:22 +0000367 /// isUNPCKH_v_undef_Mask - Special case of isUNPCKHMask for canonical form
368 /// of vector_shuffle v, v, <2, 6, 3, 7>, i.e. vector_shuffle v, undef,
369 /// <2, 2, 3, 3>
Nate Begeman9008ca62009-04-27 18:41:29 +0000370 bool isUNPCKH_v_undef_Mask(ShuffleVectorSDNode *N);
Bill Wendling2f9bb1a2007-04-24 21:16:55 +0000371
Evan Cheng0d9e9762008-01-29 19:34:22 +0000372 /// isMOVLMask - Return true if the specified VECTOR_SHUFFLE operand
373 /// specifies a shuffle of elements that is suitable for input to MOVSS,
374 /// MOVSD, and MOVD, i.e. setting the lowest element.
Nate Begeman9008ca62009-04-27 18:41:29 +0000375 bool isMOVLMask(ShuffleVectorSDNode *N);
Evan Chengd6d1cbd2006-04-11 00:19:04 +0000376
Evan Cheng0d9e9762008-01-29 19:34:22 +0000377 /// isMOVSHDUPMask - Return true if the specified VECTOR_SHUFFLE operand
378 /// specifies a shuffle of elements that is suitable for input to MOVSHDUP.
Nate Begeman9008ca62009-04-27 18:41:29 +0000379 bool isMOVSHDUPMask(ShuffleVectorSDNode *N);
Evan Chengd9539472006-04-14 21:59:03 +0000380
Evan Cheng0d9e9762008-01-29 19:34:22 +0000381 /// isMOVSLDUPMask - Return true if the specified VECTOR_SHUFFLE operand
382 /// specifies a shuffle of elements that is suitable for input to MOVSLDUP.
Nate Begeman9008ca62009-04-27 18:41:29 +0000383 bool isMOVSLDUPMask(ShuffleVectorSDNode *N);
Evan Chengf686d9b2006-10-27 21:08:32 +0000384
Evan Cheng0b457f02008-09-25 20:50:48 +0000385 /// isMOVDDUPMask - Return true if the specified VECTOR_SHUFFLE operand
386 /// specifies a shuffle of elements that is suitable for input to MOVDDUP.
Nate Begeman9008ca62009-04-27 18:41:29 +0000387 bool isMOVDDUPMask(ShuffleVectorSDNode *N);
Evan Cheng0b457f02008-09-25 20:50:48 +0000388
Nate Begemana09008b2009-10-19 02:17:23 +0000389 /// isPALIGNRMask - Return true if the specified VECTOR_SHUFFLE operand
390 /// specifies a shuffle of elements that is suitable for input to PALIGNR.
391 bool isPALIGNRMask(ShuffleVectorSDNode *N);
392
Evan Cheng0d9e9762008-01-29 19:34:22 +0000393 /// getShuffleSHUFImmediate - Return the appropriate immediate to shuffle
394 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP*
395 /// instructions.
396 unsigned getShuffleSHUFImmediate(SDNode *N);
Evan Cheng506d3df2006-03-29 23:07:14 +0000397
Evan Cheng0d9e9762008-01-29 19:34:22 +0000398 /// getShufflePSHUFHWImmediate - Return the appropriate immediate to shuffle
Nate Begemana09008b2009-10-19 02:17:23 +0000399 /// the specified VECTOR_SHUFFLE mask with PSHUFHW instruction.
Evan Cheng0d9e9762008-01-29 19:34:22 +0000400 unsigned getShufflePSHUFHWImmediate(SDNode *N);
Evan Cheng506d3df2006-03-29 23:07:14 +0000401
Nate Begemana09008b2009-10-19 02:17:23 +0000402 /// getShufflePSHUFLWImmediate - Return the appropriate immediate to shuffle
403 /// the specified VECTOR_SHUFFLE mask with PSHUFLW instruction.
Evan Cheng0d9e9762008-01-29 19:34:22 +0000404 unsigned getShufflePSHUFLWImmediate(SDNode *N);
Evan Cheng37b73872009-07-30 08:33:02 +0000405
Nate Begemana09008b2009-10-19 02:17:23 +0000406 /// getShufflePALIGNRImmediate - Return the appropriate immediate to shuffle
407 /// the specified VECTOR_SHUFFLE mask with the PALIGNR instruction.
408 unsigned getShufflePALIGNRImmediate(SDNode *N);
409
Evan Cheng37b73872009-07-30 08:33:02 +0000410 /// isZeroNode - Returns true if Elt is a constant zero or a floating point
411 /// constant +0.0.
412 bool isZeroNode(SDValue Elt);
Anton Korobeynikovb5e01722009-08-05 23:01:26 +0000413
414 /// isOffsetSuitableForCodeModel - Returns true of the given offset can be
415 /// fit into displacement field of the instruction.
416 bool isOffsetSuitableForCodeModel(int64_t Offset, CodeModel::Model M,
417 bool hasSymbolicDisplacement = true);
Evan Cheng0d9e9762008-01-29 19:34:22 +0000418 }
419
Chris Lattner91897772006-10-18 18:26:48 +0000420 //===--------------------------------------------------------------------===//
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000421 // X86TargetLowering - X86 Implementation of the TargetLowering interface
422 class X86TargetLowering : public TargetLowering {
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000423 public:
Dan Gohmanc9f5f3f2008-05-14 01:58:56 +0000424 explicit X86TargetLowering(X86TargetMachine &TM);
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000425
Chris Lattner589c6f62010-01-26 06:28:43 +0000426 /// getPICBaseSymbol - Return the X86-32 PIC base.
427 MCSymbol *getPICBaseSymbol(const MachineFunction *MF, MCContext &Ctx) const;
428
Chris Lattnerc64daab2010-01-26 05:02:42 +0000429 virtual unsigned getJumpTableEncoding() const;
Chris Lattner5e1df8d2010-01-25 23:38:14 +0000430
Chris Lattnerc64daab2010-01-26 05:02:42 +0000431 virtual const MCExpr *
432 LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI,
433 const MachineBasicBlock *MBB, unsigned uid,
434 MCContext &Ctx) const;
435
Evan Chengcc415862007-11-09 01:32:10 +0000436 /// getPICJumpTableRelocaBase - Returns relocation base for the given PIC
437 /// jumptable.
Chris Lattnerc64daab2010-01-26 05:02:42 +0000438 virtual SDValue getPICJumpTableRelocBase(SDValue Table,
439 SelectionDAG &DAG) const;
Chris Lattner589c6f62010-01-26 06:28:43 +0000440 virtual const MCExpr *
441 getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
442 unsigned JTI, MCContext &Ctx) const;
443
Chris Lattner54e3efd2007-02-26 04:01:25 +0000444 /// getStackPtrReg - Return the stack pointer register we are using: either
445 /// ESP or RSP.
446 unsigned getStackPtrReg() const { return X86StackPtr; }
Evan Cheng29286502008-01-23 23:17:41 +0000447
448 /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
449 /// function arguments in the caller parameter area. For X86, aggregates
450 /// that contains are placed at 16-byte boundaries while the rest are at
451 /// 4-byte boundaries.
452 virtual unsigned getByValTypeAlignment(const Type *Ty) const;
Evan Chengf0df0312008-05-15 08:39:06 +0000453
454 /// getOptimalMemOpType - Returns the target specific optimal type for load
Evan Chengf28f8bc2010-04-02 19:36:14 +0000455 /// and store operations as a result of memset, memcpy, and memmove
456 /// lowering. If DstAlign is zero that means it's safe to destination
457 /// alignment can satisfy any constraint. Similarly if SrcAlign is zero it
458 /// means there isn't a need to check it against alignment requirement,
459 /// probably because the source does not need to be loaded. If
460 /// 'NonScalarIntSafe' is true, that means it's safe to return a
461 /// non-scalar-integer type, e.g. empty string source, constant, or loaded
Evan Chengc3b0c342010-04-08 07:37:57 +0000462 /// from memory. 'MemcpyStrSrc' indicates whether the memcpy source is
463 /// constant so it does not need to be loaded.
Dan Gohman37f32ee2010-04-16 20:11:05 +0000464 /// It returns EVT::Other if the type should be determined using generic
465 /// target-independent logic.
Evan Chengf28f8bc2010-04-02 19:36:14 +0000466 virtual EVT
Evan Chengc3b0c342010-04-08 07:37:57 +0000467 getOptimalMemOpType(uint64_t Size, unsigned DstAlign, unsigned SrcAlign,
468 bool NonScalarIntSafe, bool MemcpyStrSrc,
Dan Gohman37f32ee2010-04-16 20:11:05 +0000469 MachineFunction &MF) const;
Bill Wendlingaf566342009-08-15 21:21:19 +0000470
471 /// allowsUnalignedMemoryAccesses - Returns true if the target allows
472 /// unaligned memory accesses. of the specified type.
473 virtual bool allowsUnalignedMemoryAccesses(EVT VT) const {
474 return true;
475 }
Bill Wendling20c568f2009-06-30 22:38:32 +0000476
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000477 /// LowerOperation - Provide custom lowering hooks for some operations.
478 ///
Dan Gohmand858e902010-04-17 15:26:15 +0000479 virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const;
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000480
Duncan Sands1607f052008-12-01 11:39:25 +0000481 /// ReplaceNodeResults - Replace the results of node with an illegal result
482 /// type with new values built out of custom code.
Chris Lattner27a6c732007-11-24 07:07:01 +0000483 ///
Duncan Sands1607f052008-12-01 11:39:25 +0000484 virtual void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
Dan Gohmand858e902010-04-17 15:26:15 +0000485 SelectionDAG &DAG) const;
Chris Lattner27a6c732007-11-24 07:07:01 +0000486
487
Dan Gohman475871a2008-07-27 21:46:04 +0000488 virtual SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const;
Evan Cheng206ee9d2006-07-07 08:33:52 +0000489
Evan Chenge5b51ac2010-04-17 06:13:15 +0000490 /// isTypeDesirableForOp - Return true if the target has native support for
491 /// the specified value type and it is 'desirable' to use the type for the
492 /// given node type. e.g. On x86 i16 is legal, but undesirable since i16
493 /// instruction encodings are longer and some i16 instructions are slow.
494 virtual bool isTypeDesirableForOp(unsigned Opc, EVT VT) const;
495
496 /// isTypeDesirable - Return true if the target has native support for the
497 /// specified value type and it is 'desirable' to use the type. e.g. On x86
498 /// i16 is legal, but undesirable since i16 instruction encodings are longer
499 /// and some i16 instructions are slow.
500 virtual bool IsDesirableToPromoteOp(SDValue Op, EVT &PVT) const;
Evan Cheng64b7bf72010-04-16 06:14:10 +0000501
Dan Gohmanaf1d8ca2010-05-01 00:01:06 +0000502 virtual MachineBasicBlock *
503 EmitInstrWithCustomInserter(MachineInstr *MI,
504 MachineBasicBlock *MBB) const;
Evan Cheng4a460802006-01-11 00:33:36 +0000505
Mon P Wang63307c32008-05-05 19:05:59 +0000506
Evan Cheng72261582005-12-20 06:22:03 +0000507 /// getTargetNodeName - This method returns the name of a target specific
508 /// DAG node.
509 virtual const char *getTargetNodeName(unsigned Opcode) const;
510
Scott Michel5b8f82e2008-03-10 15:42:14 +0000511 /// getSetCCResultType - Return the ISD::SETCC ValueType
Owen Anderson825b72b2009-08-11 20:47:22 +0000512 virtual MVT::SimpleValueType getSetCCResultType(EVT VT) const;
Scott Michel5b8f82e2008-03-10 15:42:14 +0000513
Nate Begeman368e18d2006-02-16 21:11:51 +0000514 /// computeMaskedBitsForTargetNode - Determine which of the bits specified
515 /// in Mask are known to be either zero or one and return them in the
516 /// KnownZero/KnownOne bitsets.
Dan Gohman475871a2008-07-27 21:46:04 +0000517 virtual void computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohman977a76f2008-02-13 22:28:48 +0000518 const APInt &Mask,
Dan Gohmanfd29e0e2008-02-13 00:35:47 +0000519 APInt &KnownZero,
520 APInt &KnownOne,
Dan Gohmanea859be2007-06-22 14:59:07 +0000521 const SelectionDAG &DAG,
Nate Begeman368e18d2006-02-16 21:11:51 +0000522 unsigned Depth = 0) const;
Evan Chengad4196b2008-05-12 19:56:52 +0000523
524 virtual bool
Dan Gohman46510a72010-04-15 01:51:59 +0000525 isGAPlusOffset(SDNode *N, const GlobalValue* &GA, int64_t &Offset) const;
Nate Begeman368e18d2006-02-16 21:11:51 +0000526
Dan Gohmand858e902010-04-17 15:26:15 +0000527 SDValue getReturnAddressFrameIndex(SelectionDAG &DAG) const;
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000528
Chris Lattnerb8105652009-07-20 17:51:36 +0000529 virtual bool ExpandInlineAsm(CallInst *CI) const;
530
Chris Lattner4234f572007-03-25 02:14:49 +0000531 ConstraintType getConstraintType(const std::string &Constraint) const;
Chris Lattnerf4dff842006-07-11 02:54:03 +0000532
Chris Lattner259e97c2006-01-31 19:43:35 +0000533 std::vector<unsigned>
Chris Lattner1efa40f2006-02-22 00:56:39 +0000534 getRegClassForInlineAsmConstraint(const std::string &Constraint,
Owen Andersone50ed302009-08-10 22:56:29 +0000535 EVT VT) const;
Chris Lattner48884cd2007-08-25 00:47:38 +0000536
Owen Andersone50ed302009-08-10 22:56:29 +0000537 virtual const char *LowerXConstraint(EVT ConstraintVT) const;
Dale Johannesenba2a0b92008-01-29 02:21:21 +0000538
Chris Lattner48884cd2007-08-25 00:47:38 +0000539 /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
Evan Chengda43bcf2008-09-24 00:05:32 +0000540 /// vector. If it is invalid, don't add anything to Ops. If hasMemory is
541 /// true it means one of the asm constraint of the inline asm instruction
542 /// being processed is 'm'.
Dan Gohman475871a2008-07-27 21:46:04 +0000543 virtual void LowerAsmOperandForConstraint(SDValue Op,
Chris Lattner48884cd2007-08-25 00:47:38 +0000544 char ConstraintLetter,
Dan Gohman475871a2008-07-27 21:46:04 +0000545 std::vector<SDValue> &Ops,
Chris Lattner5e764232008-04-26 23:02:14 +0000546 SelectionDAG &DAG) const;
Chris Lattner22aaf1d2006-10-31 20:13:11 +0000547
Chris Lattner91897772006-10-18 18:26:48 +0000548 /// getRegForInlineAsmConstraint - Given a physical register constraint
549 /// (e.g. {edx}), return the register number and the register class for the
550 /// register. This should only be used for C_Register constraints. On
551 /// error, this returns a register number of 0.
Chris Lattnerf76d1802006-07-31 23:26:50 +0000552 std::pair<unsigned, const TargetRegisterClass*>
553 getRegForInlineAsmConstraint(const std::string &Constraint,
Owen Andersone50ed302009-08-10 22:56:29 +0000554 EVT VT) const;
Chris Lattnerf76d1802006-07-31 23:26:50 +0000555
Chris Lattnerc9addb72007-03-30 23:15:24 +0000556 /// isLegalAddressingMode - Return true if the addressing mode represented
557 /// by AM is legal for this target, for a load/store of the specified type.
558 virtual bool isLegalAddressingMode(const AddrMode &AM, const Type *Ty)const;
559
Evan Cheng2bd122c2007-10-26 01:56:11 +0000560 /// isTruncateFree - Return true if it's free to truncate a value of
561 /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
562 /// register EAX to i16 by referencing its sub-register AX.
563 virtual bool isTruncateFree(const Type *Ty1, const Type *Ty2) const;
Owen Andersone50ed302009-08-10 22:56:29 +0000564 virtual bool isTruncateFree(EVT VT1, EVT VT2) const;
Dan Gohman97121ba2009-04-08 00:15:30 +0000565
566 /// isZExtFree - Return true if any actual instruction that defines a
567 /// value of type Ty1 implicit zero-extends the value to Ty2 in the result
568 /// register. This does not necessarily include registers defined in
569 /// unknown ways, such as incoming arguments, or copies from unknown
570 /// virtual registers. Also, if isTruncateFree(Ty2, Ty1) is true, this
571 /// does not necessarily apply to truncate instructions. e.g. on x86-64,
572 /// all instructions that define 32-bit values implicit zero-extend the
573 /// result out to 64 bits.
574 virtual bool isZExtFree(const Type *Ty1, const Type *Ty2) const;
Owen Andersone50ed302009-08-10 22:56:29 +0000575 virtual bool isZExtFree(EVT VT1, EVT VT2) const;
Dan Gohman97121ba2009-04-08 00:15:30 +0000576
Evan Cheng8b944d32009-05-28 00:35:15 +0000577 /// isNarrowingProfitable - Return true if it's profitable to narrow
578 /// operations of type VT1 to VT2. e.g. on x86, it's profitable to narrow
579 /// from i32 to i8 but not from i32 to i16.
Owen Andersone50ed302009-08-10 22:56:29 +0000580 virtual bool isNarrowingProfitable(EVT VT1, EVT VT2) const;
Evan Cheng8b944d32009-05-28 00:35:15 +0000581
Evan Chengeb2f9692009-10-27 19:56:55 +0000582 /// isFPImmLegal - Returns true if the target can instruction select the
583 /// specified FP immediate natively. If false, the legalizer will
584 /// materialize the FP immediate as a load from a constant pool.
Evan Chenga1eaa3c2009-10-28 01:43:28 +0000585 virtual bool isFPImmLegal(const APFloat &Imm, EVT VT) const;
Evan Chengeb2f9692009-10-27 19:56:55 +0000586
Evan Cheng0188ecb2006-03-22 18:59:22 +0000587 /// isShuffleMaskLegal - Targets can use this to indicate that they only
588 /// support *some* VECTOR_SHUFFLE operations, those with specific masks.
Chris Lattner91897772006-10-18 18:26:48 +0000589 /// By default, if a target supports the VECTOR_SHUFFLE node, all mask
590 /// values are assumed to be legal.
Nate Begeman5a5ca152009-04-29 05:20:52 +0000591 virtual bool isShuffleMaskLegal(const SmallVectorImpl<int> &Mask,
Owen Andersone50ed302009-08-10 22:56:29 +0000592 EVT VT) const;
Evan Cheng39623da2006-04-20 08:58:49 +0000593
594 /// isVectorClearMaskLegal - Similar to isShuffleMaskLegal. This is
595 /// used by Targets can use this to indicate if there is a suitable
596 /// VECTOR_SHUFFLE that can be used to replace a VAND with a constant
597 /// pool entry.
Nate Begeman5a5ca152009-04-29 05:20:52 +0000598 virtual bool isVectorClearMaskLegal(const SmallVectorImpl<int> &Mask,
Owen Andersone50ed302009-08-10 22:56:29 +0000599 EVT VT) const;
Evan Cheng6fd599f2008-03-05 01:30:59 +0000600
601 /// ShouldShrinkFPConstant - If true, then instruction selection should
602 /// seek to shrink the FP constant of the specified type to a smaller type
603 /// in order to save space and / or reduce runtime.
Owen Andersone50ed302009-08-10 22:56:29 +0000604 virtual bool ShouldShrinkFPConstant(EVT VT) const {
Evan Cheng6fd599f2008-03-05 01:30:59 +0000605 // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
606 // expensive than a straight movsd. On the other hand, it's important to
607 // shrink long double fp constant since fldt is very slow.
Owen Anderson825b72b2009-08-11 20:47:22 +0000608 return !X86ScalarSSEf64 || VT == MVT::f80;
Evan Cheng6fd599f2008-03-05 01:30:59 +0000609 }
Arnold Schwaighoferc85e1712007-10-11 19:40:01 +0000610
Dan Gohman419e4f92010-05-11 16:21:03 +0000611 const X86Subtarget* getSubtarget() const {
Dan Gohman707e0182008-04-12 04:36:06 +0000612 return Subtarget;
Rafael Espindolaf1ba1ca2007-11-05 23:12:20 +0000613 }
614
Chris Lattner3d661852008-01-18 06:52:41 +0000615 /// isScalarFPTypeInSSEReg - Return true if the specified scalar FP type is
616 /// computed in an SSE register, not on the X87 floating point stack.
Owen Andersone50ed302009-08-10 22:56:29 +0000617 bool isScalarFPTypeInSSEReg(EVT VT) const {
Owen Anderson825b72b2009-08-11 20:47:22 +0000618 return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
619 (VT == MVT::f32 && X86ScalarSSEf32); // f32 is when SSE1
Chris Lattner3d661852008-01-18 06:52:41 +0000620 }
Dan Gohmand9f3c482008-08-19 21:32:53 +0000621
622 /// createFastISel - This method returns a target specific FastISel object,
623 /// or null if the target does not support "fast" ISel.
Dan Gohmana4160c32010-07-07 16:29:44 +0000624 virtual FastISel *createFastISel(FunctionLoweringInfo &funcInfo) const;
Bill Wendling20c568f2009-06-30 22:38:32 +0000625
Bill Wendlingb4202b82009-07-01 18:50:55 +0000626 /// getFunctionAlignment - Return the Log2 alignment of this function.
Bill Wendling20c568f2009-06-30 22:38:32 +0000627 virtual unsigned getFunctionAlignment(const Function *F) const;
628
Evan Cheng70017e42010-07-24 00:39:05 +0000629 unsigned getRegPressureLimit(const TargetRegisterClass *RC,
630 MachineFunction &MF) const;
631
Eric Christopherf7a0c7b2010-07-06 05:18:56 +0000632 /// getStackCookieLocation - Return true if the target stores stack
633 /// protector cookies at a fixed offset in some non-standard address
634 /// space, and populates the address space and offset as
635 /// appropriate.
636 virtual bool getStackCookieLocation(unsigned &AddressSpace, unsigned &Offset) const;
637
Evan Chengdee81012010-07-26 21:50:05 +0000638 protected:
639 std::pair<const TargetRegisterClass*, uint8_t>
640 findRepresentativeClass(EVT VT) const;
641
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000642 private:
Evan Cheng0db9fe62006-04-25 20:13:52 +0000643 /// Subtarget - Keep a pointer to the X86Subtarget around so that we can
644 /// make the right decision when generating code for different targets.
645 const X86Subtarget *Subtarget;
Dan Gohmanc9f5f3f2008-05-14 01:58:56 +0000646 const X86RegisterInfo *RegInfo;
Anton Korobeynikovbff66b02008-09-09 18:22:57 +0000647 const TargetData *TD;
Evan Cheng0db9fe62006-04-25 20:13:52 +0000648
Evan Cheng25ab6902006-09-08 06:48:29 +0000649 /// X86StackPtr - X86 physical register used as stack ptr.
650 unsigned X86StackPtr;
Arnold Schwaighoferc85e1712007-10-11 19:40:01 +0000651
Dale Johannesenf1fc3a82007-09-23 14:52:20 +0000652 /// X86ScalarSSEf32, X86ScalarSSEf64 - Select between SSE or x87
653 /// floating point ops.
654 /// When SSE is available, use it for f32 operations.
655 /// When SSE2 is available, use it for f64 operations.
656 bool X86ScalarSSEf32;
657 bool X86ScalarSSEf64;
Evan Cheng0d9e9762008-01-29 19:34:22 +0000658
Evan Chengeb2f9692009-10-27 19:56:55 +0000659 /// LegalFPImmediates - A list of legal fp immediates.
660 std::vector<APFloat> LegalFPImmediates;
661
662 /// addLegalFPImmediate - Indicate that this x86 target can instruction
663 /// select the specified FP immediate natively.
664 void addLegalFPImmediate(const APFloat& Imm) {
665 LegalFPImmediates.push_back(Imm);
666 }
667
Dan Gohman98ca4f22009-08-05 01:29:28 +0000668 SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
Sandeep Patel65c3c8f2009-09-02 08:44:58 +0000669 CallingConv::ID CallConv, bool isVarArg,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000670 const SmallVectorImpl<ISD::InputArg> &Ins,
671 DebugLoc dl, SelectionDAG &DAG,
Dan Gohmand858e902010-04-17 15:26:15 +0000672 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohman98ca4f22009-08-05 01:29:28 +0000673 SDValue LowerMemArgument(SDValue Chain,
Sandeep Patel65c3c8f2009-09-02 08:44:58 +0000674 CallingConv::ID CallConv,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000675 const SmallVectorImpl<ISD::InputArg> &ArgInfo,
676 DebugLoc dl, SelectionDAG &DAG,
677 const CCValAssign &VA, MachineFrameInfo *MFI,
Dan Gohmand858e902010-04-17 15:26:15 +0000678 unsigned i) const;
Dan Gohman98ca4f22009-08-05 01:29:28 +0000679 SDValue LowerMemOpCallTo(SDValue Chain, SDValue StackPtr, SDValue Arg,
680 DebugLoc dl, SelectionDAG &DAG,
681 const CCValAssign &VA,
Dan Gohmand858e902010-04-17 15:26:15 +0000682 ISD::ArgFlagsTy Flags) const;
Rafael Espindola1b5dcc32007-08-31 15:06:30 +0000683
Gordon Henriksen86737662008-01-05 16:56:59 +0000684 // Call lowering helpers.
Evan Cheng0c439eb2010-01-27 00:07:07 +0000685
686 /// IsEligibleForTailCallOptimization - Check whether the call is eligible
687 /// for tail call optimization. Targets which want to do tail call
688 /// optimization should implement this function.
Evan Cheng022d9e12010-02-02 23:55:14 +0000689 bool IsEligibleForTailCallOptimization(SDValue Callee,
Evan Cheng0c439eb2010-01-27 00:07:07 +0000690 CallingConv::ID CalleeCC,
691 bool isVarArg,
Evan Chenga375d472010-03-15 18:54:48 +0000692 bool isCalleeStructRet,
693 bool isCallerStructRet,
Evan Chengb1712452010-01-27 06:25:16 +0000694 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanc9403652010-07-07 15:54:55 +0000695 const SmallVectorImpl<SDValue> &OutVals,
Evan Chengb1712452010-01-27 06:25:16 +0000696 const SmallVectorImpl<ISD::InputArg> &Ins,
Evan Cheng0c439eb2010-01-27 00:07:07 +0000697 SelectionDAG& DAG) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000698 bool IsCalleePop(bool isVarArg, CallingConv::ID CallConv) const;
Dan Gohman475871a2008-07-27 21:46:04 +0000699 SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr,
700 SDValue Chain, bool IsTailCall, bool Is64Bit,
Dan Gohmand858e902010-04-17 15:26:15 +0000701 int FPDiff, DebugLoc dl) const;
Arnold Schwaighofer4b5324a2008-04-12 18:11:06 +0000702
Sandeep Patel65c3c8f2009-09-02 08:44:58 +0000703 CCAssignFn *CCAssignFnForNode(CallingConv::ID CallConv) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000704 unsigned GetAlignedArgumentStackSize(unsigned StackSize,
705 SelectionDAG &DAG) const;
Evan Cheng559806f2006-01-27 08:10:46 +0000706
Eli Friedman948e95a2009-05-23 09:59:16 +0000707 std::pair<SDValue,SDValue> FP_TO_INTHelper(SDValue Op, SelectionDAG &DAG,
Dan Gohmand858e902010-04-17 15:26:15 +0000708 bool isSigned) const;
Evan Chengc3630942009-12-09 21:00:30 +0000709
710 SDValue LowerAsSplatVectorLoad(SDValue SrcOp, EVT VT, DebugLoc dl,
Dan Gohmand858e902010-04-17 15:26:15 +0000711 SelectionDAG &DAG) const;
712 SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
713 SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
714 SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) const;
715 SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
716 SDValue LowerEXTRACT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG) const;
717 SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
718 SDValue LowerINSERT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG) const;
719 SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) const;
720 SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
721 SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
Dale Johannesen33c960f2009-02-04 20:06:27 +0000722 SDValue LowerGlobalAddress(const GlobalValue *GV, DebugLoc dl,
723 int64_t Offset, SelectionDAG &DAG) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000724 SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
725 SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
726 SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG) const;
727 SDValue LowerShift(SDValue Op, SelectionDAG &DAG) const;
Owen Andersone50ed302009-08-10 22:56:29 +0000728 SDValue BuildFILD(SDValue Op, EVT SrcVT, SDValue Chain, SDValue StackSlot,
Dan Gohmand858e902010-04-17 15:26:15 +0000729 SelectionDAG &DAG) const;
Dale Johannesen7d07b482010-05-21 00:52:33 +0000730 SDValue LowerBIT_CONVERT(SDValue op, SelectionDAG &DAG) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000731 SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
732 SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
733 SDValue LowerUINT_TO_FP_i64(SDValue Op, SelectionDAG &DAG) const;
734 SDValue LowerUINT_TO_FP_i32(SDValue Op, SelectionDAG &DAG) const;
735 SDValue LowerFP_TO_SINT(SDValue Op, SelectionDAG &DAG) const;
736 SDValue LowerFP_TO_UINT(SDValue Op, SelectionDAG &DAG) const;
737 SDValue LowerFABS(SDValue Op, SelectionDAG &DAG) const;
738 SDValue LowerFNEG(SDValue Op, SelectionDAG &DAG) const;
739 SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const;
Evan Cheng5528e7b2010-04-21 01:47:12 +0000740 SDValue LowerToBT(SDValue And, ISD::CondCode CC,
741 DebugLoc dl, SelectionDAG &DAG) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000742 SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
743 SDValue LowerVSETCC(SDValue Op, SelectionDAG &DAG) const;
744 SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
745 SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
746 SDValue LowerMEMSET(SDValue Op, SelectionDAG &DAG) const;
747 SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
748 SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
749 SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
750 SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
751 SDValue LowerVACOPY(SDValue Op, SelectionDAG &DAG) const;
752 SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
753 SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
754 SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
755 SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG) const;
756 SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG) const;
757 SDValue LowerTRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
758 SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
759 SDValue LowerCTLZ(SDValue Op, SelectionDAG &DAG) const;
760 SDValue LowerCTTZ(SDValue Op, SelectionDAG &DAG) const;
761 SDValue LowerMUL_V2I64(SDValue Op, SelectionDAG &DAG) const;
Nate Begemanbdcb5af2010-07-27 22:37:06 +0000762 SDValue LowerSHL(SDValue Op, SelectionDAG &DAG) const;
Dan Gohmand858e902010-04-17 15:26:15 +0000763 SDValue LowerXALUO(SDValue Op, SelectionDAG &DAG) const;
Bill Wendling41ea7e72008-11-24 19:21:46 +0000764
Dan Gohmand858e902010-04-17 15:26:15 +0000765 SDValue LowerCMP_SWAP(SDValue Op, SelectionDAG &DAG) const;
766 SDValue LowerLOAD_SUB(SDValue Op, SelectionDAG &DAG) const;
767 SDValue LowerREADCYCLECOUNTER(SDValue Op, SelectionDAG &DAG) const;
Eric Christopher9a9d2752010-07-22 02:48:34 +0000768 SDValue LowerMEMBARRIER(SDValue Op, SelectionDAG &DAG) const;
Duncan Sands1607f052008-12-01 11:39:25 +0000769
Bruno Cardoso Lopesbf8154a2010-08-21 01:32:18 +0000770 // Utility functions to help LowerVECTOR_SHUFFLE
771 SDValue LowerVECTOR_SHUFFLEv8i16(SDValue Op, SelectionDAG &DAG) const;
772
Dan Gohman98ca4f22009-08-05 01:29:28 +0000773 virtual SDValue
774 LowerFormalArguments(SDValue Chain,
Sandeep Patel65c3c8f2009-09-02 08:44:58 +0000775 CallingConv::ID CallConv, bool isVarArg,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000776 const SmallVectorImpl<ISD::InputArg> &Ins,
777 DebugLoc dl, SelectionDAG &DAG,
Dan Gohmand858e902010-04-17 15:26:15 +0000778 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohman98ca4f22009-08-05 01:29:28 +0000779 virtual SDValue
Evan Cheng022d9e12010-02-02 23:55:14 +0000780 LowerCall(SDValue Chain, SDValue Callee,
Evan Cheng0c439eb2010-01-27 00:07:07 +0000781 CallingConv::ID CallConv, bool isVarArg, bool &isTailCall,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000782 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanc9403652010-07-07 15:54:55 +0000783 const SmallVectorImpl<SDValue> &OutVals,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000784 const SmallVectorImpl<ISD::InputArg> &Ins,
785 DebugLoc dl, SelectionDAG &DAG,
Dan Gohmand858e902010-04-17 15:26:15 +0000786 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohman98ca4f22009-08-05 01:29:28 +0000787
788 virtual SDValue
789 LowerReturn(SDValue Chain,
Sandeep Patel65c3c8f2009-09-02 08:44:58 +0000790 CallingConv::ID CallConv, bool isVarArg,
Dan Gohman98ca4f22009-08-05 01:29:28 +0000791 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanc9403652010-07-07 15:54:55 +0000792 const SmallVectorImpl<SDValue> &OutVals,
Dan Gohmand858e902010-04-17 15:26:15 +0000793 DebugLoc dl, SelectionDAG &DAG) const;
Dan Gohman98ca4f22009-08-05 01:29:28 +0000794
Kenneth Uildriksb4997ae2009-11-07 02:11:54 +0000795 virtual bool
796 CanLowerReturn(CallingConv::ID CallConv, bool isVarArg,
Dan Gohman84023e02010-07-10 09:00:22 +0000797 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanc9af33c2010-07-06 22:19:37 +0000798 LLVMContext &Context) const;
Kenneth Uildriksb4997ae2009-11-07 02:11:54 +0000799
Duncan Sands1607f052008-12-01 11:39:25 +0000800 void ReplaceATOMIC_BINARY_64(SDNode *N, SmallVectorImpl<SDValue> &Results,
Dan Gohmand858e902010-04-17 15:26:15 +0000801 SelectionDAG &DAG, unsigned NewOp) const;
Duncan Sands1607f052008-12-01 11:39:25 +0000802
Eric Christopherb120ab42009-08-18 22:50:32 +0000803 /// Utility function to emit string processing sse4.2 instructions
804 /// that return in xmm0.
Evan Cheng431f7752009-09-19 10:09:15 +0000805 /// This takes the instruction to expand, the associated machine basic
806 /// block, the number of args, and whether or not the second arg is
807 /// in memory or not.
Eric Christopherb120ab42009-08-18 22:50:32 +0000808 MachineBasicBlock *EmitPCMP(MachineInstr *BInstr, MachineBasicBlock *BB,
Mon P Wang20adc9d2010-04-04 03:10:48 +0000809 unsigned argNum, bool inMem) const;
Eric Christopherb120ab42009-08-18 22:50:32 +0000810
Mon P Wang63307c32008-05-05 19:05:59 +0000811 /// Utility function to emit atomic bitwise operations (and, or, xor).
Evan Cheng431f7752009-09-19 10:09:15 +0000812 /// It takes the bitwise instruction to expand, the associated machine basic
813 /// block, and the associated X86 opcodes for reg/reg and reg/imm.
Mon P Wang63307c32008-05-05 19:05:59 +0000814 MachineBasicBlock *EmitAtomicBitwiseWithCustomInserter(
815 MachineInstr *BInstr,
816 MachineBasicBlock *BB,
817 unsigned regOpc,
Andrew Lenharth507a58a2008-06-14 05:48:15 +0000818 unsigned immOpc,
Dale Johannesen140be2d2008-08-19 18:47:28 +0000819 unsigned loadOpc,
820 unsigned cxchgOpc,
Dale Johannesen140be2d2008-08-19 18:47:28 +0000821 unsigned notOpc,
822 unsigned EAXreg,
823 TargetRegisterClass *RC,
Dan Gohman1fdbc1d2009-02-07 16:15:20 +0000824 bool invSrc = false) const;
Dale Johannesen48c1bc22008-10-02 18:53:47 +0000825
826 MachineBasicBlock *EmitAtomicBit6432WithCustomInserter(
827 MachineInstr *BInstr,
828 MachineBasicBlock *BB,
829 unsigned regOpcL,
830 unsigned regOpcH,
831 unsigned immOpcL,
832 unsigned immOpcH,
Dan Gohman1fdbc1d2009-02-07 16:15:20 +0000833 bool invSrc = false) const;
Mon P Wang63307c32008-05-05 19:05:59 +0000834
835 /// Utility function to emit atomic min and max. It takes the min/max
Bill Wendlingbddc4422009-03-26 01:46:56 +0000836 /// instruction to expand, the associated basic block, and the associated
837 /// cmov opcode for moving the min or max value.
Mon P Wang63307c32008-05-05 19:05:59 +0000838 MachineBasicBlock *EmitAtomicMinMaxWithCustomInserter(MachineInstr *BInstr,
839 MachineBasicBlock *BB,
Dan Gohman1fdbc1d2009-02-07 16:15:20 +0000840 unsigned cmovOpc) const;
Dan Gohman076aee32009-03-04 19:44:21 +0000841
Dan Gohmand6708ea2009-08-15 01:38:56 +0000842 /// Utility function to emit the xmm reg save portion of va_start.
843 MachineBasicBlock *EmitVAStartSaveXMMRegsWithCustomInserter(
844 MachineInstr *BInstr,
845 MachineBasicBlock *BB) const;
846
Chris Lattner52600972009-09-02 05:57:00 +0000847 MachineBasicBlock *EmitLoweredSelect(MachineInstr *I,
Dan Gohmanaf1d8ca2010-05-01 00:01:06 +0000848 MachineBasicBlock *BB) const;
Anton Korobeynikov043f3c22010-03-06 19:32:29 +0000849
850 MachineBasicBlock *EmitLoweredMingwAlloca(MachineInstr *MI,
Dan Gohmanaf1d8ca2010-05-01 00:01:06 +0000851 MachineBasicBlock *BB) const;
Eric Christopher30ef0e52010-06-03 04:07:48 +0000852
853 MachineBasicBlock *EmitLoweredTLSCall(MachineInstr *MI,
854 MachineBasicBlock *BB) const;
Anton Korobeynikov043f3c22010-03-06 19:32:29 +0000855
Dan Gohman076aee32009-03-04 19:44:21 +0000856 /// Emit nodes that will be selected as "test Op0,Op0", or something
Dan Gohman31125812009-03-07 01:58:32 +0000857 /// equivalent, for use with the given x86 condition code.
Evan Cheng552f09a2010-04-26 19:06:11 +0000858 SDValue EmitTest(SDValue Op0, unsigned X86CC, SelectionDAG &DAG) const;
Dan Gohman076aee32009-03-04 19:44:21 +0000859
860 /// Emit nodes that will be selected as "cmp Op0,Op1", or something
Dan Gohman31125812009-03-07 01:58:32 +0000861 /// equivalent, for use with the given x86 condition code.
Evan Cheng552f09a2010-04-26 19:06:11 +0000862 SDValue EmitCmp(SDValue Op0, SDValue Op1, unsigned X86CC,
Dan Gohmand858e902010-04-17 15:26:15 +0000863 SelectionDAG &DAG) const;
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000864 };
Evan Chengc3f44b02008-09-03 00:03:49 +0000865
866 namespace X86 {
Dan Gohmana4160c32010-07-07 16:29:44 +0000867 FastISel *createFastISel(FunctionLoweringInfo &funcInfo);
Evan Chengc3f44b02008-09-03 00:03:49 +0000868 }
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000869}
870
Chris Lattnerdbdbf0c2005-11-15 00:40:23 +0000871#endif // X86ISELLOWERING_H