blob: 35f63b26df60822e04324438f1ec490d7acd57ca [file] [log] [blame]
Chris Lattner76ac0682005-11-15 00:40:23 +00001//===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Chris Lattner76ac0682005-11-15 00:40:23 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the interfaces that X86 uses to lower LLVM code into a
11// selection DAG.
12//
13//===----------------------------------------------------------------------===//
14
15#ifndef X86ISELLOWERING_H
16#define X86ISELLOWERING_H
17
Evan Chengcde9e302006-01-27 08:10:46 +000018#include "X86Subtarget.h"
Anton Korobeynikov383a3242007-07-14 14:06:15 +000019#include "X86RegisterInfo.h"
Gordon Henriksen92319582008-01-05 16:56:59 +000020#include "X86MachineFunctionInfo.h"
Chris Lattner76ac0682005-11-15 00:40:23 +000021#include "llvm/Target/TargetLowering.h"
Evan Cheng8703c412010-01-26 19:04:47 +000022#include "llvm/Target/TargetOptions.h"
Ted Kremenek2175b552008-09-03 02:54:11 +000023#include "llvm/CodeGen/FastISel.h"
Chris Lattner76ac0682005-11-15 00:40:23 +000024#include "llvm/CodeGen/SelectionDAG.h"
Rafael Espindolae636fc02007-08-31 15:06:30 +000025#include "llvm/CodeGen/CallingConvLower.h"
Chris Lattner76ac0682005-11-15 00:40:23 +000026
27namespace llvm {
Chris Lattner76ac0682005-11-15 00:40:23 +000028 namespace X86ISD {
Evan Cheng172fce72006-01-06 00:43:03 +000029 // X86 Specific DAG Nodes
Chris Lattner76ac0682005-11-15 00:40:23 +000030 enum NodeType {
31 // Start the numbering where the builtin ops leave off.
Dan Gohmaned1cf1a2008-09-23 18:42:32 +000032 FIRST_NUMBER = ISD::BUILTIN_OP_END,
Chris Lattner76ac0682005-11-15 00:40:23 +000033
Evan Chenge9fbc3f2007-12-14 02:13:44 +000034 /// BSF - Bit scan forward.
35 /// BSR - Bit scan reverse.
36 BSF,
37 BSR,
38
Evan Cheng9c249c32006-01-09 18:33:28 +000039 /// SHLD, SHRD - Double shift instructions. These correspond to
40 /// X86::SHLDxx and X86::SHRDxx instructions.
41 SHLD,
42 SHRD,
43
Evan Cheng2dd217b2006-01-31 03:14:29 +000044 /// FAND - Bitwise logical AND of floating point values. This corresponds
45 /// to X86::ANDPS or X86::ANDPD.
46 FAND,
47
Evan Cheng4363e882007-01-05 07:55:56 +000048 /// FOR - Bitwise logical OR of floating point values. This corresponds
49 /// to X86::ORPS or X86::ORPD.
50 FOR,
51
Evan Cheng72d5c252006-01-31 22:28:30 +000052 /// FXOR - Bitwise logical XOR of floating point values. This corresponds
53 /// to X86::XORPS or X86::XORPD.
54 FXOR,
55
Evan Cheng82241c82007-01-05 21:37:56 +000056 /// FSRL - Bitwise logical right shift of floating point values. These
57 /// corresponds to X86::PSRLDQ.
Evan Cheng4363e882007-01-05 07:55:56 +000058 FSRL,
59
Dan Gohmanf9bbcd12009-08-05 01:29:28 +000060 /// CALL - These operations represent an abstract X86 call
Chris Lattner76ac0682005-11-15 00:40:23 +000061 /// instruction, which includes a bunch of information. In particular the
62 /// operands of these node are:
63 ///
64 /// #0 - The incoming token chain
65 /// #1 - The callee
66 /// #2 - The number of arg bytes the caller pushes on the stack.
67 /// #3 - The number of arg bytes the callee pops off the stack.
68 /// #4 - The value to pass in AL/AX/EAX (optional)
69 /// #5 - The value to pass in DL/DX/EDX (optional)
70 ///
71 /// The result values of these nodes are:
72 ///
73 /// #0 - The outgoing token chain
74 /// #1 - The first register result value (optional)
75 /// #2 - The second register result value (optional)
76 ///
Chris Lattner76ac0682005-11-15 00:40:23 +000077 CALL,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +000078
Michael J. Spencer9cafc872010-10-20 23:40:27 +000079 /// RDTSC_DAG - This operation implements the lowering for
Andrew Lenharth0bf68ae2005-11-20 21:41:10 +000080 /// readcyclecounter
81 RDTSC_DAG,
Evan Cheng225a4d02005-12-17 01:21:05 +000082
83 /// X86 compare and logical compare instructions.
Evan Cheng80700992007-09-17 17:42:53 +000084 CMP, COMI, UCOMI,
Evan Cheng225a4d02005-12-17 01:21:05 +000085
Dan Gohman25a767d2008-12-23 22:45:23 +000086 /// X86 bit-test instructions.
87 BT,
88
Dan Gohman4a683472009-03-23 15:40:10 +000089 /// X86 SetCC. Operand 0 is condition code, and operand 1 is the flag
Evan Chengc1583db2005-12-21 20:21:51 +000090 /// operand produced by a CMP instruction.
91 SETCC,
92
Evan Cheng0e8b9e32009-12-15 00:53:42 +000093 // Same as SETCC except it's materialized with a sbb and the value is all
94 // one's or all zero's.
95 SETCC_CARRY,
96
Chris Lattnera492d292009-03-12 06:46:02 +000097 /// X86 conditional moves. Operand 0 and operand 1 are the two values
98 /// to select from. Operand 2 is the condition code, and operand 3 is the
99 /// flag operand produced by a CMP or TEST instruction. It also writes a
100 /// flag result.
Evan Cheng225a4d02005-12-17 01:21:05 +0000101 CMOV,
Evan Cheng6fc31042005-12-19 23:12:38 +0000102
Dan Gohman4a683472009-03-23 15:40:10 +0000103 /// X86 conditional branches. Operand 0 is the chain operand, operand 1
104 /// is the block to branch if condition is true, operand 2 is the
105 /// condition code, and operand 3 is the flag operand produced by a CMP
Evan Chengc1583db2005-12-21 20:21:51 +0000106 /// or TEST instruction.
Evan Cheng6fc31042005-12-19 23:12:38 +0000107 BRCOND,
Evan Chenga74ce622005-12-21 02:39:21 +0000108
Dan Gohman4a683472009-03-23 15:40:10 +0000109 /// Return with a flag operand. Operand 0 is the chain operand, operand
110 /// 1 is the number of bytes of stack to pop.
Evan Chenga74ce622005-12-21 02:39:21 +0000111 RET_FLAG,
Evan Chengae986f12006-01-11 22:15:48 +0000112
113 /// REP_STOS - Repeat fill, corresponds to X86::REP_STOSx.
114 REP_STOS,
115
116 /// REP_MOVS - Repeat move, corresponds to X86::REP_MOVSx.
117 REP_MOVS,
Evan Cheng72d5c252006-01-31 22:28:30 +0000118
Evan Cheng5588de92006-02-18 00:15:05 +0000119 /// GlobalBaseReg - On Darwin, this node represents the result of the popl
120 /// at function entry, used for PIC code.
121 GlobalBaseReg,
Evan Cheng1f342c22006-02-23 02:43:52 +0000122
Bill Wendling24c79f22008-09-16 21:48:12 +0000123 /// Wrapper - A wrapper node for TargetConstantPool,
124 /// TargetExternalSymbol, and TargetGlobalAddress.
Evan Chenge0ed6ec2006-02-23 20:41:18 +0000125 Wrapper,
Evan Chengd5e905d2006-03-21 23:01:21 +0000126
Evan Chengae1cd752006-11-30 21:55:46 +0000127 /// WrapperRIP - Special wrapper used under X86-64 PIC mode for RIP
128 /// relative displacements.
129 WrapperRIP,
130
Dale Johannesendd224d22010-09-30 23:57:10 +0000131 /// MOVQ2DQ - Copies a 64-bit value from an MMX vector to the low word
132 /// of an XMM vector, with the high word zero filled.
Mon P Wang586d9972010-01-24 00:05:03 +0000133 MOVQ2DQ,
134
Dale Johannesendd224d22010-09-30 23:57:10 +0000135 /// MOVDQ2Q - Copies a 64-bit value from the low word of an XMM vector
136 /// to an MMX vector. If you think this is too close to the previous
137 /// mnemonic, so do I; blame Intel.
138 MOVDQ2Q,
139
Nate Begeman2d77e8e42008-02-11 04:19:36 +0000140 /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to
141 /// i32, corresponds to X86::PEXTRB.
142 PEXTRB,
143
Evan Chengcbffa462006-03-31 19:22:53 +0000144 /// PEXTRW - Extract a 16-bit value from a vector and zero extend it to
Evan Cheng5fd7c692006-03-31 21:55:24 +0000145 /// i32, corresponds to X86::PEXTRW.
Evan Chengcbffa462006-03-31 19:22:53 +0000146 PEXTRW,
Evan Cheng5fd7c692006-03-31 21:55:24 +0000147
Nate Begeman2d77e8e42008-02-11 04:19:36 +0000148 /// INSERTPS - Insert any element of a 4 x float vector into any element
149 /// of a destination 4 x floatvector.
150 INSERTPS,
151
152 /// PINSRB - Insert the lower 8-bits of a 32-bit value to a vector,
153 /// corresponds to X86::PINSRB.
154 PINSRB,
155
Evan Cheng5fd7c692006-03-31 21:55:24 +0000156 /// PINSRW - Insert the lower 16-bits of a 32-bit value to a vector,
157 /// corresponds to X86::PINSRW.
Chris Lattnera8288502010-02-23 02:07:48 +0000158 PINSRW, MMX_PINSRW,
Evan Cheng49683ba2006-11-10 21:43:37 +0000159
Nate Begemane684da32009-02-23 08:49:38 +0000160 /// PSHUFB - Shuffle 16 8-bit values within a vector.
161 PSHUFB,
162
Evan Cheng49683ba2006-11-10 21:43:37 +0000163 /// FMAX, FMIN - Floating point max and min.
164 ///
Lauro Ramos Venancio25188892007-04-20 21:38:10 +0000165 FMAX, FMIN,
Dan Gohman57111e72007-07-10 00:05:58 +0000166
167 /// FRSQRT, FRCP - Floating point reciprocal-sqrt and reciprocal
168 /// approximation. Note that these typically require refinement
169 /// in order to obtain suitable precision.
170 FRSQRT, FRCP,
171
Rafael Espindola3b2df102009-04-08 21:14:34 +0000172 // TLSADDR - Thread Local Storage.
173 TLSADDR,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000174
Eric Christopherb0e1a452010-06-03 04:07:48 +0000175 // TLSCALL - Thread Local Storage. When calling to an OS provided
176 // thunk at the address from an earlier relocation.
177 TLSCALL,
Rafael Espindola3b2df102009-04-08 21:14:34 +0000178
Evan Cheng78af38c2008-05-08 00:57:18 +0000179 // EH_RETURN - Exception Handling helpers.
Arnold Schwaighofer9ccea992007-10-11 19:40:01 +0000180 EH_RETURN,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000181
Arnold Schwaighofer7da2bce2008-03-19 16:39:45 +0000182 /// TC_RETURN - Tail call return.
183 /// operand #0 chain
184 /// operand #1 callee (register or absolute)
185 /// operand #2 stack adjustment
186 /// operand #3 optional in flag
Anton Korobeynikov91460e42007-11-16 01:31:51 +0000187 TC_RETURN,
188
Evan Cheng961339b2008-05-09 21:53:03 +0000189 // VZEXT_MOVL - Vector move low and zero extend.
190 VZEXT_MOVL,
191
Evan Cheng5e28227d2008-05-29 08:22:04 +0000192 // VSHL, VSRL - Vector logical left / right shift.
Nate Begeman55b7bec2008-07-17 16:51:19 +0000193 VSHL, VSRL,
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000194
195 // CMPPD, CMPPS - Vector double/float comparison.
Nate Begeman55b7bec2008-07-17 16:51:19 +0000196 // CMPPD, CMPPS - Vector double/float comparison.
197 CMPPD, CMPPS,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000198
Nate Begeman55b7bec2008-07-17 16:51:19 +0000199 // PCMP* - Vector integer comparisons.
200 PCMPEQB, PCMPEQW, PCMPEQD, PCMPEQQ,
Bill Wendling1a317672008-12-12 00:56:36 +0000201 PCMPGTB, PCMPGTW, PCMPGTD, PCMPGTQ,
202
Chris Lattner364bb0a2010-12-05 07:30:36 +0000203 // ADD, SUB, SMUL, etc. - Arithmetic operations with FLAGS results.
204 ADD, SUB, SMUL,
Dan Gohman722b1ee2009-09-18 19:59:53 +0000205 INC, DEC, OR, XOR, AND,
Chris Lattner364bb0a2010-12-05 07:30:36 +0000206
207 UMUL, // LOW, HI, FLAGS = umul LHS, RHS
Evan Chenga84a3182009-03-30 21:36:47 +0000208
209 // MUL_IMM - X86 specific multiply by immediate.
Eric Christopherf7802a32009-07-29 00:28:05 +0000210 MUL_IMM,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000211
Eric Christopherf7802a32009-07-29 00:28:05 +0000212 // PTEST - Vector bitwise comparisons
Dan Gohman0700a562009-08-15 01:38:56 +0000213 PTEST,
214
Bruno Cardoso Lopes91d61df2010-08-10 23:25:42 +0000215 // TESTP - Vector packed fp sign bitwise comparisons
216 TESTP,
217
Bruno Cardoso Lopes6f3b38a2010-08-20 22:55:05 +0000218 // Several flavors of instructions with vector shuffle behaviors.
219 PALIGN,
220 PSHUFD,
221 PSHUFHW,
222 PSHUFLW,
223 PSHUFHW_LD,
224 PSHUFLW_LD,
225 SHUFPD,
226 SHUFPS,
227 MOVDDUP,
228 MOVSHDUP,
229 MOVSLDUP,
230 MOVSHDUP_LD,
231 MOVSLDUP_LD,
232 MOVLHPS,
Bruno Cardoso Lopes6f3b38a2010-08-20 22:55:05 +0000233 MOVLHPD,
Bruno Cardoso Lopes03e4c352010-08-31 21:15:21 +0000234 MOVHLPS,
Bruno Cardoso Lopes6f3b38a2010-08-20 22:55:05 +0000235 MOVHLPD,
Bruno Cardoso Lopesb3825212010-09-01 05:08:25 +0000236 MOVLPS,
237 MOVLPD,
Bruno Cardoso Lopes6f3b38a2010-08-20 22:55:05 +0000238 MOVSD,
239 MOVSS,
240 UNPCKLPS,
241 UNPCKLPD,
242 UNPCKHPS,
243 UNPCKHPD,
244 PUNPCKLBW,
245 PUNPCKLWD,
246 PUNPCKLDQ,
247 PUNPCKLQDQ,
248 PUNPCKHBW,
249 PUNPCKHWD,
250 PUNPCKHDQ,
251 PUNPCKHQDQ,
252
Dan Gohman0700a562009-08-15 01:38:56 +0000253 // VASTART_SAVE_XMM_REGS - Save xmm argument registers to the stack,
254 // according to %al. An operator is needed so that this can be expanded
255 // with control flow.
Dan Gohman48b185d2009-09-25 20:36:54 +0000256 VASTART_SAVE_XMM_REGS,
257
Michael J. Spencerf509c6c2010-10-21 01:41:01 +0000258 // WIN_ALLOCA - Windows's _chkstk call to do stack probing.
259 WIN_ALLOCA,
Anton Korobeynikovd5e3fd62010-03-06 19:32:29 +0000260
Duncan Sands7c601de2010-11-20 11:25:00 +0000261 // Memory barrier
262 MEMBARRIER,
263 MFENCE,
264 SFENCE,
265 LFENCE,
266
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000267 // ATOMADD64_DAG, ATOMSUB64_DAG, ATOMOR64_DAG, ATOMAND64_DAG,
268 // ATOMXOR64_DAG, ATOMNAND64_DAG, ATOMSWAP64_DAG -
Dan Gohman48b185d2009-09-25 20:36:54 +0000269 // Atomic 64-bit binary operations.
270 ATOMADD64_DAG = ISD::FIRST_TARGET_MEMORY_OPCODE,
271 ATOMSUB64_DAG,
272 ATOMOR64_DAG,
273 ATOMXOR64_DAG,
274 ATOMAND64_DAG,
275 ATOMNAND64_DAG,
Eric Christopher9a773822010-07-22 02:48:34 +0000276 ATOMSWAP64_DAG,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000277
Chris Lattnere479e962010-09-21 23:59:42 +0000278 // LCMPXCHG_DAG, LCMPXCHG8_DAG - Compare and swap.
279 LCMPXCHG_DAG,
Chris Lattner54e53292010-09-22 00:34:38 +0000280 LCMPXCHG8_DAG,
Anton Korobeynikovd5e3fd62010-03-06 19:32:29 +0000281
Chris Lattner54e53292010-09-22 00:34:38 +0000282 // VZEXT_LOAD - Load, scalar_to_vector, and zero extend.
Chris Lattner78f518b2010-09-22 01:05:16 +0000283 VZEXT_LOAD,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000284
Chris Lattnered85da52010-09-22 01:11:26 +0000285 // FNSTCW16m - Store FP control world into i16 memory.
286 FNSTCW16m,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000287
Chris Lattner78f518b2010-09-22 01:05:16 +0000288 /// FP_TO_INT*_IN_MEM - This instruction implements FP_TO_SINT with the
289 /// integer destination in memory and a FP reg source. This corresponds
290 /// to the X86::FIST*m instructions and the rounding mode change stuff. It
291 /// has two inputs (token chain and address) and two outputs (int value
292 /// and token chain).
293 FP_TO_INT16_IN_MEM,
294 FP_TO_INT32_IN_MEM,
Chris Lattnera5156c32010-09-22 01:28:21 +0000295 FP_TO_INT64_IN_MEM,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000296
Chris Lattnera5156c32010-09-22 01:28:21 +0000297 /// FILD, FILD_FLAG - This instruction implements SINT_TO_FP with the
298 /// integer source in memory and FP reg result. This corresponds to the
299 /// X86::FILD*m instructions. It has three inputs (token chain, address,
300 /// and source type) and two outputs (FP value and token chain). FILD_FLAG
301 /// also produces a flag).
302 FILD,
303 FILD_FLAG,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000304
Chris Lattnera5156c32010-09-22 01:28:21 +0000305 /// FLD - This instruction implements an extending load to FP stack slots.
306 /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain
307 /// operand, ptr to load from, and a ValueType node indicating the type
308 /// to load to.
309 FLD,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000310
Chris Lattnera5156c32010-09-22 01:28:21 +0000311 /// FST - This instruction implements a truncating store to FP stack
312 /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a
313 /// chain operand, value to store, address, and a ValueType to store it
314 /// as.
Dan Gohman395a8982010-10-12 18:00:49 +0000315 FST,
316
317 /// VAARG_64 - This instruction grabs the address of the next argument
318 /// from a va_list. (reads and modifies the va_list in memory)
319 VAARG_64
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000320
Anton Korobeynikovd5e3fd62010-03-06 19:32:29 +0000321 // WARNING: Do not add anything in the end unless you want the node to
322 // have memop! In fact, starting from ATOMADD64_DAG all opcodes will be
323 // thought as target memory ops!
Chris Lattner76ac0682005-11-15 00:40:23 +0000324 };
325 }
326
Evan Cheng084a1cd2008-01-29 19:34:22 +0000327 /// Define some predicates that are used for node matching.
328 namespace X86 {
329 /// isPSHUFDMask - Return true if the specified VECTOR_SHUFFLE operand
330 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000331 bool isPSHUFDMask(ShuffleVectorSDNode *N);
Evan Cheng68ad48b2006-03-22 18:59:22 +0000332
Evan Cheng084a1cd2008-01-29 19:34:22 +0000333 /// isPSHUFHWMask - Return true if the specified VECTOR_SHUFFLE operand
334 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000335 bool isPSHUFHWMask(ShuffleVectorSDNode *N);
Evan Chengb7fedff2006-03-29 23:07:14 +0000336
Evan Cheng084a1cd2008-01-29 19:34:22 +0000337 /// isPSHUFLWMask - Return true if the specified VECTOR_SHUFFLE operand
338 /// specifies a shuffle of elements that is suitable for input to PSHUFD.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000339 bool isPSHUFLWMask(ShuffleVectorSDNode *N);
Evan Chengb7fedff2006-03-29 23:07:14 +0000340
Evan Cheng084a1cd2008-01-29 19:34:22 +0000341 /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand
342 /// specifies a shuffle of elements that is suitable for input to SHUFP*.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000343 bool isSHUFPMask(ShuffleVectorSDNode *N);
Evan Chengd27fb3e2006-03-24 01:18:28 +0000344
Evan Cheng084a1cd2008-01-29 19:34:22 +0000345 /// isMOVHLPSMask - Return true if the specified VECTOR_SHUFFLE operand
346 /// specifies a shuffle of elements that is suitable for input to MOVHLPS.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000347 bool isMOVHLPSMask(ShuffleVectorSDNode *N);
Evan Cheng2595a682006-03-24 02:58:06 +0000348
Evan Cheng084a1cd2008-01-29 19:34:22 +0000349 /// isMOVHLPS_v_undef_Mask - Special case of isMOVHLPSMask for canonical form
350 /// of vector_shuffle v, v, <2, 3, 2, 3>, i.e. vector_shuffle v, undef,
351 /// <2, 3, 2, 3>
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000352 bool isMOVHLPS_v_undef_Mask(ShuffleVectorSDNode *N);
Evan Cheng922e1912006-11-07 22:14:24 +0000353
Evan Cheng084a1cd2008-01-29 19:34:22 +0000354 /// isMOVLPMask - Return true if the specified VECTOR_SHUFFLE operand
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000355 /// specifies a shuffle of elements that is suitable for MOVLP{S|D}.
356 bool isMOVLPMask(ShuffleVectorSDNode *N);
Evan Chengc995b452006-04-06 23:23:56 +0000357
Evan Cheng084a1cd2008-01-29 19:34:22 +0000358 /// isMOVHPMask - Return true if the specified VECTOR_SHUFFLE operand
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000359 /// specifies a shuffle of elements that is suitable for MOVHP{S|D}.
Evan Cheng084a1cd2008-01-29 19:34:22 +0000360 /// as well as MOVLHPS.
Nate Begeman3a313df2009-11-07 23:17:15 +0000361 bool isMOVLHPSMask(ShuffleVectorSDNode *N);
Evan Chengc995b452006-04-06 23:23:56 +0000362
Evan Cheng084a1cd2008-01-29 19:34:22 +0000363 /// isUNPCKLMask - Return true if the specified VECTOR_SHUFFLE operand
364 /// specifies a shuffle of elements that is suitable for input to UNPCKL.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000365 bool isUNPCKLMask(ShuffleVectorSDNode *N, bool V2IsSplat = false);
Evan Cheng5df75882006-03-28 00:39:58 +0000366
Evan Cheng084a1cd2008-01-29 19:34:22 +0000367 /// isUNPCKHMask - Return true if the specified VECTOR_SHUFFLE operand
368 /// specifies a shuffle of elements that is suitable for input to UNPCKH.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000369 bool isUNPCKHMask(ShuffleVectorSDNode *N, bool V2IsSplat = false);
Evan Cheng2bc32802006-03-28 02:43:26 +0000370
Evan Cheng084a1cd2008-01-29 19:34:22 +0000371 /// isUNPCKL_v_undef_Mask - Special case of isUNPCKLMask for canonical form
372 /// of vector_shuffle v, v, <0, 4, 1, 5>, i.e. vector_shuffle v, undef,
373 /// <0, 0, 1, 1>
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000374 bool isUNPCKL_v_undef_Mask(ShuffleVectorSDNode *N);
Evan Chengf3b52c82006-04-05 07:20:06 +0000375
Evan Cheng084a1cd2008-01-29 19:34:22 +0000376 /// isUNPCKH_v_undef_Mask - Special case of isUNPCKHMask for canonical form
377 /// of vector_shuffle v, v, <2, 6, 3, 7>, i.e. vector_shuffle v, undef,
378 /// <2, 2, 3, 3>
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000379 bool isUNPCKH_v_undef_Mask(ShuffleVectorSDNode *N);
Bill Wendling591eab82007-04-24 21:16:55 +0000380
Evan Cheng084a1cd2008-01-29 19:34:22 +0000381 /// isMOVLMask - Return true if the specified VECTOR_SHUFFLE operand
382 /// specifies a shuffle of elements that is suitable for input to MOVSS,
383 /// MOVSD, and MOVD, i.e. setting the lowest element.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000384 bool isMOVLMask(ShuffleVectorSDNode *N);
Evan Cheng12ba3e22006-04-11 00:19:04 +0000385
Evan Cheng084a1cd2008-01-29 19:34:22 +0000386 /// isMOVSHDUPMask - Return true if the specified VECTOR_SHUFFLE operand
387 /// specifies a shuffle of elements that is suitable for input to MOVSHDUP.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000388 bool isMOVSHDUPMask(ShuffleVectorSDNode *N);
Evan Cheng5d247f82006-04-14 21:59:03 +0000389
Evan Cheng084a1cd2008-01-29 19:34:22 +0000390 /// isMOVSLDUPMask - Return true if the specified VECTOR_SHUFFLE operand
391 /// specifies a shuffle of elements that is suitable for input to MOVSLDUP.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000392 bool isMOVSLDUPMask(ShuffleVectorSDNode *N);
Evan Chenge056dd52006-10-27 21:08:32 +0000393
Evan Cheng74c9ed92008-09-25 20:50:48 +0000394 /// isMOVDDUPMask - Return true if the specified VECTOR_SHUFFLE operand
395 /// specifies a shuffle of elements that is suitable for input to MOVDDUP.
Nate Begeman8d6d4b92009-04-27 18:41:29 +0000396 bool isMOVDDUPMask(ShuffleVectorSDNode *N);
Evan Cheng74c9ed92008-09-25 20:50:48 +0000397
Nate Begeman18df82a2009-10-19 02:17:23 +0000398 /// isPALIGNRMask - Return true if the specified VECTOR_SHUFFLE operand
399 /// specifies a shuffle of elements that is suitable for input to PALIGNR.
400 bool isPALIGNRMask(ShuffleVectorSDNode *N);
401
Evan Cheng084a1cd2008-01-29 19:34:22 +0000402 /// getShuffleSHUFImmediate - Return the appropriate immediate to shuffle
403 /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP*
404 /// instructions.
405 unsigned getShuffleSHUFImmediate(SDNode *N);
Evan Chengb7fedff2006-03-29 23:07:14 +0000406
Evan Cheng084a1cd2008-01-29 19:34:22 +0000407 /// getShufflePSHUFHWImmediate - Return the appropriate immediate to shuffle
Nate Begeman18df82a2009-10-19 02:17:23 +0000408 /// the specified VECTOR_SHUFFLE mask with PSHUFHW instruction.
Evan Cheng084a1cd2008-01-29 19:34:22 +0000409 unsigned getShufflePSHUFHWImmediate(SDNode *N);
Evan Chengb7fedff2006-03-29 23:07:14 +0000410
Nate Begeman18df82a2009-10-19 02:17:23 +0000411 /// getShufflePSHUFLWImmediate - Return the appropriate immediate to shuffle
412 /// the specified VECTOR_SHUFFLE mask with PSHUFLW instruction.
Evan Cheng084a1cd2008-01-29 19:34:22 +0000413 unsigned getShufflePSHUFLWImmediate(SDNode *N);
Evan Chenge62288f2009-07-30 08:33:02 +0000414
Nate Begeman18df82a2009-10-19 02:17:23 +0000415 /// getShufflePALIGNRImmediate - Return the appropriate immediate to shuffle
416 /// the specified VECTOR_SHUFFLE mask with the PALIGNR instruction.
417 unsigned getShufflePALIGNRImmediate(SDNode *N);
418
Evan Chenge62288f2009-07-30 08:33:02 +0000419 /// isZeroNode - Returns true if Elt is a constant zero or a floating point
420 /// constant +0.0.
421 bool isZeroNode(SDValue Elt);
Anton Korobeynikov741ea0d2009-08-05 23:01:26 +0000422
423 /// isOffsetSuitableForCodeModel - Returns true of the given offset can be
424 /// fit into displacement field of the instruction.
425 bool isOffsetSuitableForCodeModel(int64_t Offset, CodeModel::Model M,
426 bool hasSymbolicDisplacement = true);
Evan Cheng084a1cd2008-01-29 19:34:22 +0000427 }
428
Chris Lattnerf4aeff02006-10-18 18:26:48 +0000429 //===--------------------------------------------------------------------===//
Chris Lattner76ac0682005-11-15 00:40:23 +0000430 // X86TargetLowering - X86 Implementation of the TargetLowering interface
431 class X86TargetLowering : public TargetLowering {
Chris Lattner76ac0682005-11-15 00:40:23 +0000432 public:
Dan Gohmaneabd6472008-05-14 01:58:56 +0000433 explicit X86TargetLowering(X86TargetMachine &TM);
Chris Lattner76ac0682005-11-15 00:40:23 +0000434
Chris Lattner4bfbe932010-01-26 05:02:42 +0000435 virtual unsigned getJumpTableEncoding() const;
Chris Lattner9c1efcd2010-01-25 23:38:14 +0000436
Chris Lattner4bfbe932010-01-26 05:02:42 +0000437 virtual const MCExpr *
438 LowerCustomJumpTableEntry(const MachineJumpTableInfo *MJTI,
439 const MachineBasicBlock *MBB, unsigned uid,
440 MCContext &Ctx) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000441
Evan Cheng797d56f2007-11-09 01:32:10 +0000442 /// getPICJumpTableRelocaBase - Returns relocation base for the given PIC
443 /// jumptable.
Chris Lattner4bfbe932010-01-26 05:02:42 +0000444 virtual SDValue getPICJumpTableRelocBase(SDValue Table,
445 SelectionDAG &DAG) const;
Chris Lattner8a785d72010-01-26 06:28:43 +0000446 virtual const MCExpr *
447 getPICJumpTableRelocBaseExpr(const MachineFunction *MF,
448 unsigned JTI, MCContext &Ctx) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000449
Chris Lattner74f5bcf2007-02-26 04:01:25 +0000450 /// getStackPtrReg - Return the stack pointer register we are using: either
451 /// ESP or RSP.
452 unsigned getStackPtrReg() const { return X86StackPtr; }
Evan Cheng35abd842008-01-23 23:17:41 +0000453
454 /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
455 /// function arguments in the caller parameter area. For X86, aggregates
456 /// that contains are placed at 16-byte boundaries while the rest are at
457 /// 4-byte boundaries.
458 virtual unsigned getByValTypeAlignment(const Type *Ty) const;
Evan Chengef377ad2008-05-15 08:39:06 +0000459
460 /// getOptimalMemOpType - Returns the target specific optimal type for load
Evan Cheng61399372010-04-02 19:36:14 +0000461 /// and store operations as a result of memset, memcpy, and memmove
462 /// lowering. If DstAlign is zero that means it's safe to destination
463 /// alignment can satisfy any constraint. Similarly if SrcAlign is zero it
464 /// means there isn't a need to check it against alignment requirement,
465 /// probably because the source does not need to be loaded. If
466 /// 'NonScalarIntSafe' is true, that means it's safe to return a
467 /// non-scalar-integer type, e.g. empty string source, constant, or loaded
Evan Chengebe47c82010-04-08 07:37:57 +0000468 /// from memory. 'MemcpyStrSrc' indicates whether the memcpy source is
469 /// constant so it does not need to be loaded.
Dan Gohman148c69a2010-04-16 20:11:05 +0000470 /// It returns EVT::Other if the type should be determined using generic
471 /// target-independent logic.
Evan Cheng61399372010-04-02 19:36:14 +0000472 virtual EVT
Evan Chengebe47c82010-04-08 07:37:57 +0000473 getOptimalMemOpType(uint64_t Size, unsigned DstAlign, unsigned SrcAlign,
474 bool NonScalarIntSafe, bool MemcpyStrSrc,
Dan Gohman148c69a2010-04-16 20:11:05 +0000475 MachineFunction &MF) const;
Bill Wendlingbae6b2c2009-08-15 21:21:19 +0000476
477 /// allowsUnalignedMemoryAccesses - Returns true if the target allows
478 /// unaligned memory accesses. of the specified type.
479 virtual bool allowsUnalignedMemoryAccesses(EVT VT) const {
480 return true;
481 }
Bill Wendling31ceb1b2009-06-30 22:38:32 +0000482
Chris Lattner76ac0682005-11-15 00:40:23 +0000483 /// LowerOperation - Provide custom lowering hooks for some operations.
484 ///
Dan Gohman21cea8a2010-04-17 15:26:15 +0000485 virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const;
Chris Lattner76ac0682005-11-15 00:40:23 +0000486
Duncan Sands6ed40142008-12-01 11:39:25 +0000487 /// ReplaceNodeResults - Replace the results of node with an illegal result
488 /// type with new values built out of custom code.
Chris Lattnerf81d5882007-11-24 07:07:01 +0000489 ///
Duncan Sands6ed40142008-12-01 11:39:25 +0000490 virtual void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000491 SelectionDAG &DAG) const;
Chris Lattnerf81d5882007-11-24 07:07:01 +0000492
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000493
Dan Gohman2ce6f2a2008-07-27 21:46:04 +0000494 virtual SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const;
Evan Cheng5987cfb2006-07-07 08:33:52 +0000495
Evan Chengf1bd5fc2010-04-17 06:13:15 +0000496 /// isTypeDesirableForOp - Return true if the target has native support for
497 /// the specified value type and it is 'desirable' to use the type for the
498 /// given node type. e.g. On x86 i16 is legal, but undesirable since i16
499 /// instruction encodings are longer and some i16 instructions are slow.
500 virtual bool isTypeDesirableForOp(unsigned Opc, EVT VT) const;
501
502 /// isTypeDesirable - Return true if the target has native support for the
503 /// specified value type and it is 'desirable' to use the type. e.g. On x86
504 /// i16 is legal, but undesirable since i16 instruction encodings are longer
505 /// and some i16 instructions are slow.
506 virtual bool IsDesirableToPromoteOp(SDValue Op, EVT &PVT) const;
Evan Chengaf56fac2010-04-16 06:14:10 +0000507
Dan Gohman25c16532010-05-01 00:01:06 +0000508 virtual MachineBasicBlock *
509 EmitInstrWithCustomInserter(MachineInstr *MI,
510 MachineBasicBlock *MBB) const;
Evan Cheng339edad2006-01-11 00:33:36 +0000511
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000512
Evan Cheng6af02632005-12-20 06:22:03 +0000513 /// getTargetNodeName - This method returns the name of a target specific
514 /// DAG node.
515 virtual const char *getTargetNodeName(unsigned Opcode) const;
516
Scott Michela6729e82008-03-10 15:42:14 +0000517 /// getSetCCResultType - Return the ISD::SETCC ValueType
Owen Anderson9f944592009-08-11 20:47:22 +0000518 virtual MVT::SimpleValueType getSetCCResultType(EVT VT) const;
Scott Michela6729e82008-03-10 15:42:14 +0000519
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000520 /// computeMaskedBitsForTargetNode - Determine which of the bits specified
521 /// in Mask are known to be either zero or one and return them in the
Nate Begeman8a77efe2006-02-16 21:11:51 +0000522 /// KnownZero/KnownOne bitsets.
Dan Gohman2ce6f2a2008-07-27 21:46:04 +0000523 virtual void computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohmane1d9ee62008-02-13 22:28:48 +0000524 const APInt &Mask,
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000525 APInt &KnownZero,
Dan Gohmanf990faf2008-02-13 00:35:47 +0000526 APInt &KnownOne,
Dan Gohman309d3d52007-06-22 14:59:07 +0000527 const SelectionDAG &DAG,
Nate Begeman8a77efe2006-02-16 21:11:51 +0000528 unsigned Depth = 0) const;
Evan Cheng2609d5e2008-05-12 19:56:52 +0000529
Owen Anderson5e65dfb2010-09-21 20:42:50 +0000530 // ComputeNumSignBitsForTargetNode - Determine the number of bits in the
531 // operation that are sign bits.
532 virtual unsigned ComputeNumSignBitsForTargetNode(SDValue Op,
533 unsigned Depth) const;
534
Evan Cheng2609d5e2008-05-12 19:56:52 +0000535 virtual bool
Dan Gohmanbcaf6812010-04-15 01:51:59 +0000536 isGAPlusOffset(SDNode *N, const GlobalValue* &GA, int64_t &Offset) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000537
Dan Gohman21cea8a2010-04-17 15:26:15 +0000538 SDValue getReturnAddressFrameIndex(SelectionDAG &DAG) const;
Chris Lattner76ac0682005-11-15 00:40:23 +0000539
Chris Lattner5849d222009-07-20 17:51:36 +0000540 virtual bool ExpandInlineAsm(CallInst *CI) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000541
Chris Lattnerd6855142007-03-25 02:14:49 +0000542 ConstraintType getConstraintType(const std::string &Constraint) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000543
John Thompsone8360b72010-10-29 17:29:13 +0000544 /// Examine constraint string and operand type and determine a weight value.
John Thompson1094c802010-09-13 18:15:37 +0000545 /// The operand object must already have been set up with the operand type.
John Thompsone8360b72010-10-29 17:29:13 +0000546 virtual ConstraintWeight getSingleConstraintMatchWeight(
John Thompson1094c802010-09-13 18:15:37 +0000547 AsmOperandInfo &info, const char *constraint) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000548
549 std::vector<unsigned>
Chris Lattner7ad77df2006-02-22 00:56:39 +0000550 getRegClassForInlineAsmConstraint(const std::string &Constraint,
Owen Anderson53aa7a92009-08-10 22:56:29 +0000551 EVT VT) const;
Chris Lattnerd8c9cb92007-08-25 00:47:38 +0000552
Owen Anderson53aa7a92009-08-10 22:56:29 +0000553 virtual const char *LowerXConstraint(EVT ConstraintVT) const;
Dale Johannesen2b3bc302008-01-29 02:21:21 +0000554
Chris Lattnerd8c9cb92007-08-25 00:47:38 +0000555 /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
Evan Chenge0add202008-09-24 00:05:32 +0000556 /// vector. If it is invalid, don't add anything to Ops. If hasMemory is
557 /// true it means one of the asm constraint of the inline asm instruction
558 /// being processed is 'm'.
Dan Gohman2ce6f2a2008-07-27 21:46:04 +0000559 virtual void LowerAsmOperandForConstraint(SDValue Op,
Chris Lattnerd8c9cb92007-08-25 00:47:38 +0000560 char ConstraintLetter,
Dan Gohman2ce6f2a2008-07-27 21:46:04 +0000561 std::vector<SDValue> &Ops,
Chris Lattner724539c2008-04-26 23:02:14 +0000562 SelectionDAG &DAG) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000563
Chris Lattnerf4aeff02006-10-18 18:26:48 +0000564 /// getRegForInlineAsmConstraint - Given a physical register constraint
565 /// (e.g. {edx}), return the register number and the register class for the
566 /// register. This should only be used for C_Register constraints. On
567 /// error, this returns a register number of 0.
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000568 std::pair<unsigned, const TargetRegisterClass*>
Chris Lattner524129d2006-07-31 23:26:50 +0000569 getRegForInlineAsmConstraint(const std::string &Constraint,
Owen Anderson53aa7a92009-08-10 22:56:29 +0000570 EVT VT) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000571
Chris Lattner1eb94d92007-03-30 23:15:24 +0000572 /// isLegalAddressingMode - Return true if the addressing mode represented
573 /// by AM is legal for this target, for a load/store of the specified type.
574 virtual bool isLegalAddressingMode(const AddrMode &AM, const Type *Ty)const;
575
Evan Cheng7f3d0242007-10-26 01:56:11 +0000576 /// isTruncateFree - Return true if it's free to truncate a value of
577 /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in
578 /// register EAX to i16 by referencing its sub-register AX.
579 virtual bool isTruncateFree(const Type *Ty1, const Type *Ty2) const;
Owen Anderson53aa7a92009-08-10 22:56:29 +0000580 virtual bool isTruncateFree(EVT VT1, EVT VT2) const;
Dan Gohmanad3e5492009-04-08 00:15:30 +0000581
582 /// isZExtFree - Return true if any actual instruction that defines a
583 /// value of type Ty1 implicit zero-extends the value to Ty2 in the result
584 /// register. This does not necessarily include registers defined in
585 /// unknown ways, such as incoming arguments, or copies from unknown
586 /// virtual registers. Also, if isTruncateFree(Ty2, Ty1) is true, this
587 /// does not necessarily apply to truncate instructions. e.g. on x86-64,
588 /// all instructions that define 32-bit values implicit zero-extend the
589 /// result out to 64 bits.
590 virtual bool isZExtFree(const Type *Ty1, const Type *Ty2) const;
Owen Anderson53aa7a92009-08-10 22:56:29 +0000591 virtual bool isZExtFree(EVT VT1, EVT VT2) const;
Dan Gohmanad3e5492009-04-08 00:15:30 +0000592
Evan Chenga9cda8a2009-05-28 00:35:15 +0000593 /// isNarrowingProfitable - Return true if it's profitable to narrow
594 /// operations of type VT1 to VT2. e.g. on x86, it's profitable to narrow
595 /// from i32 to i8 but not from i32 to i16.
Owen Anderson53aa7a92009-08-10 22:56:29 +0000596 virtual bool isNarrowingProfitable(EVT VT1, EVT VT2) const;
Evan Chenga9cda8a2009-05-28 00:35:15 +0000597
Evan Cheng16993aa2009-10-27 19:56:55 +0000598 /// isFPImmLegal - Returns true if the target can instruction select the
599 /// specified FP immediate natively. If false, the legalizer will
600 /// materialize the FP immediate as a load from a constant pool.
Evan Cheng83896a52009-10-28 01:43:28 +0000601 virtual bool isFPImmLegal(const APFloat &Imm, EVT VT) const;
Evan Cheng16993aa2009-10-27 19:56:55 +0000602
Evan Cheng68ad48b2006-03-22 18:59:22 +0000603 /// isShuffleMaskLegal - Targets can use this to indicate that they only
604 /// support *some* VECTOR_SHUFFLE operations, those with specific masks.
Chris Lattnerf4aeff02006-10-18 18:26:48 +0000605 /// By default, if a target supports the VECTOR_SHUFFLE node, all mask
606 /// values are assumed to be legal.
Nate Begeman5f829d82009-04-29 05:20:52 +0000607 virtual bool isShuffleMaskLegal(const SmallVectorImpl<int> &Mask,
Owen Anderson53aa7a92009-08-10 22:56:29 +0000608 EVT VT) const;
Evan Cheng60f0b892006-04-20 08:58:49 +0000609
610 /// isVectorClearMaskLegal - Similar to isShuffleMaskLegal. This is
611 /// used by Targets can use this to indicate if there is a suitable
612 /// VECTOR_SHUFFLE that can be used to replace a VAND with a constant
613 /// pool entry.
Nate Begeman5f829d82009-04-29 05:20:52 +0000614 virtual bool isVectorClearMaskLegal(const SmallVectorImpl<int> &Mask,
Owen Anderson53aa7a92009-08-10 22:56:29 +0000615 EVT VT) const;
Evan Cheng0a62cb42008-03-05 01:30:59 +0000616
617 /// ShouldShrinkFPConstant - If true, then instruction selection should
618 /// seek to shrink the FP constant of the specified type to a smaller type
619 /// in order to save space and / or reduce runtime.
Owen Anderson53aa7a92009-08-10 22:56:29 +0000620 virtual bool ShouldShrinkFPConstant(EVT VT) const {
Evan Cheng0a62cb42008-03-05 01:30:59 +0000621 // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more
622 // expensive than a straight movsd. On the other hand, it's important to
623 // shrink long double fp constant since fldt is very slow.
Owen Anderson9f944592009-08-11 20:47:22 +0000624 return !X86ScalarSSEf64 || VT == MVT::f80;
Evan Cheng0a62cb42008-03-05 01:30:59 +0000625 }
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000626
Dan Gohman4df9d9c2010-05-11 16:21:03 +0000627 const X86Subtarget* getSubtarget() const {
Dan Gohman544ab2c2008-04-12 04:36:06 +0000628 return Subtarget;
Rafael Espindolafa0df552007-11-05 23:12:20 +0000629 }
630
Chris Lattner7dc00e82008-01-18 06:52:41 +0000631 /// isScalarFPTypeInSSEReg - Return true if the specified scalar FP type is
632 /// computed in an SSE register, not on the X87 floating point stack.
Owen Anderson53aa7a92009-08-10 22:56:29 +0000633 bool isScalarFPTypeInSSEReg(EVT VT) const {
Owen Anderson9f944592009-08-11 20:47:22 +0000634 return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2
635 (VT == MVT::f32 && X86ScalarSSEf32); // f32 is when SSE1
Chris Lattner7dc00e82008-01-18 06:52:41 +0000636 }
Dan Gohman4619e932008-08-19 21:32:53 +0000637
638 /// createFastISel - This method returns a target specific FastISel object,
639 /// or null if the target does not support "fast" ISel.
Dan Gohman87fb4e82010-07-07 16:29:44 +0000640 virtual FastISel *createFastISel(FunctionLoweringInfo &funcInfo) const;
Bill Wendling31ceb1b2009-06-30 22:38:32 +0000641
Bill Wendling512ff732009-07-01 18:50:55 +0000642 /// getFunctionAlignment - Return the Log2 alignment of this function.
Bill Wendling31ceb1b2009-06-30 22:38:32 +0000643 virtual unsigned getFunctionAlignment(const Function *F) const;
644
Evan Cheng37b740c2010-07-24 00:39:05 +0000645 unsigned getRegPressureLimit(const TargetRegisterClass *RC,
646 MachineFunction &MF) const;
647
Eric Christopher2ad0c772010-07-06 05:18:56 +0000648 /// getStackCookieLocation - Return true if the target stores stack
649 /// protector cookies at a fixed offset in some non-standard address
650 /// space, and populates the address space and offset as
651 /// appropriate.
652 virtual bool getStackCookieLocation(unsigned &AddressSpace, unsigned &Offset) const;
653
Evan Chengd4218b82010-07-26 21:50:05 +0000654 protected:
655 std::pair<const TargetRegisterClass*, uint8_t>
656 findRepresentativeClass(EVT VT) const;
657
Chris Lattner76ac0682005-11-15 00:40:23 +0000658 private:
Evan Chenga9467aa2006-04-25 20:13:52 +0000659 /// Subtarget - Keep a pointer to the X86Subtarget around so that we can
660 /// make the right decision when generating code for different targets.
661 const X86Subtarget *Subtarget;
Dan Gohmaneabd6472008-05-14 01:58:56 +0000662 const X86RegisterInfo *RegInfo;
Anton Korobeynikov6acb2212008-09-09 18:22:57 +0000663 const TargetData *TD;
Evan Chenga9467aa2006-04-25 20:13:52 +0000664
Evan Cheng11b0a5d2006-09-08 06:48:29 +0000665 /// X86StackPtr - X86 physical register used as stack ptr.
666 unsigned X86StackPtr;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000667
668 /// X86ScalarSSEf32, X86ScalarSSEf64 - Select between SSE or x87
Dale Johannesene36c4002007-09-23 14:52:20 +0000669 /// floating point ops.
670 /// When SSE is available, use it for f32 operations.
671 /// When SSE2 is available, use it for f64 operations.
672 bool X86ScalarSSEf32;
673 bool X86ScalarSSEf64;
Evan Cheng084a1cd2008-01-29 19:34:22 +0000674
Evan Cheng16993aa2009-10-27 19:56:55 +0000675 /// LegalFPImmediates - A list of legal fp immediates.
676 std::vector<APFloat> LegalFPImmediates;
677
678 /// addLegalFPImmediate - Indicate that this x86 target can instruction
679 /// select the specified FP immediate natively.
680 void addLegalFPImmediate(const APFloat& Imm) {
681 LegalFPImmediates.push_back(Imm);
682 }
683
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000684 SDValue LowerCallResult(SDValue Chain, SDValue InFlag,
Sandeep Patel68c5f472009-09-02 08:44:58 +0000685 CallingConv::ID CallConv, bool isVarArg,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000686 const SmallVectorImpl<ISD::InputArg> &Ins,
687 DebugLoc dl, SelectionDAG &DAG,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000688 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000689 SDValue LowerMemArgument(SDValue Chain,
Sandeep Patel68c5f472009-09-02 08:44:58 +0000690 CallingConv::ID CallConv,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000691 const SmallVectorImpl<ISD::InputArg> &ArgInfo,
692 DebugLoc dl, SelectionDAG &DAG,
693 const CCValAssign &VA, MachineFrameInfo *MFI,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000694 unsigned i) const;
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000695 SDValue LowerMemOpCallTo(SDValue Chain, SDValue StackPtr, SDValue Arg,
696 DebugLoc dl, SelectionDAG &DAG,
697 const CCValAssign &VA,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000698 ISD::ArgFlagsTy Flags) const;
Rafael Espindolae636fc02007-08-31 15:06:30 +0000699
Gordon Henriksen92319582008-01-05 16:56:59 +0000700 // Call lowering helpers.
Evan Cheng67a69dd2010-01-27 00:07:07 +0000701
702 /// IsEligibleForTailCallOptimization - Check whether the call is eligible
703 /// for tail call optimization. Targets which want to do tail call
704 /// optimization should implement this function.
Evan Cheng6f36a082010-02-02 23:55:14 +0000705 bool IsEligibleForTailCallOptimization(SDValue Callee,
Evan Cheng67a69dd2010-01-27 00:07:07 +0000706 CallingConv::ID CalleeCC,
707 bool isVarArg,
Evan Chengae5edee2010-03-15 18:54:48 +0000708 bool isCalleeStructRet,
709 bool isCallerStructRet,
Evan Cheng85476f32010-01-27 06:25:16 +0000710 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanfe7532a2010-07-07 15:54:55 +0000711 const SmallVectorImpl<SDValue> &OutVals,
Evan Cheng85476f32010-01-27 06:25:16 +0000712 const SmallVectorImpl<ISD::InputArg> &Ins,
Evan Cheng67a69dd2010-01-27 00:07:07 +0000713 SelectionDAG& DAG) const;
Dan Gohman21cea8a2010-04-17 15:26:15 +0000714 bool IsCalleePop(bool isVarArg, CallingConv::ID CallConv) const;
Dan Gohman2ce6f2a2008-07-27 21:46:04 +0000715 SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr,
716 SDValue Chain, bool IsTailCall, bool Is64Bit,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000717 int FPDiff, DebugLoc dl) const;
Arnold Schwaighofer634fc9a2008-04-12 18:11:06 +0000718
Dan Gohman21cea8a2010-04-17 15:26:15 +0000719 unsigned GetAlignedArgumentStackSize(unsigned StackSize,
720 SelectionDAG &DAG) const;
Evan Chengcde9e302006-01-27 08:10:46 +0000721
Eli Friedmandfe4f252009-05-23 09:59:16 +0000722 std::pair<SDValue,SDValue> FP_TO_INTHelper(SDValue Op, SelectionDAG &DAG,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000723 bool isSigned) const;
Evan Cheng493b8822009-12-09 21:00:30 +0000724
725 SDValue LowerAsSplatVectorLoad(SDValue SrcOp, EVT VT, DebugLoc dl,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000726 SelectionDAG &DAG) const;
727 SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) const;
728 SDValue LowerCONCAT_VECTORS(SDValue Op, SelectionDAG &DAG) const;
729 SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) const;
730 SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
731 SDValue LowerEXTRACT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG) const;
732 SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) const;
733 SDValue LowerINSERT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG) const;
734 SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) const;
735 SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) const;
736 SDValue LowerBlockAddress(SDValue Op, SelectionDAG &DAG) const;
Dale Johannesen021052a2009-02-04 20:06:27 +0000737 SDValue LowerGlobalAddress(const GlobalValue *GV, DebugLoc dl,
738 int64_t Offset, SelectionDAG &DAG) const;
Dan Gohman21cea8a2010-04-17 15:26:15 +0000739 SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG) const;
740 SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) const;
741 SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG) const;
742 SDValue LowerShift(SDValue Op, SelectionDAG &DAG) const;
Owen Anderson53aa7a92009-08-10 22:56:29 +0000743 SDValue BuildFILD(SDValue Op, EVT SrcVT, SDValue Chain, SDValue StackSlot,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000744 SelectionDAG &DAG) const;
Wesley Peck527da1b2010-11-23 03:31:01 +0000745 SDValue LowerBITCAST(SDValue op, SelectionDAG &DAG) const;
Dan Gohman21cea8a2010-04-17 15:26:15 +0000746 SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
747 SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG) const;
748 SDValue LowerUINT_TO_FP_i64(SDValue Op, SelectionDAG &DAG) const;
749 SDValue LowerUINT_TO_FP_i32(SDValue Op, SelectionDAG &DAG) const;
750 SDValue LowerFP_TO_SINT(SDValue Op, SelectionDAG &DAG) const;
751 SDValue LowerFP_TO_UINT(SDValue Op, SelectionDAG &DAG) const;
752 SDValue LowerFABS(SDValue Op, SelectionDAG &DAG) const;
753 SDValue LowerFNEG(SDValue Op, SelectionDAG &DAG) const;
754 SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) const;
Evan Cheng9c8cd8c2010-04-21 01:47:12 +0000755 SDValue LowerToBT(SDValue And, ISD::CondCode CC,
756 DebugLoc dl, SelectionDAG &DAG) const;
Dan Gohman21cea8a2010-04-17 15:26:15 +0000757 SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG) const;
758 SDValue LowerVSETCC(SDValue Op, SelectionDAG &DAG) const;
759 SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG) const;
760 SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG) const;
761 SDValue LowerMEMSET(SDValue Op, SelectionDAG &DAG) const;
762 SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG) const;
763 SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG) const;
764 SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG) const;
765 SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG) const;
766 SDValue LowerVACOPY(SDValue Op, SelectionDAG &DAG) const;
767 SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) const;
768 SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG) const;
769 SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) const;
770 SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG) const;
771 SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG) const;
772 SDValue LowerTRAMPOLINE(SDValue Op, SelectionDAG &DAG) const;
773 SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG) const;
774 SDValue LowerCTLZ(SDValue Op, SelectionDAG &DAG) const;
775 SDValue LowerCTTZ(SDValue Op, SelectionDAG &DAG) const;
776 SDValue LowerMUL_V2I64(SDValue Op, SelectionDAG &DAG) const;
Nate Begeman269a6da2010-07-27 22:37:06 +0000777 SDValue LowerSHL(SDValue Op, SelectionDAG &DAG) const;
Dan Gohman21cea8a2010-04-17 15:26:15 +0000778 SDValue LowerXALUO(SDValue Op, SelectionDAG &DAG) const;
Bill Wendling66835472008-11-24 19:21:46 +0000779
Dan Gohman21cea8a2010-04-17 15:26:15 +0000780 SDValue LowerCMP_SWAP(SDValue Op, SelectionDAG &DAG) const;
781 SDValue LowerLOAD_SUB(SDValue Op, SelectionDAG &DAG) const;
782 SDValue LowerREADCYCLECOUNTER(SDValue Op, SelectionDAG &DAG) const;
Eric Christopher9a773822010-07-22 02:48:34 +0000783 SDValue LowerMEMBARRIER(SDValue Op, SelectionDAG &DAG) const;
Duncan Sands6ed40142008-12-01 11:39:25 +0000784
Bruno Cardoso Lopes9f20e7a2010-08-21 01:32:18 +0000785 // Utility functions to help LowerVECTOR_SHUFFLE
786 SDValue LowerVECTOR_SHUFFLEv8i16(SDValue Op, SelectionDAG &DAG) const;
787
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000788 virtual SDValue
789 LowerFormalArguments(SDValue Chain,
Sandeep Patel68c5f472009-09-02 08:44:58 +0000790 CallingConv::ID CallConv, bool isVarArg,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000791 const SmallVectorImpl<ISD::InputArg> &Ins,
792 DebugLoc dl, SelectionDAG &DAG,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000793 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000794 virtual SDValue
Evan Cheng6f36a082010-02-02 23:55:14 +0000795 LowerCall(SDValue Chain, SDValue Callee,
Evan Cheng67a69dd2010-01-27 00:07:07 +0000796 CallingConv::ID CallConv, bool isVarArg, bool &isTailCall,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000797 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanfe7532a2010-07-07 15:54:55 +0000798 const SmallVectorImpl<SDValue> &OutVals,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000799 const SmallVectorImpl<ISD::InputArg> &Ins,
800 DebugLoc dl, SelectionDAG &DAG,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000801 SmallVectorImpl<SDValue> &InVals) const;
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000802
803 virtual SDValue
804 LowerReturn(SDValue Chain,
Sandeep Patel68c5f472009-09-02 08:44:58 +0000805 CallingConv::ID CallConv, bool isVarArg,
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000806 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanfe7532a2010-07-07 15:54:55 +0000807 const SmallVectorImpl<SDValue> &OutVals,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000808 DebugLoc dl, SelectionDAG &DAG) const;
Dan Gohmanf9bbcd12009-08-05 01:29:28 +0000809
Evan Chengd4b08732010-11-30 23:55:39 +0000810 virtual bool isUsedByReturnOnly(SDNode *N) const;
811
Kenneth Uildriks07119732009-11-07 02:11:54 +0000812 virtual bool
813 CanLowerReturn(CallingConv::ID CallConv, bool isVarArg,
Dan Gohmand7b5ce32010-07-10 09:00:22 +0000814 const SmallVectorImpl<ISD::OutputArg> &Outs,
Dan Gohmanee0cb702010-07-06 22:19:37 +0000815 LLVMContext &Context) const;
Kenneth Uildriks07119732009-11-07 02:11:54 +0000816
Duncan Sands6ed40142008-12-01 11:39:25 +0000817 void ReplaceATOMIC_BINARY_64(SDNode *N, SmallVectorImpl<SDValue> &Results,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000818 SelectionDAG &DAG, unsigned NewOp) const;
Duncan Sands6ed40142008-12-01 11:39:25 +0000819
Eric Christopher9fe912d2009-08-18 22:50:32 +0000820 /// Utility function to emit string processing sse4.2 instructions
821 /// that return in xmm0.
Evan Chengb82b5512009-09-19 10:09:15 +0000822 /// This takes the instruction to expand, the associated machine basic
823 /// block, the number of args, and whether or not the second arg is
824 /// in memory or not.
Eric Christopher9fe912d2009-08-18 22:50:32 +0000825 MachineBasicBlock *EmitPCMP(MachineInstr *BInstr, MachineBasicBlock *BB,
Mon P Wangc576ee92010-04-04 03:10:48 +0000826 unsigned argNum, bool inMem) const;
Eric Christopher9fe912d2009-08-18 22:50:32 +0000827
Eric Christopherfa6657c2010-11-30 07:20:12 +0000828 /// Utility functions to emit monitor and mwait instructions. These
829 /// need to make sure that the arguments to the intrinsic are in the
830 /// correct registers.
Eric Christopher1a86e842010-11-30 08:10:28 +0000831 MachineBasicBlock *EmitMonitor(MachineInstr *MI,
832 MachineBasicBlock *BB) const;
Eric Christopherfa6657c2010-11-30 07:20:12 +0000833 MachineBasicBlock *EmitMwait(MachineInstr *MI, MachineBasicBlock *BB) const;
834
Mon P Wang3e583932008-05-05 19:05:59 +0000835 /// Utility function to emit atomic bitwise operations (and, or, xor).
Evan Chengb82b5512009-09-19 10:09:15 +0000836 /// It takes the bitwise instruction to expand, the associated machine basic
837 /// block, and the associated X86 opcodes for reg/reg and reg/imm.
Mon P Wang3e583932008-05-05 19:05:59 +0000838 MachineBasicBlock *EmitAtomicBitwiseWithCustomInserter(
839 MachineInstr *BInstr,
840 MachineBasicBlock *BB,
841 unsigned regOpc,
Andrew Lenharthf88d50b2008-06-14 05:48:15 +0000842 unsigned immOpc,
Dale Johannesen5afbf512008-08-19 18:47:28 +0000843 unsigned loadOpc,
844 unsigned cxchgOpc,
Dale Johannesen5afbf512008-08-19 18:47:28 +0000845 unsigned notOpc,
846 unsigned EAXreg,
847 TargetRegisterClass *RC,
Dan Gohman747e55b2009-02-07 16:15:20 +0000848 bool invSrc = false) const;
Dale Johannesen867d5492008-10-02 18:53:47 +0000849
850 MachineBasicBlock *EmitAtomicBit6432WithCustomInserter(
851 MachineInstr *BInstr,
852 MachineBasicBlock *BB,
853 unsigned regOpcL,
854 unsigned regOpcH,
855 unsigned immOpcL,
856 unsigned immOpcH,
Dan Gohman747e55b2009-02-07 16:15:20 +0000857 bool invSrc = false) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000858
Mon P Wang3e583932008-05-05 19:05:59 +0000859 /// Utility function to emit atomic min and max. It takes the min/max
Bill Wendling189d6712009-03-26 01:46:56 +0000860 /// instruction to expand, the associated basic block, and the associated
861 /// cmov opcode for moving the min or max value.
Mon P Wang3e583932008-05-05 19:05:59 +0000862 MachineBasicBlock *EmitAtomicMinMaxWithCustomInserter(MachineInstr *BInstr,
863 MachineBasicBlock *BB,
Dan Gohman747e55b2009-02-07 16:15:20 +0000864 unsigned cmovOpc) const;
Dan Gohman55d7b2a2009-03-04 19:44:21 +0000865
Dan Gohman395a8982010-10-12 18:00:49 +0000866 // Utility function to emit the low-level va_arg code for X86-64.
867 MachineBasicBlock *EmitVAARG64WithCustomInserter(
868 MachineInstr *MI,
869 MachineBasicBlock *MBB) const;
870
Dan Gohman0700a562009-08-15 01:38:56 +0000871 /// Utility function to emit the xmm reg save portion of va_start.
872 MachineBasicBlock *EmitVAStartSaveXMMRegsWithCustomInserter(
873 MachineInstr *BInstr,
874 MachineBasicBlock *BB) const;
875
Chris Lattnerd5f4fcc2009-09-02 05:57:00 +0000876 MachineBasicBlock *EmitLoweredSelect(MachineInstr *I,
Dan Gohman25c16532010-05-01 00:01:06 +0000877 MachineBasicBlock *BB) const;
Anton Korobeynikovd5e3fd62010-03-06 19:32:29 +0000878
Michael J. Spencerf509c6c2010-10-21 01:41:01 +0000879 MachineBasicBlock *EmitLoweredWinAlloca(MachineInstr *MI,
Dan Gohman25c16532010-05-01 00:01:06 +0000880 MachineBasicBlock *BB) const;
Michael J. Spencer9cafc872010-10-20 23:40:27 +0000881
Eric Christopherb0e1a452010-06-03 04:07:48 +0000882 MachineBasicBlock *EmitLoweredTLSCall(MachineInstr *MI,
883 MachineBasicBlock *BB) const;
Anton Korobeynikovd5e3fd62010-03-06 19:32:29 +0000884
Rafael Espindola5d882892010-11-27 20:43:02 +0000885 MachineBasicBlock *emitLoweredTLSAddr(MachineInstr *MI,
886 MachineBasicBlock *BB) const;
887
Dan Gohman55d7b2a2009-03-04 19:44:21 +0000888 /// Emit nodes that will be selected as "test Op0,Op0", or something
Dan Gohmanff659b52009-03-07 01:58:32 +0000889 /// equivalent, for use with the given x86 condition code.
Evan Cheng6e45f1d2010-04-26 19:06:11 +0000890 SDValue EmitTest(SDValue Op0, unsigned X86CC, SelectionDAG &DAG) const;
Dan Gohman55d7b2a2009-03-04 19:44:21 +0000891
892 /// Emit nodes that will be selected as "cmp Op0,Op1", or something
Dan Gohmanff659b52009-03-07 01:58:32 +0000893 /// equivalent, for use with the given x86 condition code.
Evan Cheng6e45f1d2010-04-26 19:06:11 +0000894 SDValue EmitCmp(SDValue Op0, SDValue Op1, unsigned X86CC,
Dan Gohman21cea8a2010-04-17 15:26:15 +0000895 SelectionDAG &DAG) const;
Chris Lattner76ac0682005-11-15 00:40:23 +0000896 };
Evan Cheng24422d42008-09-03 00:03:49 +0000897
898 namespace X86 {
Dan Gohman87fb4e82010-07-07 16:29:44 +0000899 FastISel *createFastISel(FunctionLoweringInfo &funcInfo);
Evan Cheng24422d42008-09-03 00:03:49 +0000900 }
Chris Lattner76ac0682005-11-15 00:40:23 +0000901}
902
Chris Lattner76ac0682005-11-15 00:40:23 +0000903#endif // X86ISELLOWERING_H