Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 1 | //===-- X86ISelLowering.h - X86 DAG Lowering Interface ----------*- C++ -*-===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file defines the interfaces that X86 uses to lower LLVM code into a |
| 11 | // selection DAG. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #ifndef X86ISELLOWERING_H |
| 16 | #define X86ISELLOWERING_H |
| 17 | |
Evan Cheng | 559806f | 2006-01-27 08:10:46 +0000 | [diff] [blame] | 18 | #include "X86Subtarget.h" |
Anton Korobeynikov | 2365f51 | 2007-07-14 14:06:15 +0000 | [diff] [blame] | 19 | #include "X86RegisterInfo.h" |
Gordon Henriksen | 8673766 | 2008-01-05 16:56:59 +0000 | [diff] [blame] | 20 | #include "X86MachineFunctionInfo.h" |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 21 | #include "llvm/Target/TargetLowering.h" |
Ted Kremenek | b388eb8 | 2008-09-03 02:54:11 +0000 | [diff] [blame] | 22 | #include "llvm/CodeGen/FastISel.h" |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 23 | #include "llvm/CodeGen/SelectionDAG.h" |
Rafael Espindola | 1b5dcc3 | 2007-08-31 15:06:30 +0000 | [diff] [blame] | 24 | #include "llvm/CodeGen/CallingConvLower.h" |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 25 | |
| 26 | namespace llvm { |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 27 | namespace X86ISD { |
Evan Cheng | d9558e0 | 2006-01-06 00:43:03 +0000 | [diff] [blame] | 28 | // X86 Specific DAG Nodes |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 29 | enum NodeType { |
| 30 | // Start the numbering where the builtin ops leave off. |
Dan Gohman | 0ba2bcf | 2008-09-23 18:42:32 +0000 | [diff] [blame] | 31 | FIRST_NUMBER = ISD::BUILTIN_OP_END, |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 32 | |
Evan Cheng | 18efe26 | 2007-12-14 02:13:44 +0000 | [diff] [blame] | 33 | /// BSF - Bit scan forward. |
| 34 | /// BSR - Bit scan reverse. |
| 35 | BSF, |
| 36 | BSR, |
| 37 | |
Evan Cheng | e341316 | 2006-01-09 18:33:28 +0000 | [diff] [blame] | 38 | /// SHLD, SHRD - Double shift instructions. These correspond to |
| 39 | /// X86::SHLDxx and X86::SHRDxx instructions. |
| 40 | SHLD, |
| 41 | SHRD, |
| 42 | |
Evan Cheng | ef6ffb1 | 2006-01-31 03:14:29 +0000 | [diff] [blame] | 43 | /// FAND - Bitwise logical AND of floating point values. This corresponds |
| 44 | /// to X86::ANDPS or X86::ANDPD. |
| 45 | FAND, |
| 46 | |
Evan Cheng | 68c47cb | 2007-01-05 07:55:56 +0000 | [diff] [blame] | 47 | /// FOR - Bitwise logical OR of floating point values. This corresponds |
| 48 | /// to X86::ORPS or X86::ORPD. |
| 49 | FOR, |
| 50 | |
Evan Cheng | 223547a | 2006-01-31 22:28:30 +0000 | [diff] [blame] | 51 | /// FXOR - Bitwise logical XOR of floating point values. This corresponds |
| 52 | /// to X86::XORPS or X86::XORPD. |
| 53 | FXOR, |
| 54 | |
Evan Cheng | 73d6cf1 | 2007-01-05 21:37:56 +0000 | [diff] [blame] | 55 | /// FSRL - Bitwise logical right shift of floating point values. These |
| 56 | /// corresponds to X86::PSRLDQ. |
Evan Cheng | 68c47cb | 2007-01-05 07:55:56 +0000 | [diff] [blame] | 57 | FSRL, |
| 58 | |
Evan Cheng | e3de85b | 2006-02-04 02:20:30 +0000 | [diff] [blame] | 59 | /// FILD, FILD_FLAG - This instruction implements SINT_TO_FP with the |
| 60 | /// integer source in memory and FP reg result. This corresponds to the |
| 61 | /// X86::FILD*m instructions. It has three inputs (token chain, address, |
| 62 | /// and source type) and two outputs (FP value and token chain). FILD_FLAG |
| 63 | /// also produces a flag). |
Evan Cheng | a3195e8 | 2006-01-12 22:54:21 +0000 | [diff] [blame] | 64 | FILD, |
Evan Cheng | e3de85b | 2006-02-04 02:20:30 +0000 | [diff] [blame] | 65 | FILD_FLAG, |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 66 | |
| 67 | /// FP_TO_INT*_IN_MEM - This instruction implements FP_TO_SINT with the |
| 68 | /// integer destination in memory and a FP reg source. This corresponds |
| 69 | /// to the X86::FIST*m instructions and the rounding mode change stuff. It |
Chris Lattner | 9189777 | 2006-10-18 18:26:48 +0000 | [diff] [blame] | 70 | /// has two inputs (token chain and address) and two outputs (int value |
| 71 | /// and token chain). |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 72 | FP_TO_INT16_IN_MEM, |
| 73 | FP_TO_INT32_IN_MEM, |
| 74 | FP_TO_INT64_IN_MEM, |
| 75 | |
Evan Cheng | b077b84 | 2005-12-21 02:39:21 +0000 | [diff] [blame] | 76 | /// FLD - This instruction implements an extending load to FP stack slots. |
| 77 | /// This corresponds to the X86::FLD32m / X86::FLD64m. It takes a chain |
Evan Cheng | 38bcbaf | 2005-12-23 07:31:11 +0000 | [diff] [blame] | 78 | /// operand, ptr to load from, and a ValueType node indicating the type |
| 79 | /// to load to. |
Evan Cheng | b077b84 | 2005-12-21 02:39:21 +0000 | [diff] [blame] | 80 | FLD, |
| 81 | |
Evan Cheng | d90eb7f | 2006-01-05 00:27:02 +0000 | [diff] [blame] | 82 | /// FST - This instruction implements a truncating store to FP stack |
| 83 | /// slots. This corresponds to the X86::FST32m / X86::FST64m. It takes a |
| 84 | /// chain operand, value to store, address, and a ValueType to store it |
| 85 | /// as. |
| 86 | FST, |
| 87 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 88 | /// CALL/TAILCALL - These operations represent an abstract X86 call |
| 89 | /// instruction, which includes a bunch of information. In particular the |
| 90 | /// operands of these node are: |
| 91 | /// |
| 92 | /// #0 - The incoming token chain |
| 93 | /// #1 - The callee |
| 94 | /// #2 - The number of arg bytes the caller pushes on the stack. |
| 95 | /// #3 - The number of arg bytes the callee pops off the stack. |
| 96 | /// #4 - The value to pass in AL/AX/EAX (optional) |
| 97 | /// #5 - The value to pass in DL/DX/EDX (optional) |
| 98 | /// |
| 99 | /// The result values of these nodes are: |
| 100 | /// |
| 101 | /// #0 - The outgoing token chain |
| 102 | /// #1 - The first register result value (optional) |
| 103 | /// #2 - The second register result value (optional) |
| 104 | /// |
| 105 | /// The CALL vs TAILCALL distinction boils down to whether the callee is |
| 106 | /// known not to modify the caller's stack frame, as is standard with |
| 107 | /// LLVM. |
| 108 | CALL, |
| 109 | TAILCALL, |
Andrew Lenharth | b873ff3 | 2005-11-20 21:41:10 +0000 | [diff] [blame] | 110 | |
| 111 | /// RDTSC_DAG - This operation implements the lowering for |
| 112 | /// readcyclecounter |
| 113 | RDTSC_DAG, |
Evan Cheng | 7df96d6 | 2005-12-17 01:21:05 +0000 | [diff] [blame] | 114 | |
| 115 | /// X86 compare and logical compare instructions. |
Evan Cheng | 7d6ff3a | 2007-09-17 17:42:53 +0000 | [diff] [blame] | 116 | CMP, COMI, UCOMI, |
Evan Cheng | 7df96d6 | 2005-12-17 01:21:05 +0000 | [diff] [blame] | 117 | |
Dan Gohman | c7a37d4 | 2008-12-23 22:45:23 +0000 | [diff] [blame] | 118 | /// X86 bit-test instructions. |
| 119 | BT, |
| 120 | |
Evan Cheng | d5781fc | 2005-12-21 20:21:51 +0000 | [diff] [blame] | 121 | /// X86 SetCC. Operand 1 is condition code, and operand 2 is the flag |
| 122 | /// operand produced by a CMP instruction. |
| 123 | SETCC, |
| 124 | |
| 125 | /// X86 conditional moves. Operand 1 and operand 2 are the two values |
Chris Lattner | 9189777 | 2006-10-18 18:26:48 +0000 | [diff] [blame] | 126 | /// to select from (operand 1 is a R/W operand). Operand 3 is the |
| 127 | /// condition code, and operand 4 is the flag operand produced by a CMP |
| 128 | /// or TEST instruction. It also writes a flag result. |
Evan Cheng | 7df96d6 | 2005-12-17 01:21:05 +0000 | [diff] [blame] | 129 | CMOV, |
Evan Cheng | 898101c | 2005-12-19 23:12:38 +0000 | [diff] [blame] | 130 | |
Evan Cheng | d5781fc | 2005-12-21 20:21:51 +0000 | [diff] [blame] | 131 | /// X86 conditional branches. Operand 1 is the chain operand, operand 2 |
| 132 | /// is the block to branch if condition is true, operand 3 is the |
| 133 | /// condition code, and operand 4 is the flag operand produced by a CMP |
| 134 | /// or TEST instruction. |
Evan Cheng | 898101c | 2005-12-19 23:12:38 +0000 | [diff] [blame] | 135 | BRCOND, |
Evan Cheng | b077b84 | 2005-12-21 02:39:21 +0000 | [diff] [blame] | 136 | |
Evan Cheng | 67f92a7 | 2006-01-11 22:15:48 +0000 | [diff] [blame] | 137 | /// Return with a flag operand. Operand 1 is the chain operand, operand |
| 138 | /// 2 is the number of bytes of stack to pop. |
Evan Cheng | b077b84 | 2005-12-21 02:39:21 +0000 | [diff] [blame] | 139 | RET_FLAG, |
Evan Cheng | 67f92a7 | 2006-01-11 22:15:48 +0000 | [diff] [blame] | 140 | |
| 141 | /// REP_STOS - Repeat fill, corresponds to X86::REP_STOSx. |
| 142 | REP_STOS, |
| 143 | |
| 144 | /// REP_MOVS - Repeat move, corresponds to X86::REP_MOVSx. |
| 145 | REP_MOVS, |
Evan Cheng | 223547a | 2006-01-31 22:28:30 +0000 | [diff] [blame] | 146 | |
Evan Cheng | 7ccced6 | 2006-02-18 00:15:05 +0000 | [diff] [blame] | 147 | /// GlobalBaseReg - On Darwin, this node represents the result of the popl |
| 148 | /// at function entry, used for PIC code. |
| 149 | GlobalBaseReg, |
Evan Cheng | a0ea053 | 2006-02-23 02:43:52 +0000 | [diff] [blame] | 150 | |
Bill Wendling | 056292f | 2008-09-16 21:48:12 +0000 | [diff] [blame] | 151 | /// Wrapper - A wrapper node for TargetConstantPool, |
| 152 | /// TargetExternalSymbol, and TargetGlobalAddress. |
Evan Cheng | 020d2e8 | 2006-02-23 20:41:18 +0000 | [diff] [blame] | 153 | Wrapper, |
Evan Cheng | 48090aa | 2006-03-21 23:01:21 +0000 | [diff] [blame] | 154 | |
Evan Cheng | 0085a28 | 2006-11-30 21:55:46 +0000 | [diff] [blame] | 155 | /// WrapperRIP - Special wrapper used under X86-64 PIC mode for RIP |
| 156 | /// relative displacements. |
| 157 | WrapperRIP, |
| 158 | |
Nate Begeman | 14d12ca | 2008-02-11 04:19:36 +0000 | [diff] [blame] | 159 | /// PEXTRB - Extract an 8-bit value from a vector and zero extend it to |
| 160 | /// i32, corresponds to X86::PEXTRB. |
| 161 | PEXTRB, |
| 162 | |
Evan Cheng | b067a1e | 2006-03-31 19:22:53 +0000 | [diff] [blame] | 163 | /// PEXTRW - Extract a 16-bit value from a vector and zero extend it to |
Evan Cheng | 653159f | 2006-03-31 21:55:24 +0000 | [diff] [blame] | 164 | /// i32, corresponds to X86::PEXTRW. |
Evan Cheng | b067a1e | 2006-03-31 19:22:53 +0000 | [diff] [blame] | 165 | PEXTRW, |
Evan Cheng | 653159f | 2006-03-31 21:55:24 +0000 | [diff] [blame] | 166 | |
Nate Begeman | 14d12ca | 2008-02-11 04:19:36 +0000 | [diff] [blame] | 167 | /// INSERTPS - Insert any element of a 4 x float vector into any element |
| 168 | /// of a destination 4 x floatvector. |
| 169 | INSERTPS, |
| 170 | |
| 171 | /// PINSRB - Insert the lower 8-bits of a 32-bit value to a vector, |
| 172 | /// corresponds to X86::PINSRB. |
| 173 | PINSRB, |
| 174 | |
Evan Cheng | 653159f | 2006-03-31 21:55:24 +0000 | [diff] [blame] | 175 | /// PINSRW - Insert the lower 16-bits of a 32-bit value to a vector, |
| 176 | /// corresponds to X86::PINSRW. |
Evan Cheng | 8ca2932 | 2006-11-10 21:43:37 +0000 | [diff] [blame] | 177 | PINSRW, |
| 178 | |
Nate Begeman | b9a47b8 | 2009-02-23 08:49:38 +0000 | [diff] [blame] | 179 | /// PSHUFB - Shuffle 16 8-bit values within a vector. |
| 180 | PSHUFB, |
| 181 | |
Evan Cheng | 8ca2932 | 2006-11-10 21:43:37 +0000 | [diff] [blame] | 182 | /// FMAX, FMIN - Floating point max and min. |
| 183 | /// |
Lauro Ramos Venancio | b3a0417 | 2007-04-20 21:38:10 +0000 | [diff] [blame] | 184 | FMAX, FMIN, |
Dan Gohman | 2038252 | 2007-07-10 00:05:58 +0000 | [diff] [blame] | 185 | |
| 186 | /// FRSQRT, FRCP - Floating point reciprocal-sqrt and reciprocal |
| 187 | /// approximation. Note that these typically require refinement |
| 188 | /// in order to obtain suitable precision. |
| 189 | FRSQRT, FRCP, |
| 190 | |
Nate Begeman | 9b99485 | 2009-01-24 22:12:48 +0000 | [diff] [blame] | 191 | // TLSADDR, THREAD_POINTER - Thread Local Storage. |
Anton Korobeynikov | 2365f51 | 2007-07-14 14:06:15 +0000 | [diff] [blame] | 192 | TLSADDR, THREAD_POINTER, |
| 193 | |
Evan Cheng | 7e2ff77 | 2008-05-08 00:57:18 +0000 | [diff] [blame] | 194 | // EH_RETURN - Exception Handling helpers. |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 195 | EH_RETURN, |
| 196 | |
Arnold Schwaighofer | 4fe3073 | 2008-03-19 16:39:45 +0000 | [diff] [blame] | 197 | /// TC_RETURN - Tail call return. |
| 198 | /// operand #0 chain |
| 199 | /// operand #1 callee (register or absolute) |
| 200 | /// operand #2 stack adjustment |
| 201 | /// operand #3 optional in flag |
Anton Korobeynikov | 45b22fa | 2007-11-16 01:31:51 +0000 | [diff] [blame] | 202 | TC_RETURN, |
| 203 | |
Evan Cheng | 7e2ff77 | 2008-05-08 00:57:18 +0000 | [diff] [blame] | 204 | // LCMPXCHG_DAG, LCMPXCHG8_DAG - Compare and swap. |
Andrew Lenharth | 26ed869 | 2008-03-01 21:52:34 +0000 | [diff] [blame] | 205 | LCMPXCHG_DAG, |
Andrew Lenharth | d19189e | 2008-03-05 01:15:49 +0000 | [diff] [blame] | 206 | LCMPXCHG8_DAG, |
Andrew Lenharth | 26ed869 | 2008-03-01 21:52:34 +0000 | [diff] [blame] | 207 | |
Dale Johannesen | 48c1bc2 | 2008-10-02 18:53:47 +0000 | [diff] [blame] | 208 | // ATOMADD64_DAG, ATOMSUB64_DAG, ATOMOR64_DAG, ATOMAND64_DAG, |
Dale Johannesen | 880ae36 | 2008-10-03 22:25:52 +0000 | [diff] [blame] | 209 | // ATOMXOR64_DAG, ATOMNAND64_DAG, ATOMSWAP64_DAG - |
| 210 | // Atomic 64-bit binary operations. |
Dale Johannesen | 48c1bc2 | 2008-10-02 18:53:47 +0000 | [diff] [blame] | 211 | ATOMADD64_DAG, |
| 212 | ATOMSUB64_DAG, |
| 213 | ATOMOR64_DAG, |
| 214 | ATOMXOR64_DAG, |
| 215 | ATOMAND64_DAG, |
| 216 | ATOMNAND64_DAG, |
Dale Johannesen | 880ae36 | 2008-10-03 22:25:52 +0000 | [diff] [blame] | 217 | ATOMSWAP64_DAG, |
Dale Johannesen | 48c1bc2 | 2008-10-02 18:53:47 +0000 | [diff] [blame] | 218 | |
Evan Cheng | 7e2ff77 | 2008-05-08 00:57:18 +0000 | [diff] [blame] | 219 | // FNSTCW16m - Store FP control world into i16 memory. |
| 220 | FNSTCW16m, |
| 221 | |
Evan Cheng | d880b97 | 2008-05-09 21:53:03 +0000 | [diff] [blame] | 222 | // VZEXT_MOVL - Vector move low and zero extend. |
| 223 | VZEXT_MOVL, |
| 224 | |
| 225 | // VZEXT_LOAD - Load, scalar_to_vector, and zero extend. |
Evan Cheng | f26ffe9 | 2008-05-29 08:22:04 +0000 | [diff] [blame] | 226 | VZEXT_LOAD, |
| 227 | |
| 228 | // VSHL, VSRL - Vector logical left / right shift. |
Nate Begeman | 30a0de9 | 2008-07-17 16:51:19 +0000 | [diff] [blame] | 229 | VSHL, VSRL, |
| 230 | |
| 231 | // CMPPD, CMPPS - Vector double/float comparison. |
| 232 | CMPPD, CMPPS, |
| 233 | |
| 234 | // PCMP* - Vector integer comparisons. |
| 235 | PCMPEQB, PCMPEQW, PCMPEQD, PCMPEQQ, |
Bill Wendling | ab55ebd | 2008-12-12 00:56:36 +0000 | [diff] [blame] | 236 | PCMPGTB, PCMPGTW, PCMPGTD, PCMPGTQ, |
| 237 | |
Dan Gohman | 076aee3 | 2009-03-04 19:44:21 +0000 | [diff] [blame^] | 238 | // ADD, SUB, SMUL, UMUL, etc. - Arithmetic operations with FLAGS results. |
| 239 | ADD, SUB, SMUL, UMUL, |
| 240 | INC, DEC |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 241 | }; |
| 242 | } |
| 243 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 244 | /// Define some predicates that are used for node matching. |
| 245 | namespace X86 { |
| 246 | /// isPSHUFDMask - Return true if the specified VECTOR_SHUFFLE operand |
| 247 | /// specifies a shuffle of elements that is suitable for input to PSHUFD. |
| 248 | bool isPSHUFDMask(SDNode *N); |
Evan Cheng | 0188ecb | 2006-03-22 18:59:22 +0000 | [diff] [blame] | 249 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 250 | /// isPSHUFHWMask - Return true if the specified VECTOR_SHUFFLE operand |
| 251 | /// specifies a shuffle of elements that is suitable for input to PSHUFD. |
| 252 | bool isPSHUFHWMask(SDNode *N); |
Evan Cheng | 506d3df | 2006-03-29 23:07:14 +0000 | [diff] [blame] | 253 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 254 | /// isPSHUFLWMask - Return true if the specified VECTOR_SHUFFLE operand |
| 255 | /// specifies a shuffle of elements that is suitable for input to PSHUFD. |
| 256 | bool isPSHUFLWMask(SDNode *N); |
Evan Cheng | 506d3df | 2006-03-29 23:07:14 +0000 | [diff] [blame] | 257 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 258 | /// isSHUFPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 259 | /// specifies a shuffle of elements that is suitable for input to SHUFP*. |
| 260 | bool isSHUFPMask(SDNode *N); |
Evan Cheng | 14aed5e | 2006-03-24 01:18:28 +0000 | [diff] [blame] | 261 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 262 | /// isMOVHLPSMask - Return true if the specified VECTOR_SHUFFLE operand |
| 263 | /// specifies a shuffle of elements that is suitable for input to MOVHLPS. |
| 264 | bool isMOVHLPSMask(SDNode *N); |
Evan Cheng | 2c0dbd0 | 2006-03-24 02:58:06 +0000 | [diff] [blame] | 265 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 266 | /// isMOVHLPS_v_undef_Mask - Special case of isMOVHLPSMask for canonical form |
| 267 | /// of vector_shuffle v, v, <2, 3, 2, 3>, i.e. vector_shuffle v, undef, |
| 268 | /// <2, 3, 2, 3> |
| 269 | bool isMOVHLPS_v_undef_Mask(SDNode *N); |
Evan Cheng | 6e56e2c | 2006-11-07 22:14:24 +0000 | [diff] [blame] | 270 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 271 | /// isMOVLPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 272 | /// specifies a shuffle of elements that is suitable for input to MOVLP{S|D}. |
| 273 | bool isMOVLPMask(SDNode *N); |
Evan Cheng | 5ced1d8 | 2006-04-06 23:23:56 +0000 | [diff] [blame] | 274 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 275 | /// isMOVHPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 276 | /// specifies a shuffle of elements that is suitable for input to MOVHP{S|D} |
| 277 | /// as well as MOVLHPS. |
| 278 | bool isMOVHPMask(SDNode *N); |
Evan Cheng | 5ced1d8 | 2006-04-06 23:23:56 +0000 | [diff] [blame] | 279 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 280 | /// isUNPCKLMask - Return true if the specified VECTOR_SHUFFLE operand |
| 281 | /// specifies a shuffle of elements that is suitable for input to UNPCKL. |
| 282 | bool isUNPCKLMask(SDNode *N, bool V2IsSplat = false); |
Evan Cheng | 0038e59 | 2006-03-28 00:39:58 +0000 | [diff] [blame] | 283 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 284 | /// isUNPCKHMask - Return true if the specified VECTOR_SHUFFLE operand |
| 285 | /// specifies a shuffle of elements that is suitable for input to UNPCKH. |
| 286 | bool isUNPCKHMask(SDNode *N, bool V2IsSplat = false); |
Evan Cheng | 4fcb922 | 2006-03-28 02:43:26 +0000 | [diff] [blame] | 287 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 288 | /// isUNPCKL_v_undef_Mask - Special case of isUNPCKLMask for canonical form |
| 289 | /// of vector_shuffle v, v, <0, 4, 1, 5>, i.e. vector_shuffle v, undef, |
| 290 | /// <0, 0, 1, 1> |
| 291 | bool isUNPCKL_v_undef_Mask(SDNode *N); |
Evan Cheng | 1d5a8cc | 2006-04-05 07:20:06 +0000 | [diff] [blame] | 292 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 293 | /// isUNPCKH_v_undef_Mask - Special case of isUNPCKHMask for canonical form |
| 294 | /// of vector_shuffle v, v, <2, 6, 3, 7>, i.e. vector_shuffle v, undef, |
| 295 | /// <2, 2, 3, 3> |
| 296 | bool isUNPCKH_v_undef_Mask(SDNode *N); |
Bill Wendling | 2f9bb1a | 2007-04-24 21:16:55 +0000 | [diff] [blame] | 297 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 298 | /// isMOVLMask - Return true if the specified VECTOR_SHUFFLE operand |
| 299 | /// specifies a shuffle of elements that is suitable for input to MOVSS, |
| 300 | /// MOVSD, and MOVD, i.e. setting the lowest element. |
| 301 | bool isMOVLMask(SDNode *N); |
Evan Cheng | d6d1cbd | 2006-04-11 00:19:04 +0000 | [diff] [blame] | 302 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 303 | /// isMOVSHDUPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 304 | /// specifies a shuffle of elements that is suitable for input to MOVSHDUP. |
| 305 | bool isMOVSHDUPMask(SDNode *N); |
Evan Cheng | d953947 | 2006-04-14 21:59:03 +0000 | [diff] [blame] | 306 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 307 | /// isMOVSLDUPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 308 | /// specifies a shuffle of elements that is suitable for input to MOVSLDUP. |
| 309 | bool isMOVSLDUPMask(SDNode *N); |
Evan Cheng | d953947 | 2006-04-14 21:59:03 +0000 | [diff] [blame] | 310 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 311 | /// isSplatMask - Return true if the specified VECTOR_SHUFFLE operand |
| 312 | /// specifies a splat of a single element. |
| 313 | bool isSplatMask(SDNode *N); |
Evan Cheng | b9df0ca | 2006-03-22 02:53:00 +0000 | [diff] [blame] | 314 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 315 | /// isSplatLoMask - Return true if the specified VECTOR_SHUFFLE operand |
| 316 | /// specifies a splat of zero element. |
| 317 | bool isSplatLoMask(SDNode *N); |
Evan Cheng | f686d9b | 2006-10-27 21:08:32 +0000 | [diff] [blame] | 318 | |
Evan Cheng | 0b457f0 | 2008-09-25 20:50:48 +0000 | [diff] [blame] | 319 | /// isMOVDDUPMask - Return true if the specified VECTOR_SHUFFLE operand |
| 320 | /// specifies a shuffle of elements that is suitable for input to MOVDDUP. |
| 321 | bool isMOVDDUPMask(SDNode *N); |
| 322 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 323 | /// getShuffleSHUFImmediate - Return the appropriate immediate to shuffle |
| 324 | /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUF* and SHUFP* |
| 325 | /// instructions. |
| 326 | unsigned getShuffleSHUFImmediate(SDNode *N); |
Evan Cheng | 506d3df | 2006-03-29 23:07:14 +0000 | [diff] [blame] | 327 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 328 | /// getShufflePSHUFHWImmediate - Return the appropriate immediate to shuffle |
| 329 | /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFHW |
| 330 | /// instructions. |
| 331 | unsigned getShufflePSHUFHWImmediate(SDNode *N); |
Evan Cheng | 506d3df | 2006-03-29 23:07:14 +0000 | [diff] [blame] | 332 | |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 333 | /// getShufflePSHUFKWImmediate - Return the appropriate immediate to shuffle |
| 334 | /// the specified isShuffleMask VECTOR_SHUFFLE mask with PSHUFLW |
| 335 | /// instructions. |
| 336 | unsigned getShufflePSHUFLWImmediate(SDNode *N); |
| 337 | } |
| 338 | |
Chris Lattner | 9189777 | 2006-10-18 18:26:48 +0000 | [diff] [blame] | 339 | //===--------------------------------------------------------------------===// |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 340 | // X86TargetLowering - X86 Implementation of the TargetLowering interface |
| 341 | class X86TargetLowering : public TargetLowering { |
| 342 | int VarArgsFrameIndex; // FrameIndex for start of varargs area. |
Evan Cheng | 25ab690 | 2006-09-08 06:48:29 +0000 | [diff] [blame] | 343 | int RegSaveFrameIndex; // X86-64 vararg func register save area. |
| 344 | unsigned VarArgsGPOffset; // X86-64 vararg func int reg offset. |
| 345 | unsigned VarArgsFPOffset; // X86-64 vararg func fp reg offset. |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 346 | int BytesToPopOnReturn; // Number of arg bytes ret should pop. |
| 347 | int BytesCallerReserves; // Number of arg bytes caller makes. |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 348 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 349 | public: |
Dan Gohman | c9f5f3f | 2008-05-14 01:58:56 +0000 | [diff] [blame] | 350 | explicit X86TargetLowering(X86TargetMachine &TM); |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 351 | |
Evan Cheng | cc41586 | 2007-11-09 01:32:10 +0000 | [diff] [blame] | 352 | /// getPICJumpTableRelocaBase - Returns relocation base for the given PIC |
| 353 | /// jumptable. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 354 | SDValue getPICJumpTableRelocBase(SDValue Table, |
Evan Cheng | cc41586 | 2007-11-09 01:32:10 +0000 | [diff] [blame] | 355 | SelectionDAG &DAG) const; |
| 356 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 357 | // Return the number of bytes that a function should pop when it returns (in |
| 358 | // addition to the space used by the return address). |
| 359 | // |
| 360 | unsigned getBytesToPopOnReturn() const { return BytesToPopOnReturn; } |
| 361 | |
| 362 | // Return the number of bytes that the caller reserves for arguments passed |
| 363 | // to this function. |
| 364 | unsigned getBytesCallerReserves() const { return BytesCallerReserves; } |
| 365 | |
Chris Lattner | 54e3efd | 2007-02-26 04:01:25 +0000 | [diff] [blame] | 366 | /// getStackPtrReg - Return the stack pointer register we are using: either |
| 367 | /// ESP or RSP. |
| 368 | unsigned getStackPtrReg() const { return X86StackPtr; } |
Evan Cheng | 2928650 | 2008-01-23 23:17:41 +0000 | [diff] [blame] | 369 | |
| 370 | /// getByValTypeAlignment - Return the desired alignment for ByVal aggregate |
| 371 | /// function arguments in the caller parameter area. For X86, aggregates |
| 372 | /// that contains are placed at 16-byte boundaries while the rest are at |
| 373 | /// 4-byte boundaries. |
| 374 | virtual unsigned getByValTypeAlignment(const Type *Ty) const; |
Evan Cheng | f0df031 | 2008-05-15 08:39:06 +0000 | [diff] [blame] | 375 | |
| 376 | /// getOptimalMemOpType - Returns the target specific optimal type for load |
Evan Cheng | 0ef8de3 | 2008-05-15 22:13:02 +0000 | [diff] [blame] | 377 | /// and store operations as a result of memset, memcpy, and memmove |
| 378 | /// lowering. It returns MVT::iAny if SelectionDAG should be responsible for |
Evan Cheng | f0df031 | 2008-05-15 08:39:06 +0000 | [diff] [blame] | 379 | /// determining it. |
| 380 | virtual |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 381 | MVT getOptimalMemOpType(uint64_t Size, unsigned Align, |
| 382 | bool isSrcConst, bool isSrcStr) const; |
Chris Lattner | 54e3efd | 2007-02-26 04:01:25 +0000 | [diff] [blame] | 383 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 384 | /// LowerOperation - Provide custom lowering hooks for some operations. |
| 385 | /// |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 386 | virtual SDValue LowerOperation(SDValue Op, SelectionDAG &DAG); |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 387 | |
Duncan Sands | 1607f05 | 2008-12-01 11:39:25 +0000 | [diff] [blame] | 388 | /// ReplaceNodeResults - Replace the results of node with an illegal result |
| 389 | /// type with new values built out of custom code. |
Chris Lattner | 27a6c73 | 2007-11-24 07:07:01 +0000 | [diff] [blame] | 390 | /// |
Duncan Sands | 1607f05 | 2008-12-01 11:39:25 +0000 | [diff] [blame] | 391 | virtual void ReplaceNodeResults(SDNode *N, SmallVectorImpl<SDValue>&Results, |
| 392 | SelectionDAG &DAG); |
Chris Lattner | 27a6c73 | 2007-11-24 07:07:01 +0000 | [diff] [blame] | 393 | |
| 394 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 395 | virtual SDValue PerformDAGCombine(SDNode *N, DAGCombinerInfo &DCI) const; |
Evan Cheng | 206ee9d | 2006-07-07 08:33:52 +0000 | [diff] [blame] | 396 | |
Evan Cheng | ff9b373 | 2008-01-30 18:18:23 +0000 | [diff] [blame] | 397 | virtual MachineBasicBlock *EmitInstrWithCustomInserter(MachineInstr *MI, |
Dan Gohman | 1fdbc1d | 2009-02-07 16:15:20 +0000 | [diff] [blame] | 398 | MachineBasicBlock *MBB) const; |
Evan Cheng | 4a46080 | 2006-01-11 00:33:36 +0000 | [diff] [blame] | 399 | |
Mon P Wang | 63307c3 | 2008-05-05 19:05:59 +0000 | [diff] [blame] | 400 | |
Evan Cheng | 7226158 | 2005-12-20 06:22:03 +0000 | [diff] [blame] | 401 | /// getTargetNodeName - This method returns the name of a target specific |
| 402 | /// DAG node. |
| 403 | virtual const char *getTargetNodeName(unsigned Opcode) const; |
| 404 | |
Scott Michel | 5b8f82e | 2008-03-10 15:42:14 +0000 | [diff] [blame] | 405 | /// getSetCCResultType - Return the ISD::SETCC ValueType |
Duncan Sands | 5480c04 | 2009-01-01 15:52:00 +0000 | [diff] [blame] | 406 | virtual MVT getSetCCResultType(MVT VT) const; |
Scott Michel | 5b8f82e | 2008-03-10 15:42:14 +0000 | [diff] [blame] | 407 | |
Nate Begeman | 368e18d | 2006-02-16 21:11:51 +0000 | [diff] [blame] | 408 | /// computeMaskedBitsForTargetNode - Determine which of the bits specified |
| 409 | /// in Mask are known to be either zero or one and return them in the |
| 410 | /// KnownZero/KnownOne bitsets. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 411 | virtual void computeMaskedBitsForTargetNode(const SDValue Op, |
Dan Gohman | 977a76f | 2008-02-13 22:28:48 +0000 | [diff] [blame] | 412 | const APInt &Mask, |
Dan Gohman | fd29e0e | 2008-02-13 00:35:47 +0000 | [diff] [blame] | 413 | APInt &KnownZero, |
| 414 | APInt &KnownOne, |
Dan Gohman | ea859be | 2007-06-22 14:59:07 +0000 | [diff] [blame] | 415 | const SelectionDAG &DAG, |
Nate Begeman | 368e18d | 2006-02-16 21:11:51 +0000 | [diff] [blame] | 416 | unsigned Depth = 0) const; |
Evan Cheng | ad4196b | 2008-05-12 19:56:52 +0000 | [diff] [blame] | 417 | |
| 418 | virtual bool |
| 419 | isGAPlusOffset(SDNode *N, GlobalValue* &GA, int64_t &Offset) const; |
Nate Begeman | 368e18d | 2006-02-16 21:11:51 +0000 | [diff] [blame] | 420 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 421 | SDValue getReturnAddressFrameIndex(SelectionDAG &DAG); |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 422 | |
Chris Lattner | 4234f57 | 2007-03-25 02:14:49 +0000 | [diff] [blame] | 423 | ConstraintType getConstraintType(const std::string &Constraint) const; |
Chris Lattner | f4dff84 | 2006-07-11 02:54:03 +0000 | [diff] [blame] | 424 | |
Chris Lattner | 259e97c | 2006-01-31 19:43:35 +0000 | [diff] [blame] | 425 | std::vector<unsigned> |
Chris Lattner | 1efa40f | 2006-02-22 00:56:39 +0000 | [diff] [blame] | 426 | getRegClassForInlineAsmConstraint(const std::string &Constraint, |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 427 | MVT VT) const; |
Chris Lattner | 48884cd | 2007-08-25 00:47:38 +0000 | [diff] [blame] | 428 | |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 429 | virtual const char *LowerXConstraint(MVT ConstraintVT) const; |
Dale Johannesen | ba2a0b9 | 2008-01-29 02:21:21 +0000 | [diff] [blame] | 430 | |
Chris Lattner | 48884cd | 2007-08-25 00:47:38 +0000 | [diff] [blame] | 431 | /// LowerAsmOperandForConstraint - Lower the specified operand into the Ops |
Evan Cheng | da43bcf | 2008-09-24 00:05:32 +0000 | [diff] [blame] | 432 | /// vector. If it is invalid, don't add anything to Ops. If hasMemory is |
| 433 | /// true it means one of the asm constraint of the inline asm instruction |
| 434 | /// being processed is 'm'. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 435 | virtual void LowerAsmOperandForConstraint(SDValue Op, |
Chris Lattner | 48884cd | 2007-08-25 00:47:38 +0000 | [diff] [blame] | 436 | char ConstraintLetter, |
Evan Cheng | da43bcf | 2008-09-24 00:05:32 +0000 | [diff] [blame] | 437 | bool hasMemory, |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 438 | std::vector<SDValue> &Ops, |
Chris Lattner | 5e76423 | 2008-04-26 23:02:14 +0000 | [diff] [blame] | 439 | SelectionDAG &DAG) const; |
Chris Lattner | 22aaf1d | 2006-10-31 20:13:11 +0000 | [diff] [blame] | 440 | |
Chris Lattner | 9189777 | 2006-10-18 18:26:48 +0000 | [diff] [blame] | 441 | /// getRegForInlineAsmConstraint - Given a physical register constraint |
| 442 | /// (e.g. {edx}), return the register number and the register class for the |
| 443 | /// register. This should only be used for C_Register constraints. On |
| 444 | /// error, this returns a register number of 0. |
Chris Lattner | f76d180 | 2006-07-31 23:26:50 +0000 | [diff] [blame] | 445 | std::pair<unsigned, const TargetRegisterClass*> |
| 446 | getRegForInlineAsmConstraint(const std::string &Constraint, |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 447 | MVT VT) const; |
Chris Lattner | f76d180 | 2006-07-31 23:26:50 +0000 | [diff] [blame] | 448 | |
Chris Lattner | c9addb7 | 2007-03-30 23:15:24 +0000 | [diff] [blame] | 449 | /// isLegalAddressingMode - Return true if the addressing mode represented |
| 450 | /// by AM is legal for this target, for a load/store of the specified type. |
| 451 | virtual bool isLegalAddressingMode(const AddrMode &AM, const Type *Ty)const; |
| 452 | |
Evan Cheng | 2bd122c | 2007-10-26 01:56:11 +0000 | [diff] [blame] | 453 | /// isTruncateFree - Return true if it's free to truncate a value of |
| 454 | /// type Ty1 to type Ty2. e.g. On x86 it's free to truncate a i32 value in |
| 455 | /// register EAX to i16 by referencing its sub-register AX. |
| 456 | virtual bool isTruncateFree(const Type *Ty1, const Type *Ty2) const; |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 457 | virtual bool isTruncateFree(MVT VT1, MVT VT2) const; |
Evan Cheng | 2bd122c | 2007-10-26 01:56:11 +0000 | [diff] [blame] | 458 | |
Evan Cheng | 0188ecb | 2006-03-22 18:59:22 +0000 | [diff] [blame] | 459 | /// isShuffleMaskLegal - Targets can use this to indicate that they only |
| 460 | /// support *some* VECTOR_SHUFFLE operations, those with specific masks. |
Chris Lattner | 9189777 | 2006-10-18 18:26:48 +0000 | [diff] [blame] | 461 | /// By default, if a target supports the VECTOR_SHUFFLE node, all mask |
| 462 | /// values are assumed to be legal. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 463 | virtual bool isShuffleMaskLegal(SDValue Mask, MVT VT) const; |
Evan Cheng | 39623da | 2006-04-20 08:58:49 +0000 | [diff] [blame] | 464 | |
| 465 | /// isVectorClearMaskLegal - Similar to isShuffleMaskLegal. This is |
| 466 | /// used by Targets can use this to indicate if there is a suitable |
| 467 | /// VECTOR_SHUFFLE that can be used to replace a VAND with a constant |
| 468 | /// pool entry. |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 469 | virtual bool isVectorClearMaskLegal(const std::vector<SDValue> &BVOps, |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 470 | MVT EVT, SelectionDAG &DAG) const; |
Evan Cheng | 6fd599f | 2008-03-05 01:30:59 +0000 | [diff] [blame] | 471 | |
| 472 | /// ShouldShrinkFPConstant - If true, then instruction selection should |
| 473 | /// seek to shrink the FP constant of the specified type to a smaller type |
| 474 | /// in order to save space and / or reduce runtime. |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 475 | virtual bool ShouldShrinkFPConstant(MVT VT) const { |
Evan Cheng | 6fd599f | 2008-03-05 01:30:59 +0000 | [diff] [blame] | 476 | // Don't shrink FP constpool if SSE2 is available since cvtss2sd is more |
| 477 | // expensive than a straight movsd. On the other hand, it's important to |
| 478 | // shrink long double fp constant since fldt is very slow. |
| 479 | return !X86ScalarSSEf64 || VT == MVT::f80; |
| 480 | } |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 481 | |
| 482 | /// IsEligibleForTailCallOptimization - Check whether the call is eligible |
| 483 | /// for tail call optimization. Target which want to do tail call |
| 484 | /// optimization should implement this function. |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 485 | virtual bool IsEligibleForTailCallOptimization(CallSDNode *TheCall, |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 486 | SDValue Ret, |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 487 | SelectionDAG &DAG) const; |
| 488 | |
Dan Gohman | 707e018 | 2008-04-12 04:36:06 +0000 | [diff] [blame] | 489 | virtual const X86Subtarget* getSubtarget() { |
| 490 | return Subtarget; |
Rafael Espindola | f1ba1ca | 2007-11-05 23:12:20 +0000 | [diff] [blame] | 491 | } |
| 492 | |
Chris Lattner | 3d66185 | 2008-01-18 06:52:41 +0000 | [diff] [blame] | 493 | /// isScalarFPTypeInSSEReg - Return true if the specified scalar FP type is |
| 494 | /// computed in an SSE register, not on the X87 floating point stack. |
Duncan Sands | 83ec4b6 | 2008-06-06 12:08:01 +0000 | [diff] [blame] | 495 | bool isScalarFPTypeInSSEReg(MVT VT) const { |
Chris Lattner | 3d66185 | 2008-01-18 06:52:41 +0000 | [diff] [blame] | 496 | return (VT == MVT::f64 && X86ScalarSSEf64) || // f64 is when SSE2 |
| 497 | (VT == MVT::f32 && X86ScalarSSEf32); // f32 is when SSE1 |
| 498 | } |
Dan Gohman | d9f3c48 | 2008-08-19 21:32:53 +0000 | [diff] [blame] | 499 | |
Mon P Wang | 0c39719 | 2008-10-30 08:01:45 +0000 | [diff] [blame] | 500 | /// getWidenVectorType: given a vector type, returns the type to widen |
| 501 | /// to (e.g., v7i8 to v8i8). If the vector type is legal, it returns itself. |
| 502 | /// If there is no vector type that we want to widen to, returns MVT::Other |
| 503 | /// When and were to widen is target dependent based on the cost of |
| 504 | /// scalarizing vs using the wider vector type. |
Dan Gohman | c13cf13 | 2009-01-15 17:34:08 +0000 | [diff] [blame] | 505 | virtual MVT getWidenVectorType(MVT VT) const; |
Mon P Wang | 0c39719 | 2008-10-30 08:01:45 +0000 | [diff] [blame] | 506 | |
Dan Gohman | d9f3c48 | 2008-08-19 21:32:53 +0000 | [diff] [blame] | 507 | /// createFastISel - This method returns a target specific FastISel object, |
| 508 | /// or null if the target does not support "fast" ISel. |
Dan Gohman | 3df24e6 | 2008-09-03 23:12:08 +0000 | [diff] [blame] | 509 | virtual FastISel * |
| 510 | createFastISel(MachineFunction &mf, |
Devang Patel | 83489bb | 2009-01-13 00:35:13 +0000 | [diff] [blame] | 511 | MachineModuleInfo *mmi, DwarfWriter *dw, |
Dan Gohman | 3df24e6 | 2008-09-03 23:12:08 +0000 | [diff] [blame] | 512 | DenseMap<const Value *, unsigned> &, |
Dan Gohman | 0586d91 | 2008-09-10 20:11:02 +0000 | [diff] [blame] | 513 | DenseMap<const BasicBlock *, MachineBasicBlock *> &, |
Dan Gohman | dd5b58a | 2008-10-14 23:54:11 +0000 | [diff] [blame] | 514 | DenseMap<const AllocaInst *, int> & |
| 515 | #ifndef NDEBUG |
| 516 | , SmallSet<Instruction*, 8> & |
| 517 | #endif |
| 518 | ); |
Chris Lattner | 3d66185 | 2008-01-18 06:52:41 +0000 | [diff] [blame] | 519 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 520 | private: |
Evan Cheng | 0db9fe6 | 2006-04-25 20:13:52 +0000 | [diff] [blame] | 521 | /// Subtarget - Keep a pointer to the X86Subtarget around so that we can |
| 522 | /// make the right decision when generating code for different targets. |
| 523 | const X86Subtarget *Subtarget; |
Dan Gohman | c9f5f3f | 2008-05-14 01:58:56 +0000 | [diff] [blame] | 524 | const X86RegisterInfo *RegInfo; |
Anton Korobeynikov | bff66b0 | 2008-09-09 18:22:57 +0000 | [diff] [blame] | 525 | const TargetData *TD; |
Evan Cheng | 0db9fe6 | 2006-04-25 20:13:52 +0000 | [diff] [blame] | 526 | |
Evan Cheng | 25ab690 | 2006-09-08 06:48:29 +0000 | [diff] [blame] | 527 | /// X86StackPtr - X86 physical register used as stack ptr. |
| 528 | unsigned X86StackPtr; |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 529 | |
Dale Johannesen | f1fc3a8 | 2007-09-23 14:52:20 +0000 | [diff] [blame] | 530 | /// X86ScalarSSEf32, X86ScalarSSEf64 - Select between SSE or x87 |
| 531 | /// floating point ops. |
| 532 | /// When SSE is available, use it for f32 operations. |
| 533 | /// When SSE2 is available, use it for f64 operations. |
| 534 | bool X86ScalarSSEf32; |
| 535 | bool X86ScalarSSEf64; |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 536 | |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 537 | SDNode *LowerCallResult(SDValue Chain, SDValue InFlag, CallSDNode *TheCall, |
Chris Lattner | 3085e15 | 2007-02-25 08:59:22 +0000 | [diff] [blame] | 538 | unsigned CallingConv, SelectionDAG &DAG); |
Evan Cheng | 0d9e976 | 2008-01-29 19:34:22 +0000 | [diff] [blame] | 539 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 540 | SDValue LowerMemArgument(SDValue Op, SelectionDAG &DAG, |
Rafael Espindola | 7effac5 | 2007-09-14 15:48:13 +0000 | [diff] [blame] | 541 | const CCValAssign &VA, MachineFrameInfo *MFI, |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 542 | unsigned CC, SDValue Root, unsigned i); |
Rafael Espindola | 7effac5 | 2007-09-14 15:48:13 +0000 | [diff] [blame] | 543 | |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 544 | SDValue LowerMemOpCallTo(CallSDNode *TheCall, SelectionDAG &DAG, |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 545 | const SDValue &StackPtr, |
| 546 | const CCValAssign &VA, SDValue Chain, |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 547 | SDValue Arg, ISD::ArgFlagsTy Flags); |
Rafael Espindola | 1b5dcc3 | 2007-08-31 15:06:30 +0000 | [diff] [blame] | 548 | |
Gordon Henriksen | 8673766 | 2008-01-05 16:56:59 +0000 | [diff] [blame] | 549 | // Call lowering helpers. |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 550 | bool IsCalleePop(bool isVarArg, unsigned CallingConv); |
Arnold Schwaighofer | 258bb1b | 2008-02-26 22:21:54 +0000 | [diff] [blame] | 551 | bool CallRequiresGOTPtrInReg(bool Is64Bit, bool IsTailCall); |
| 552 | bool CallRequiresFnAddressInReg(bool Is64Bit, bool IsTailCall); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 553 | SDValue EmitTailCallLoadRetAddr(SelectionDAG &DAG, SDValue &OutRetAddr, |
| 554 | SDValue Chain, bool IsTailCall, bool Is64Bit, |
Dale Johannesen | ace1610 | 2009-02-03 19:33:06 +0000 | [diff] [blame] | 555 | int FPDiff, DebugLoc dl); |
Arnold Schwaighofer | 4b5324a | 2008-04-12 18:11:06 +0000 | [diff] [blame] | 556 | |
Dan Gohman | 095cc29 | 2008-09-13 01:54:27 +0000 | [diff] [blame] | 557 | CCAssignFn *CCAssignFnForNode(unsigned CallingConv) const; |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 558 | NameDecorationStyle NameDecorationForFORMAL_ARGUMENTS(SDValue Op); |
Arnold Schwaighofer | c85e171 | 2007-10-11 19:40:01 +0000 | [diff] [blame] | 559 | unsigned GetAlignedArgumentStackSize(unsigned StackSize, SelectionDAG &DAG); |
Evan Cheng | 559806f | 2006-01-27 08:10:46 +0000 | [diff] [blame] | 560 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 561 | std::pair<SDValue,SDValue> FP_TO_SINTHelper(SDValue Op, |
Chris Lattner | 27a6c73 | 2007-11-24 07:07:01 +0000 | [diff] [blame] | 562 | SelectionDAG &DAG); |
| 563 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 564 | SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG); |
| 565 | SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG); |
| 566 | SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG); |
| 567 | SDValue LowerEXTRACT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG); |
| 568 | SDValue LowerINSERT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG); |
| 569 | SDValue LowerINSERT_VECTOR_ELT_SSE4(SDValue Op, SelectionDAG &DAG); |
| 570 | SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG); |
| 571 | SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG); |
Dale Johannesen | 33c960f | 2009-02-04 20:06:27 +0000 | [diff] [blame] | 572 | SDValue LowerGlobalAddress(const GlobalValue *GV, DebugLoc dl, |
| 573 | int64_t Offset, SelectionDAG &DAG) const; |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 574 | SDValue LowerGlobalAddress(SDValue Op, SelectionDAG &DAG); |
| 575 | SDValue LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG); |
| 576 | SDValue LowerExternalSymbol(SDValue Op, SelectionDAG &DAG); |
| 577 | SDValue LowerShift(SDValue Op, SelectionDAG &DAG); |
| 578 | SDValue LowerSINT_TO_FP(SDValue Op, SelectionDAG &DAG); |
Dale Johannesen | 1c15bf5 | 2008-10-21 20:50:01 +0000 | [diff] [blame] | 579 | SDValue LowerUINT_TO_FP(SDValue Op, SelectionDAG &DAG); |
Bill Wendling | 8b8a636 | 2009-01-17 03:56:04 +0000 | [diff] [blame] | 580 | SDValue LowerUINT_TO_FP_i64(SDValue Op, SelectionDAG &DAG); |
| 581 | SDValue LowerUINT_TO_FP_i32(SDValue Op, SelectionDAG &DAG); |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 582 | SDValue LowerFP_TO_SINT(SDValue Op, SelectionDAG &DAG); |
| 583 | SDValue LowerFABS(SDValue Op, SelectionDAG &DAG); |
| 584 | SDValue LowerFNEG(SDValue Op, SelectionDAG &DAG); |
| 585 | SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG); |
| 586 | SDValue LowerSETCC(SDValue Op, SelectionDAG &DAG); |
| 587 | SDValue LowerVSETCC(SDValue Op, SelectionDAG &DAG); |
| 588 | SDValue LowerSELECT(SDValue Op, SelectionDAG &DAG); |
| 589 | SDValue LowerBRCOND(SDValue Op, SelectionDAG &DAG); |
| 590 | SDValue LowerMEMSET(SDValue Op, SelectionDAG &DAG); |
| 591 | SDValue LowerJumpTable(SDValue Op, SelectionDAG &DAG); |
| 592 | SDValue LowerCALL(SDValue Op, SelectionDAG &DAG); |
| 593 | SDValue LowerRET(SDValue Op, SelectionDAG &DAG); |
| 594 | SDValue LowerDYNAMIC_STACKALLOC(SDValue Op, SelectionDAG &DAG); |
| 595 | SDValue LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG); |
| 596 | SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG); |
| 597 | SDValue LowerVAARG(SDValue Op, SelectionDAG &DAG); |
| 598 | SDValue LowerVACOPY(SDValue Op, SelectionDAG &DAG); |
| 599 | SDValue LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG); |
| 600 | SDValue LowerRETURNADDR(SDValue Op, SelectionDAG &DAG); |
| 601 | SDValue LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG); |
| 602 | SDValue LowerFRAME_TO_ARGS_OFFSET(SDValue Op, SelectionDAG &DAG); |
| 603 | SDValue LowerEH_RETURN(SDValue Op, SelectionDAG &DAG); |
| 604 | SDValue LowerTRAMPOLINE(SDValue Op, SelectionDAG &DAG); |
| 605 | SDValue LowerFLT_ROUNDS_(SDValue Op, SelectionDAG &DAG); |
| 606 | SDValue LowerCTLZ(SDValue Op, SelectionDAG &DAG); |
| 607 | SDValue LowerCTTZ(SDValue Op, SelectionDAG &DAG); |
Mon P Wang | af9b952 | 2008-12-18 21:42:19 +0000 | [diff] [blame] | 608 | SDValue LowerMUL_V2I64(SDValue Op, SelectionDAG &DAG); |
Bill Wendling | 74c3765 | 2008-12-09 22:08:41 +0000 | [diff] [blame] | 609 | SDValue LowerXALUO(SDValue Op, SelectionDAG &DAG); |
Bill Wendling | 41ea7e7 | 2008-11-24 19:21:46 +0000 | [diff] [blame] | 610 | |
Dan Gohman | 475871a | 2008-07-27 21:46:04 +0000 | [diff] [blame] | 611 | SDValue LowerCMP_SWAP(SDValue Op, SelectionDAG &DAG); |
Dale Johannesen | 71d1bf5 | 2008-09-29 22:25:26 +0000 | [diff] [blame] | 612 | SDValue LowerLOAD_SUB(SDValue Op, SelectionDAG &DAG); |
Duncan Sands | 1607f05 | 2008-12-01 11:39:25 +0000 | [diff] [blame] | 613 | SDValue LowerREADCYCLECOUNTER(SDValue Op, SelectionDAG &DAG); |
| 614 | |
| 615 | void ReplaceATOMIC_BINARY_64(SDNode *N, SmallVectorImpl<SDValue> &Results, |
| 616 | SelectionDAG &DAG, unsigned NewOp); |
| 617 | |
Dale Johannesen | eacf2dc | 2009-02-03 22:26:34 +0000 | [diff] [blame] | 618 | SDValue EmitTargetCodeForMemset(SelectionDAG &DAG, DebugLoc dl, |
Bill Wendling | 6f287b2 | 2008-09-30 21:22:07 +0000 | [diff] [blame] | 619 | SDValue Chain, |
| 620 | SDValue Dst, SDValue Src, |
| 621 | SDValue Size, unsigned Align, |
Bill Wendling | 6158d84 | 2008-10-01 00:59:58 +0000 | [diff] [blame] | 622 | const Value *DstSV, uint64_t DstSVOff); |
Dale Johannesen | eacf2dc | 2009-02-03 22:26:34 +0000 | [diff] [blame] | 623 | SDValue EmitTargetCodeForMemcpy(SelectionDAG &DAG, DebugLoc dl, |
Bill Wendling | 6f287b2 | 2008-09-30 21:22:07 +0000 | [diff] [blame] | 624 | SDValue Chain, |
| 625 | SDValue Dst, SDValue Src, |
| 626 | SDValue Size, unsigned Align, |
| 627 | bool AlwaysInline, |
| 628 | const Value *DstSV, uint64_t DstSVOff, |
| 629 | const Value *SrcSV, uint64_t SrcSVOff); |
Mon P Wang | 63307c3 | 2008-05-05 19:05:59 +0000 | [diff] [blame] | 630 | |
| 631 | /// Utility function to emit atomic bitwise operations (and, or, xor). |
| 632 | // It takes the bitwise instruction to expand, the associated machine basic |
| 633 | // block, and the associated X86 opcodes for reg/reg and reg/imm. |
| 634 | MachineBasicBlock *EmitAtomicBitwiseWithCustomInserter( |
| 635 | MachineInstr *BInstr, |
| 636 | MachineBasicBlock *BB, |
| 637 | unsigned regOpc, |
Andrew Lenharth | 507a58a | 2008-06-14 05:48:15 +0000 | [diff] [blame] | 638 | unsigned immOpc, |
Dale Johannesen | 140be2d | 2008-08-19 18:47:28 +0000 | [diff] [blame] | 639 | unsigned loadOpc, |
| 640 | unsigned cxchgOpc, |
| 641 | unsigned copyOpc, |
| 642 | unsigned notOpc, |
| 643 | unsigned EAXreg, |
| 644 | TargetRegisterClass *RC, |
Dan Gohman | 1fdbc1d | 2009-02-07 16:15:20 +0000 | [diff] [blame] | 645 | bool invSrc = false) const; |
Dale Johannesen | 48c1bc2 | 2008-10-02 18:53:47 +0000 | [diff] [blame] | 646 | |
| 647 | MachineBasicBlock *EmitAtomicBit6432WithCustomInserter( |
| 648 | MachineInstr *BInstr, |
| 649 | MachineBasicBlock *BB, |
| 650 | unsigned regOpcL, |
| 651 | unsigned regOpcH, |
| 652 | unsigned immOpcL, |
| 653 | unsigned immOpcH, |
Dan Gohman | 1fdbc1d | 2009-02-07 16:15:20 +0000 | [diff] [blame] | 654 | bool invSrc = false) const; |
Mon P Wang | 63307c3 | 2008-05-05 19:05:59 +0000 | [diff] [blame] | 655 | |
| 656 | /// Utility function to emit atomic min and max. It takes the min/max |
| 657 | // instruction to expand, the associated basic block, and the associated |
| 658 | // cmov opcode for moving the min or max value. |
| 659 | MachineBasicBlock *EmitAtomicMinMaxWithCustomInserter(MachineInstr *BInstr, |
| 660 | MachineBasicBlock *BB, |
Dan Gohman | 1fdbc1d | 2009-02-07 16:15:20 +0000 | [diff] [blame] | 661 | unsigned cmovOpc) const; |
Dan Gohman | 076aee3 | 2009-03-04 19:44:21 +0000 | [diff] [blame^] | 662 | |
| 663 | /// Emit nodes that will be selected as "test Op0,Op0", or something |
| 664 | /// equivalent. |
| 665 | SDValue EmitTest(SDValue Op0, SelectionDAG &DAG); |
| 666 | |
| 667 | /// Emit nodes that will be selected as "cmp Op0,Op1", or something |
| 668 | /// equivalent. |
| 669 | SDValue EmitCmp(SDValue Op0, SDValue Op1, SelectionDAG &DAG); |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 670 | }; |
Evan Cheng | c3f44b0 | 2008-09-03 00:03:49 +0000 | [diff] [blame] | 671 | |
| 672 | namespace X86 { |
Dan Gohman | 3df24e6 | 2008-09-03 23:12:08 +0000 | [diff] [blame] | 673 | FastISel *createFastISel(MachineFunction &mf, |
Devang Patel | 83489bb | 2009-01-13 00:35:13 +0000 | [diff] [blame] | 674 | MachineModuleInfo *mmi, DwarfWriter *dw, |
Dan Gohman | 3df24e6 | 2008-09-03 23:12:08 +0000 | [diff] [blame] | 675 | DenseMap<const Value *, unsigned> &, |
Dan Gohman | 0586d91 | 2008-09-10 20:11:02 +0000 | [diff] [blame] | 676 | DenseMap<const BasicBlock *, MachineBasicBlock *> &, |
Dan Gohman | dd5b58a | 2008-10-14 23:54:11 +0000 | [diff] [blame] | 677 | DenseMap<const AllocaInst *, int> & |
| 678 | #ifndef NDEBUG |
| 679 | , SmallSet<Instruction*, 8> & |
| 680 | #endif |
| 681 | ); |
Evan Cheng | c3f44b0 | 2008-09-03 00:03:49 +0000 | [diff] [blame] | 682 | } |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 683 | } |
| 684 | |
Chris Lattner | dbdbf0c | 2005-11-15 00:40:23 +0000 | [diff] [blame] | 685 | #endif // X86ISELLOWERING_H |