| Bill Wendling | 2bce78e | 2010-12-04 23:57:24 +0000 | [diff] [blame] | 1 | //===-- X86Subtarget.cpp - X86 Subtarget Information ----------------------===// |
| Nate Begeman | f26625e | 2005-07-12 01:41:54 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| Chris Lattner | f3ebc3f | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| Nate Begeman | f26625e | 2005-07-12 01:41:54 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| Evan Cheng | 0d639a2 | 2011-07-01 21:01:15 +0000 | [diff] [blame] | 10 | // This file implements the X86 specific subclass of TargetSubtargetInfo. |
| Nate Begeman | f26625e | 2005-07-12 01:41:54 +0000 | [diff] [blame] | 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| Quentin Colombet | 8cf805a | 2017-07-01 00:45:50 +0000 | [diff] [blame] | 14 | #include "X86.h" |
| 15 | |
| Quentin Colombet | 8cf805a | 2017-07-01 00:45:50 +0000 | [diff] [blame] | 16 | #include "X86CallLowering.h" |
| 17 | #include "X86LegalizerInfo.h" |
| 18 | #include "X86RegisterBankInfo.h" |
| Nate Begeman | f26625e | 2005-07-12 01:41:54 +0000 | [diff] [blame] | 19 | #include "X86Subtarget.h" |
| Chandler Carruth | 6bda14b | 2017-06-06 11:49:48 +0000 | [diff] [blame] | 20 | #include "MCTargetDesc/X86BaseInfo.h" |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 21 | #include "X86TargetMachine.h" |
| Eugene Zelenko | fbd13c5 | 2017-02-02 22:55:55 +0000 | [diff] [blame] | 22 | #include "llvm/ADT/Triple.h" |
| Quentin Colombet | 8cf805a | 2017-07-01 00:45:50 +0000 | [diff] [blame] | 23 | #include "llvm/CodeGen/GlobalISel/CallLowering.h" |
| 24 | #include "llvm/CodeGen/GlobalISel/InstructionSelect.h" |
| Bill Wendling | aef9c37 | 2013-02-15 22:31:27 +0000 | [diff] [blame] | 25 | #include "llvm/IR/Attributes.h" |
| Peter Collingbourne | dc5e583 | 2017-02-02 00:32:03 +0000 | [diff] [blame] | 26 | #include "llvm/IR/ConstantRange.h" |
| Bill Wendling | aef9c37 | 2013-02-15 22:31:27 +0000 | [diff] [blame] | 27 | #include "llvm/IR/Function.h" |
| Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 28 | #include "llvm/IR/GlobalValue.h" |
| Eugene Zelenko | fbd13c5 | 2017-02-02 22:55:55 +0000 | [diff] [blame] | 29 | #include "llvm/Support/Casting.h" |
| 30 | #include "llvm/Support/CodeGen.h" |
| Eric Christopher | 3470bbb | 2014-05-21 23:51:57 +0000 | [diff] [blame] | 31 | #include "llvm/Support/CommandLine.h" |
| Evan Cheng | 9a3ec1b | 2009-01-03 04:04:46 +0000 | [diff] [blame] | 32 | #include "llvm/Support/Debug.h" |
| Rafael Espindola | 6559656 | 2011-09-07 16:10:57 +0000 | [diff] [blame] | 33 | #include "llvm/Support/ErrorHandling.h" |
| Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 34 | #include "llvm/Support/raw_ostream.h" |
| Anton Korobeynikov | 430e68a1 | 2006-12-22 22:29:05 +0000 | [diff] [blame] | 35 | #include "llvm/Target/TargetMachine.h" |
| Evan Cheng | 54b68e3 | 2011-07-01 20:45:01 +0000 | [diff] [blame] | 36 | |
| Chris Lattner | 3ad60b1 | 2009-04-25 18:27:23 +0000 | [diff] [blame] | 37 | #if defined(_MSC_VER) |
| Bill Wendling | 6eecd56 | 2009-08-03 00:11:34 +0000 | [diff] [blame] | 38 | #include <intrin.h> |
| Chris Lattner | 3ad60b1 | 2009-04-25 18:27:23 +0000 | [diff] [blame] | 39 | #endif |
| 40 | |
| Chandler Carruth | 84e68b2 | 2014-04-22 02:41:26 +0000 | [diff] [blame] | 41 | using namespace llvm; |
| 42 | |
| 43 | #define DEBUG_TYPE "subtarget" |
| 44 | |
| Chandler Carruth | d174b72 | 2014-04-22 02:03:14 +0000 | [diff] [blame] | 45 | #define GET_SUBTARGETINFO_TARGET_DESC |
| 46 | #define GET_SUBTARGETINFO_CTOR |
| 47 | #include "X86GenSubtargetInfo.inc" |
| 48 | |
| Eric Christopher | 6b0fcfe | 2014-05-21 23:40:26 +0000 | [diff] [blame] | 49 | // Temporary option to control early if-conversion for x86 while adding machine |
| 50 | // models. |
| 51 | static cl::opt<bool> |
| 52 | X86EarlyIfConv("x86-early-ifcvt", cl::Hidden, |
| 53 | cl::desc("Enable early if-conversion on X86")); |
| 54 | |
| 55 | |
| Sanjay Patel | 2e75341 | 2015-08-14 15:11:42 +0000 | [diff] [blame] | 56 | /// Classify a blockaddress reference for the current subtarget according to how |
| 57 | /// we should reference it in a non-pcrel context. |
| Rafael Espindola | cb2d266 | 2016-05-19 18:34:20 +0000 | [diff] [blame] | 58 | unsigned char X86Subtarget::classifyBlockAddressReference() const { |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 59 | return classifyLocalReference(nullptr); |
| 60 | } |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 61 | |
| Sanjay Patel | 2e75341 | 2015-08-14 15:11:42 +0000 | [diff] [blame] | 62 | /// Classify a global variable reference for the current subtarget according to |
| 63 | /// how we should reference it in a non-pcrel context. |
| Rafael Espindola | ab03eb0 | 2016-05-19 22:07:57 +0000 | [diff] [blame] | 64 | unsigned char |
| 65 | X86Subtarget::classifyGlobalReference(const GlobalValue *GV) const { |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 66 | return classifyGlobalReference(GV, *GV->getParent()); |
| 67 | } |
| Chris Lattner | dc842c0 | 2009-07-10 07:20:05 +0000 | [diff] [blame] | 68 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 69 | unsigned char |
| 70 | X86Subtarget::classifyLocalReference(const GlobalValue *GV) const { |
| 71 | // 64 bits can use %rip addressing for anything local. |
| 72 | if (is64Bit()) |
| Chris Lattner | dc842c0 | 2009-07-10 07:20:05 +0000 | [diff] [blame] | 73 | return X86II::MO_NO_FLAG; |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 74 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 75 | // If this is for a position dependent executable, the static linker can |
| 76 | // figure it out. |
| Davide Italiano | ef5d8be | 2016-06-18 00:03:20 +0000 | [diff] [blame] | 77 | if (!isPositionIndependent()) |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 78 | return X86II::MO_NO_FLAG; |
| Sriraman Tallam | 3cb7734 | 2016-04-22 21:41:58 +0000 | [diff] [blame] | 79 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 80 | // The COFF dynamic linker just patches the executable sections. |
| 81 | if (isTargetCOFF()) |
| 82 | return X86II::MO_NO_FLAG; |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 83 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 84 | if (isTargetDarwin()) { |
| 85 | // 32 bit macho has no relocation for a-b if a is undefined, even if |
| 86 | // b is in the section that is being relocated. |
| 87 | // This means we have to use o load even for GVs that are known to be |
| 88 | // local to the dso. |
| 89 | if (GV && (GV->isDeclarationForLinker() || GV->hasCommonLinkage())) |
| Chris Lattner | bd3e560 | 2009-07-10 20:53:38 +0000 | [diff] [blame] | 90 | return X86II::MO_DARWIN_NONLAZY_PIC_BASE; |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 91 | |
| Chris Lattner | bd3e560 | 2009-07-10 20:53:38 +0000 | [diff] [blame] | 92 | return X86II::MO_PIC_BASE_OFFSET; |
| 93 | } |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 94 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 95 | return X86II::MO_GOTOFF; |
| 96 | } |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 97 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 98 | unsigned char X86Subtarget::classifyGlobalReference(const GlobalValue *GV, |
| 99 | const Module &M) const { |
| 100 | // Large model never uses stubs. |
| 101 | if (TM.getCodeModel() == CodeModel::Large) |
| Chris Lattner | bd3e560 | 2009-07-10 20:53:38 +0000 | [diff] [blame] | 102 | return X86II::MO_NO_FLAG; |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 103 | |
| Peter Collingbourne | 235c275 | 2016-12-08 19:01:00 +0000 | [diff] [blame] | 104 | // Absolute symbols can be referenced directly. |
| Peter Collingbourne | dc5e583 | 2017-02-02 00:32:03 +0000 | [diff] [blame] | 105 | if (GV) { |
| 106 | if (Optional<ConstantRange> CR = GV->getAbsoluteSymbolRange()) { |
| 107 | // See if we can use the 8-bit immediate form. Note that some instructions |
| 108 | // will sign extend the immediate operand, so to be conservative we only |
| 109 | // accept the range [0,128). |
| 110 | if (CR->getUnsignedMax().ult(128)) |
| 111 | return X86II::MO_ABS8; |
| 112 | else |
| 113 | return X86II::MO_NO_FLAG; |
| 114 | } |
| 115 | } |
| Peter Collingbourne | 235c275 | 2016-12-08 19:01:00 +0000 | [diff] [blame] | 116 | |
| Rafael Espindola | 2393c3b | 2017-10-27 21:18:48 +0000 | [diff] [blame] | 117 | if (TM.shouldAssumeDSOLocal(M, GV)) |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 118 | return classifyLocalReference(GV); |
| 119 | |
| 120 | if (isTargetCOFF()) |
| 121 | return X86II::MO_DLLIMPORT; |
| 122 | |
| 123 | if (is64Bit()) |
| 124 | return X86II::MO_GOTPCREL; |
| 125 | |
| 126 | if (isTargetDarwin()) { |
| Davide Italiano | ef5d8be | 2016-06-18 00:03:20 +0000 | [diff] [blame] | 127 | if (!isPositionIndependent()) |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 128 | return X86II::MO_DARWIN_NONLAZY; |
| 129 | return X86II::MO_DARWIN_NONLAZY_PIC_BASE; |
| Chris Lattner | dc842c0 | 2009-07-10 07:20:05 +0000 | [diff] [blame] | 130 | } |
| Chad Rosier | 24c19d2 | 2012-08-01 18:39:17 +0000 | [diff] [blame] | 131 | |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 132 | return X86II::MO_GOT; |
| Chris Lattner | dc842c0 | 2009-07-10 07:20:05 +0000 | [diff] [blame] | 133 | } |
| 134 | |
| Rafael Espindola | 46107b9 | 2016-05-19 18:49:29 +0000 | [diff] [blame] | 135 | unsigned char |
| 136 | X86Subtarget::classifyGlobalFunctionReference(const GlobalValue *GV) const { |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 137 | return classifyGlobalFunctionReference(GV, *GV->getParent()); |
| 138 | } |
| 139 | |
| 140 | unsigned char |
| 141 | X86Subtarget::classifyGlobalFunctionReference(const GlobalValue *GV, |
| 142 | const Module &M) const { |
| Rafael Espindola | 3beef8d | 2016-06-27 23:15:57 +0000 | [diff] [blame] | 143 | if (TM.shouldAssumeDSOLocal(M, GV)) |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 144 | return X86II::MO_NO_FLAG; |
| 145 | |
| Reid Kleckner | 7662d50 | 2017-08-05 00:10:43 +0000 | [diff] [blame] | 146 | if (isTargetCOFF()) { |
| 147 | assert(GV->hasDLLImportStorageClass() && |
| 148 | "shouldAssumeDSOLocal gave inconsistent answer"); |
| 149 | return X86II::MO_DLLIMPORT; |
| 150 | } |
| 151 | |
| Sriraman Tallam | 056b3fd | 2017-11-08 00:01:05 +0000 | [diff] [blame] | 152 | const Function *F = dyn_cast_or_null<Function>(GV); |
| 153 | |
| Oren Ben Simhon | 51de033 | 2017-05-04 07:22:49 +0000 | [diff] [blame] | 154 | if (isTargetELF()) { |
| 155 | if (is64Bit() && F && (CallingConv::X86_RegCall == F->getCallingConv())) |
| 156 | // According to psABI, PLT stub clobbers XMM8-XMM15. |
| 157 | // In Regcall calling convention those registers are used for passing |
| 158 | // parameters. Thus we need to prevent lazy binding in Regcall. |
| 159 | return X86II::MO_GOTPCREL; |
| Sriraman Tallam | 609f8c0 | 2018-02-23 21:32:06 +0000 | [diff] [blame] | 160 | // If PLT must be avoided then the call should be via GOTPCREL. |
| 161 | if (((F && F->hasFnAttribute(Attribute::NonLazyBind)) || |
| 162 | (!F && M.getRtLibUseGOT())) && |
| 163 | is64Bit()) |
| 164 | return X86II::MO_GOTPCREL; |
| Asaf Badouh | 89406d1 | 2016-04-20 08:32:57 +0000 | [diff] [blame] | 165 | return X86II::MO_PLT; |
| Oren Ben Simhon | 51de033 | 2017-05-04 07:22:49 +0000 | [diff] [blame] | 166 | } |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 167 | |
| 168 | if (is64Bit()) { |
| Rafael Espindola | c7e9813 | 2016-05-20 12:20:10 +0000 | [diff] [blame] | 169 | if (F && F->hasFnAttribute(Attribute::NonLazyBind)) |
| 170 | // If the function is marked as non-lazy, generate an indirect call |
| 171 | // which loads from the GOT directly. This avoids runtime overhead |
| 172 | // at the cost of eager binding (and one extra byte of encoding). |
| 173 | return X86II::MO_GOTPCREL; |
| 174 | return X86II::MO_NO_FLAG; |
| Asaf Badouh | 89406d1 | 2016-04-20 08:32:57 +0000 | [diff] [blame] | 175 | } |
| 176 | |
| 177 | return X86II::MO_NO_FLAG; |
| 178 | } |
| Anton Korobeynikov | 6dbdfe2 | 2006-11-30 22:42:55 +0000 | [diff] [blame] | 179 | |
| Sanjay Patel | 2e75341 | 2015-08-14 15:11:42 +0000 | [diff] [blame] | 180 | /// Return true if the subtarget allows calls to immediate address. |
| Rafael Espindola | 46107b9 | 2016-05-19 18:49:29 +0000 | [diff] [blame] | 181 | bool X86Subtarget::isLegalToCallImmediateAddr() const { |
| David Majnemer | 02f2188 | 2014-03-28 21:40:47 +0000 | [diff] [blame] | 182 | // FIXME: I386 PE/COFF supports PC relative calls using IMAGE_REL_I386_REL32 |
| 183 | // but WinCOFFObjectWriter::RecordRelocation cannot emit them. Once it does, |
| 184 | // the following check for Win32 should be removed. |
| 185 | if (In64BitMode || isTargetWin32()) |
| Evan Cheng | 9609833 | 2009-05-20 04:53:57 +0000 | [diff] [blame] | 186 | return false; |
| Rafael Espindola | ab03eb0 | 2016-05-19 22:07:57 +0000 | [diff] [blame] | 187 | return isTargetELF() || TM.getRelocationModel() == Reloc::Static; |
| Evan Cheng | 9609833 | 2009-05-20 04:53:57 +0000 | [diff] [blame] | 188 | } |
| 189 | |
| Eric Christopher | b68e253 | 2014-09-03 20:36:31 +0000 | [diff] [blame] | 190 | void X86Subtarget::initSubtargetFeatures(StringRef CPU, StringRef FS) { |
| Nadav Rotem | 08ab877 | 2013-02-27 05:56:20 +0000 | [diff] [blame] | 191 | std::string CPUName = CPU; |
| Jim Grosbach | 48551fb | 2014-04-12 01:34:29 +0000 | [diff] [blame] | 192 | if (CPUName.empty()) |
| 193 | CPUName = "generic"; |
| Evan Cheng | 964cb5f | 2011-07-08 21:14:14 +0000 | [diff] [blame] | 194 | |
| Jim Grosbach | 48551fb | 2014-04-12 01:34:29 +0000 | [diff] [blame] | 195 | // Make sure 64-bit features are available in 64-bit mode. (But make sure |
| 196 | // SSE2 can be turned off explicitly.) |
| 197 | std::string FullFS = FS; |
| 198 | if (In64BitMode) { |
| 199 | if (!FullFS.empty()) |
| 200 | FullFS = "+64bit,+sse2," + FullFS; |
| 201 | else |
| 202 | FullFS = "+64bit,+sse2"; |
| Evan Cheng | 11b0a5d | 2006-09-08 06:48:29 +0000 | [diff] [blame] | 203 | } |
| Evan Cheng | c5e6d2f | 2011-07-11 03:57:24 +0000 | [diff] [blame] | 204 | |
| Hans Wennborg | 5000ce8 | 2015-12-04 23:00:33 +0000 | [diff] [blame] | 205 | // LAHF/SAHF are always supported in non-64-bit mode. |
| 206 | if (!In64BitMode) { |
| 207 | if (!FullFS.empty()) |
| 208 | FullFS = "+sahf," + FullFS; |
| 209 | else |
| 210 | FullFS = "+sahf"; |
| 211 | } |
| 212 | |
| Duncan P. N. Exon Smith | bb57d73 | 2015-07-10 22:33:01 +0000 | [diff] [blame] | 213 | // Parse features string and set the CPU. |
| Jim Grosbach | 48551fb | 2014-04-12 01:34:29 +0000 | [diff] [blame] | 214 | ParseSubtargetFeatures(CPUName, FullFS); |
| 215 | |
| Sanjay Patel | deb8f82 | 2015-08-25 16:29:21 +0000 | [diff] [blame] | 216 | // All CPUs that implement SSE4.2 or SSE4A support unaligned accesses of |
| 217 | // 16-bytes and under that are reasonably fast. These features were |
| 218 | // introduced with Intel's Nehalem/Silvermont and AMD's Family10h |
| 219 | // micro-architectures respectively. |
| 220 | if (hasSSE42() || hasSSE4A()) |
| Sanjay Patel | 3014567 | 2015-09-01 20:51:51 +0000 | [diff] [blame] | 221 | IsUAMem16Slow = false; |
| Sanjay Patel | deb8f82 | 2015-08-25 16:29:21 +0000 | [diff] [blame] | 222 | |
| Andrew Trick | e0c83b1 | 2012-08-07 00:25:30 +0000 | [diff] [blame] | 223 | InstrItins = getInstrItineraryForCPU(CPUName); |
| Andrew Trick | 8523b16 | 2012-02-01 23:20:51 +0000 | [diff] [blame] | 224 | |
| Evan Cheng | c5e6d2f | 2011-07-11 03:57:24 +0000 | [diff] [blame] | 225 | // It's important to keep the MCSubtargetInfo feature bits in sync with |
| 226 | // target data structure which is shared with MC code emitter, etc. |
| 227 | if (In64BitMode) |
| 228 | ToggleFeature(X86::Mode64Bit); |
| Craig Topper | 3c80d62 | 2014-01-06 04:55:54 +0000 | [diff] [blame] | 229 | else if (In32BitMode) |
| 230 | ToggleFeature(X86::Mode32Bit); |
| 231 | else if (In16BitMode) |
| 232 | ToggleFeature(X86::Mode16Bit); |
| 233 | else |
| 234 | llvm_unreachable("Not 16-bit, 32-bit or 64-bit mode!"); |
| Evan Cheng | c5e6d2f | 2011-07-11 03:57:24 +0000 | [diff] [blame] | 235 | |
| David Greene | 0041181 | 2010-01-05 01:29:13 +0000 | [diff] [blame] | 236 | DEBUG(dbgs() << "Subtarget features: SSELevel " << X86SSELevel |
| Bill Wendling | 6eecd56 | 2009-08-03 00:11:34 +0000 | [diff] [blame] | 237 | << ", 3DNowLevel " << X863DNowLevel |
| 238 | << ", 64bit " << HasX86_64 << "\n"); |
| Evan Cheng | 13bcc6c | 2011-07-07 21:06:52 +0000 | [diff] [blame] | 239 | assert((!In64BitMode || HasX86_64) && |
| Dan Gohman | 7403751 | 2009-02-03 00:04:43 +0000 | [diff] [blame] | 240 | "64-bit code requested on a subtarget that doesn't support it!"); |
| Evan Cheng | 11b0a5d | 2006-09-08 06:48:29 +0000 | [diff] [blame] | 241 | |
| Marcin Koscielnicki | 0275fac | 2016-05-05 11:35:51 +0000 | [diff] [blame] | 242 | // Stack alignment is 16 bytes on Darwin, Linux, kFreeBSD and Solaris (both |
| Roman Divacky | e8a93fe8 | 2011-02-22 17:30:05 +0000 | [diff] [blame] | 243 | // 32 and 64 bit) and for all 64-bit targets. |
| Evan Cheng | 3a0c5e5 | 2011-06-23 17:54:54 +0000 | [diff] [blame] | 244 | if (StackAlignOverride) |
| 245 | stackAlignment = StackAlignOverride; |
| Roman Divacky | 2213567 | 2012-11-09 20:10:44 +0000 | [diff] [blame] | 246 | else if (isTargetDarwin() || isTargetLinux() || isTargetSolaris() || |
| Marcin Koscielnicki | 0275fac | 2016-05-05 11:35:51 +0000 | [diff] [blame] | 247 | isTargetKFreeBSD() || In64BitMode) |
| Nate Begeman | f26625e | 2005-07-12 01:41:54 +0000 | [diff] [blame] | 248 | stackAlignment = 16; |
| Craig Topper | 17078ff | 2017-11-19 01:11:58 +0000 | [diff] [blame] | 249 | |
| Craig Topper | ea37e20 | 2017-11-25 18:09:37 +0000 | [diff] [blame] | 250 | // Some CPUs have more overhead for gather. The specified overhead is relative |
| 251 | // to the Load operation. "2" is the number provided by Intel architects. This |
| Craig Topper | 17078ff | 2017-11-19 01:11:58 +0000 | [diff] [blame] | 252 | // parameter is used for cost estimation of Gather Op and comparison with |
| 253 | // other alternatives. |
| Craig Topper | ea37e20 | 2017-11-25 18:09:37 +0000 | [diff] [blame] | 254 | // TODO: Remove the explicit hasAVX512()?, That would mean we would only |
| 255 | // enable gather with a -march. |
| 256 | if (hasAVX512() || (hasAVX2() && hasFastGather())) |
| Mohammed Agabaria | e9aebf2 | 2017-09-13 09:00:27 +0000 | [diff] [blame] | 257 | GatherOverhead = 2; |
| 258 | if (hasAVX512()) |
| 259 | ScatterOverhead = 2; |
| Craig Topper | 0d797a3 | 2018-01-20 00:26:08 +0000 | [diff] [blame] | 260 | |
| 261 | // Consume the vector width attribute or apply any target specific limit. |
| 262 | if (PreferVectorWidthOverride) |
| 263 | PreferVectorWidth = PreferVectorWidthOverride; |
| 264 | else if (Prefer256Bit) |
| 265 | PreferVectorWidth = 256; |
| Dan Gohman | dc53f1c | 2010-05-27 18:43:40 +0000 | [diff] [blame] | 266 | } |
| Andrew Trick | 8523b16 | 2012-02-01 23:20:51 +0000 | [diff] [blame] | 267 | |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 268 | void X86Subtarget::initializeEnvironment() { |
| Eric Christopher | 11e5983 | 2015-10-08 20:10:06 +0000 | [diff] [blame] | 269 | X86SSELevel = NoSSE; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 270 | X863DNowLevel = NoThreeDNow; |
| Andrey Turetskiy | 6a3d561 | 2016-03-23 11:13:54 +0000 | [diff] [blame] | 271 | HasX87 = false; |
| Craig Topper | 505f38a | 2018-01-10 22:07:16 +0000 | [diff] [blame] | 272 | HasNOPL = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 273 | HasCMov = false; |
| 274 | HasX86_64 = false; |
| 275 | HasPOPCNT = false; |
| 276 | HasSSE4A = false; |
| 277 | HasAES = false; |
| Coby Tayree | 2a1c02f | 2017-11-21 09:11:41 +0000 | [diff] [blame] | 278 | HasVAES = false; |
| Craig Topper | 09b6598 | 2015-10-16 06:03:09 +0000 | [diff] [blame] | 279 | HasFXSR = false; |
| Amjad Aboud | 1db6d7a | 2015-10-12 11:47:46 +0000 | [diff] [blame] | 280 | HasXSAVE = false; |
| 281 | HasXSAVEOPT = false; |
| 282 | HasXSAVEC = false; |
| 283 | HasXSAVES = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 284 | HasPCLMUL = false; |
| Coby Tayree | 7ca5e587 | 2017-11-21 09:30:33 +0000 | [diff] [blame] | 285 | HasVPCLMULQDQ = false; |
| Coby Tayree | d8b17be | 2017-11-26 09:36:41 +0000 | [diff] [blame] | 286 | HasGFNI = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 287 | HasFMA = false; |
| 288 | HasFMA4 = false; |
| 289 | HasXOP = false; |
| Yunzhong Gao | dd36e93 | 2013-09-24 18:21:52 +0000 | [diff] [blame] | 290 | HasTBM = false; |
| Simon Pilgrim | 99b925b | 2017-05-03 15:51:39 +0000 | [diff] [blame] | 291 | HasLWP = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 292 | HasMOVBE = false; |
| 293 | HasRDRAND = false; |
| 294 | HasF16C = false; |
| 295 | HasFSGSBase = false; |
| 296 | HasLZCNT = false; |
| 297 | HasBMI = false; |
| 298 | HasBMI2 = false; |
| Michael Zuckerman | 97b6a692 | 2016-01-17 13:42:12 +0000 | [diff] [blame] | 299 | HasVBMI = false; |
| Coby Tayree | 71e37cc | 2017-11-21 09:48:44 +0000 | [diff] [blame] | 300 | HasVBMI2 = false; |
| Elena Demikhovsky | 29cde35 | 2016-01-24 10:41:28 +0000 | [diff] [blame] | 301 | HasIFMA = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 302 | HasRTM = false; |
| Elena Demikhovsky | 003e7d7 | 2013-07-28 08:28:38 +0000 | [diff] [blame] | 303 | HasERI = false; |
| 304 | HasCDI = false; |
| Craig Topper | 7a8cf01 | 2013-08-20 05:23:59 +0000 | [diff] [blame] | 305 | HasPFI = false; |
| Robert Khasanov | bfa0131 | 2014-07-21 14:54:21 +0000 | [diff] [blame] | 306 | HasDQI = false; |
| Oren Ben Simhon | 7bf27f0 | 2017-05-25 13:45:23 +0000 | [diff] [blame] | 307 | HasVPOPCNTDQ = false; |
| Robert Khasanov | bfa0131 | 2014-07-21 14:54:21 +0000 | [diff] [blame] | 308 | HasBWI = false; |
| 309 | HasVLX = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 310 | HasADX = false; |
| Asaf Badouh | 5acf66f | 2015-12-15 13:35:29 +0000 | [diff] [blame] | 311 | HasPKU = false; |
| Coby Tayree | 3880f2a | 2017-11-21 10:04:28 +0000 | [diff] [blame] | 312 | HasVNNI = false; |
| Coby Tayree | 5c7fe5d | 2017-11-21 10:32:42 +0000 | [diff] [blame] | 313 | HasBITALG = false; |
| Ben Langmuir | 1650175 | 2013-09-12 15:51:31 +0000 | [diff] [blame] | 314 | HasSHA = false; |
| Craig Topper | e2873a1 | 2017-12-22 03:53:14 +0000 | [diff] [blame] | 315 | HasPREFETCHWT1 = false; |
| Michael Liao | 5173ee0 | 2013-03-26 17:47:11 +0000 | [diff] [blame] | 316 | HasPRFCHW = false; |
| Michael Liao | a486a11 | 2013-03-28 23:41:26 +0000 | [diff] [blame] | 317 | HasRDSEED = false; |
| Hans Wennborg | 5000ce8 | 2015-12-04 23:00:33 +0000 | [diff] [blame] | 318 | HasLAHFSAHF = false; |
| Ashutosh Nema | 348af9c | 2016-05-18 11:59:12 +0000 | [diff] [blame] | 319 | HasMWAITX = false; |
| Craig Topper | 50f3d14 | 2017-02-09 04:27:34 +0000 | [diff] [blame] | 320 | HasCLZERO = false; |
| Elena Demikhovsky | f7e641c | 2015-06-03 10:30:57 +0000 | [diff] [blame] | 321 | HasMPX = false; |
| Oren Ben Simhon | fa582b0 | 2017-11-26 13:02:45 +0000 | [diff] [blame] | 322 | HasSHSTK = false; |
| 323 | HasIBT = false; |
| Tim Northover | 9bb6931 | 2017-05-01 17:50:15 +0000 | [diff] [blame] | 324 | HasSGX = false; |
| 325 | HasCLFLUSHOPT = false; |
| 326 | HasCLWB = false; |
| Craig Topper | 84b26b9 | 2018-01-18 23:52:31 +0000 | [diff] [blame] | 327 | HasRDPID = false; |
| Chandler Carruth | c58f216 | 2018-01-22 22:05:25 +0000 | [diff] [blame] | 328 | UseRetpoline = false; |
| 329 | UseRetpolineExternalThunk = false; |
| Zvi Rackover | 8bc7e4d | 2016-12-06 19:35:20 +0000 | [diff] [blame] | 330 | IsPMULLDSlow = false; |
| Ekaterina Romanova | d5fa554 | 2013-11-21 23:21:26 +0000 | [diff] [blame] | 331 | IsSHLDSlow = false; |
| Sanjay Patel | 3014567 | 2015-09-01 20:51:51 +0000 | [diff] [blame] | 332 | IsUAMem16Slow = false; |
| Sanjay Patel | 501890e | 2014-11-21 17:40:04 +0000 | [diff] [blame] | 333 | IsUAMem32Slow = false; |
| Sanjay Patel | ffd039b | 2015-02-03 17:13:04 +0000 | [diff] [blame] | 334 | HasSSEUnalignedMem = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 335 | HasCmpxchg16b = false; |
| 336 | UseLeaForSP = false; |
| Marina Yatsina | 77a21db | 2018-01-22 10:07:01 +0000 | [diff] [blame] | 337 | HasPOPCNTFalseDeps = false; |
| 338 | HasLZCNTFalseDeps = false; |
| Simon Pilgrim | 3feaf2a | 2017-12-19 14:34:35 +0000 | [diff] [blame] | 339 | HasFastVariableShuffle = false; |
| Amjad Aboud | 4f97751 | 2017-03-03 09:03:24 +0000 | [diff] [blame] | 340 | HasFastPartialYMMorZMMWrite = false; |
| Simon Pilgrim | 02bdac5 | 2018-01-29 21:24:31 +0000 | [diff] [blame] | 341 | HasFast11ByteNOP = false; |
| 342 | HasFast15ByteNOP = false; |
| Craig Topper | ea37e20 | 2017-11-25 18:09:37 +0000 | [diff] [blame] | 343 | HasFastGather = false; |
| Nikolai Bozhenov | f679530 | 2016-08-04 12:47:28 +0000 | [diff] [blame] | 344 | HasFastScalarFSQRT = false; |
| 345 | HasFastVectorFSQRT = false; |
| Pierre Gousseau | b6d652a | 2016-10-14 16:41:38 +0000 | [diff] [blame] | 346 | HasFastLZCNT = false; |
| Craig Topper | d88389a | 2017-02-21 06:39:13 +0000 | [diff] [blame] | 347 | HasFastSHLDRotate = false; |
| Craig Topper | 641e2af | 2017-08-30 04:34:48 +0000 | [diff] [blame] | 348 | HasMacroFusion = false; |
| Clement Courbet | 203fc17 | 2017-04-21 09:20:50 +0000 | [diff] [blame] | 349 | HasERMSB = false; |
| Alexey Volkov | fd1731d | 2014-11-21 11:19:34 +0000 | [diff] [blame] | 350 | HasSlowDivide32 = false; |
| 351 | HasSlowDivide64 = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 352 | PadShortFunctions = false; |
| Craig Topper | 62c47a2 | 2017-08-29 05:14:27 +0000 | [diff] [blame] | 353 | SlowTwoMemOps = false; |
| Preston Gurd | 8b7ab4b | 2013-04-25 20:29:37 +0000 | [diff] [blame] | 354 | LEAUsesAG = false; |
| Alexey Volkov | 6226de6 | 2014-05-20 08:55:50 +0000 | [diff] [blame] | 355 | SlowLEA = false; |
| Lama Saba | 2ea271b | 2017-05-18 08:11:50 +0000 | [diff] [blame] | 356 | Slow3OpsLEA = false; |
| Alexey Volkov | 5260dba | 2014-06-09 11:40:41 +0000 | [diff] [blame] | 357 | SlowIncDec = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 358 | stackAlignment = 4; |
| 359 | // FIXME: this is a known good value for Yonah. How about others? |
| 360 | MaxInlineSizeThreshold = 128; |
| Eric Christopher | 824f42f | 2015-05-12 01:26:05 +0000 | [diff] [blame] | 361 | UseSoftFloat = false; |
| Mohammed Agabaria | e9aebf2 | 2017-09-13 09:00:27 +0000 | [diff] [blame] | 362 | X86ProcFamily = Others; |
| 363 | GatherOverhead = 1024; |
| 364 | ScatterOverhead = 1024; |
| Craig Topper | 0d797a3 | 2018-01-20 00:26:08 +0000 | [diff] [blame] | 365 | PreferVectorWidth = UINT32_MAX; |
| 366 | Prefer256Bit = false; |
| Bill Wendling | 61375d8 | 2013-02-16 01:36:26 +0000 | [diff] [blame] | 367 | } |
| 368 | |
| Eric Christopher | 1a21203 | 2014-06-11 00:25:19 +0000 | [diff] [blame] | 369 | X86Subtarget &X86Subtarget::initializeSubtargetDependencies(StringRef CPU, |
| 370 | StringRef FS) { |
| 371 | initializeEnvironment(); |
| Eric Christopher | b68e253 | 2014-09-03 20:36:31 +0000 | [diff] [blame] | 372 | initSubtargetFeatures(CPU, FS); |
| Eric Christopher | 1a21203 | 2014-06-11 00:25:19 +0000 | [diff] [blame] | 373 | return *this; |
| 374 | } |
| 375 | |
| David Majnemer | ca29023 | 2016-05-20 18:16:06 +0000 | [diff] [blame] | 376 | X86Subtarget::X86Subtarget(const Triple &TT, StringRef CPU, StringRef FS, |
| 377 | const X86TargetMachine &TM, |
| Craig Topper | 0d797a3 | 2018-01-20 00:26:08 +0000 | [diff] [blame] | 378 | unsigned StackAlignOverride, |
| Craig Topper | 24d3b28 | 2018-02-11 08:06:27 +0000 | [diff] [blame] | 379 | unsigned PreferVectorWidthOverride, |
| 380 | unsigned RequiredVectorWidth) |
| Daniel Sanders | 50f1723 | 2015-09-15 16:17:27 +0000 | [diff] [blame] | 381 | : X86GenSubtargetInfo(TT, CPU, FS), X86ProcFamily(Others), |
| Rafael Espindola | ab03eb0 | 2016-05-19 22:07:57 +0000 | [diff] [blame] | 382 | PICStyle(PICStyles::None), TM(TM), TargetTriple(TT), |
| Eric Christopher | b8f9768 | 2014-05-07 21:05:47 +0000 | [diff] [blame] | 383 | StackAlignOverride(StackAlignOverride), |
| Craig Topper | 0d797a3 | 2018-01-20 00:26:08 +0000 | [diff] [blame] | 384 | PreferVectorWidthOverride(PreferVectorWidthOverride), |
| Craig Topper | 24d3b28 | 2018-02-11 08:06:27 +0000 | [diff] [blame] | 385 | RequiredVectorWidth(RequiredVectorWidth), |
| Eric Christopher | b8f9768 | 2014-05-07 21:05:47 +0000 | [diff] [blame] | 386 | In64BitMode(TargetTriple.getArch() == Triple::x86_64), |
| 387 | In32BitMode(TargetTriple.getArch() == Triple::x86 && |
| 388 | TargetTriple.getEnvironment() != Triple::CODE16), |
| 389 | In16BitMode(TargetTriple.getArch() == Triple::x86 && |
| Eric Christopher | a08f30b | 2014-06-09 17:08:19 +0000 | [diff] [blame] | 390 | TargetTriple.getEnvironment() == Triple::CODE16), |
| Daniel Sanders | e9fdba3 | 2017-04-29 17:30:09 +0000 | [diff] [blame] | 391 | InstrInfo(initializeSubtargetDependencies(CPU, FS)), TLInfo(TM, *this), |
| Daniel Sanders | a1b2db79 | 2017-05-19 11:08:33 +0000 | [diff] [blame] | 392 | FrameLowering(*this, getStackAlignment()) { |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 393 | // Determine the PICStyle based on the target selected. |
| Rafael Espindola | 0d34826 | 2016-06-20 23:41:56 +0000 | [diff] [blame] | 394 | if (!isPositionIndependent()) |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 395 | setPICStyle(PICStyles::None); |
| Rafael Espindola | 0d34826 | 2016-06-20 23:41:56 +0000 | [diff] [blame] | 396 | else if (is64Bit()) |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 397 | setPICStyle(PICStyles::RIPRel); |
| Rafael Espindola | 0d34826 | 2016-06-20 23:41:56 +0000 | [diff] [blame] | 398 | else if (isTargetCOFF()) |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 399 | setPICStyle(PICStyles::None); |
| Rafael Espindola | 0d34826 | 2016-06-20 23:41:56 +0000 | [diff] [blame] | 400 | else if (isTargetDarwin()) |
| 401 | setPICStyle(PICStyles::StubPIC); |
| 402 | else if (isTargetELF()) |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 403 | setPICStyle(PICStyles::GOT); |
| Quentin Colombet | 8cf805a | 2017-07-01 00:45:50 +0000 | [diff] [blame] | 404 | |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 405 | CallLoweringInfo.reset(new X86CallLowering(*getTargetLowering())); |
| 406 | Legalizer.reset(new X86LegalizerInfo(*this, TM)); |
| Quentin Colombet | 8cf805a | 2017-07-01 00:45:50 +0000 | [diff] [blame] | 407 | |
| 408 | auto *RBI = new X86RegisterBankInfo(*getRegisterInfo()); |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 409 | RegBankInfo.reset(RBI); |
| 410 | InstSelector.reset(createX86InstructionSelector(TM, *this, *RBI)); |
| Eric Christopher | 4629ed7 | 2014-08-09 01:07:25 +0000 | [diff] [blame] | 411 | } |
| Bill Wendling | aef9c37 | 2013-02-15 22:31:27 +0000 | [diff] [blame] | 412 | |
| Zvi Rackover | 76dbf26 | 2016-11-15 06:34:33 +0000 | [diff] [blame] | 413 | const CallLowering *X86Subtarget::getCallLowering() const { |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 414 | return CallLoweringInfo.get(); |
| Zvi Rackover | 76dbf26 | 2016-11-15 06:34:33 +0000 | [diff] [blame] | 415 | } |
| 416 | |
| 417 | const InstructionSelector *X86Subtarget::getInstructionSelector() const { |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 418 | return InstSelector.get(); |
| Zvi Rackover | 76dbf26 | 2016-11-15 06:34:33 +0000 | [diff] [blame] | 419 | } |
| 420 | |
| 421 | const LegalizerInfo *X86Subtarget::getLegalizerInfo() const { |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 422 | return Legalizer.get(); |
| Zvi Rackover | 76dbf26 | 2016-11-15 06:34:33 +0000 | [diff] [blame] | 423 | } |
| 424 | |
| 425 | const RegisterBankInfo *X86Subtarget::getRegBankInfo() const { |
| Quentin Colombet | 61d71a1 | 2017-08-15 22:31:51 +0000 | [diff] [blame] | 426 | return RegBankInfo.get(); |
| Zvi Rackover | 76dbf26 | 2016-11-15 06:34:33 +0000 | [diff] [blame] | 427 | } |
| 428 | |
| Sanjay Patel | a2f658d | 2014-07-15 22:39:58 +0000 | [diff] [blame] | 429 | bool X86Subtarget::enableEarlyIfConversion() const { |
| Eric Christopher | 3470bbb | 2014-05-21 23:51:57 +0000 | [diff] [blame] | 430 | return hasCMov() && X86EarlyIfConv; |
| Eric Christopher | 6b0fcfe | 2014-05-21 23:40:26 +0000 | [diff] [blame] | 431 | } |