Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 1 | //===-- X86TargetMachine.cpp - Define TargetMachine for the X86 -----------===// |
Misha Brukman | 0e0a7a45 | 2005-04-21 23:38:14 +0000 | [diff] [blame] | 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
Misha Brukman | 0e0a7a45 | 2005-04-21 23:38:14 +0000 | [diff] [blame] | 7 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Misha Brukman | 0e0a7a45 | 2005-04-21 23:38:14 +0000 | [diff] [blame] | 9 | // |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 10 | // This file defines the X86 specific subclass of TargetMachine. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "X86TargetMachine.h" |
Chris Lattner | 5bcd95c | 2002-12-24 00:04:01 +0000 | [diff] [blame] | 15 | #include "X86.h" |
Chris Lattner | bb144a8 | 2003-08-24 19:49:48 +0000 | [diff] [blame] | 16 | #include "llvm/Module.h" |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 17 | #include "llvm/PassManager.h" |
Chris Lattner | 3048373 | 2004-06-20 07:49:54 +0000 | [diff] [blame] | 18 | #include "llvm/CodeGen/IntrinsicLowering.h" |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 19 | #include "llvm/CodeGen/MachineFunction.h" |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 20 | #include "llvm/CodeGen/Passes.h" |
Chris Lattner | 0cf0c37 | 2004-07-11 04:17:10 +0000 | [diff] [blame] | 21 | #include "llvm/Target/TargetOptions.h" |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 22 | #include "llvm/Target/TargetMachineRegistry.h" |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 23 | #include "llvm/Transforms/Scalar.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 24 | #include "llvm/Support/CommandLine.h" |
| 25 | #include "llvm/ADT/Statistic.h" |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 26 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 27 | |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 28 | X86VectorEnum llvm::X86Vector = NoSSE; |
Nate Begeman | f63be7d | 2005-07-06 18:59:04 +0000 | [diff] [blame] | 29 | bool llvm::X86ScalarSSE = false; |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 30 | |
Jeff Cohen | 1c32f79 | 2005-01-03 16:34:19 +0000 | [diff] [blame] | 31 | /// X86TargetMachineModule - Note that this is used on hosts that cannot link |
| 32 | /// in a library unless there are references into the library. In particular, |
| 33 | /// it seems that it is not possible to get things to work on Win32 without |
| 34 | /// this. Though it is unused, do not remove it. |
| 35 | extern "C" int X86TargetMachineModule; |
| 36 | int X86TargetMachineModule = 0; |
| 37 | |
Chris Lattner | 439a27a | 2002-12-16 16:15:51 +0000 | [diff] [blame] | 38 | namespace { |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 39 | cl::opt<bool> NoSSAPeephole("disable-ssa-peephole", cl::init(true), |
Chris Lattner | 4482715 | 2003-12-28 09:47:19 +0000 | [diff] [blame] | 40 | cl::desc("Disable the ssa-based peephole optimizer " |
| 41 | "(defaults to disabled)")); |
Chris Lattner | f6f263c | 2004-02-09 01:47:10 +0000 | [diff] [blame] | 42 | cl::opt<bool> DisableOutput("disable-x86-llc-output", cl::Hidden, |
| 43 | cl::desc("Disable the X86 asm printer, for use " |
| 44 | "when profiling the code generator.")); |
Nate Begeman | f63be7d | 2005-07-06 18:59:04 +0000 | [diff] [blame] | 45 | cl::opt<bool, true> EnableSSEFP("enable-sse-scalar-fp", |
| 46 | cl::desc("Perform FP math in SSE regs instead of the FP stack"), |
| 47 | cl::location(X86ScalarSSE), |
| 48 | cl::init(false)); |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 49 | |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 50 | // FIXME: This should eventually be handled with target triples and |
| 51 | // subtarget support! |
| 52 | cl::opt<X86VectorEnum, true> |
| 53 | SSEArg( |
| 54 | cl::desc("Enable SSE support in the X86 target:"), |
| 55 | cl::values( |
| 56 | clEnumValN(SSE, "sse", " Enable SSE support"), |
| 57 | clEnumValN(SSE2, "sse2", " Enable SSE and SSE2 support"), |
| 58 | clEnumValN(SSE3, "sse3", " Enable SSE, SSE2, and SSE3 support"), |
| 59 | clEnumValEnd), |
| 60 | cl::location(X86Vector), cl::init(NoSSE)); |
| 61 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 62 | // Register the target. |
Chris Lattner | 71d24aa | 2004-07-11 03:27:42 +0000 | [diff] [blame] | 63 | RegisterTarget<X86TargetMachine> X("x86", " IA-32 (Pentium and above)"); |
Chris Lattner | 439a27a | 2002-12-16 16:15:51 +0000 | [diff] [blame] | 64 | } |
| 65 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 66 | unsigned X86TargetMachine::getJITMatchQuality() { |
Chris Lattner | 7d0974b | 2004-10-18 15:54:17 +0000 | [diff] [blame] | 67 | #if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86) |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 68 | return 10; |
| 69 | #else |
| 70 | return 0; |
| 71 | #endif |
| 72 | } |
| 73 | |
| 74 | unsigned X86TargetMachine::getModuleMatchQuality(const Module &M) { |
Chris Lattner | 3ea78c4 | 2004-12-12 17:40:28 +0000 | [diff] [blame] | 75 | // We strongly match "i[3-9]86-*". |
| 76 | std::string TT = M.getTargetTriple(); |
| 77 | if (TT.size() >= 5 && TT[0] == 'i' && TT[2] == '8' && TT[3] == '6' && |
| 78 | TT[4] == '-' && TT[1] - '3' < 6) |
| 79 | return 20; |
| 80 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 81 | if (M.getEndianness() == Module::LittleEndian && |
| 82 | M.getPointerSize() == Module::Pointer32) |
Chris Lattner | 3ea78c4 | 2004-12-12 17:40:28 +0000 | [diff] [blame] | 83 | return 10; // Weak match |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 84 | else if (M.getEndianness() != Module::AnyEndianness || |
| 85 | M.getPointerSize() != Module::AnyPointerSize) |
| 86 | return 0; // Match for some other target |
| 87 | |
| 88 | return getJITMatchQuality()/2; |
| 89 | } |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 90 | |
| 91 | /// X86TargetMachine ctor - Create an ILP32 architecture model |
| 92 | /// |
Chris Lattner | f70e0c2 | 2003-12-28 21:23:38 +0000 | [diff] [blame] | 93 | X86TargetMachine::X86TargetMachine(const Module &M, IntrinsicLowering *IL) |
| 94 | : TargetMachine("X86", IL, true, 4, 4, 4, 4, 4), |
Nate Begeman | fb5792f | 2005-07-12 01:41:54 +0000 | [diff] [blame^] | 95 | Subtarget(M), |
| 96 | FrameInfo(TargetFrameInfo::StackGrowsDown, |
| 97 | Subtarget.getStackAlignment(), -4), |
Chris Lattner | f70e0c2 | 2003-12-28 21:23:38 +0000 | [diff] [blame] | 98 | JITInfo(*this) { |
Nate Begeman | f63be7d | 2005-07-06 18:59:04 +0000 | [diff] [blame] | 99 | // Scalar SSE FP requires at least SSE2 |
| 100 | X86ScalarSSE &= X86Vector >= SSE2; |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 101 | } |
| 102 | |
Chris Lattner | c9bbfbc | 2003-08-05 16:34:44 +0000 | [diff] [blame] | 103 | |
Chris Lattner | 0431c96 | 2005-06-25 02:48:37 +0000 | [diff] [blame] | 104 | // addPassesToEmitFile - We currently use all of the same passes as the JIT |
Chris Lattner | c9bbfbc | 2003-08-05 16:34:44 +0000 | [diff] [blame] | 105 | // does to emit statically compiled machine code. |
Chris Lattner | 0431c96 | 2005-06-25 02:48:37 +0000 | [diff] [blame] | 106 | bool X86TargetMachine::addPassesToEmitFile(PassManager &PM, std::ostream &Out, |
| 107 | CodeGenFileType FileType) { |
Chris Lattner | 07a9144 | 2005-06-27 06:30:12 +0000 | [diff] [blame] | 108 | if (FileType != TargetMachine::AssemblyFile && |
| 109 | FileType != TargetMachine::ObjectFile) return true; |
Chris Lattner | 0431c96 | 2005-06-25 02:48:37 +0000 | [diff] [blame] | 110 | |
Chris Lattner | 99c59e8 | 2004-05-23 21:23:35 +0000 | [diff] [blame] | 111 | // FIXME: Implement efficient support for garbage collection intrinsics. |
| 112 | PM.add(createLowerGCPass()); |
| 113 | |
Chris Lattner | c58c169 | 2003-10-05 19:15:47 +0000 | [diff] [blame] | 114 | // FIXME: Implement the invoke/unwind instructions! |
| 115 | PM.add(createLowerInvokePass()); |
| 116 | |
Chris Lattner | 8712442 | 2004-02-25 19:30:19 +0000 | [diff] [blame] | 117 | // FIXME: Implement the switch instruction in the instruction selector! |
| 118 | PM.add(createLowerSwitchPass()); |
| 119 | |
Chris Lattner | 9a9ca0f | 2004-07-02 05:46:41 +0000 | [diff] [blame] | 120 | // Make sure that no unreachable blocks are instruction selected. |
| 121 | PM.add(createUnreachableBlockEliminationPass()); |
| 122 | |
Chris Lattner | 6649418 | 2005-05-12 19:56:09 +0000 | [diff] [blame] | 123 | // Default to pattern ISel |
| 124 | if (PatternISelTriState == 0) |
Chris Lattner | 18ad194 | 2005-01-07 07:50:50 +0000 | [diff] [blame] | 125 | PM.add(createX86SimpleInstructionSelector(*this)); |
| 126 | else |
| 127 | PM.add(createX86PatternInstructionSelector(*this)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 128 | |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 129 | // Run optional SSA-based machine code optimizations next... |
| 130 | if (!NoSSAPeephole) |
| 131 | PM.add(createX86SSAPeepholeOptimizerPass()); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 132 | |
| 133 | // Print the instruction selected machine code... |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 134 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 135 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 136 | |
| 137 | // Perform register allocation to convert to a concrete x86 representation |
Alkis Evlogimenos | 7237ece | 2003-10-02 16:57:49 +0000 | [diff] [blame] | 138 | PM.add(createRegisterAllocator()); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 139 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 140 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 141 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 142 | |
| 143 | PM.add(createX86FloatingPointStackifierPass()); |
| 144 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 145 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 146 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 147 | |
| 148 | // Insert prolog/epilog code. Eliminate abstract frame index references... |
| 149 | PM.add(createPrologEpilogCodeInserter()); |
| 150 | |
| 151 | PM.add(createX86PeepholeOptimizerPass()); |
| 152 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 153 | if (PrintMachineCode) // Print the register-allocated code |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 154 | PM.add(createX86CodePrinterPass(std::cerr, *this)); |
| 155 | |
Chris Lattner | f6f263c | 2004-02-09 01:47:10 +0000 | [diff] [blame] | 156 | if (!DisableOutput) |
Chris Lattner | 07a9144 | 2005-06-27 06:30:12 +0000 | [diff] [blame] | 157 | switch (FileType) { |
| 158 | default: |
| 159 | assert(0 && "Unexpected filetype here!"); |
| 160 | case TargetMachine::AssemblyFile: |
| 161 | PM.add(createX86CodePrinterPass(Out, *this)); |
| 162 | break; |
| 163 | case TargetMachine::ObjectFile: |
| 164 | // FIXME: We only support emission of ELF files for now, this should check |
| 165 | // the target triple and decide on the format to write (e.g. COFF on |
| 166 | // win32). |
Chris Lattner | 81b6ed7 | 2005-07-11 05:17:48 +0000 | [diff] [blame] | 167 | addX86ELFObjectWriterPass(PM, Out, *this); |
Chris Lattner | 07a9144 | 2005-06-27 06:30:12 +0000 | [diff] [blame] | 168 | break; |
| 169 | } |
Chris Lattner | 655239c | 2003-12-20 10:20:19 +0000 | [diff] [blame] | 170 | |
Alkis Evlogimenos | c81efdc | 2004-02-15 00:03:15 +0000 | [diff] [blame] | 171 | // Delete machine code for this function |
| 172 | PM.add(createMachineCodeDeleter()); |
| 173 | |
Brian Gaeke | de3aa4f | 2003-06-18 21:43:21 +0000 | [diff] [blame] | 174 | return false; // success! |
| 175 | } |
| 176 | |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 177 | /// addPassesToJITCompile - Add passes to the specified pass manager to |
| 178 | /// implement a fast dynamic compiler for this target. Return true if this is |
| 179 | /// not supported for this target. |
| 180 | /// |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 181 | void X86JITInfo::addPassesToJITCompile(FunctionPassManager &PM) { |
Chris Lattner | 99c59e8 | 2004-05-23 21:23:35 +0000 | [diff] [blame] | 182 | // FIXME: Implement efficient support for garbage collection intrinsics. |
| 183 | PM.add(createLowerGCPass()); |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 184 | |
Chris Lattner | c58c169 | 2003-10-05 19:15:47 +0000 | [diff] [blame] | 185 | // FIXME: Implement the invoke/unwind instructions! |
| 186 | PM.add(createLowerInvokePass()); |
| 187 | |
Chris Lattner | 8712442 | 2004-02-25 19:30:19 +0000 | [diff] [blame] | 188 | // FIXME: Implement the switch instruction in the instruction selector! |
| 189 | PM.add(createLowerSwitchPass()); |
| 190 | |
Chris Lattner | 9a9ca0f | 2004-07-02 05:46:41 +0000 | [diff] [blame] | 191 | // Make sure that no unreachable blocks are instruction selected. |
| 192 | PM.add(createUnreachableBlockEliminationPass()); |
| 193 | |
Chris Lattner | 6649418 | 2005-05-12 19:56:09 +0000 | [diff] [blame] | 194 | // Default to pattern ISel |
| 195 | if (PatternISelTriState == 0) |
Chris Lattner | 18ad194 | 2005-01-07 07:50:50 +0000 | [diff] [blame] | 196 | PM.add(createX86SimpleInstructionSelector(TM)); |
| 197 | else |
| 198 | PM.add(createX86PatternInstructionSelector(TM)); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 199 | |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 200 | // Run optional SSA-based machine code optimizations next... |
| 201 | if (!NoSSAPeephole) |
| 202 | PM.add(createX86SSAPeepholeOptimizerPass()); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 203 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 204 | // FIXME: Add SSA based peephole optimizer here. |
| 205 | |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 206 | // Print the instruction selected machine code... |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 207 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 208 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 209 | |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 210 | // Perform register allocation to convert to a concrete x86 representation |
Alkis Evlogimenos | 7237ece | 2003-10-02 16:57:49 +0000 | [diff] [blame] | 211 | PM.add(createRegisterAllocator()); |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 212 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 213 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 214 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 215 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 216 | PM.add(createX86FloatingPointStackifierPass()); |
| 217 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 218 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 219 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 220 | |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 221 | // Insert prolog/epilog code. Eliminate abstract frame index references... |
| 222 | PM.add(createPrologEpilogCodeInserter()); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 223 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 224 | PM.add(createX86PeepholeOptimizerPass()); |
| 225 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 226 | if (PrintMachineCode) // Print the register-allocated code |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 227 | PM.add(createX86CodePrinterPass(std::cerr, TM)); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 228 | } |
| 229 | |
Chris Lattner | 81b6ed7 | 2005-07-11 05:17:48 +0000 | [diff] [blame] | 230 | bool X86TargetMachine::addPassesToEmitMachineCode(FunctionPassManager &PM, |
| 231 | MachineCodeEmitter &MCE) { |
| 232 | PM.add(createX86CodeEmitterPass(MCE)); |
| 233 | // Delete machine code for this function |
| 234 | PM.add(createMachineCodeDeleter()); |
| 235 | return false; |
| 236 | } |