Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 1 | //===-- X86TargetMachine.cpp - Define TargetMachine for the X86 -----------===// |
| 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file was developed by the LLVM research group and is distributed under |
| 6 | // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 10 | // This file defines the X86 specific subclass of TargetMachine. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "X86TargetMachine.h" |
Chris Lattner | 5bcd95c | 2002-12-24 00:04:01 +0000 | [diff] [blame] | 15 | #include "X86.h" |
Chris Lattner | bb144a8 | 2003-08-24 19:49:48 +0000 | [diff] [blame] | 16 | #include "llvm/Module.h" |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 17 | #include "llvm/PassManager.h" |
Chris Lattner | 3048373 | 2004-06-20 07:49:54 +0000 | [diff] [blame] | 18 | #include "llvm/CodeGen/IntrinsicLowering.h" |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 19 | #include "llvm/CodeGen/MachineFunction.h" |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 20 | #include "llvm/CodeGen/Passes.h" |
Chris Lattner | 0cf0c37 | 2004-07-11 04:17:10 +0000 | [diff] [blame] | 21 | #include "llvm/Target/TargetOptions.h" |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 22 | #include "llvm/Target/TargetMachineRegistry.h" |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 23 | #include "llvm/Transforms/Scalar.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 24 | #include "llvm/Support/CommandLine.h" |
| 25 | #include "llvm/ADT/Statistic.h" |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 26 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 27 | |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 28 | X86VectorEnum llvm::X86Vector = NoSSE; |
| 29 | |
Jeff Cohen | 1c32f79 | 2005-01-03 16:34:19 +0000 | [diff] [blame] | 30 | /// X86TargetMachineModule - Note that this is used on hosts that cannot link |
| 31 | /// in a library unless there are references into the library. In particular, |
| 32 | /// it seems that it is not possible to get things to work on Win32 without |
| 33 | /// this. Though it is unused, do not remove it. |
| 34 | extern "C" int X86TargetMachineModule; |
| 35 | int X86TargetMachineModule = 0; |
| 36 | |
Chris Lattner | 439a27a | 2002-12-16 16:15:51 +0000 | [diff] [blame] | 37 | namespace { |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 38 | cl::opt<bool> NoSSAPeephole("disable-ssa-peephole", cl::init(true), |
Chris Lattner | 4482715 | 2003-12-28 09:47:19 +0000 | [diff] [blame] | 39 | cl::desc("Disable the ssa-based peephole optimizer " |
| 40 | "(defaults to disabled)")); |
Chris Lattner | f6f263c | 2004-02-09 01:47:10 +0000 | [diff] [blame] | 41 | cl::opt<bool> DisableOutput("disable-x86-llc-output", cl::Hidden, |
| 42 | cl::desc("Disable the X86 asm printer, for use " |
| 43 | "when profiling the code generator.")); |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 44 | |
Chris Lattner | 222b86f | 2004-10-08 22:41:46 +0000 | [diff] [blame] | 45 | #if 0 |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 46 | // FIXME: This should eventually be handled with target triples and |
| 47 | // subtarget support! |
| 48 | cl::opt<X86VectorEnum, true> |
| 49 | SSEArg( |
| 50 | cl::desc("Enable SSE support in the X86 target:"), |
| 51 | cl::values( |
| 52 | clEnumValN(SSE, "sse", " Enable SSE support"), |
| 53 | clEnumValN(SSE2, "sse2", " Enable SSE and SSE2 support"), |
| 54 | clEnumValN(SSE3, "sse3", " Enable SSE, SSE2, and SSE3 support"), |
| 55 | clEnumValEnd), |
| 56 | cl::location(X86Vector), cl::init(NoSSE)); |
Chris Lattner | 222b86f | 2004-10-08 22:41:46 +0000 | [diff] [blame] | 57 | #endif |
Chris Lattner | 6f0161a | 2004-08-24 08:18:44 +0000 | [diff] [blame] | 58 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 59 | // Register the target. |
Chris Lattner | 71d24aa | 2004-07-11 03:27:42 +0000 | [diff] [blame] | 60 | RegisterTarget<X86TargetMachine> X("x86", " IA-32 (Pentium and above)"); |
Chris Lattner | 439a27a | 2002-12-16 16:15:51 +0000 | [diff] [blame] | 61 | } |
| 62 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 63 | unsigned X86TargetMachine::getJITMatchQuality() { |
Chris Lattner | 7d0974b | 2004-10-18 15:54:17 +0000 | [diff] [blame] | 64 | #if defined(i386) || defined(__i386__) || defined(__x86__) || defined(_M_IX86) |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 65 | return 10; |
| 66 | #else |
| 67 | return 0; |
| 68 | #endif |
| 69 | } |
| 70 | |
| 71 | unsigned X86TargetMachine::getModuleMatchQuality(const Module &M) { |
Chris Lattner | 3ea78c4 | 2004-12-12 17:40:28 +0000 | [diff] [blame] | 72 | // We strongly match "i[3-9]86-*". |
| 73 | std::string TT = M.getTargetTriple(); |
| 74 | if (TT.size() >= 5 && TT[0] == 'i' && TT[2] == '8' && TT[3] == '6' && |
| 75 | TT[4] == '-' && TT[1] - '3' < 6) |
| 76 | return 20; |
| 77 | |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 78 | if (M.getEndianness() == Module::LittleEndian && |
| 79 | M.getPointerSize() == Module::Pointer32) |
Chris Lattner | 3ea78c4 | 2004-12-12 17:40:28 +0000 | [diff] [blame] | 80 | return 10; // Weak match |
Chris Lattner | d36c970 | 2004-07-11 02:48:49 +0000 | [diff] [blame] | 81 | else if (M.getEndianness() != Module::AnyEndianness || |
| 82 | M.getPointerSize() != Module::AnyPointerSize) |
| 83 | return 0; // Match for some other target |
| 84 | |
| 85 | return getJITMatchQuality()/2; |
| 86 | } |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 87 | |
| 88 | /// X86TargetMachine ctor - Create an ILP32 architecture model |
| 89 | /// |
Chris Lattner | f70e0c2 | 2003-12-28 21:23:38 +0000 | [diff] [blame] | 90 | X86TargetMachine::X86TargetMachine(const Module &M, IntrinsicLowering *IL) |
| 91 | : TargetMachine("X86", IL, true, 4, 4, 4, 4, 4), |
Chris Lattner | 222b86f | 2004-10-08 22:41:46 +0000 | [diff] [blame] | 92 | FrameInfo(TargetFrameInfo::StackGrowsDown, 8, -4), |
Chris Lattner | f70e0c2 | 2003-12-28 21:23:38 +0000 | [diff] [blame] | 93 | JITInfo(*this) { |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 94 | } |
| 95 | |
Chris Lattner | c9bbfbc | 2003-08-05 16:34:44 +0000 | [diff] [blame] | 96 | |
| 97 | // addPassesToEmitAssembly - We currently use all of the same passes as the JIT |
| 98 | // does to emit statically compiled machine code. |
Brian Gaeke | de3aa4f | 2003-06-18 21:43:21 +0000 | [diff] [blame] | 99 | bool X86TargetMachine::addPassesToEmitAssembly(PassManager &PM, |
| 100 | std::ostream &Out) { |
Chris Lattner | 99c59e8 | 2004-05-23 21:23:35 +0000 | [diff] [blame] | 101 | // FIXME: Implement efficient support for garbage collection intrinsics. |
| 102 | PM.add(createLowerGCPass()); |
| 103 | |
Chris Lattner | c58c169 | 2003-10-05 19:15:47 +0000 | [diff] [blame] | 104 | // FIXME: Implement the invoke/unwind instructions! |
| 105 | PM.add(createLowerInvokePass()); |
| 106 | |
Chris Lattner | 8712442 | 2004-02-25 19:30:19 +0000 | [diff] [blame] | 107 | // FIXME: Implement the switch instruction in the instruction selector! |
| 108 | PM.add(createLowerSwitchPass()); |
| 109 | |
Chris Lattner | 9a9ca0f | 2004-07-02 05:46:41 +0000 | [diff] [blame] | 110 | // Make sure that no unreachable blocks are instruction selected. |
| 111 | PM.add(createUnreachableBlockEliminationPass()); |
| 112 | |
Nate Begeman | f8b0294 | 2005-04-15 22:12:16 +0000 | [diff] [blame] | 113 | // Default to simple ISel |
| 114 | if (PatternISelTriState != 1) |
Chris Lattner | 18ad194 | 2005-01-07 07:50:50 +0000 | [diff] [blame] | 115 | PM.add(createX86SimpleInstructionSelector(*this)); |
| 116 | else |
| 117 | PM.add(createX86PatternInstructionSelector(*this)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 118 | |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 119 | // Run optional SSA-based machine code optimizations next... |
| 120 | if (!NoSSAPeephole) |
| 121 | PM.add(createX86SSAPeepholeOptimizerPass()); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 122 | |
| 123 | // Print the instruction selected machine code... |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 124 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 125 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 126 | |
| 127 | // Perform register allocation to convert to a concrete x86 representation |
Alkis Evlogimenos | 7237ece | 2003-10-02 16:57:49 +0000 | [diff] [blame] | 128 | PM.add(createRegisterAllocator()); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 129 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 130 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 131 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 132 | |
| 133 | PM.add(createX86FloatingPointStackifierPass()); |
| 134 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 135 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 136 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 137 | |
| 138 | // Insert prolog/epilog code. Eliminate abstract frame index references... |
| 139 | PM.add(createPrologEpilogCodeInserter()); |
| 140 | |
| 141 | PM.add(createX86PeepholeOptimizerPass()); |
| 142 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 143 | if (PrintMachineCode) // Print the register-allocated code |
Brian Gaeke | b428654 | 2003-08-13 18:15:52 +0000 | [diff] [blame] | 144 | PM.add(createX86CodePrinterPass(std::cerr, *this)); |
| 145 | |
Chris Lattner | f6f263c | 2004-02-09 01:47:10 +0000 | [diff] [blame] | 146 | if (!DisableOutput) |
| 147 | PM.add(createX86CodePrinterPass(Out, *this)); |
Chris Lattner | 655239c | 2003-12-20 10:20:19 +0000 | [diff] [blame] | 148 | |
Alkis Evlogimenos | c81efdc | 2004-02-15 00:03:15 +0000 | [diff] [blame] | 149 | // Delete machine code for this function |
| 150 | PM.add(createMachineCodeDeleter()); |
| 151 | |
Brian Gaeke | de3aa4f | 2003-06-18 21:43:21 +0000 | [diff] [blame] | 152 | return false; // success! |
| 153 | } |
| 154 | |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 155 | /// addPassesToJITCompile - Add passes to the specified pass manager to |
| 156 | /// implement a fast dynamic compiler for this target. Return true if this is |
| 157 | /// not supported for this target. |
| 158 | /// |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 159 | void X86JITInfo::addPassesToJITCompile(FunctionPassManager &PM) { |
Chris Lattner | 99c59e8 | 2004-05-23 21:23:35 +0000 | [diff] [blame] | 160 | // FIXME: Implement efficient support for garbage collection intrinsics. |
| 161 | PM.add(createLowerGCPass()); |
Chris Lattner | 155e68f | 2003-04-23 16:24:55 +0000 | [diff] [blame] | 162 | |
Chris Lattner | c58c169 | 2003-10-05 19:15:47 +0000 | [diff] [blame] | 163 | // FIXME: Implement the invoke/unwind instructions! |
| 164 | PM.add(createLowerInvokePass()); |
| 165 | |
Chris Lattner | 8712442 | 2004-02-25 19:30:19 +0000 | [diff] [blame] | 166 | // FIXME: Implement the switch instruction in the instruction selector! |
| 167 | PM.add(createLowerSwitchPass()); |
| 168 | |
Chris Lattner | 9a9ca0f | 2004-07-02 05:46:41 +0000 | [diff] [blame] | 169 | // Make sure that no unreachable blocks are instruction selected. |
| 170 | PM.add(createUnreachableBlockEliminationPass()); |
| 171 | |
Nate Begeman | f8b0294 | 2005-04-15 22:12:16 +0000 | [diff] [blame] | 172 | // Default to simple ISel |
| 173 | if (PatternISelTriState != 1) |
Chris Lattner | 18ad194 | 2005-01-07 07:50:50 +0000 | [diff] [blame] | 174 | PM.add(createX86SimpleInstructionSelector(TM)); |
| 175 | else |
| 176 | PM.add(createX86PatternInstructionSelector(TM)); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 177 | |
Chris Lattner | 9b52770 | 2003-12-01 05:18:30 +0000 | [diff] [blame] | 178 | // Run optional SSA-based machine code optimizations next... |
| 179 | if (!NoSSAPeephole) |
| 180 | PM.add(createX86SSAPeepholeOptimizerPass()); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 181 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 182 | // FIXME: Add SSA based peephole optimizer here. |
| 183 | |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 184 | // Print the instruction selected machine code... |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 185 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 186 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | 3dffa79 | 2002-10-30 00:47:49 +0000 | [diff] [blame] | 187 | |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 188 | // Perform register allocation to convert to a concrete x86 representation |
Alkis Evlogimenos | 7237ece | 2003-10-02 16:57:49 +0000 | [diff] [blame] | 189 | PM.add(createRegisterAllocator()); |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 190 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 191 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 192 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 193 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 194 | PM.add(createX86FloatingPointStackifierPass()); |
| 195 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 196 | if (PrintMachineCode) |
Brian Gaeke | 74ceb29 | 2004-02-04 21:41:01 +0000 | [diff] [blame] | 197 | PM.add(createMachineFunctionPrinterPass(&std::cerr)); |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 198 | |
Chris Lattner | d282cfe | 2002-12-28 20:33:32 +0000 | [diff] [blame] | 199 | // Insert prolog/epilog code. Eliminate abstract frame index references... |
| 200 | PM.add(createPrologEpilogCodeInserter()); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 201 | |
Chris Lattner | d91d86f | 2003-01-13 00:51:23 +0000 | [diff] [blame] | 202 | PM.add(createX86PeepholeOptimizerPass()); |
| 203 | |
Brian Gaeke | 323819e | 2004-03-04 19:16:23 +0000 | [diff] [blame] | 204 | if (PrintMachineCode) // Print the register-allocated code |
Chris Lattner | 1e60a91 | 2003-12-20 01:22:19 +0000 | [diff] [blame] | 205 | PM.add(createX86CodePrinterPass(std::cerr, TM)); |
Chris Lattner | b4f68ed | 2002-10-29 22:37:54 +0000 | [diff] [blame] | 206 | } |
| 207 | |