Misha Brukman | cd60313 | 2003-06-02 03:28:00 +0000 | [diff] [blame] | 1 | //===-- X86/X86CodeEmitter.cpp - Convert X86 code to machine code ---------===// |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 2 | // |
| 3 | // This file contains the pass that transforms the X86 machine instructions into |
| 4 | // actual executable machine code. |
| 5 | // |
| 6 | //===----------------------------------------------------------------------===// |
| 7 | |
Chris Lattner | cb53358 | 2003-08-03 21:14:38 +0000 | [diff] [blame] | 8 | #define DEBUG_TYPE "jit" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 9 | #include "X86TargetMachine.h" |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 10 | #include "X86.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 11 | #include "llvm/PassManager.h" |
| 12 | #include "llvm/CodeGen/MachineCodeEmitter.h" |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 13 | #include "llvm/CodeGen/MachineFunctionPass.h" |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 14 | #include "llvm/CodeGen/MachineInstr.h" |
Chris Lattner | c01d123 | 2003-10-20 03:42:58 +0000 | [diff] [blame^] | 15 | #include "llvm/Function.h" |
Chris Lattner | a11136b | 2003-08-01 22:21:34 +0000 | [diff] [blame] | 16 | #include "Support/Debug.h" |
Chris Lattner | 302de59 | 2003-06-06 04:00:05 +0000 | [diff] [blame] | 17 | #include "Support/Statistic.h" |
John Criswell | 7a73b80 | 2003-06-30 21:59:07 +0000 | [diff] [blame] | 18 | #include "Config/alloca.h" |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 19 | |
| 20 | namespace { |
Chris Lattner | 302de59 | 2003-06-06 04:00:05 +0000 | [diff] [blame] | 21 | Statistic<> |
| 22 | NumEmitted("x86-emitter", "Number of machine instructions emitted"); |
| 23 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 24 | class JITResolver { |
| 25 | MachineCodeEmitter &MCE; |
| 26 | |
| 27 | // LazyCodeGenMap - Keep track of call sites for functions that are to be |
| 28 | // lazily resolved. |
| 29 | std::map<unsigned, Function*> LazyCodeGenMap; |
| 30 | |
| 31 | // LazyResolverMap - Keep track of the lazy resolver created for a |
| 32 | // particular function so that we can reuse them if necessary. |
| 33 | std::map<Function*, unsigned> LazyResolverMap; |
| 34 | public: |
| 35 | JITResolver(MachineCodeEmitter &mce) : MCE(mce) {} |
| 36 | unsigned getLazyResolver(Function *F); |
| 37 | unsigned addFunctionReference(unsigned Address, Function *F); |
| 38 | |
| 39 | private: |
| 40 | unsigned emitStubForFunction(Function *F); |
| 41 | static void CompilationCallback(); |
| 42 | unsigned resolveFunctionReference(unsigned RetAddr); |
| 43 | }; |
| 44 | |
| 45 | JITResolver *TheJITResolver; |
| 46 | } |
| 47 | |
| 48 | |
| 49 | /// addFunctionReference - This method is called when we need to emit the |
| 50 | /// address of a function that has not yet been emitted, so we don't know the |
| 51 | /// address. Instead, we emit a call to the CompilationCallback method, and |
| 52 | /// keep track of where we are. |
| 53 | /// |
| 54 | unsigned JITResolver::addFunctionReference(unsigned Address, Function *F) { |
| 55 | LazyCodeGenMap[Address] = F; |
| 56 | return (intptr_t)&JITResolver::CompilationCallback; |
| 57 | } |
| 58 | |
| 59 | unsigned JITResolver::resolveFunctionReference(unsigned RetAddr) { |
| 60 | std::map<unsigned, Function*>::iterator I = LazyCodeGenMap.find(RetAddr); |
| 61 | assert(I != LazyCodeGenMap.end() && "Not in map!"); |
| 62 | Function *F = I->second; |
| 63 | LazyCodeGenMap.erase(I); |
| 64 | return MCE.forceCompilationOf(F); |
| 65 | } |
| 66 | |
| 67 | unsigned JITResolver::getLazyResolver(Function *F) { |
| 68 | std::map<Function*, unsigned>::iterator I = LazyResolverMap.lower_bound(F); |
| 69 | if (I != LazyResolverMap.end() && I->first == F) return I->second; |
| 70 | |
| 71 | //std::cerr << "Getting lazy resolver for : " << ((Value*)F)->getName() << "\n"; |
| 72 | |
| 73 | unsigned Stub = emitStubForFunction(F); |
| 74 | LazyResolverMap.insert(I, std::make_pair(F, Stub)); |
| 75 | return Stub; |
| 76 | } |
| 77 | |
| 78 | void JITResolver::CompilationCallback() { |
| 79 | unsigned *StackPtr = (unsigned*)__builtin_frame_address(0); |
Misha Brukman | bc80b22 | 2003-06-02 04:13:58 +0000 | [diff] [blame] | 80 | unsigned RetAddr = (unsigned)(intptr_t)__builtin_return_address(0); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 81 | assert(StackPtr[1] == RetAddr && |
| 82 | "Could not find return address on the stack!"); |
Chris Lattner | 30d002b | 2003-06-06 18:25:33 +0000 | [diff] [blame] | 83 | |
| 84 | // It's a stub if there is an interrupt marker after the call... |
| 85 | bool isStub = ((unsigned char*)(intptr_t)RetAddr)[0] == 0xCD; |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 86 | |
Chris Lattner | 302de59 | 2003-06-06 04:00:05 +0000 | [diff] [blame] | 87 | // FIXME FIXME FIXME FIXME: __builtin_frame_address doesn't work if frame |
| 88 | // pointer elimination has been performed. Having a variable sized alloca |
| 89 | // disables frame pointer elimination currently, even if it's dead. This is a |
| 90 | // gross hack. |
| 91 | alloca(10+isStub); |
| 92 | // FIXME FIXME FIXME FIXME |
| 93 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 94 | // The call instruction should have pushed the return value onto the stack... |
| 95 | RetAddr -= 4; // Backtrack to the reference itself... |
| 96 | |
| 97 | #if 0 |
| 98 | DEBUG(std::cerr << "In callback! Addr=0x" << std::hex << RetAddr |
| 99 | << " ESP=0x" << (unsigned)StackPtr << std::dec |
| 100 | << ": Resolving call to function: " |
| 101 | << TheVM->getFunctionReferencedName((void*)RetAddr) << "\n"); |
| 102 | #endif |
| 103 | |
| 104 | // Sanity check to make sure this really is a call instruction... |
Chris Lattner | 30d002b | 2003-06-06 18:25:33 +0000 | [diff] [blame] | 105 | assert(((unsigned char*)(intptr_t)RetAddr)[-1] == 0xE8 &&"Not a call instr!"); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 106 | |
| 107 | unsigned NewVal = TheJITResolver->resolveFunctionReference(RetAddr); |
| 108 | |
| 109 | // Rewrite the call target... so that we don't fault every time we execute |
| 110 | // the call. |
Chris Lattner | 30d002b | 2003-06-06 18:25:33 +0000 | [diff] [blame] | 111 | *(unsigned*)(intptr_t)RetAddr = NewVal-RetAddr-4; |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 112 | |
| 113 | if (isStub) { |
| 114 | // If this is a stub, rewrite the call into an unconditional branch |
| 115 | // instruction so that two return addresses are not pushed onto the stack |
| 116 | // when the requested function finally gets called. This also makes the |
| 117 | // 0xCD byte (interrupt) dead, so the marker doesn't effect anything. |
Chris Lattner | 30d002b | 2003-06-06 18:25:33 +0000 | [diff] [blame] | 118 | ((unsigned char*)(intptr_t)RetAddr)[-1] = 0xE9; |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 119 | } |
| 120 | |
| 121 | // Change the return address to reexecute the call instruction... |
| 122 | StackPtr[1] -= 5; |
| 123 | } |
| 124 | |
| 125 | /// emitStubForFunction - This method is used by the JIT when it needs to emit |
| 126 | /// the address of a function for a function whose code has not yet been |
| 127 | /// generated. In order to do this, it generates a stub which jumps to the lazy |
| 128 | /// function compiler, which will eventually get fixed to call the function |
| 129 | /// directly. |
| 130 | /// |
| 131 | unsigned JITResolver::emitStubForFunction(Function *F) { |
| 132 | MCE.startFunctionStub(*F, 6); |
| 133 | MCE.emitByte(0xE8); // Call with 32 bit pc-rel destination... |
| 134 | |
| 135 | unsigned Address = addFunctionReference(MCE.getCurrentPCValue(), F); |
| 136 | MCE.emitWord(Address-MCE.getCurrentPCValue()-4); |
| 137 | |
| 138 | MCE.emitByte(0xCD); // Interrupt - Just a marker identifying the stub! |
| 139 | return (intptr_t)MCE.finishFunctionStub(*F); |
| 140 | } |
| 141 | |
| 142 | |
| 143 | |
| 144 | namespace { |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 145 | class Emitter : public MachineFunctionPass { |
| 146 | const X86InstrInfo *II; |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 147 | MachineCodeEmitter &MCE; |
Chris Lattner | dee1263 | 2003-07-26 23:06:00 +0000 | [diff] [blame] | 148 | std::map<const BasicBlock*, unsigned> BasicBlockAddrs; |
| 149 | std::vector<std::pair<const BasicBlock*, unsigned> > BBRefs; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 150 | public: |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 151 | Emitter(MachineCodeEmitter &mce) : II(0), MCE(mce) {} |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 152 | |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 153 | bool runOnMachineFunction(MachineFunction &MF); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 154 | |
Chris Lattner | f0eb7be | 2002-12-15 21:13:40 +0000 | [diff] [blame] | 155 | virtual const char *getPassName() const { |
| 156 | return "X86 Machine Code Emitter"; |
| 157 | } |
| 158 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 159 | private: |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 160 | void emitBasicBlock(MachineBasicBlock &MBB); |
| 161 | void emitInstruction(MachineInstr &MI); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 162 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 163 | void emitPCRelativeBlockAddress(BasicBlock *BB); |
| 164 | void emitMaybePCRelativeValue(unsigned Address, bool isPCRelative); |
| 165 | void emitGlobalAddressForCall(GlobalValue *GV); |
| 166 | void emitGlobalAddressForPtr(GlobalValue *GV); |
| 167 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 168 | void emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeField); |
| 169 | void emitSIBByte(unsigned SS, unsigned Index, unsigned Base); |
| 170 | void emitConstant(unsigned Val, unsigned Size); |
| 171 | |
| 172 | void emitMemModRMByte(const MachineInstr &MI, |
| 173 | unsigned Op, unsigned RegOpcodeField); |
| 174 | |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 175 | }; |
| 176 | } |
| 177 | |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 178 | /// addPassesToEmitMachineCode - Add passes to the specified pass manager to get |
Brian Gaeke | 45f0b6d | 2003-10-16 23:45:05 +0000 | [diff] [blame] | 179 | /// machine code emitted. This uses a MachineCodeEmitter object to handle |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 180 | /// actually outputting the machine code and resolving things like the address |
| 181 | /// of functions. This method should returns true if machine code emission is |
| 182 | /// not supported. |
| 183 | /// |
Brian Gaeke | 8844a0b | 2003-08-13 18:17:27 +0000 | [diff] [blame] | 184 | bool X86TargetMachine::addPassesToEmitMachineCode(FunctionPassManager &PM, |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 185 | MachineCodeEmitter &MCE) { |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 186 | PM.add(new Emitter(MCE)); |
Chris Lattner | 40ead95 | 2002-12-02 21:24:12 +0000 | [diff] [blame] | 187 | return false; |
| 188 | } |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 189 | |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 190 | bool Emitter::runOnMachineFunction(MachineFunction &MF) { |
| 191 | II = &((X86TargetMachine&)MF.getTarget()).getInstrInfo(); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 192 | |
| 193 | MCE.startFunction(MF); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 194 | MCE.emitConstantPool(MF.getConstantPool()); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 195 | for (MachineFunction::iterator I = MF.begin(), E = MF.end(); I != E; ++I) |
| 196 | emitBasicBlock(*I); |
| 197 | MCE.finishFunction(MF); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 198 | |
| 199 | // Resolve all forward branches now... |
| 200 | for (unsigned i = 0, e = BBRefs.size(); i != e; ++i) { |
| 201 | unsigned Location = BasicBlockAddrs[BBRefs[i].first]; |
| 202 | unsigned Ref = BBRefs[i].second; |
Chris Lattner | 30d002b | 2003-06-06 18:25:33 +0000 | [diff] [blame] | 203 | *(unsigned*)(intptr_t)Ref = Location-Ref-4; |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 204 | } |
| 205 | BBRefs.clear(); |
| 206 | BasicBlockAddrs.clear(); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 207 | return false; |
| 208 | } |
| 209 | |
| 210 | void Emitter::emitBasicBlock(MachineBasicBlock &MBB) { |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 211 | if (uint64_t Addr = MCE.getCurrentPCValue()) |
| 212 | BasicBlockAddrs[MBB.getBasicBlock()] = Addr; |
| 213 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 214 | for (MachineBasicBlock::iterator I = MBB.begin(), E = MBB.end(); I != E; ++I) |
| 215 | emitInstruction(**I); |
| 216 | } |
| 217 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 218 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 219 | /// emitPCRelativeBlockAddress - This method emits the PC relative address of |
| 220 | /// the specified basic block, or if the basic block hasn't been emitted yet |
| 221 | /// (because this is a forward branch), it keeps track of the information |
| 222 | /// necessary to resolve this address later (and emits a dummy value). |
| 223 | /// |
| 224 | void Emitter::emitPCRelativeBlockAddress(BasicBlock *BB) { |
| 225 | // FIXME: Emit backward branches directly |
| 226 | BBRefs.push_back(std::make_pair(BB, MCE.getCurrentPCValue())); |
| 227 | MCE.emitWord(0); // Emit a dummy value |
| 228 | } |
| 229 | |
| 230 | /// emitMaybePCRelativeValue - Emit a 32-bit address which may be PC relative. |
| 231 | /// |
| 232 | void Emitter::emitMaybePCRelativeValue(unsigned Address, bool isPCRelative) { |
| 233 | if (isPCRelative) |
| 234 | MCE.emitWord(Address-MCE.getCurrentPCValue()-4); |
| 235 | else |
| 236 | MCE.emitWord(Address); |
| 237 | } |
| 238 | |
| 239 | /// emitGlobalAddressForCall - Emit the specified address to the code stream |
| 240 | /// assuming this is part of a function call, which is PC relative. |
| 241 | /// |
| 242 | void Emitter::emitGlobalAddressForCall(GlobalValue *GV) { |
| 243 | // Get the address from the backend... |
| 244 | unsigned Address = MCE.getGlobalValueAddress(GV); |
| 245 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 246 | if (Address == 0) { |
| 247 | // FIXME: this is JIT specific! |
| 248 | if (TheJITResolver == 0) |
| 249 | TheJITResolver = new JITResolver(MCE); |
| 250 | Address = TheJITResolver->addFunctionReference(MCE.getCurrentPCValue(), |
Chris Lattner | c01d123 | 2003-10-20 03:42:58 +0000 | [diff] [blame^] | 251 | cast<Function>(GV)); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 252 | } |
| 253 | emitMaybePCRelativeValue(Address, true); |
| 254 | } |
| 255 | |
| 256 | /// emitGlobalAddress - Emit the specified address to the code stream assuming |
| 257 | /// this is part of a "take the address of a global" instruction, which is not |
| 258 | /// PC relative. |
| 259 | /// |
| 260 | void Emitter::emitGlobalAddressForPtr(GlobalValue *GV) { |
| 261 | // Get the address from the backend... |
| 262 | unsigned Address = MCE.getGlobalValueAddress(GV); |
| 263 | |
| 264 | // If the machine code emitter doesn't know what the address IS yet, we have |
| 265 | // to take special measures. |
| 266 | // |
| 267 | if (Address == 0) { |
| 268 | // FIXME: this is JIT specific! |
| 269 | if (TheJITResolver == 0) |
| 270 | TheJITResolver = new JITResolver(MCE); |
| 271 | Address = TheJITResolver->getLazyResolver((Function*)GV); |
| 272 | } |
| 273 | |
| 274 | emitMaybePCRelativeValue(Address, false); |
| 275 | } |
| 276 | |
| 277 | |
| 278 | |
Chris Lattner | ff3261a | 2003-06-03 15:31:23 +0000 | [diff] [blame] | 279 | /// N86 namespace - Native X86 Register numbers... used by X86 backend. |
| 280 | /// |
| 281 | namespace N86 { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 282 | enum { |
| 283 | EAX = 0, ECX = 1, EDX = 2, EBX = 3, ESP = 4, EBP = 5, ESI = 6, EDI = 7 |
| 284 | }; |
| 285 | } |
| 286 | |
| 287 | |
| 288 | // getX86RegNum - This function maps LLVM register identifiers to their X86 |
| 289 | // specific numbering, which is used in various places encoding instructions. |
| 290 | // |
| 291 | static unsigned getX86RegNum(unsigned RegNo) { |
| 292 | switch(RegNo) { |
| 293 | case X86::EAX: case X86::AX: case X86::AL: return N86::EAX; |
| 294 | case X86::ECX: case X86::CX: case X86::CL: return N86::ECX; |
| 295 | case X86::EDX: case X86::DX: case X86::DL: return N86::EDX; |
| 296 | case X86::EBX: case X86::BX: case X86::BL: return N86::EBX; |
| 297 | case X86::ESP: case X86::SP: case X86::AH: return N86::ESP; |
| 298 | case X86::EBP: case X86::BP: case X86::CH: return N86::EBP; |
| 299 | case X86::ESI: case X86::SI: case X86::DH: return N86::ESI; |
| 300 | case X86::EDI: case X86::DI: case X86::BH: return N86::EDI; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 301 | |
| 302 | case X86::ST0: case X86::ST1: case X86::ST2: case X86::ST3: |
| 303 | case X86::ST4: case X86::ST5: case X86::ST6: case X86::ST7: |
| 304 | return RegNo-X86::ST0; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 305 | default: |
| 306 | assert(RegNo >= MRegisterInfo::FirstVirtualRegister && |
| 307 | "Unknown physical register!"); |
| 308 | assert(0 && "Register allocator hasn't allocated reg correctly yet!"); |
| 309 | return 0; |
| 310 | } |
| 311 | } |
| 312 | |
| 313 | inline static unsigned char ModRMByte(unsigned Mod, unsigned RegOpcode, |
| 314 | unsigned RM) { |
| 315 | assert(Mod < 4 && RegOpcode < 8 && RM < 8 && "ModRM Fields out of range!"); |
| 316 | return RM | (RegOpcode << 3) | (Mod << 6); |
| 317 | } |
| 318 | |
| 319 | void Emitter::emitRegModRMByte(unsigned ModRMReg, unsigned RegOpcodeFld){ |
| 320 | MCE.emitByte(ModRMByte(3, RegOpcodeFld, getX86RegNum(ModRMReg))); |
| 321 | } |
| 322 | |
| 323 | void Emitter::emitSIBByte(unsigned SS, unsigned Index, unsigned Base) { |
| 324 | // SIB byte is in the same format as the ModRMByte... |
| 325 | MCE.emitByte(ModRMByte(SS, Index, Base)); |
| 326 | } |
| 327 | |
| 328 | void Emitter::emitConstant(unsigned Val, unsigned Size) { |
| 329 | // Output the constant in little endian byte order... |
| 330 | for (unsigned i = 0; i != Size; ++i) { |
| 331 | MCE.emitByte(Val & 255); |
| 332 | Val >>= 8; |
| 333 | } |
| 334 | } |
| 335 | |
| 336 | static bool isDisp8(int Value) { |
| 337 | return Value == (signed char)Value; |
| 338 | } |
| 339 | |
| 340 | void Emitter::emitMemModRMByte(const MachineInstr &MI, |
| 341 | unsigned Op, unsigned RegOpcodeField) { |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 342 | const MachineOperand &Disp = MI.getOperand(Op+3); |
| 343 | if (MI.getOperand(Op).isConstantPoolIndex()) { |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 344 | // Emit a direct address reference [disp32] where the displacement of the |
| 345 | // constant pool entry is controlled by the MCE. |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 346 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 5)); |
| 347 | unsigned Index = MI.getOperand(Op).getConstantPoolIndex(); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 348 | unsigned Address = MCE.getConstantPoolEntryAddress(Index); |
| 349 | MCE.emitWord(Address+Disp.getImmedValue()); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 350 | return; |
| 351 | } |
| 352 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 353 | const MachineOperand &BaseReg = MI.getOperand(Op); |
| 354 | const MachineOperand &Scale = MI.getOperand(Op+1); |
| 355 | const MachineOperand &IndexReg = MI.getOperand(Op+2); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 356 | |
| 357 | // Is a SIB byte needed? |
| 358 | if (IndexReg.getReg() == 0 && BaseReg.getReg() != X86::ESP) { |
| 359 | if (BaseReg.getReg() == 0) { // Just a displacement? |
| 360 | // Emit special case [disp32] encoding |
| 361 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 5)); |
| 362 | emitConstant(Disp.getImmedValue(), 4); |
| 363 | } else { |
| 364 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
| 365 | if (Disp.getImmedValue() == 0 && BaseRegNo != N86::EBP) { |
| 366 | // Emit simple indirect register encoding... [EAX] f.e. |
| 367 | MCE.emitByte(ModRMByte(0, RegOpcodeField, BaseRegNo)); |
| 368 | } else if (isDisp8(Disp.getImmedValue())) { |
| 369 | // Emit the disp8 encoding... [REG+disp8] |
| 370 | MCE.emitByte(ModRMByte(1, RegOpcodeField, BaseRegNo)); |
| 371 | emitConstant(Disp.getImmedValue(), 1); |
| 372 | } else { |
| 373 | // Emit the most general non-SIB encoding: [REG+disp32] |
Chris Lattner | 2067184 | 2002-12-13 05:05:05 +0000 | [diff] [blame] | 374 | MCE.emitByte(ModRMByte(2, RegOpcodeField, BaseRegNo)); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 375 | emitConstant(Disp.getImmedValue(), 4); |
| 376 | } |
| 377 | } |
| 378 | |
| 379 | } else { // We need a SIB byte, so start by outputting the ModR/M byte first |
| 380 | assert(IndexReg.getReg() != X86::ESP && "Cannot use ESP as index reg!"); |
| 381 | |
| 382 | bool ForceDisp32 = false; |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 383 | bool ForceDisp8 = false; |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 384 | if (BaseReg.getReg() == 0) { |
| 385 | // If there is no base register, we emit the special case SIB byte with |
| 386 | // MOD=0, BASE=5, to JUST get the index, scale, and displacement. |
| 387 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 388 | ForceDisp32 = true; |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 389 | } else if (Disp.getImmedValue() == 0 && BaseReg.getReg() != X86::EBP) { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 390 | // Emit no displacement ModR/M byte |
| 391 | MCE.emitByte(ModRMByte(0, RegOpcodeField, 4)); |
| 392 | } else if (isDisp8(Disp.getImmedValue())) { |
| 393 | // Emit the disp8 encoding... |
| 394 | MCE.emitByte(ModRMByte(1, RegOpcodeField, 4)); |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 395 | ForceDisp8 = true; // Make sure to force 8 bit disp if Base=EBP |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 396 | } else { |
| 397 | // Emit the normal disp32 encoding... |
| 398 | MCE.emitByte(ModRMByte(2, RegOpcodeField, 4)); |
| 399 | } |
| 400 | |
| 401 | // Calculate what the SS field value should be... |
| 402 | static const unsigned SSTable[] = { ~0, 0, 1, ~0, 2, ~0, ~0, ~0, 3 }; |
| 403 | unsigned SS = SSTable[Scale.getImmedValue()]; |
| 404 | |
| 405 | if (BaseReg.getReg() == 0) { |
| 406 | // Handle the SIB byte for the case where there is no base. The |
| 407 | // displacement has already been output. |
| 408 | assert(IndexReg.getReg() && "Index register must be specified!"); |
| 409 | emitSIBByte(SS, getX86RegNum(IndexReg.getReg()), 5); |
| 410 | } else { |
| 411 | unsigned BaseRegNo = getX86RegNum(BaseReg.getReg()); |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 412 | unsigned IndexRegNo; |
| 413 | if (IndexReg.getReg()) |
| 414 | IndexRegNo = getX86RegNum(IndexReg.getReg()); |
| 415 | else |
| 416 | IndexRegNo = 4; // For example [ESP+1*<noreg>+4] |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 417 | emitSIBByte(SS, IndexRegNo, BaseRegNo); |
| 418 | } |
| 419 | |
| 420 | // Do we need to output a displacement? |
Brian Gaeke | 95780cc | 2002-12-13 07:56:18 +0000 | [diff] [blame] | 421 | if (Disp.getImmedValue() != 0 || ForceDisp32 || ForceDisp8) { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 422 | if (!ForceDisp32 && isDisp8(Disp.getImmedValue())) |
| 423 | emitConstant(Disp.getImmedValue(), 1); |
| 424 | else |
| 425 | emitConstant(Disp.getImmedValue(), 4); |
| 426 | } |
| 427 | } |
| 428 | } |
| 429 | |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 430 | static unsigned sizeOfPtr(const TargetInstrDescriptor &Desc) { |
Chris Lattner | a0f38c8 | 2002-12-13 03:51:55 +0000 | [diff] [blame] | 431 | switch (Desc.TSFlags & X86II::ArgMask) { |
| 432 | case X86II::Arg8: return 1; |
| 433 | case X86II::Arg16: return 2; |
| 434 | case X86II::Arg32: return 4; |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 435 | case X86II::ArgF32: return 4; |
| 436 | case X86II::ArgF64: return 8; |
| 437 | case X86II::ArgF80: return 10; |
Chris Lattner | a6a382c | 2002-12-13 03:50:13 +0000 | [diff] [blame] | 438 | default: assert(0 && "Memory size not set!"); |
Chris Lattner | df642e1 | 2002-12-20 04:12:48 +0000 | [diff] [blame] | 439 | return 0; |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 440 | } |
| 441 | } |
| 442 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 443 | void Emitter::emitInstruction(MachineInstr &MI) { |
Chris Lattner | 302de59 | 2003-06-06 04:00:05 +0000 | [diff] [blame] | 444 | NumEmitted++; // Keep track of the # of mi's emitted |
| 445 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 446 | unsigned Opcode = MI.getOpcode(); |
Chris Lattner | 3501fea | 2003-01-14 22:00:31 +0000 | [diff] [blame] | 447 | const TargetInstrDescriptor &Desc = II->get(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 448 | |
Misha Brukman | 5560c9d | 2003-08-18 14:43:39 +0000 | [diff] [blame] | 449 | // Emit instruction prefixes if necessary |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 450 | if (Desc.TSFlags & X86II::OpSize) MCE.emitByte(0x66);// Operand size... |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 451 | |
| 452 | switch (Desc.TSFlags & X86II::Op0Mask) { |
| 453 | case X86II::TB: |
| 454 | MCE.emitByte(0x0F); // Two-byte opcode prefix |
| 455 | break; |
| 456 | case X86II::D8: case X86II::D9: case X86II::DA: case X86II::DB: |
| 457 | case X86II::DC: case X86II::DD: case X86II::DE: case X86II::DF: |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 458 | MCE.emitByte(0xD8+ |
| 459 | (((Desc.TSFlags & X86II::Op0Mask)-X86II::D8) |
| 460 | >> X86II::Op0Shift)); |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 461 | break; // Two-byte opcode prefix |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 462 | default: assert(0 && "Invalid prefix!"); |
| 463 | case 0: break; // No prefix! |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 464 | } |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 465 | |
Chris Lattner | 5ae99fe | 2002-12-28 20:24:48 +0000 | [diff] [blame] | 466 | unsigned char BaseOpcode = II->getBaseOpcodeFor(Opcode); |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 467 | switch (Desc.TSFlags & X86II::FormMask) { |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 468 | default: assert(0 && "Unknown FormMask value in X86 MachineCodeEmitter!"); |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 469 | case X86II::Pseudo: |
Chris Lattner | 02beda1 | 2003-08-05 00:48:47 +0000 | [diff] [blame] | 470 | if (Opcode != X86::IMPLICIT_USE && Opcode != X86::IMPLICIT_DEF) |
Chris Lattner | 9dedbcc | 2003-05-06 21:31:47 +0000 | [diff] [blame] | 471 | std::cerr << "X86 Machine Code Emitter: No 'form', not emitting: " << MI; |
Chris Lattner | 5ada8df | 2002-12-25 05:09:21 +0000 | [diff] [blame] | 472 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 473 | |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 474 | case X86II::RawFrm: |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 475 | MCE.emitByte(BaseOpcode); |
Chris Lattner | 8f04b09 | 2002-12-02 21:56:18 +0000 | [diff] [blame] | 476 | if (MI.getNumOperands() == 1) { |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 477 | MachineOperand &MO = MI.getOperand(0); |
| 478 | if (MO.isPCRelativeDisp()) { |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 479 | // Conditional branch... FIXME: this should use an MBB destination! |
| 480 | emitPCRelativeBlockAddress(cast<BasicBlock>(MO.getVRegValue())); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 481 | } else if (MO.isGlobalAddress()) { |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 482 | assert(MO.isPCRelative() && "Call target is not PC Relative?"); |
| 483 | emitGlobalAddressForCall(MO.getGlobal()); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 484 | } else if (MO.isExternalSymbol()) { |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 485 | unsigned Address = MCE.getGlobalValueAddress(MO.getSymbolName()); |
| 486 | assert(Address && "Unknown external symbol!"); |
| 487 | emitMaybePCRelativeValue(Address, MO.isPCRelative()); |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 488 | } else { |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 489 | assert(0 && "Unknown RawFrm operand!"); |
Chris Lattner | dbf30f7 | 2002-12-04 06:45:19 +0000 | [diff] [blame] | 490 | } |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 491 | } |
| 492 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 493 | |
| 494 | case X86II::AddRegFrm: |
| 495 | MCE.emitByte(BaseOpcode + getX86RegNum(MI.getOperand(0).getReg())); |
| 496 | if (MI.getNumOperands() == 2) { |
| 497 | MachineOperand &MO1 = MI.getOperand(1); |
| 498 | if (MO1.isImmediate() || MO1.getVRegValueOrNull() || |
| 499 | MO1.isGlobalAddress() || MO1.isExternalSymbol()) { |
| 500 | unsigned Size = sizeOfPtr(Desc); |
| 501 | if (Value *V = MO1.getVRegValueOrNull()) { |
| 502 | assert(Size == 4 && "Don't know how to emit non-pointer values!"); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 503 | emitGlobalAddressForPtr(cast<GlobalValue>(V)); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 504 | } else if (MO1.isGlobalAddress()) { |
| 505 | assert(Size == 4 && "Don't know how to emit non-pointer values!"); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 506 | assert(!MO1.isPCRelative() && "Function pointer ref is PC relative?"); |
| 507 | emitGlobalAddressForPtr(MO1.getGlobal()); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 508 | } else if (MO1.isExternalSymbol()) { |
| 509 | assert(Size == 4 && "Don't know how to emit non-pointer values!"); |
Chris Lattner | 04b0b30 | 2003-06-01 23:23:50 +0000 | [diff] [blame] | 510 | |
| 511 | unsigned Address = MCE.getGlobalValueAddress(MO1.getSymbolName()); |
| 512 | assert(Address && "Unknown external symbol!"); |
| 513 | emitMaybePCRelativeValue(Address, MO1.isPCRelative()); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 514 | } else { |
| 515 | emitConstant(MO1.getImmedValue(), Size); |
| 516 | } |
| 517 | } |
| 518 | } |
| 519 | break; |
| 520 | |
| 521 | case X86II::MRMDestReg: { |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 522 | MCE.emitByte(BaseOpcode); |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 523 | MachineOperand &SrcOp = MI.getOperand(1+II->isTwoAddrInstr(Opcode)); |
| 524 | emitRegModRMByte(MI.getOperand(0).getReg(), getX86RegNum(SrcOp.getReg())); |
| 525 | if (MI.getNumOperands() == 4) |
| 526 | emitConstant(MI.getOperand(3).getImmedValue(), sizeOfPtr(Desc)); |
Chris Lattner | 9dedbcc | 2003-05-06 21:31:47 +0000 | [diff] [blame] | 527 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 528 | } |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 529 | case X86II::MRMDestMem: |
| 530 | MCE.emitByte(BaseOpcode); |
| 531 | emitMemModRMByte(MI, 0, getX86RegNum(MI.getOperand(4).getReg())); |
| 532 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 533 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 534 | case X86II::MRMSrcReg: |
| 535 | MCE.emitByte(BaseOpcode); |
Chris Lattner | c01d123 | 2003-10-20 03:42:58 +0000 | [diff] [blame^] | 536 | |
| 537 | if (MI.getNumOperands() == 2) { |
| 538 | emitRegModRMByte(MI.getOperand(MI.getNumOperands()-1).getReg(), |
| 539 | getX86RegNum(MI.getOperand(0).getReg())); |
| 540 | } else if (MI.getOperand(2).isImmediate()) { |
| 541 | emitRegModRMByte(MI.getOperand(1).getReg(), |
| 542 | getX86RegNum(MI.getOperand(0).getReg())); |
| 543 | |
| 544 | emitConstant(MI.getOperand(2).getImmedValue(), sizeOfPtr(Desc)); |
| 545 | } else { |
| 546 | emitRegModRMByte(MI.getOperand(2).getReg(), |
| 547 | getX86RegNum(MI.getOperand(0).getReg())); |
| 548 | } |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 549 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 550 | |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 551 | case X86II::MRMSrcMem: |
| 552 | MCE.emitByte(BaseOpcode); |
| 553 | emitMemModRMByte(MI, MI.getNumOperands()-4, |
| 554 | getX86RegNum(MI.getOperand(0).getReg())); |
| 555 | break; |
| 556 | |
| 557 | case X86II::MRMS0r: case X86II::MRMS1r: |
| 558 | case X86II::MRMS2r: case X86II::MRMS3r: |
| 559 | case X86II::MRMS4r: case X86II::MRMS5r: |
| 560 | case X86II::MRMS6r: case X86II::MRMS7r: |
| 561 | MCE.emitByte(BaseOpcode); |
| 562 | emitRegModRMByte(MI.getOperand(0).getReg(), |
| 563 | (Desc.TSFlags & X86II::FormMask)-X86II::MRMS0r); |
| 564 | |
Chris Lattner | d909683 | 2002-12-15 08:01:39 +0000 | [diff] [blame] | 565 | if (MI.getOperand(MI.getNumOperands()-1).isImmediate()) { |
Misha Brukman | 5000e43 | 2002-12-13 02:13:15 +0000 | [diff] [blame] | 566 | unsigned Size = sizeOfPtr(Desc); |
Chris Lattner | ea1ddab | 2002-12-03 06:34:06 +0000 | [diff] [blame] | 567 | emitConstant(MI.getOperand(MI.getNumOperands()-1).getImmedValue(), Size); |
| 568 | } |
| 569 | break; |
Chris Lattner | e831b6b | 2003-01-13 00:33:59 +0000 | [diff] [blame] | 570 | |
| 571 | case X86II::MRMS0m: case X86II::MRMS1m: |
| 572 | case X86II::MRMS2m: case X86II::MRMS3m: |
| 573 | case X86II::MRMS4m: case X86II::MRMS5m: |
| 574 | case X86II::MRMS6m: case X86II::MRMS7m: |
| 575 | MCE.emitByte(BaseOpcode); |
| 576 | emitMemModRMByte(MI, 0, (Desc.TSFlags & X86II::FormMask)-X86II::MRMS0m); |
| 577 | |
| 578 | if (MI.getNumOperands() == 5) { |
| 579 | unsigned Size = sizeOfPtr(Desc); |
| 580 | emitConstant(MI.getOperand(4).getImmedValue(), Size); |
| 581 | } |
| 582 | break; |
Chris Lattner | 76041ce | 2002-12-02 21:44:34 +0000 | [diff] [blame] | 583 | } |
| 584 | } |