| //===-- X86JITInfo.cpp - Implement the JIT interfaces for the X86 target --===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file was developed by the LLVM research group and is distributed under |
| // the University of Illinois Open Source License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // This file implements the JIT interfaces for the X86 target. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #define DEBUG_TYPE "jit" |
| #include "X86JITInfo.h" |
| #include "X86Relocations.h" |
| #include "llvm/CodeGen/MachineCodeEmitter.h" |
| #include "llvm/Config/alloca.h" |
| #include <cstdlib> |
| #include <iostream> |
| using namespace llvm; |
| |
| #ifdef _MSC_VER |
| extern "C" void *_AddressOfReturnAddress(void); |
| #pragma intrinsic(_AddressOfReturnAddress) |
| #endif |
| |
| void X86JITInfo::replaceMachineCodeForFunction(void *Old, void *New) { |
| unsigned char *OldByte = (unsigned char *)Old; |
| *OldByte++ = 0xE9; // Emit JMP opcode. |
| unsigned *OldWord = (unsigned *)OldByte; |
| unsigned NewAddr = (intptr_t)New; |
| unsigned OldAddr = (intptr_t)OldWord; |
| *OldWord = NewAddr - OldAddr - 4; // Emit PC-relative addr of New code. |
| } |
| |
| |
| /// JITCompilerFunction - This contains the address of the JIT function used to |
| /// compile a function lazily. |
| static TargetJITInfo::JITCompilerFn JITCompilerFunction; |
| |
| // Provide a wrapper for X86CompilationCallback2 that saves non-traditional |
| // callee saved registers, for the fastcc calling convention. |
| extern "C" { |
| #if defined(__i386__) || defined(i386) || defined(_M_IX86) |
| #ifndef _MSC_VER |
| void X86CompilationCallback(void); |
| asm( |
| ".text\n" |
| ".align 8\n" |
| #if defined(__CYGWIN__) || defined(__APPLE__) |
| ".globl _X86CompilationCallback\n" |
| "_X86CompilationCallback:\n" |
| #else |
| ".globl X86CompilationCallback\n" |
| "X86CompilationCallback:\n" |
| #endif |
| "pushl %ebp\n" |
| "movl %esp, %ebp\n" // Standard prologue |
| "pushl %eax\n" |
| "pushl %edx\n" // save EAX/EDX |
| #if defined(__CYGWIN__) || defined(__APPLE__) |
| "call _X86CompilationCallback2\n" |
| #else |
| "call X86CompilationCallback2\n" |
| #endif |
| "popl %edx\n" |
| "popl %eax\n" |
| "popl %ebp\n" |
| "ret\n"); |
| #else |
| void X86CompilationCallback2(void); |
| |
| _declspec(naked) void X86CompilationCallback(void) { |
| __asm { |
| push eax |
| push edx |
| call X86CompilationCallback2 |
| pop edx |
| pop eax |
| ret |
| } |
| } |
| #endif // _MSC_VER |
| |
| #else // Not an i386 host |
| void X86CompilationCallback() { |
| std::cerr << "Cannot call X86CompilationCallback() on a non-x86 arch!\n"; |
| abort(); |
| } |
| #endif |
| } |
| |
| /// X86CompilationCallback - This is the target-specific function invoked by the |
| /// function stub when we did not know the real target of a call. This function |
| /// must locate the start of the stub or call site and pass it into the JIT |
| /// compiler function. |
| extern "C" void X86CompilationCallback2() { |
| #ifdef _MSC_VER |
| assert(sizeof(size_t) == 4); // FIXME: handle Win64 |
| unsigned *RetAddrLoc = (unsigned *)_AddressOfReturnAddress(); |
| RetAddrLoc += 3; // skip over ret addr, edx, eax |
| unsigned RetAddr = *RetAddrLoc; |
| #else |
| unsigned *StackPtr = (unsigned*)__builtin_frame_address(1); |
| unsigned RetAddr = (unsigned)(intptr_t)__builtin_return_address(1); |
| unsigned *RetAddrLoc = &StackPtr[1]; |
| |
| // NOTE: __builtin_frame_address doesn't work if frame pointer elimination has |
| // been performed. Having a variable sized alloca disables frame pointer |
| // elimination currently, even if it's dead. This is a gross hack. |
| alloca(10+(RetAddr >> 31)); |
| |
| #endif |
| assert(*RetAddrLoc == RetAddr && |
| "Could not find return address on the stack!"); |
| |
| // It's a stub if there is an interrupt marker after the call. |
| bool isStub = ((unsigned char*)(intptr_t)RetAddr)[0] == 0xCD; |
| |
| // The call instruction should have pushed the return value onto the stack... |
| RetAddr -= 4; // Backtrack to the reference itself... |
| |
| #if 0 |
| DEBUG(std::cerr << "In callback! Addr=" << (void*)RetAddr |
| << " ESP=" << (void*)StackPtr |
| << ": Resolving call to function: " |
| << TheVM->getFunctionReferencedName((void*)RetAddr) << "\n"); |
| #endif |
| |
| // Sanity check to make sure this really is a call instruction. |
| assert(((unsigned char*)(intptr_t)RetAddr)[-1] == 0xE8 &&"Not a call instr!"); |
| |
| unsigned NewVal = (intptr_t)JITCompilerFunction((void*)(intptr_t)RetAddr); |
| |
| // Rewrite the call target... so that we don't end up here every time we |
| // execute the call. |
| *(unsigned*)(intptr_t)RetAddr = NewVal-RetAddr-4; |
| |
| if (isStub) { |
| // If this is a stub, rewrite the call into an unconditional branch |
| // instruction so that two return addresses are not pushed onto the stack |
| // when the requested function finally gets called. This also makes the |
| // 0xCD byte (interrupt) dead, so the marker doesn't effect anything. |
| ((unsigned char*)(intptr_t)RetAddr)[-1] = 0xE9; |
| } |
| |
| // Change the return address to reexecute the call instruction... |
| *RetAddrLoc -= 5; |
| } |
| |
| TargetJITInfo::LazyResolverFn |
| X86JITInfo::getLazyResolverFunction(JITCompilerFn F) { |
| JITCompilerFunction = F; |
| return X86CompilationCallback; |
| } |
| |
| void *X86JITInfo::emitFunctionStub(void *Fn, MachineCodeEmitter &MCE) { |
| if (Fn != X86CompilationCallback) { |
| MCE.startFunctionStub(5); |
| MCE.emitByte(0xE9); |
| MCE.emitWord((intptr_t)Fn-MCE.getCurrentPCValue()-4); |
| return MCE.finishFunctionStub(0); |
| } |
| |
| MCE.startFunctionStub(6); |
| MCE.emitByte(0xE8); // Call with 32 bit pc-rel destination... |
| |
| MCE.emitWord((intptr_t)Fn-MCE.getCurrentPCValue()-4); |
| |
| MCE.emitByte(0xCD); // Interrupt - Just a marker identifying the stub! |
| return MCE.finishFunctionStub(0); |
| } |
| |
| /// relocate - Before the JIT can run a block of code that has been emitted, |
| /// it must rewrite the code to contain the actual addresses of any |
| /// referenced global symbols. |
| void X86JITInfo::relocate(void *Function, MachineRelocation *MR, |
| unsigned NumRelocs, unsigned char* GOTBase) { |
| for (unsigned i = 0; i != NumRelocs; ++i, ++MR) { |
| void *RelocPos = (char*)Function + MR->getMachineCodeOffset(); |
| intptr_t ResultPtr = (intptr_t)MR->getResultPointer(); |
| switch ((X86::RelocationType)MR->getRelocationType()) { |
| case X86::reloc_pcrel_word: |
| // PC relative relocation, add the relocated value to the value already in |
| // memory, after we adjust it for where the PC is. |
| ResultPtr = ResultPtr-(intptr_t)RelocPos-4; |
| *((intptr_t*)RelocPos) += ResultPtr; |
| break; |
| case X86::reloc_absolute_word: |
| // Absolute relocation, just add the relocated value to the value already |
| // in memory. |
| *((intptr_t*)RelocPos) += ResultPtr; |
| break; |
| } |
| } |
| } |