Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 1 | #include "llvm/ADT/Triple.h" |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 2 | #include "llvm/ExecutionEngine/Orc/OrcTargetSupport.h" |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 3 | #include <array> |
| 4 | |
Lang Hames | e738061 | 2015-02-21 20:44:36 +0000 | [diff] [blame] | 5 | using namespace llvm::orc; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 6 | |
| 7 | namespace { |
| 8 | |
Lang Hames | 8389b55 | 2015-03-25 02:45:50 +0000 | [diff] [blame] | 9 | uint64_t executeCompileCallback(JITCompileCallbackManagerBase *JCBM, |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 10 | TargetAddress CallbackID) { |
| 11 | return JCBM->executeCompileCallback(CallbackID); |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 12 | } |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 13 | |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 14 | } |
| 15 | |
| 16 | namespace llvm { |
Lang Hames | e738061 | 2015-02-21 20:44:36 +0000 | [diff] [blame] | 17 | namespace orc { |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 18 | |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 19 | const char* OrcX86_64::ResolverBlockName = "orc_resolver_block"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 20 | |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 21 | void OrcX86_64::insertResolverBlock( |
Lang Hames | 8389b55 | 2015-03-25 02:45:50 +0000 | [diff] [blame] | 22 | Module &M, JITCompileCallbackManagerBase &JCBM) { |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 23 | |
| 24 | // Trampoline code-sequence length, used to get trampoline address from return |
| 25 | // address. |
Lang Hames | cd118e7 | 2015-03-24 04:27:02 +0000 | [diff] [blame] | 26 | const unsigned X86_64_TrampolineLength = 6; |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 27 | |
Lang Hames | ed96cb7 | 2015-04-07 06:12:21 +0000 | [diff] [blame^] | 28 | // List of x86-64 GPRs to save. Note - RBP saved separately below. |
| 29 | std::array<const char *, 14> GPRs = {{ |
| 30 | "rax", "rbx", "rcx", "rdx", |
| 31 | "rsi", "rdi", "r8", "r9", |
| 32 | "r10", "r11", "r12", "r13", |
| 33 | "r14", "r15" |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 34 | }}; |
| 35 | |
| 36 | // Address of the executeCompileCallback function. |
NAKAMURA Takumi | cd5a367 | 2015-02-17 12:53:16 +0000 | [diff] [blame] | 37 | uint64_t CallbackAddr = |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 38 | static_cast<uint64_t>( |
| 39 | reinterpret_cast<uintptr_t>(executeCompileCallback)); |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 40 | |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 41 | std::ostringstream AsmStream; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 42 | Triple TT(M.getTargetTriple()); |
| 43 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 44 | // Switch to text section. |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 45 | if (TT.getOS() == Triple::Darwin) |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 46 | AsmStream << ".section __TEXT,__text,regular,pure_instructions\n" |
| 47 | << ".align 4, 0x90\n"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 48 | else |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 49 | AsmStream << ".text\n" |
| 50 | << ".align 16, 0x90\n"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 51 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 52 | // Bake in a pointer to the callback manager immediately before the |
| 53 | // start of the resolver function. |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 54 | AsmStream << "jit_callback_manager_addr:\n" |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 55 | << " .quad " << &JCBM << "\n"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 56 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 57 | // Start the resolver function. |
| 58 | AsmStream << ResolverBlockName << ":\n" |
| 59 | << " pushq %rbp\n" |
| 60 | << " movq %rsp, %rbp\n"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 61 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 62 | // Store the GPRs. |
| 63 | for (const auto &GPR : GPRs) |
| 64 | AsmStream << " pushq %" << GPR << "\n"; |
| 65 | |
| 66 | // Store floating-point state with FXSAVE. |
Lang Hames | ed96cb7 | 2015-04-07 06:12:21 +0000 | [diff] [blame^] | 67 | // Note: We need to keep the stack 16-byte aligned, so if we've emitted an odd |
| 68 | // number of 64-bit pushes so far (GPRs.size() plus 1 for RBP) then add |
| 69 | // an extra 64 bits of padding to the FXSave area. |
| 70 | unsigned Padding = (GPRs.size() + 1) % 2 ? 8 : 0; |
| 71 | unsigned FXSaveSize = 512 + Padding; |
| 72 | AsmStream << " subq $" << FXSaveSize << ", %rsp\n" |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 73 | << " fxsave (%rsp)\n" |
| 74 | |
| 75 | // Load callback manager address, compute trampoline address, call JIT. |
| 76 | << " lea jit_callback_manager_addr(%rip), %rdi\n" |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 77 | << " movq (%rdi), %rdi\n" |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 78 | << " movq 0x8(%rbp), %rsi\n" |
Lang Hames | cd118e7 | 2015-03-24 04:27:02 +0000 | [diff] [blame] | 79 | << " subq $" << X86_64_TrampolineLength << ", %rsi\n" |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 80 | << " movabsq $" << CallbackAddr << ", %rax\n" |
| 81 | << " callq *%rax\n" |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 82 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 83 | // Replace the return to the trampoline with the return address of the |
| 84 | // compiled function body. |
| 85 | << " movq %rax, 0x8(%rbp)\n" |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 86 | |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 87 | // Restore the floating point state. |
| 88 | << " fxrstor (%rsp)\n" |
Lang Hames | ed96cb7 | 2015-04-07 06:12:21 +0000 | [diff] [blame^] | 89 | << " addq $" << FXSaveSize << ", %rsp\n"; |
Lang Hames | e51ab6e | 2015-04-06 03:01:29 +0000 | [diff] [blame] | 90 | |
| 91 | for (const auto &GPR : make_range(GPRs.rbegin(), GPRs.rend())) |
| 92 | AsmStream << " popq %" << GPR << "\n"; |
| 93 | |
| 94 | // Restore original RBP and return to compiled function body. |
| 95 | AsmStream << " popq %rbp\n" |
| 96 | << " retq\n"; |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 97 | |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 98 | M.appendModuleInlineAsm(AsmStream.str()); |
Lang Hames | 93de2a1 | 2015-01-23 21:25:00 +0000 | [diff] [blame] | 99 | } |
Lang Hames | 2754714 | 2015-02-17 01:18:38 +0000 | [diff] [blame] | 100 | |
| 101 | OrcX86_64::LabelNameFtor |
| 102 | OrcX86_64::insertCompileCallbackTrampolines(Module &M, |
| 103 | TargetAddress ResolverBlockAddr, |
| 104 | unsigned NumCalls, |
| 105 | unsigned StartIndex) { |
| 106 | const char *ResolverBlockPtrName = "Lorc_resolve_block_addr"; |
| 107 | |
| 108 | std::ostringstream AsmStream; |
| 109 | Triple TT(M.getTargetTriple()); |
| 110 | |
| 111 | if (TT.getOS() == Triple::Darwin) |
| 112 | AsmStream << ".section __TEXT,__text,regular,pure_instructions\n" |
| 113 | << ".align 4, 0x90\n"; |
| 114 | else |
| 115 | AsmStream << ".text\n" |
| 116 | << ".align 16, 0x90\n"; |
| 117 | |
| 118 | AsmStream << ResolverBlockPtrName << ":\n" |
| 119 | << " .quad " << ResolverBlockAddr << "\n"; |
| 120 | |
| 121 | auto GetLabelName = |
| 122 | [=](unsigned I) { |
| 123 | std::ostringstream LabelStream; |
| 124 | LabelStream << "orc_jcc_" << (StartIndex + I); |
| 125 | return LabelStream.str(); |
| 126 | }; |
| 127 | |
| 128 | for (unsigned I = 0; I < NumCalls; ++I) |
| 129 | AsmStream << GetLabelName(I) << ":\n" |
| 130 | << " callq *" << ResolverBlockPtrName << "(%rip)\n"; |
| 131 | |
| 132 | M.appendModuleInlineAsm(AsmStream.str()); |
| 133 | |
| 134 | return GetLabelName; |
| 135 | } |
| 136 | |
Lang Hames | e738061 | 2015-02-21 20:44:36 +0000 | [diff] [blame] | 137 | } // End namespace orc. |
| 138 | } // End namespace llvm. |