[Orc] Move delta-handling for trampoline sizes into the resolver block.
[oota-llvm.git] / lib / ExecutionEngine / Orc / OrcTargetSupport.cpp
1 #include "llvm/ADT/Triple.h"
2 #include "llvm/ExecutionEngine/Orc/OrcTargetSupport.h"
3 #include <array>
4
5 using namespace llvm::orc;
6
7 namespace {
8
9 std::array<const char *, 12> X86GPRsToSave = {{
10     "rbp", "rbx", "r12", "r13", "r14", "r15", // Callee saved.
11     "rdi", "rsi", "rdx", "rcx", "r8", "r9",   // Int args.
12 }};
13
14 std::array<const char *, 8> X86XMMsToSave = {{
15     "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7" // FP args
16 }};
17
18 template <typename OStream> unsigned saveX86Regs(OStream &OS) {
19   for (const auto &GPR : X86GPRsToSave)
20     OS << "  pushq   %" << GPR << "\n";
21
22   OS << "  subq    $" << (16 * X86XMMsToSave.size()) << ", %rsp\n";
23
24   for (unsigned i = 0; i < X86XMMsToSave.size(); ++i)
25     OS << "  movdqu  %" << X86XMMsToSave[i] << ", "
26        << (16 * (X86XMMsToSave.size() - i - 1)) << "(%rsp)\n";
27
28   return (8 * X86GPRsToSave.size()) + (16 * X86XMMsToSave.size());
29 }
30
31 template <typename OStream> void restoreX86Regs(OStream &OS) {
32   for (unsigned i = 0; i < X86XMMsToSave.size(); ++i)
33     OS << "  movdqu  " << (16 * i) << "(%rsp), %"
34        << X86XMMsToSave[(X86XMMsToSave.size() - i - 1)] << "\n";
35   OS << "  addq    $" << (16 * X86XMMsToSave.size()) << ", %rsp\n";
36
37   for (unsigned i = 0; i < X86GPRsToSave.size(); ++i)
38     OS << "  popq    %" << X86GPRsToSave[X86GPRsToSave.size() - i - 1] << "\n";
39 }
40
41 template <typename TargetT>
42 uint64_t executeCompileCallback(JITCompileCallbackManagerBase<TargetT> *JCBM,
43                                 TargetAddress CallbackID) {
44   return JCBM->executeCompileCallback(CallbackID);
45 }
46
47 }
48
49 namespace llvm {
50 namespace orc {
51
52 const char* OrcX86_64::ResolverBlockName = "orc_resolver_block";
53
54 void OrcX86_64::insertResolverBlock(
55     Module &M, JITCompileCallbackManagerBase<OrcX86_64> &JCBM) {
56   const unsigned X86_64_TrampolineLength = 6;
57   auto CallbackPtr = executeCompileCallback<OrcX86_64>;
58   uint64_t CallbackAddr =
59       static_cast<uint64_t>(reinterpret_cast<uintptr_t>(CallbackPtr));
60
61   std::ostringstream AsmStream;
62   Triple TT(M.getTargetTriple());
63
64   if (TT.getOS() == Triple::Darwin)
65     AsmStream << ".section __TEXT,__text,regular,pure_instructions\n"
66               << ".align 4, 0x90\n";
67   else
68     AsmStream << ".text\n"
69               << ".align 16, 0x90\n";
70
71   AsmStream << "jit_callback_manager_addr:\n"
72             << "  .quad " << &JCBM << "\n"
73             << ResolverBlockName << ":\n";
74
75   uint64_t ReturnAddrOffset = saveX86Regs(AsmStream);
76
77   // Compute index, load object address, and call JIT.
78   AsmStream << "  leaq    jit_callback_manager_addr(%rip), %rdi\n"
79             << "  movq    (%rdi), %rdi\n"
80             << "  movq    " << ReturnAddrOffset << "(%rsp), %rsi\n"
81             << "  subq    $" << X86_64_TrampolineLength << ", %rsi\n"
82             << "  movabsq $" << CallbackAddr << ", %rax\n"
83             << "  callq   *%rax\n"
84             << "  movq    %rax, " << ReturnAddrOffset << "(%rsp)\n";
85
86   restoreX86Regs(AsmStream);
87
88   AsmStream << "  retq\n";
89
90   M.appendModuleInlineAsm(AsmStream.str());
91 }
92
93 OrcX86_64::LabelNameFtor
94 OrcX86_64::insertCompileCallbackTrampolines(Module &M,
95                                             TargetAddress ResolverBlockAddr,
96                                             unsigned NumCalls,
97                                             unsigned StartIndex) {
98   const char *ResolverBlockPtrName = "Lorc_resolve_block_addr";
99
100   std::ostringstream AsmStream;
101   Triple TT(M.getTargetTriple());
102
103   if (TT.getOS() == Triple::Darwin)
104     AsmStream << ".section __TEXT,__text,regular,pure_instructions\n"
105               << ".align 4, 0x90\n";
106   else
107     AsmStream << ".text\n"
108               << ".align 16, 0x90\n";
109
110   AsmStream << ResolverBlockPtrName << ":\n"
111             << "  .quad " << ResolverBlockAddr << "\n";
112
113   auto GetLabelName =
114     [=](unsigned I) {
115       std::ostringstream LabelStream;
116       LabelStream << "orc_jcc_" << (StartIndex + I);
117       return LabelStream.str();
118   };
119
120   for (unsigned I = 0; I < NumCalls; ++I)
121     AsmStream << GetLabelName(I) << ":\n"
122               << "  callq *" << ResolverBlockPtrName << "(%rip)\n";
123
124   M.appendModuleInlineAsm(AsmStream.str());
125
126   return GetLabelName;
127 }
128
129 } // End namespace orc.
130 } // End namespace llvm.