1 //===-- llvm-rtdyld.cpp - MCJIT Testing Tool ------------------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This is a testing tool for use with the MC-JIT LLVM components.
12 //===----------------------------------------------------------------------===//
14 #include "llvm/ADT/StringMap.h"
15 #include "llvm/DebugInfo/DIContext.h"
16 #include "llvm/DebugInfo/DWARF/DWARFContext.h"
17 #include "llvm/ExecutionEngine/RTDyldMemoryManager.h"
18 #include "llvm/ExecutionEngine/RuntimeDyld.h"
19 #include "llvm/ExecutionEngine/RuntimeDyldChecker.h"
20 #include "llvm/MC/MCAsmInfo.h"
21 #include "llvm/MC/MCContext.h"
22 #include "llvm/MC/MCDisassembler.h"
23 #include "llvm/MC/MCInstPrinter.h"
24 #include "llvm/MC/MCInstrInfo.h"
25 #include "llvm/MC/MCRegisterInfo.h"
26 #include "llvm/MC/MCSubtargetInfo.h"
27 #include "llvm/Object/MachO.h"
28 #include "llvm/Support/CommandLine.h"
29 #include "llvm/Support/DynamicLibrary.h"
30 #include "llvm/Support/ManagedStatic.h"
31 #include "llvm/Support/Memory.h"
32 #include "llvm/Support/MemoryBuffer.h"
33 #include "llvm/Support/PrettyStackTrace.h"
34 #include "llvm/Support/Signals.h"
35 #include "llvm/Support/TargetRegistry.h"
36 #include "llvm/Support/TargetSelect.h"
37 #include "llvm/Support/raw_ostream.h"
39 #include <system_error>
42 using namespace llvm::object;
44 static cl::list<std::string>
45 InputFileList(cl::Positional, cl::ZeroOrMore,
46 cl::desc("<input file>"));
50 AC_PrintObjectLineInfo,
52 AC_PrintDebugLineInfo,
56 static cl::opt<ActionType>
57 Action(cl::desc("Action to perform:"),
59 cl::values(clEnumValN(AC_Execute, "execute",
60 "Load, link, and execute the inputs."),
61 clEnumValN(AC_PrintLineInfo, "printline",
62 "Load, link, and print line information for each function."),
63 clEnumValN(AC_PrintDebugLineInfo, "printdebugline",
64 "Load, link, and print line information for each function using the debug object"),
65 clEnumValN(AC_PrintObjectLineInfo, "printobjline",
66 "Like -printlineinfo but does not load the object first"),
67 clEnumValN(AC_Verify, "verify",
68 "Load, link and verify the resulting memory image."),
71 static cl::opt<std::string>
73 cl::desc("Function to call as entry point."),
76 static cl::list<std::string>
78 cl::desc("Add library."),
81 static cl::opt<std::string>
82 TripleName("triple", cl::desc("Target triple for disassembler"));
84 static cl::list<std::string>
86 cl::desc("File containing RuntimeDyld verifier checks."),
89 static cl::opt<uint64_t>
90 TargetAddrStart("target-addr-start",
91 cl::desc("For -verify only: start of phony target address "
93 cl::init(4096), // Start at "page 1" - no allocating at "null".
96 static cl::opt<uint64_t>
97 TargetAddrEnd("target-addr-end",
98 cl::desc("For -verify only: end of phony target address range."),
102 static cl::opt<uint64_t>
103 TargetSectionSep("target-section-sep",
104 cl::desc("For -verify only: Separation between sections in "
105 "phony target address space."),
109 static cl::list<std::string>
110 SpecificSectionMappings("map-section",
111 cl::desc("Map a section to a specific address."),
116 // A trivial memory manager that doesn't do anything fancy, just uses the
117 // support library allocation routines directly.
118 class TrivialMemoryManager : public RTDyldMemoryManager {
120 SmallVector<sys::MemoryBlock, 16> FunctionMemory;
121 SmallVector<sys::MemoryBlock, 16> DataMemory;
123 uint8_t *allocateCodeSection(uintptr_t Size, unsigned Alignment,
125 StringRef SectionName) override;
126 uint8_t *allocateDataSection(uintptr_t Size, unsigned Alignment,
127 unsigned SectionID, StringRef SectionName,
128 bool IsReadOnly) override;
130 void *getPointerToNamedFunction(const std::string &Name,
131 bool AbortOnFailure = true) override {
135 bool finalizeMemory(std::string *ErrMsg) override { return false; }
137 // Invalidate instruction cache for sections with execute permissions.
138 // Some platforms with separate data cache and instruction cache require
139 // explicit cache flush, otherwise JIT code manipulations (like resolved
140 // relocations) will get to the data cache but not to the instruction cache.
141 virtual void invalidateInstructionCache();
144 uint8_t *TrivialMemoryManager::allocateCodeSection(uintptr_t Size,
147 StringRef SectionName) {
148 sys::MemoryBlock MB = sys::Memory::AllocateRWX(Size, nullptr, nullptr);
149 FunctionMemory.push_back(MB);
150 return (uint8_t*)MB.base();
153 uint8_t *TrivialMemoryManager::allocateDataSection(uintptr_t Size,
156 StringRef SectionName,
158 sys::MemoryBlock MB = sys::Memory::AllocateRWX(Size, nullptr, nullptr);
159 DataMemory.push_back(MB);
160 return (uint8_t*)MB.base();
163 void TrivialMemoryManager::invalidateInstructionCache() {
164 for (int i = 0, e = FunctionMemory.size(); i != e; ++i)
165 sys::Memory::InvalidateInstructionCache(FunctionMemory[i].base(),
166 FunctionMemory[i].size());
168 for (int i = 0, e = DataMemory.size(); i != e; ++i)
169 sys::Memory::InvalidateInstructionCache(DataMemory[i].base(),
170 DataMemory[i].size());
173 static const char *ProgramName;
175 static void Message(const char *Type, const Twine &Msg) {
176 errs() << ProgramName << ": " << Type << ": " << Msg << "\n";
179 static int Error(const Twine &Msg) {
180 Message("error", Msg);
184 static void loadDylibs() {
185 for (const std::string &Dylib : Dylibs) {
186 if (sys::fs::is_regular_file(Dylib)) {
188 if (sys::DynamicLibrary::LoadLibraryPermanently(Dylib.c_str(), &ErrMsg))
189 llvm::errs() << "Error loading '" << Dylib << "': "
192 llvm::errs() << "Dylib not found: '" << Dylib << "'.\n";
198 static int printLineInfoForInput(bool LoadObjects, bool UseDebugObj) {
199 assert(LoadObjects || !UseDebugObj);
201 // Load any dylibs requested on the command line.
204 // If we don't have any input files, read from stdin.
205 if (!InputFileList.size())
206 InputFileList.push_back("-");
207 for(unsigned i = 0, e = InputFileList.size(); i != e; ++i) {
208 // Instantiate a dynamic linker.
209 TrivialMemoryManager MemMgr;
210 RuntimeDyld Dyld(MemMgr, MemMgr);
212 // Load the input memory buffer.
214 ErrorOr<std::unique_ptr<MemoryBuffer>> InputBuffer =
215 MemoryBuffer::getFileOrSTDIN(InputFileList[i]);
216 if (std::error_code EC = InputBuffer.getError())
217 return Error("unable to read input: '" + EC.message() + "'");
219 ErrorOr<std::unique_ptr<ObjectFile>> MaybeObj(
220 ObjectFile::createObjectFile((*InputBuffer)->getMemBufferRef()));
222 if (std::error_code EC = MaybeObj.getError())
223 return Error("unable to create object file: '" + EC.message() + "'");
225 ObjectFile &Obj = **MaybeObj;
227 OwningBinary<ObjectFile> DebugObj;
228 std::unique_ptr<RuntimeDyld::LoadedObjectInfo> LoadedObjInfo = nullptr;
229 ObjectFile *SymbolObj = &Obj;
231 // Load the object file
233 Dyld.loadObject(Obj);
236 return Error(Dyld.getErrorString());
238 // Resolve all the relocations we can.
239 Dyld.resolveRelocations();
242 DebugObj = LoadedObjInfo->getObjectForDebug(Obj);
243 SymbolObj = DebugObj.getBinary();
247 std::unique_ptr<DIContext> Context(
248 new DWARFContextInMemory(*SymbolObj,LoadedObjInfo.get()));
250 // FIXME: This is generally useful. Figure out a place in lib/Object to
251 // put utility functions.
252 std::map<object::SectionRef, std::vector<uint64_t>> FuncAddresses;
253 if (!isa<ELFObjectFileBase>(SymbolObj)) {
254 for (object::SymbolRef Sym : SymbolObj->symbols()) {
255 object::SymbolRef::Type SymType;
256 if (Sym.getType(SymType))
258 if (SymType != object::SymbolRef::ST_Function)
261 if (Sym.getAddress(Addr))
263 object::section_iterator Sec = SymbolObj->section_end();
264 if (Sym.getSection(Sec))
266 std::vector<uint64_t> &Addrs = FuncAddresses[*Sec];
268 uint64_t SecAddr = Sec->getAddress();
269 uint64_t SecSize = Sec->getSize();
270 Addrs.push_back(SecAddr + SecSize);
272 Addrs.push_back(Addr);
274 for (auto &Pair : FuncAddresses) {
275 std::vector<uint64_t> &Addrs = Pair.second;
276 array_pod_sort(Addrs.begin(), Addrs.end());
280 // Use symbol info to iterate functions in the object.
281 for (object::SymbolRef Sym : SymbolObj->symbols()) {
282 object::SymbolRef::Type SymType;
283 if (Sym.getType(SymType))
285 if (SymType == object::SymbolRef::ST_Function) {
288 if (Sym.getName(Name))
290 if (Sym.getAddress(Addr))
294 if (isa<ELFObjectFileBase>(SymbolObj)) {
295 Size = Sym.getSize();
297 object::section_iterator Sec = SymbolObj->section_end();
298 if (Sym.getSection(Sec))
300 const std::vector<uint64_t> &Addrs = FuncAddresses[*Sec];
301 auto AddrI = std::find(Addrs.begin(), Addrs.end(), Addr);
302 assert(AddrI != Addrs.end() && (AddrI + 1) != Addrs.end());
303 assert(*AddrI == Addr);
304 Size = *(AddrI + 1) - Addr;
307 // If we're not using the debug object, compute the address of the
308 // symbol in memory (rather than that in the unrelocated object file)
309 // and use that to query the DWARFContext.
310 if (!UseDebugObj && LoadObjects) {
311 object::section_iterator Sec(SymbolObj->section_end());
314 Sec->getName(SecName);
315 uint64_t SectionLoadAddress =
316 LoadedObjInfo->getSectionLoadAddress(SecName);
317 if (SectionLoadAddress != 0)
318 Addr += SectionLoadAddress - Sec->getAddress();
321 outs() << "Function: " << Name << ", Size = " << Size << ", Addr = " << Addr << "\n";
323 DILineInfoTable Lines = Context->getLineInfoForAddressRange(Addr, Size);
324 DILineInfoTable::iterator Begin = Lines.begin();
325 DILineInfoTable::iterator End = Lines.end();
326 for (DILineInfoTable::iterator It = Begin; It != End; ++It) {
327 outs() << " Line info @ " << It->first - Addr << ": "
328 << It->second.FileName << ", line:" << It->second.Line << "\n";
337 static int executeInput() {
338 // Load any dylibs requested on the command line.
341 // Instantiate a dynamic linker.
342 TrivialMemoryManager MemMgr;
343 RuntimeDyld Dyld(MemMgr, MemMgr);
345 // FIXME: Preserve buffers until resolveRelocations time to work around a bug
346 // in RuntimeDyldELF.
347 // This fixme should be fixed ASAP. This is a very brittle workaround.
348 std::vector<std::unique_ptr<MemoryBuffer>> InputBuffers;
350 // If we don't have any input files, read from stdin.
351 if (!InputFileList.size())
352 InputFileList.push_back("-");
353 for(unsigned i = 0, e = InputFileList.size(); i != e; ++i) {
354 // Load the input memory buffer.
355 ErrorOr<std::unique_ptr<MemoryBuffer>> InputBuffer =
356 MemoryBuffer::getFileOrSTDIN(InputFileList[i]);
357 if (std::error_code EC = InputBuffer.getError())
358 return Error("unable to read input: '" + EC.message() + "'");
359 ErrorOr<std::unique_ptr<ObjectFile>> MaybeObj(
360 ObjectFile::createObjectFile((*InputBuffer)->getMemBufferRef()));
362 if (std::error_code EC = MaybeObj.getError())
363 return Error("unable to create object file: '" + EC.message() + "'");
365 ObjectFile &Obj = **MaybeObj;
366 InputBuffers.push_back(std::move(*InputBuffer));
368 // Load the object file
369 Dyld.loadObject(Obj);
370 if (Dyld.hasError()) {
371 return Error(Dyld.getErrorString());
375 // Resolve all the relocations we can.
376 Dyld.resolveRelocations();
377 // Clear instruction cache before code will be executed.
378 MemMgr.invalidateInstructionCache();
380 // FIXME: Error out if there are unresolved relocations.
382 // Get the address of the entry point (_main by default).
383 void *MainAddress = Dyld.getSymbolLocalAddress(EntryPoint);
385 return Error("no definition for '" + EntryPoint + "'");
387 // Invalidate the instruction cache for each loaded function.
388 for (unsigned i = 0, e = MemMgr.FunctionMemory.size(); i != e; ++i) {
389 sys::MemoryBlock &Data = MemMgr.FunctionMemory[i];
390 // Make sure the memory is executable.
391 std::string ErrorStr;
392 sys::Memory::InvalidateInstructionCache(Data.base(), Data.size());
393 if (!sys::Memory::setExecutable(Data, &ErrorStr))
394 return Error("unable to mark function executable: '" + ErrorStr + "'");
397 // Dispatch to _main().
398 errs() << "loaded '" << EntryPoint << "' at: " << (void*)MainAddress << "\n";
400 int (*Main)(int, const char**) =
401 (int(*)(int,const char**)) uintptr_t(MainAddress);
402 const char **Argv = new const char*[2];
403 // Use the name of the first input object module as argv[0] for the target.
404 Argv[0] = InputFileList[0].c_str();
406 return Main(1, Argv);
409 static int checkAllExpressions(RuntimeDyldChecker &Checker) {
410 for (const auto& CheckerFileName : CheckFiles) {
411 ErrorOr<std::unique_ptr<MemoryBuffer>> CheckerFileBuf =
412 MemoryBuffer::getFileOrSTDIN(CheckerFileName);
413 if (std::error_code EC = CheckerFileBuf.getError())
414 return Error("unable to read input '" + CheckerFileName + "': " +
417 if (!Checker.checkAllRulesInBuffer("# rtdyld-check:",
418 CheckerFileBuf.get().get()))
419 return Error("some checks in '" + CheckerFileName + "' failed");
424 static std::map<void *, uint64_t>
425 applySpecificSectionMappings(RuntimeDyldChecker &Checker) {
427 std::map<void*, uint64_t> SpecificMappings;
429 for (StringRef Mapping : SpecificSectionMappings) {
431 size_t EqualsIdx = Mapping.find_first_of("=");
432 StringRef SectionIDStr = Mapping.substr(0, EqualsIdx);
433 size_t ComaIdx = Mapping.find_first_of(",");
435 if (ComaIdx == StringRef::npos) {
436 errs() << "Invalid section specification '" << Mapping
437 << "'. Should be '<file name>,<section name>=<addr>'\n";
441 StringRef FileName = SectionIDStr.substr(0, ComaIdx);
442 StringRef SectionName = SectionIDStr.substr(ComaIdx + 1);
445 std::string ErrorMsg;
446 std::tie(OldAddrInt, ErrorMsg) =
447 Checker.getSectionAddr(FileName, SectionName, true);
449 if (ErrorMsg != "") {
454 void* OldAddr = reinterpret_cast<void*>(static_cast<uintptr_t>(OldAddrInt));
456 StringRef NewAddrStr = Mapping.substr(EqualsIdx + 1);
459 if (NewAddrStr.getAsInteger(0, NewAddr)) {
460 errs() << "Invalid section address in mapping: " << Mapping << "\n";
464 Checker.getRTDyld().mapSectionAddress(OldAddr, NewAddr);
465 SpecificMappings[OldAddr] = NewAddr;
468 return SpecificMappings;
471 // Scatter sections in all directions!
472 // Remaps section addresses for -verify mode. The following command line options
473 // can be used to customize the layout of the memory within the phony target's
475 // -target-addr-start <s> -- Specify where the phony target addres range starts.
476 // -target-addr-end <e> -- Specify where the phony target address range ends.
477 // -target-section-sep <d> -- Specify how big a gap should be left between the
478 // end of one section and the start of the next.
479 // Defaults to zero. Set to something big
480 // (e.g. 1 << 32) to stress-test stubs, GOTs, etc.
482 static void remapSections(const llvm::Triple &TargetTriple,
483 const TrivialMemoryManager &MemMgr,
484 RuntimeDyldChecker &Checker) {
486 // Set up a work list (section addr/size pairs).
487 typedef std::list<std::pair<void*, uint64_t>> WorklistT;
490 for (const auto& CodeSection : MemMgr.FunctionMemory)
491 Worklist.push_back(std::make_pair(CodeSection.base(), CodeSection.size()));
492 for (const auto& DataSection : MemMgr.DataMemory)
493 Worklist.push_back(std::make_pair(DataSection.base(), DataSection.size()));
495 // Apply any section-specific mappings that were requested on the command
497 typedef std::map<void*, uint64_t> AppliedMappingsT;
498 AppliedMappingsT AppliedMappings = applySpecificSectionMappings(Checker);
500 // Keep an "already allocated" mapping of section target addresses to sizes.
501 // Sections whose address mappings aren't specified on the command line will
502 // allocated around the explicitly mapped sections while maintaining the
503 // minimum separation.
504 std::map<uint64_t, uint64_t> AlreadyAllocated;
506 // Move the previously applied mappings into the already-allocated map.
507 for (WorklistT::iterator I = Worklist.begin(), E = Worklist.end();
509 WorklistT::iterator Tmp = I;
511 AppliedMappingsT::iterator AI = AppliedMappings.find(Tmp->first);
513 if (AI != AppliedMappings.end()) {
514 AlreadyAllocated[AI->second] = Tmp->second;
519 // If the -target-addr-end option wasn't explicitly passed, then set it to a
520 // sensible default based on the target triple.
521 if (TargetAddrEnd.getNumOccurrences() == 0) {
522 if (TargetTriple.isArch16Bit())
523 TargetAddrEnd = (1ULL << 16) - 1;
524 else if (TargetTriple.isArch32Bit())
525 TargetAddrEnd = (1ULL << 32) - 1;
526 // TargetAddrEnd already has a sensible default for 64-bit systems, so
527 // there's nothing to do in the 64-bit case.
530 // Process any elements remaining in the worklist.
531 while (!Worklist.empty()) {
532 std::pair<void*, uint64_t> CurEntry = Worklist.front();
533 Worklist.pop_front();
535 uint64_t NextSectionAddr = TargetAddrStart;
537 for (const auto &Alloc : AlreadyAllocated)
538 if (NextSectionAddr + CurEntry.second + TargetSectionSep <= Alloc.first)
541 NextSectionAddr = Alloc.first + Alloc.second + TargetSectionSep;
543 AlreadyAllocated[NextSectionAddr] = CurEntry.second;
544 Checker.getRTDyld().mapSectionAddress(CurEntry.first, NextSectionAddr);
549 // Load and link the objects specified on the command line, but do not execute
550 // anything. Instead, attach a RuntimeDyldChecker instance and call it to
551 // verify the correctness of the linked memory.
552 static int linkAndVerify() {
554 // Check for missing triple.
555 if (TripleName == "") {
556 llvm::errs() << "Error: -triple required when running in -verify mode.\n";
560 // Look up the target and build the disassembler.
561 Triple TheTriple(Triple::normalize(TripleName));
562 std::string ErrorStr;
563 const Target *TheTarget =
564 TargetRegistry::lookupTarget("", TheTriple, ErrorStr);
566 llvm::errs() << "Error accessing target '" << TripleName << "': "
570 TripleName = TheTriple.getTriple();
572 std::unique_ptr<MCSubtargetInfo> STI(
573 TheTarget->createMCSubtargetInfo(TripleName, "", ""));
574 assert(STI && "Unable to create subtarget info!");
576 std::unique_ptr<MCRegisterInfo> MRI(TheTarget->createMCRegInfo(TripleName));
577 assert(MRI && "Unable to create target register info!");
579 std::unique_ptr<MCAsmInfo> MAI(TheTarget->createMCAsmInfo(*MRI, TripleName));
580 assert(MAI && "Unable to create target asm info!");
582 MCContext Ctx(MAI.get(), MRI.get(), nullptr);
584 std::unique_ptr<MCDisassembler> Disassembler(
585 TheTarget->createMCDisassembler(*STI, Ctx));
586 assert(Disassembler && "Unable to create disassembler!");
588 std::unique_ptr<MCInstrInfo> MII(TheTarget->createMCInstrInfo());
590 std::unique_ptr<MCInstPrinter> InstPrinter(
591 TheTarget->createMCInstPrinter(Triple(TripleName), 0, *MAI, *MII, *MRI));
593 // Load any dylibs requested on the command line.
596 // Instantiate a dynamic linker.
597 TrivialMemoryManager MemMgr;
598 RuntimeDyld Dyld(MemMgr, MemMgr);
599 Dyld.setProcessAllSections(true);
600 RuntimeDyldChecker Checker(Dyld, Disassembler.get(), InstPrinter.get(),
603 // FIXME: Preserve buffers until resolveRelocations time to work around a bug
604 // in RuntimeDyldELF.
605 // This fixme should be fixed ASAP. This is a very brittle workaround.
606 std::vector<std::unique_ptr<MemoryBuffer>> InputBuffers;
608 // If we don't have any input files, read from stdin.
609 if (!InputFileList.size())
610 InputFileList.push_back("-");
611 for(unsigned i = 0, e = InputFileList.size(); i != e; ++i) {
612 // Load the input memory buffer.
613 ErrorOr<std::unique_ptr<MemoryBuffer>> InputBuffer =
614 MemoryBuffer::getFileOrSTDIN(InputFileList[i]);
616 if (std::error_code EC = InputBuffer.getError())
617 return Error("unable to read input: '" + EC.message() + "'");
619 ErrorOr<std::unique_ptr<ObjectFile>> MaybeObj(
620 ObjectFile::createObjectFile((*InputBuffer)->getMemBufferRef()));
622 if (std::error_code EC = MaybeObj.getError())
623 return Error("unable to create object file: '" + EC.message() + "'");
625 ObjectFile &Obj = **MaybeObj;
626 InputBuffers.push_back(std::move(*InputBuffer));
628 // Load the object file
629 Dyld.loadObject(Obj);
630 if (Dyld.hasError()) {
631 return Error(Dyld.getErrorString());
635 // Re-map the section addresses into the phony target address space.
636 remapSections(TheTriple, MemMgr, Checker);
638 // Resolve all the relocations we can.
639 Dyld.resolveRelocations();
641 // Register EH frames.
642 Dyld.registerEHFrames();
644 int ErrorCode = checkAllExpressions(Checker);
645 if (Dyld.hasError()) {
646 errs() << "RTDyld reported an error applying relocations:\n "
647 << Dyld.getErrorString() << "\n";
654 int main(int argc, char **argv) {
655 sys::PrintStackTraceOnErrorSignal();
656 PrettyStackTraceProgram X(argc, argv);
658 ProgramName = argv[0];
659 llvm_shutdown_obj Y; // Call llvm_shutdown() on exit.
661 llvm::InitializeAllTargetInfos();
662 llvm::InitializeAllTargetMCs();
663 llvm::InitializeAllDisassemblers();
665 cl::ParseCommandLineOptions(argc, argv, "llvm MC-JIT tool\n");
669 return executeInput();
670 case AC_PrintDebugLineInfo:
671 return printLineInfoForInput(/* LoadObjects */ true,/* UseDebugObj */ true);
672 case AC_PrintLineInfo:
673 return printLineInfoForInput(/* LoadObjects */ true,/* UseDebugObj */false);
674 case AC_PrintObjectLineInfo:
675 return printLineInfoForInput(/* LoadObjects */false,/* UseDebugObj */false);
677 return linkAndVerify();