1f12b8282SRafael Espindola //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===// 2f12b8282SRafael Espindola // 3f12b8282SRafael Espindola // The LLVM Compiler Infrastructure 4f12b8282SRafael Espindola // 5f12b8282SRafael Espindola // This file is distributed under the University of Illinois Open Source 6f12b8282SRafael Espindola // License. See LICENSE.TXT for details. 7f12b8282SRafael Espindola // 8f12b8282SRafael Espindola //===----------------------------------------------------------------------===// 9f12b8282SRafael Espindola // 10f12b8282SRafael Espindola // Part of the IRObjectFile class implementation. 11f12b8282SRafael Espindola // 12f12b8282SRafael Espindola //===----------------------------------------------------------------------===// 13f12b8282SRafael Espindola 14ba79dba8SRafael Espindola #include "llvm/Object/IRObjectFile.h" 15ba79dba8SRafael Espindola #include "RecordStreamer.h" 160a446fd5SBenjamin Kramer #include "llvm/ADT/STLExtras.h" 17f12b8282SRafael Espindola #include "llvm/Bitcode/ReaderWriter.h" 18c3f9b5a5SRafael Espindola #include "llvm/IR/GVMaterializer.h" 19d9903888SChandler Carruth #include "llvm/IR/LLVMContext.h" 20a51f0f83SRafael Espindola #include "llvm/IR/Mangler.h" 21f12b8282SRafael Espindola #include "llvm/IR/Module.h" 2213b69d63SRafael Espindola #include "llvm/MC/MCAsmInfo.h" 2313b69d63SRafael Espindola #include "llvm/MC/MCContext.h" 2413b69d63SRafael Espindola #include "llvm/MC/MCInstrInfo.h" 2513b69d63SRafael Espindola #include "llvm/MC/MCObjectFileInfo.h" 2613b69d63SRafael Espindola #include "llvm/MC/MCParser/MCAsmParser.h" 27b3e8a6d2SBenjamin Kramer #include "llvm/MC/MCParser/MCTargetAsmParser.h" 28d9903888SChandler Carruth #include "llvm/MC/MCRegisterInfo.h" 2981902a3aSPete Cooper #include "llvm/MC/MCSubtargetInfo.h" 3010039c02SPeter Collingbourne #include "llvm/Object/ObjectFile.h" 312e60ca96SRafael Espindola #include "llvm/Support/MemoryBuffer.h" 3213b69d63SRafael Espindola #include "llvm/Support/SourceMgr.h" 3313b69d63SRafael Espindola #include "llvm/Support/TargetRegistry.h" 3423f04061SRafael Espindola #include "llvm/Support/raw_ostream.h" 35f12b8282SRafael Espindola using namespace llvm; 36f12b8282SRafael Espindola using namespace object; 37f12b8282SRafael Espindola 3848af1c2aSRafael Espindola IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod) 3948af1c2aSRafael Espindola : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) { 40c233f74eSRafael Espindola Mang.reset(new Mangler()); 419ff43e40SMehdi Amini CollectAsmUndefinedRefs( 42*a0cb890fSMehdi Amini Triple(M->getTargetTriple()), M->getModuleInlineAsm(), 43*a0cb890fSMehdi Amini [this](StringRef Name, BasicSymbolRef::Flags Flags) { 449ff43e40SMehdi Amini AsmSymbols.push_back( 459ff43e40SMehdi Amini std::make_pair<std::string, uint32_t>(Name, std::move(Flags))); 46e9cffafdSMehdi Amini }); 47e9cffafdSMehdi Amini } 4813b69d63SRafael Espindola 49e9cffafdSMehdi Amini // Parse inline ASM and collect the list of symbols that are not defined in 50e9cffafdSMehdi Amini // the current module. This is inspired from IRObjectFile. 51e9cffafdSMehdi Amini void IRObjectFile::CollectAsmUndefinedRefs( 52*a0cb890fSMehdi Amini const Triple &TT, StringRef InlineAsm, 53e9cffafdSMehdi Amini const std::function<void(StringRef, BasicSymbolRef::Flags)> & 54e9cffafdSMehdi Amini AsmUndefinedRefs) { 5513b69d63SRafael Espindola if (InlineAsm.empty()) 5613b69d63SRafael Espindola return; 5713b69d63SRafael Espindola 5813b69d63SRafael Espindola std::string Err; 598d8b13dcSDaniel Sanders const Target *T = TargetRegistry::lookupTarget(TT.str(), Err); 6013b69d63SRafael Espindola if (!T) 6113b69d63SRafael Espindola return; 6213b69d63SRafael Espindola 638d8b13dcSDaniel Sanders std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str())); 6413b69d63SRafael Espindola if (!MRI) 6513b69d63SRafael Espindola return; 6613b69d63SRafael Espindola 678d8b13dcSDaniel Sanders std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str())); 6813b69d63SRafael Espindola if (!MAI) 6913b69d63SRafael Espindola return; 7013b69d63SRafael Espindola 7113b69d63SRafael Espindola std::unique_ptr<MCSubtargetInfo> STI( 728d8b13dcSDaniel Sanders T->createMCSubtargetInfo(TT.str(), "", "")); 7313b69d63SRafael Espindola if (!STI) 7413b69d63SRafael Espindola return; 7513b69d63SRafael Espindola 7613b69d63SRafael Espindola std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo()); 7713b69d63SRafael Espindola if (!MCII) 7813b69d63SRafael Espindola return; 7913b69d63SRafael Espindola 8013b69d63SRafael Espindola MCObjectFileInfo MOFI; 8113b69d63SRafael Espindola MCContext MCCtx(MAI.get(), MRI.get(), &MOFI); 828d8b13dcSDaniel Sanders MOFI.InitMCObjectFileInfo(TT, Reloc::Default, CodeModel::Default, MCCtx); 8313b69d63SRafael Espindola std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx)); 8420c7259cSPeter Collingbourne T->createNullTargetStreamer(*Streamer); 8513b69d63SRafael Espindola 8613b69d63SRafael Espindola std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm)); 8713b69d63SRafael Espindola SourceMgr SrcMgr; 881961f14cSDavid Blaikie SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc()); 8913b69d63SRafael Espindola std::unique_ptr<MCAsmParser> Parser( 9013b69d63SRafael Espindola createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI)); 9113b69d63SRafael Espindola 9213b69d63SRafael Espindola MCTargetOptions MCOptions; 9313b69d63SRafael Espindola std::unique_ptr<MCTargetAsmParser> TAP( 9413b69d63SRafael Espindola T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions)); 9513b69d63SRafael Espindola if (!TAP) 9613b69d63SRafael Espindola return; 9713b69d63SRafael Espindola 9813b69d63SRafael Espindola Parser->setTargetParser(*TAP); 9913b69d63SRafael Espindola if (Parser->Run(false)) 10013b69d63SRafael Espindola return; 10113b69d63SRafael Espindola 10213b69d63SRafael Espindola for (auto &KV : *Streamer) { 10313b69d63SRafael Espindola StringRef Key = KV.first(); 10413b69d63SRafael Espindola RecordStreamer::State Value = KV.second; 10513b69d63SRafael Espindola uint32_t Res = BasicSymbolRef::SF_None; 10613b69d63SRafael Espindola switch (Value) { 10713b69d63SRafael Espindola case RecordStreamer::NeverSeen: 10813b69d63SRafael Espindola llvm_unreachable("foo"); 10913b69d63SRafael Espindola case RecordStreamer::DefinedGlobal: 11013b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Global; 11113b69d63SRafael Espindola break; 11213b69d63SRafael Espindola case RecordStreamer::Defined: 11313b69d63SRafael Espindola break; 11413b69d63SRafael Espindola case RecordStreamer::Global: 11513b69d63SRafael Espindola case RecordStreamer::Used: 11613b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Undefined; 11713b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Global; 11813b69d63SRafael Espindola break; 11913b69d63SRafael Espindola } 120e9cffafdSMehdi Amini AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res)); 12113b69d63SRafael Espindola } 122f12b8282SRafael Espindola } 123f12b8282SRafael Espindola 124dddd1fd9SRafael Espindola IRObjectFile::~IRObjectFile() { 125dddd1fd9SRafael Espindola } 126c3f9b5a5SRafael Espindola 127527e846eSRafael Espindola static GlobalValue *getGV(DataRefImpl &Symb) { 12813b69d63SRafael Espindola if ((Symb.p & 3) == 3) 12913b69d63SRafael Espindola return nullptr; 13013b69d63SRafael Espindola 13113b69d63SRafael Espindola return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3)); 132f12b8282SRafael Espindola } 133f12b8282SRafael Espindola 134f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) { 135f12b8282SRafael Espindola if (I == M.alias_end()) 136f12b8282SRafael Espindola return 3; 137f12b8282SRafael Espindola const GlobalValue *GV = &*I; 138f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 2; 139f12b8282SRafael Espindola } 140f12b8282SRafael Espindola 141f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) { 142f12b8282SRafael Espindola if (I == M.global_end()) 143f12b8282SRafael Espindola return skipEmpty(M.alias_begin(), M); 144f12b8282SRafael Espindola const GlobalValue *GV = &*I; 145f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 1; 146f12b8282SRafael Espindola } 147f12b8282SRafael Espindola 148f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) { 149f12b8282SRafael Espindola if (I == M.end()) 150f12b8282SRafael Espindola return skipEmpty(M.global_begin(), M); 151f12b8282SRafael Espindola const GlobalValue *GV = &*I; 152f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 0; 153f12b8282SRafael Espindola } 154f12b8282SRafael Espindola 15513b69d63SRafael Espindola static unsigned getAsmSymIndex(DataRefImpl Symb) { 15613b69d63SRafael Espindola assert((Symb.p & uintptr_t(3)) == 3); 15713b69d63SRafael Espindola uintptr_t Index = Symb.p & ~uintptr_t(3); 15813b69d63SRafael Espindola Index >>= 2; 15913b69d63SRafael Espindola return Index; 16013b69d63SRafael Espindola } 16113b69d63SRafael Espindola 162f12b8282SRafael Espindola void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const { 16313b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 164f12b8282SRafael Espindola uintptr_t Res; 16513b69d63SRafael Espindola 166f12b8282SRafael Espindola switch (Symb.p & 3) { 167f12b8282SRafael Espindola case 0: { 168f12b8282SRafael Espindola Module::const_iterator Iter(static_cast<const Function*>(GV)); 169f12b8282SRafael Espindola ++Iter; 17013b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 171f12b8282SRafael Espindola break; 172f12b8282SRafael Espindola } 173f12b8282SRafael Espindola case 1: { 174f12b8282SRafael Espindola Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV)); 175f12b8282SRafael Espindola ++Iter; 17613b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 177f12b8282SRafael Espindola break; 178f12b8282SRafael Espindola } 179f12b8282SRafael Espindola case 2: { 180f12b8282SRafael Espindola Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV)); 181f12b8282SRafael Espindola ++Iter; 18213b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 183f12b8282SRafael Espindola break; 184f12b8282SRafael Espindola } 18513b69d63SRafael Espindola case 3: { 18613b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 18713b69d63SRafael Espindola assert(Index < AsmSymbols.size()); 18813b69d63SRafael Espindola ++Index; 18913b69d63SRafael Espindola Res = (Index << 2) | 3; 19013b69d63SRafael Espindola break; 19113b69d63SRafael Espindola } 192addddc44SMichael Ilseman default: 193addddc44SMichael Ilseman llvm_unreachable("unreachable case"); 194f12b8282SRafael Espindola } 195f12b8282SRafael Espindola 196f12b8282SRafael Espindola Symb.p = Res; 197f12b8282SRafael Espindola } 198f12b8282SRafael Espindola 199db4ed0bdSRafael Espindola std::error_code IRObjectFile::printSymbolName(raw_ostream &OS, 200f12b8282SRafael Espindola DataRefImpl Symb) const { 20113b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 20213b69d63SRafael Espindola if (!GV) { 20313b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 20413b69d63SRafael Espindola assert(Index <= AsmSymbols.size()); 20513b69d63SRafael Espindola OS << AsmSymbols[Index].first; 2067d099195SRui Ueyama return std::error_code(); 20713b69d63SRafael Espindola } 208a51f0f83SRafael Espindola 20982e657b5SPeter Collingbourne if (GV->hasDLLImportStorageClass()) 21082e657b5SPeter Collingbourne OS << "__imp_"; 21182e657b5SPeter Collingbourne 212a51f0f83SRafael Espindola if (Mang) 21313b69d63SRafael Espindola Mang->getNameWithPrefix(OS, GV, false); 214a51f0f83SRafael Espindola else 21513b69d63SRafael Espindola OS << GV->getName(); 216a51f0f83SRafael Espindola 2177d099195SRui Ueyama return std::error_code(); 218f12b8282SRafael Espindola } 219f12b8282SRafael Espindola 220f12b8282SRafael Espindola uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const { 22113b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 22213b69d63SRafael Espindola 22313b69d63SRafael Espindola if (!GV) { 22413b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 22513b69d63SRafael Espindola assert(Index <= AsmSymbols.size()); 22613b69d63SRafael Espindola return AsmSymbols[Index].second; 22713b69d63SRafael Espindola } 228f12b8282SRafael Espindola 229f12b8282SRafael Espindola uint32_t Res = BasicSymbolRef::SF_None; 230d4bcefc7SRafael Espindola if (GV->isDeclarationForLinker()) 231f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Undefined; 232dc0dbe1fSKevin Enderby else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage()) 233dc0dbe1fSKevin Enderby Res |= BasicSymbolRef::SF_Hidden; 234dc0dbe1fSKevin Enderby if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) { 235dc0dbe1fSKevin Enderby if (GVar->isConstant()) 236dc0dbe1fSKevin Enderby Res |= BasicSymbolRef::SF_Const; 237dc0dbe1fSKevin Enderby } 23813b69d63SRafael Espindola if (GV->hasPrivateLinkage()) 239f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 24013b69d63SRafael Espindola if (!GV->hasLocalLinkage()) 241f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Global; 24213b69d63SRafael Espindola if (GV->hasCommonLinkage()) 243f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Common; 2448d6fbc3aSRafael Espindola if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() || 2458d6fbc3aSRafael Espindola GV->hasExternalWeakLinkage()) 246f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Weak; 247f12b8282SRafael Espindola 2482dc0d9bdSRafael Espindola if (GV->getName().startswith("llvm.")) 249b674c17dSRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 2502dc0d9bdSRafael Espindola else if (auto *Var = dyn_cast<GlobalVariable>(GV)) { 2512dc0d9bdSRafael Espindola if (Var->getSection() == StringRef("llvm.metadata")) 2523885090bSRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 2533885090bSRafael Espindola } 2543885090bSRafael Espindola 255f12b8282SRafael Espindola return Res; 256f12b8282SRafael Espindola } 257f12b8282SRafael Espindola 258527e846eSRafael Espindola GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); } 259f12b8282SRafael Espindola 26025a7e0a8SRafael Espindola std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); } 26125a7e0a8SRafael Espindola 262f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_begin_impl() const { 263f12b8282SRafael Espindola Module::const_iterator I = M->begin(); 264f12b8282SRafael Espindola DataRefImpl Ret; 265f12b8282SRafael Espindola Ret.p = skipEmpty(I, *M); 266f12b8282SRafael Espindola return basic_symbol_iterator(BasicSymbolRef(Ret, this)); 267f12b8282SRafael Espindola } 268f12b8282SRafael Espindola 269f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_end_impl() const { 270f12b8282SRafael Espindola DataRefImpl Ret; 27113b69d63SRafael Espindola uint64_t NumAsm = AsmSymbols.size(); 27213b69d63SRafael Espindola NumAsm <<= 2; 27313b69d63SRafael Espindola Ret.p = 3 | NumAsm; 274f12b8282SRafael Espindola return basic_symbol_iterator(BasicSymbolRef(Ret, this)); 275f12b8282SRafael Espindola } 276f12b8282SRafael Espindola 27710039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) { 27810039c02SPeter Collingbourne for (const SectionRef &Sec : Obj.sections()) { 279f2fe0141SSteven Wu if (Sec.isBitcode()) { 28010039c02SPeter Collingbourne StringRef SecContents; 28110039c02SPeter Collingbourne if (std::error_code EC = Sec.getContents(SecContents)) 28210039c02SPeter Collingbourne return EC; 28310039c02SPeter Collingbourne return MemoryBufferRef(SecContents, Obj.getFileName()); 28410039c02SPeter Collingbourne } 28510039c02SPeter Collingbourne } 28610039c02SPeter Collingbourne 28710039c02SPeter Collingbourne return object_error::bitcode_section_not_found; 28810039c02SPeter Collingbourne } 28910039c02SPeter Collingbourne 29010039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) { 29110039c02SPeter Collingbourne sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer()); 29210039c02SPeter Collingbourne switch (Type) { 29310039c02SPeter Collingbourne case sys::fs::file_magic::bitcode: 29410039c02SPeter Collingbourne return Object; 29510039c02SPeter Collingbourne case sys::fs::file_magic::elf_relocatable: 29610039c02SPeter Collingbourne case sys::fs::file_magic::macho_object: 29710039c02SPeter Collingbourne case sys::fs::file_magic::coff_object: { 2983fcdf6aeSKevin Enderby Expected<std::unique_ptr<ObjectFile>> ObjFile = 29910039c02SPeter Collingbourne ObjectFile::createObjectFile(Object, Type); 30010039c02SPeter Collingbourne if (!ObjFile) 3013fcdf6aeSKevin Enderby return errorToErrorCode(ObjFile.takeError()); 30210039c02SPeter Collingbourne return findBitcodeInObject(*ObjFile->get()); 30310039c02SPeter Collingbourne } 30410039c02SPeter Collingbourne default: 30510039c02SPeter Collingbourne return object_error::invalid_file_type; 30610039c02SPeter Collingbourne } 30710039c02SPeter Collingbourne } 30810039c02SPeter Collingbourne 30910a27df8SDavid Blaikie ErrorOr<std::unique_ptr<IRObjectFile>> 3105dec7eaaSRafael Espindola llvm::object::IRObjectFile::create(MemoryBufferRef Object, 31148af1c2aSRafael Espindola LLVMContext &Context) { 31210039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object); 31310039c02SPeter Collingbourne if (!BCOrErr) 31410039c02SPeter Collingbourne return BCOrErr.getError(); 31548af1c2aSRafael Espindola 316cf981625SRafael Espindola std::unique_ptr<MemoryBuffer> Buff = 317cf981625SRafael Espindola MemoryBuffer::getMemBuffer(BCOrErr.get(), false); 31848af1c2aSRafael Espindola 319dcd1dca2SRafael Espindola ErrorOr<std::unique_ptr<Module>> MOrErr = 3209d2bfc48SRafael Espindola getLazyBitcodeModule(std::move(Buff), Context, 321cba833a0SRafael Espindola /*ShouldLazyLoadMetadata*/ true); 322dddd1fd9SRafael Espindola if (std::error_code EC = MOrErr.getError()) 323f12b8282SRafael Espindola return EC; 324dddd1fd9SRafael Espindola 325dcd1dca2SRafael Espindola std::unique_ptr<Module> &M = MOrErr.get(); 32610a27df8SDavid Blaikie return llvm::make_unique<IRObjectFile>(Object, std::move(M)); 327f12b8282SRafael Espindola } 328