1f12b8282SRafael Espindola //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===// 2f12b8282SRafael Espindola // 3f12b8282SRafael Espindola // The LLVM Compiler Infrastructure 4f12b8282SRafael Espindola // 5f12b8282SRafael Espindola // This file is distributed under the University of Illinois Open Source 6f12b8282SRafael Espindola // License. See LICENSE.TXT for details. 7f12b8282SRafael Espindola // 8f12b8282SRafael Espindola //===----------------------------------------------------------------------===// 9f12b8282SRafael Espindola // 10f12b8282SRafael Espindola // Part of the IRObjectFile class implementation. 11f12b8282SRafael Espindola // 12f12b8282SRafael Espindola //===----------------------------------------------------------------------===// 13f12b8282SRafael Espindola 14ba79dba8SRafael Espindola #include "llvm/Object/IRObjectFile.h" 15ba79dba8SRafael Espindola #include "RecordStreamer.h" 160a446fd5SBenjamin Kramer #include "llvm/ADT/STLExtras.h" 17f12b8282SRafael Espindola #include "llvm/Bitcode/ReaderWriter.h" 18c3f9b5a5SRafael Espindola #include "llvm/IR/GVMaterializer.h" 19d9903888SChandler Carruth #include "llvm/IR/LLVMContext.h" 20a51f0f83SRafael Espindola #include "llvm/IR/Mangler.h" 21f12b8282SRafael Espindola #include "llvm/IR/Module.h" 2213b69d63SRafael Espindola #include "llvm/MC/MCAsmInfo.h" 2313b69d63SRafael Espindola #include "llvm/MC/MCContext.h" 2413b69d63SRafael Espindola #include "llvm/MC/MCInstrInfo.h" 2513b69d63SRafael Espindola #include "llvm/MC/MCObjectFileInfo.h" 2613b69d63SRafael Espindola #include "llvm/MC/MCParser/MCAsmParser.h" 27b3e8a6d2SBenjamin Kramer #include "llvm/MC/MCParser/MCTargetAsmParser.h" 28d9903888SChandler Carruth #include "llvm/MC/MCRegisterInfo.h" 2981902a3aSPete Cooper #include "llvm/MC/MCSubtargetInfo.h" 3010039c02SPeter Collingbourne #include "llvm/Object/ObjectFile.h" 312e60ca96SRafael Espindola #include "llvm/Support/MemoryBuffer.h" 3213b69d63SRafael Espindola #include "llvm/Support/SourceMgr.h" 3313b69d63SRafael Espindola #include "llvm/Support/TargetRegistry.h" 3423f04061SRafael Espindola #include "llvm/Support/raw_ostream.h" 35f12b8282SRafael Espindola using namespace llvm; 36f12b8282SRafael Espindola using namespace object; 37f12b8282SRafael Espindola 3848af1c2aSRafael Espindola IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod) 3948af1c2aSRafael Espindola : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) { 40c233f74eSRafael Espindola Mang.reset(new Mangler()); 41*9ff43e40SMehdi Amini CollectAsmUndefinedRefs( 42*9ff43e40SMehdi Amini *M, [this](StringRef Name, BasicSymbolRef::Flags Flags) { 43*9ff43e40SMehdi Amini AsmSymbols.push_back( 44*9ff43e40SMehdi Amini std::make_pair<std::string, uint32_t>(Name, std::move(Flags))); 45e9cffafdSMehdi Amini }); 46e9cffafdSMehdi Amini } 4713b69d63SRafael Espindola 48e9cffafdSMehdi Amini // Parse inline ASM and collect the list of symbols that are not defined in 49e9cffafdSMehdi Amini // the current module. This is inspired from IRObjectFile. 50e9cffafdSMehdi Amini void IRObjectFile::CollectAsmUndefinedRefs( 51e9cffafdSMehdi Amini Module &TheModule, 52e9cffafdSMehdi Amini const std::function<void(StringRef, BasicSymbolRef::Flags)> & 53e9cffafdSMehdi Amini AsmUndefinedRefs) { 54e9cffafdSMehdi Amini 55e9cffafdSMehdi Amini const std::string &InlineAsm = TheModule.getModuleInlineAsm(); 5613b69d63SRafael Espindola if (InlineAsm.empty()) 5713b69d63SRafael Espindola return; 5813b69d63SRafael Espindola 59e9cffafdSMehdi Amini Triple TT(TheModule.getTargetTriple()); 6013b69d63SRafael Espindola std::string Err; 618d8b13dcSDaniel Sanders const Target *T = TargetRegistry::lookupTarget(TT.str(), Err); 6213b69d63SRafael Espindola if (!T) 6313b69d63SRafael Espindola return; 6413b69d63SRafael Espindola 658d8b13dcSDaniel Sanders std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str())); 6613b69d63SRafael Espindola if (!MRI) 6713b69d63SRafael Espindola return; 6813b69d63SRafael Espindola 698d8b13dcSDaniel Sanders std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str())); 7013b69d63SRafael Espindola if (!MAI) 7113b69d63SRafael Espindola return; 7213b69d63SRafael Espindola 7313b69d63SRafael Espindola std::unique_ptr<MCSubtargetInfo> STI( 748d8b13dcSDaniel Sanders T->createMCSubtargetInfo(TT.str(), "", "")); 7513b69d63SRafael Espindola if (!STI) 7613b69d63SRafael Espindola return; 7713b69d63SRafael Espindola 7813b69d63SRafael Espindola std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo()); 7913b69d63SRafael Espindola if (!MCII) 8013b69d63SRafael Espindola return; 8113b69d63SRafael Espindola 8213b69d63SRafael Espindola MCObjectFileInfo MOFI; 8313b69d63SRafael Espindola MCContext MCCtx(MAI.get(), MRI.get(), &MOFI); 848d8b13dcSDaniel Sanders MOFI.InitMCObjectFileInfo(TT, Reloc::Default, CodeModel::Default, MCCtx); 8513b69d63SRafael Espindola std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx)); 8620c7259cSPeter Collingbourne T->createNullTargetStreamer(*Streamer); 8713b69d63SRafael Espindola 8813b69d63SRafael Espindola std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm)); 8913b69d63SRafael Espindola SourceMgr SrcMgr; 901961f14cSDavid Blaikie SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc()); 9113b69d63SRafael Espindola std::unique_ptr<MCAsmParser> Parser( 9213b69d63SRafael Espindola createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI)); 9313b69d63SRafael Espindola 9413b69d63SRafael Espindola MCTargetOptions MCOptions; 9513b69d63SRafael Espindola std::unique_ptr<MCTargetAsmParser> TAP( 9613b69d63SRafael Espindola T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions)); 9713b69d63SRafael Espindola if (!TAP) 9813b69d63SRafael Espindola return; 9913b69d63SRafael Espindola 10013b69d63SRafael Espindola Parser->setTargetParser(*TAP); 10113b69d63SRafael Espindola if (Parser->Run(false)) 10213b69d63SRafael Espindola return; 10313b69d63SRafael Espindola 10413b69d63SRafael Espindola for (auto &KV : *Streamer) { 10513b69d63SRafael Espindola StringRef Key = KV.first(); 10613b69d63SRafael Espindola RecordStreamer::State Value = KV.second; 10713b69d63SRafael Espindola uint32_t Res = BasicSymbolRef::SF_None; 10813b69d63SRafael Espindola switch (Value) { 10913b69d63SRafael Espindola case RecordStreamer::NeverSeen: 11013b69d63SRafael Espindola llvm_unreachable("foo"); 11113b69d63SRafael Espindola case RecordStreamer::DefinedGlobal: 11213b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Global; 11313b69d63SRafael Espindola break; 11413b69d63SRafael Espindola case RecordStreamer::Defined: 11513b69d63SRafael Espindola break; 11613b69d63SRafael Espindola case RecordStreamer::Global: 11713b69d63SRafael Espindola case RecordStreamer::Used: 11813b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Undefined; 11913b69d63SRafael Espindola Res |= BasicSymbolRef::SF_Global; 12013b69d63SRafael Espindola break; 12113b69d63SRafael Espindola } 122e9cffafdSMehdi Amini AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res)); 12313b69d63SRafael Espindola } 124f12b8282SRafael Espindola } 125f12b8282SRafael Espindola 126dddd1fd9SRafael Espindola IRObjectFile::~IRObjectFile() { 127dddd1fd9SRafael Espindola } 128c3f9b5a5SRafael Espindola 129527e846eSRafael Espindola static GlobalValue *getGV(DataRefImpl &Symb) { 13013b69d63SRafael Espindola if ((Symb.p & 3) == 3) 13113b69d63SRafael Espindola return nullptr; 13213b69d63SRafael Espindola 13313b69d63SRafael Espindola return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3)); 134f12b8282SRafael Espindola } 135f12b8282SRafael Espindola 136f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) { 137f12b8282SRafael Espindola if (I == M.alias_end()) 138f12b8282SRafael Espindola return 3; 139f12b8282SRafael Espindola const GlobalValue *GV = &*I; 140f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 2; 141f12b8282SRafael Espindola } 142f12b8282SRafael Espindola 143f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) { 144f12b8282SRafael Espindola if (I == M.global_end()) 145f12b8282SRafael Espindola return skipEmpty(M.alias_begin(), M); 146f12b8282SRafael Espindola const GlobalValue *GV = &*I; 147f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 1; 148f12b8282SRafael Espindola } 149f12b8282SRafael Espindola 150f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) { 151f12b8282SRafael Espindola if (I == M.end()) 152f12b8282SRafael Espindola return skipEmpty(M.global_begin(), M); 153f12b8282SRafael Espindola const GlobalValue *GV = &*I; 154f12b8282SRafael Espindola return reinterpret_cast<uintptr_t>(GV) | 0; 155f12b8282SRafael Espindola } 156f12b8282SRafael Espindola 15713b69d63SRafael Espindola static unsigned getAsmSymIndex(DataRefImpl Symb) { 15813b69d63SRafael Espindola assert((Symb.p & uintptr_t(3)) == 3); 15913b69d63SRafael Espindola uintptr_t Index = Symb.p & ~uintptr_t(3); 16013b69d63SRafael Espindola Index >>= 2; 16113b69d63SRafael Espindola return Index; 16213b69d63SRafael Espindola } 16313b69d63SRafael Espindola 164f12b8282SRafael Espindola void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const { 16513b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 166f12b8282SRafael Espindola uintptr_t Res; 16713b69d63SRafael Espindola 168f12b8282SRafael Espindola switch (Symb.p & 3) { 169f12b8282SRafael Espindola case 0: { 170f12b8282SRafael Espindola Module::const_iterator Iter(static_cast<const Function*>(GV)); 171f12b8282SRafael Espindola ++Iter; 17213b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 173f12b8282SRafael Espindola break; 174f12b8282SRafael Espindola } 175f12b8282SRafael Espindola case 1: { 176f12b8282SRafael Espindola Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV)); 177f12b8282SRafael Espindola ++Iter; 17813b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 179f12b8282SRafael Espindola break; 180f12b8282SRafael Espindola } 181f12b8282SRafael Espindola case 2: { 182f12b8282SRafael Espindola Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV)); 183f12b8282SRafael Espindola ++Iter; 18413b69d63SRafael Espindola Res = skipEmpty(Iter, *M); 185f12b8282SRafael Espindola break; 186f12b8282SRafael Espindola } 18713b69d63SRafael Espindola case 3: { 18813b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 18913b69d63SRafael Espindola assert(Index < AsmSymbols.size()); 19013b69d63SRafael Espindola ++Index; 19113b69d63SRafael Espindola Res = (Index << 2) | 3; 19213b69d63SRafael Espindola break; 19313b69d63SRafael Espindola } 194addddc44SMichael Ilseman default: 195addddc44SMichael Ilseman llvm_unreachable("unreachable case"); 196f12b8282SRafael Espindola } 197f12b8282SRafael Espindola 198f12b8282SRafael Espindola Symb.p = Res; 199f12b8282SRafael Espindola } 200f12b8282SRafael Espindola 201db4ed0bdSRafael Espindola std::error_code IRObjectFile::printSymbolName(raw_ostream &OS, 202f12b8282SRafael Espindola DataRefImpl Symb) const { 20313b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 20413b69d63SRafael Espindola if (!GV) { 20513b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 20613b69d63SRafael Espindola assert(Index <= AsmSymbols.size()); 20713b69d63SRafael Espindola OS << AsmSymbols[Index].first; 2087d099195SRui Ueyama return std::error_code(); 20913b69d63SRafael Espindola } 210a51f0f83SRafael Espindola 21182e657b5SPeter Collingbourne if (GV->hasDLLImportStorageClass()) 21282e657b5SPeter Collingbourne OS << "__imp_"; 21382e657b5SPeter Collingbourne 214a51f0f83SRafael Espindola if (Mang) 21513b69d63SRafael Espindola Mang->getNameWithPrefix(OS, GV, false); 216a51f0f83SRafael Espindola else 21713b69d63SRafael Espindola OS << GV->getName(); 218a51f0f83SRafael Espindola 2197d099195SRui Ueyama return std::error_code(); 220f12b8282SRafael Espindola } 221f12b8282SRafael Espindola 222f12b8282SRafael Espindola uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const { 22313b69d63SRafael Espindola const GlobalValue *GV = getGV(Symb); 22413b69d63SRafael Espindola 22513b69d63SRafael Espindola if (!GV) { 22613b69d63SRafael Espindola unsigned Index = getAsmSymIndex(Symb); 22713b69d63SRafael Espindola assert(Index <= AsmSymbols.size()); 22813b69d63SRafael Espindola return AsmSymbols[Index].second; 22913b69d63SRafael Espindola } 230f12b8282SRafael Espindola 231f12b8282SRafael Espindola uint32_t Res = BasicSymbolRef::SF_None; 232d4bcefc7SRafael Espindola if (GV->isDeclarationForLinker()) 233f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Undefined; 234dc0dbe1fSKevin Enderby else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage()) 235dc0dbe1fSKevin Enderby Res |= BasicSymbolRef::SF_Hidden; 236dc0dbe1fSKevin Enderby if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) { 237dc0dbe1fSKevin Enderby if (GVar->isConstant()) 238dc0dbe1fSKevin Enderby Res |= BasicSymbolRef::SF_Const; 239dc0dbe1fSKevin Enderby } 24013b69d63SRafael Espindola if (GV->hasPrivateLinkage()) 241f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 24213b69d63SRafael Espindola if (!GV->hasLocalLinkage()) 243f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Global; 24413b69d63SRafael Espindola if (GV->hasCommonLinkage()) 245f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Common; 2468d6fbc3aSRafael Espindola if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() || 2478d6fbc3aSRafael Espindola GV->hasExternalWeakLinkage()) 248f12b8282SRafael Espindola Res |= BasicSymbolRef::SF_Weak; 249f12b8282SRafael Espindola 2502dc0d9bdSRafael Espindola if (GV->getName().startswith("llvm.")) 251b674c17dSRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 2522dc0d9bdSRafael Espindola else if (auto *Var = dyn_cast<GlobalVariable>(GV)) { 2532dc0d9bdSRafael Espindola if (Var->getSection() == StringRef("llvm.metadata")) 2543885090bSRafael Espindola Res |= BasicSymbolRef::SF_FormatSpecific; 2553885090bSRafael Espindola } 2563885090bSRafael Espindola 257f12b8282SRafael Espindola return Res; 258f12b8282SRafael Espindola } 259f12b8282SRafael Espindola 260527e846eSRafael Espindola GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); } 261f12b8282SRafael Espindola 26225a7e0a8SRafael Espindola std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); } 26325a7e0a8SRafael Espindola 264f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_begin_impl() const { 265f12b8282SRafael Espindola Module::const_iterator I = M->begin(); 266f12b8282SRafael Espindola DataRefImpl Ret; 267f12b8282SRafael Espindola Ret.p = skipEmpty(I, *M); 268f12b8282SRafael Espindola return basic_symbol_iterator(BasicSymbolRef(Ret, this)); 269f12b8282SRafael Espindola } 270f12b8282SRafael Espindola 271f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_end_impl() const { 272f12b8282SRafael Espindola DataRefImpl Ret; 27313b69d63SRafael Espindola uint64_t NumAsm = AsmSymbols.size(); 27413b69d63SRafael Espindola NumAsm <<= 2; 27513b69d63SRafael Espindola Ret.p = 3 | NumAsm; 276f12b8282SRafael Espindola return basic_symbol_iterator(BasicSymbolRef(Ret, this)); 277f12b8282SRafael Espindola } 278f12b8282SRafael Espindola 27910039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) { 28010039c02SPeter Collingbourne for (const SectionRef &Sec : Obj.sections()) { 281f2fe0141SSteven Wu if (Sec.isBitcode()) { 28210039c02SPeter Collingbourne StringRef SecContents; 28310039c02SPeter Collingbourne if (std::error_code EC = Sec.getContents(SecContents)) 28410039c02SPeter Collingbourne return EC; 28510039c02SPeter Collingbourne return MemoryBufferRef(SecContents, Obj.getFileName()); 28610039c02SPeter Collingbourne } 28710039c02SPeter Collingbourne } 28810039c02SPeter Collingbourne 28910039c02SPeter Collingbourne return object_error::bitcode_section_not_found; 29010039c02SPeter Collingbourne } 29110039c02SPeter Collingbourne 29210039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) { 29310039c02SPeter Collingbourne sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer()); 29410039c02SPeter Collingbourne switch (Type) { 29510039c02SPeter Collingbourne case sys::fs::file_magic::bitcode: 29610039c02SPeter Collingbourne return Object; 29710039c02SPeter Collingbourne case sys::fs::file_magic::elf_relocatable: 29810039c02SPeter Collingbourne case sys::fs::file_magic::macho_object: 29910039c02SPeter Collingbourne case sys::fs::file_magic::coff_object: { 3003fcdf6aeSKevin Enderby Expected<std::unique_ptr<ObjectFile>> ObjFile = 30110039c02SPeter Collingbourne ObjectFile::createObjectFile(Object, Type); 30210039c02SPeter Collingbourne if (!ObjFile) 3033fcdf6aeSKevin Enderby return errorToErrorCode(ObjFile.takeError()); 30410039c02SPeter Collingbourne return findBitcodeInObject(*ObjFile->get()); 30510039c02SPeter Collingbourne } 30610039c02SPeter Collingbourne default: 30710039c02SPeter Collingbourne return object_error::invalid_file_type; 30810039c02SPeter Collingbourne } 30910039c02SPeter Collingbourne } 31010039c02SPeter Collingbourne 31110a27df8SDavid Blaikie ErrorOr<std::unique_ptr<IRObjectFile>> 3125dec7eaaSRafael Espindola llvm::object::IRObjectFile::create(MemoryBufferRef Object, 31348af1c2aSRafael Espindola LLVMContext &Context) { 31410039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object); 31510039c02SPeter Collingbourne if (!BCOrErr) 31610039c02SPeter Collingbourne return BCOrErr.getError(); 31748af1c2aSRafael Espindola 318cf981625SRafael Espindola std::unique_ptr<MemoryBuffer> Buff = 319cf981625SRafael Espindola MemoryBuffer::getMemBuffer(BCOrErr.get(), false); 32048af1c2aSRafael Espindola 321dcd1dca2SRafael Espindola ErrorOr<std::unique_ptr<Module>> MOrErr = 3229d2bfc48SRafael Espindola getLazyBitcodeModule(std::move(Buff), Context, 323cba833a0SRafael Espindola /*ShouldLazyLoadMetadata*/ true); 324dddd1fd9SRafael Espindola if (std::error_code EC = MOrErr.getError()) 325f12b8282SRafael Espindola return EC; 326dddd1fd9SRafael Espindola 327dcd1dca2SRafael Espindola std::unique_ptr<Module> &M = MOrErr.get(); 32810a27df8SDavid Blaikie return llvm::make_unique<IRObjectFile>(Object, std::move(M)); 329f12b8282SRafael Espindola } 330