1f12b8282SRafael Espindola //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===//
2f12b8282SRafael Espindola //
3f12b8282SRafael Espindola //                     The LLVM Compiler Infrastructure
4f12b8282SRafael Espindola //
5f12b8282SRafael Espindola // This file is distributed under the University of Illinois Open Source
6f12b8282SRafael Espindola // License. See LICENSE.TXT for details.
7f12b8282SRafael Espindola //
8f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
9f12b8282SRafael Espindola //
10f12b8282SRafael Espindola // Part of the IRObjectFile class implementation.
11f12b8282SRafael Espindola //
12f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
13f12b8282SRafael Espindola 
14ba79dba8SRafael Espindola #include "llvm/Object/IRObjectFile.h"
15ba79dba8SRafael Espindola #include "RecordStreamer.h"
160a446fd5SBenjamin Kramer #include "llvm/ADT/STLExtras.h"
17f12b8282SRafael Espindola #include "llvm/Bitcode/ReaderWriter.h"
18c3f9b5a5SRafael Espindola #include "llvm/IR/GVMaterializer.h"
19d9903888SChandler Carruth #include "llvm/IR/LLVMContext.h"
20a51f0f83SRafael Espindola #include "llvm/IR/Mangler.h"
21f12b8282SRafael Espindola #include "llvm/IR/Module.h"
2213b69d63SRafael Espindola #include "llvm/MC/MCAsmInfo.h"
2313b69d63SRafael Espindola #include "llvm/MC/MCContext.h"
2413b69d63SRafael Espindola #include "llvm/MC/MCInstrInfo.h"
2513b69d63SRafael Espindola #include "llvm/MC/MCObjectFileInfo.h"
2613b69d63SRafael Espindola #include "llvm/MC/MCParser/MCAsmParser.h"
27b3e8a6d2SBenjamin Kramer #include "llvm/MC/MCParser/MCTargetAsmParser.h"
28d9903888SChandler Carruth #include "llvm/MC/MCRegisterInfo.h"
2981902a3aSPete Cooper #include "llvm/MC/MCSubtargetInfo.h"
3010039c02SPeter Collingbourne #include "llvm/Object/ObjectFile.h"
312e60ca96SRafael Espindola #include "llvm/Support/MemoryBuffer.h"
3213b69d63SRafael Espindola #include "llvm/Support/SourceMgr.h"
3313b69d63SRafael Espindola #include "llvm/Support/TargetRegistry.h"
3423f04061SRafael Espindola #include "llvm/Support/raw_ostream.h"
35f12b8282SRafael Espindola using namespace llvm;
36f12b8282SRafael Espindola using namespace object;
37f12b8282SRafael Espindola 
3848af1c2aSRafael Espindola IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod)
3948af1c2aSRafael Espindola     : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) {
40c233f74eSRafael Espindola   Mang.reset(new Mangler());
419ff43e40SMehdi Amini   CollectAsmUndefinedRefs(
42*a0cb890fSMehdi Amini       Triple(M->getTargetTriple()), M->getModuleInlineAsm(),
43*a0cb890fSMehdi Amini       [this](StringRef Name, BasicSymbolRef::Flags Flags) {
449ff43e40SMehdi Amini         AsmSymbols.push_back(
459ff43e40SMehdi Amini             std::make_pair<std::string, uint32_t>(Name, std::move(Flags)));
46e9cffafdSMehdi Amini       });
47e9cffafdSMehdi Amini }
4813b69d63SRafael Espindola 
49e9cffafdSMehdi Amini // Parse inline ASM and collect the list of symbols that are not defined in
50e9cffafdSMehdi Amini // the current module. This is inspired from IRObjectFile.
51e9cffafdSMehdi Amini void IRObjectFile::CollectAsmUndefinedRefs(
52*a0cb890fSMehdi Amini     const Triple &TT, StringRef InlineAsm,
53e9cffafdSMehdi Amini     const std::function<void(StringRef, BasicSymbolRef::Flags)> &
54e9cffafdSMehdi Amini         AsmUndefinedRefs) {
5513b69d63SRafael Espindola   if (InlineAsm.empty())
5613b69d63SRafael Espindola     return;
5713b69d63SRafael Espindola 
5813b69d63SRafael Espindola   std::string Err;
598d8b13dcSDaniel Sanders   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
6013b69d63SRafael Espindola   if (!T)
6113b69d63SRafael Espindola     return;
6213b69d63SRafael Espindola 
638d8b13dcSDaniel Sanders   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
6413b69d63SRafael Espindola   if (!MRI)
6513b69d63SRafael Espindola     return;
6613b69d63SRafael Espindola 
678d8b13dcSDaniel Sanders   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
6813b69d63SRafael Espindola   if (!MAI)
6913b69d63SRafael Espindola     return;
7013b69d63SRafael Espindola 
7113b69d63SRafael Espindola   std::unique_ptr<MCSubtargetInfo> STI(
728d8b13dcSDaniel Sanders       T->createMCSubtargetInfo(TT.str(), "", ""));
7313b69d63SRafael Espindola   if (!STI)
7413b69d63SRafael Espindola     return;
7513b69d63SRafael Espindola 
7613b69d63SRafael Espindola   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
7713b69d63SRafael Espindola   if (!MCII)
7813b69d63SRafael Espindola     return;
7913b69d63SRafael Espindola 
8013b69d63SRafael Espindola   MCObjectFileInfo MOFI;
8113b69d63SRafael Espindola   MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
828d8b13dcSDaniel Sanders   MOFI.InitMCObjectFileInfo(TT, Reloc::Default, CodeModel::Default, MCCtx);
8313b69d63SRafael Espindola   std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx));
8420c7259cSPeter Collingbourne   T->createNullTargetStreamer(*Streamer);
8513b69d63SRafael Espindola 
8613b69d63SRafael Espindola   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
8713b69d63SRafael Espindola   SourceMgr SrcMgr;
881961f14cSDavid Blaikie   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
8913b69d63SRafael Espindola   std::unique_ptr<MCAsmParser> Parser(
9013b69d63SRafael Espindola       createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI));
9113b69d63SRafael Espindola 
9213b69d63SRafael Espindola   MCTargetOptions MCOptions;
9313b69d63SRafael Espindola   std::unique_ptr<MCTargetAsmParser> TAP(
9413b69d63SRafael Espindola       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
9513b69d63SRafael Espindola   if (!TAP)
9613b69d63SRafael Espindola     return;
9713b69d63SRafael Espindola 
9813b69d63SRafael Espindola   Parser->setTargetParser(*TAP);
9913b69d63SRafael Espindola   if (Parser->Run(false))
10013b69d63SRafael Espindola     return;
10113b69d63SRafael Espindola 
10213b69d63SRafael Espindola   for (auto &KV : *Streamer) {
10313b69d63SRafael Espindola     StringRef Key = KV.first();
10413b69d63SRafael Espindola     RecordStreamer::State Value = KV.second;
10513b69d63SRafael Espindola     uint32_t Res = BasicSymbolRef::SF_None;
10613b69d63SRafael Espindola     switch (Value) {
10713b69d63SRafael Espindola     case RecordStreamer::NeverSeen:
10813b69d63SRafael Espindola       llvm_unreachable("foo");
10913b69d63SRafael Espindola     case RecordStreamer::DefinedGlobal:
11013b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
11113b69d63SRafael Espindola       break;
11213b69d63SRafael Espindola     case RecordStreamer::Defined:
11313b69d63SRafael Espindola       break;
11413b69d63SRafael Espindola     case RecordStreamer::Global:
11513b69d63SRafael Espindola     case RecordStreamer::Used:
11613b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Undefined;
11713b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
11813b69d63SRafael Espindola       break;
11913b69d63SRafael Espindola     }
120e9cffafdSMehdi Amini     AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res));
12113b69d63SRafael Espindola   }
122f12b8282SRafael Espindola }
123f12b8282SRafael Espindola 
124dddd1fd9SRafael Espindola IRObjectFile::~IRObjectFile() {
125dddd1fd9SRafael Espindola  }
126c3f9b5a5SRafael Espindola 
127527e846eSRafael Espindola static GlobalValue *getGV(DataRefImpl &Symb) {
12813b69d63SRafael Espindola   if ((Symb.p & 3) == 3)
12913b69d63SRafael Espindola     return nullptr;
13013b69d63SRafael Espindola 
13113b69d63SRafael Espindola   return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3));
132f12b8282SRafael Espindola }
133f12b8282SRafael Espindola 
134f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) {
135f12b8282SRafael Espindola   if (I == M.alias_end())
136f12b8282SRafael Espindola     return 3;
137f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
138f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 2;
139f12b8282SRafael Espindola }
140f12b8282SRafael Espindola 
141f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) {
142f12b8282SRafael Espindola   if (I == M.global_end())
143f12b8282SRafael Espindola     return skipEmpty(M.alias_begin(), M);
144f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
145f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 1;
146f12b8282SRafael Espindola }
147f12b8282SRafael Espindola 
148f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) {
149f12b8282SRafael Espindola   if (I == M.end())
150f12b8282SRafael Espindola     return skipEmpty(M.global_begin(), M);
151f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
152f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 0;
153f12b8282SRafael Espindola }
154f12b8282SRafael Espindola 
15513b69d63SRafael Espindola static unsigned getAsmSymIndex(DataRefImpl Symb) {
15613b69d63SRafael Espindola   assert((Symb.p & uintptr_t(3)) == 3);
15713b69d63SRafael Espindola   uintptr_t Index = Symb.p & ~uintptr_t(3);
15813b69d63SRafael Espindola   Index >>= 2;
15913b69d63SRafael Espindola   return Index;
16013b69d63SRafael Espindola }
16113b69d63SRafael Espindola 
162f12b8282SRafael Espindola void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
16313b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
164f12b8282SRafael Espindola   uintptr_t Res;
16513b69d63SRafael Espindola 
166f12b8282SRafael Espindola   switch (Symb.p & 3) {
167f12b8282SRafael Espindola   case 0: {
168f12b8282SRafael Espindola     Module::const_iterator Iter(static_cast<const Function*>(GV));
169f12b8282SRafael Espindola     ++Iter;
17013b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
171f12b8282SRafael Espindola     break;
172f12b8282SRafael Espindola   }
173f12b8282SRafael Espindola   case 1: {
174f12b8282SRafael Espindola     Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV));
175f12b8282SRafael Espindola     ++Iter;
17613b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
177f12b8282SRafael Espindola     break;
178f12b8282SRafael Espindola   }
179f12b8282SRafael Espindola   case 2: {
180f12b8282SRafael Espindola     Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV));
181f12b8282SRafael Espindola     ++Iter;
18213b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
183f12b8282SRafael Espindola     break;
184f12b8282SRafael Espindola   }
18513b69d63SRafael Espindola   case 3: {
18613b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
18713b69d63SRafael Espindola     assert(Index < AsmSymbols.size());
18813b69d63SRafael Espindola     ++Index;
18913b69d63SRafael Espindola     Res = (Index << 2) | 3;
19013b69d63SRafael Espindola     break;
19113b69d63SRafael Espindola   }
192addddc44SMichael Ilseman   default:
193addddc44SMichael Ilseman     llvm_unreachable("unreachable case");
194f12b8282SRafael Espindola   }
195f12b8282SRafael Espindola 
196f12b8282SRafael Espindola   Symb.p = Res;
197f12b8282SRafael Espindola }
198f12b8282SRafael Espindola 
199db4ed0bdSRafael Espindola std::error_code IRObjectFile::printSymbolName(raw_ostream &OS,
200f12b8282SRafael Espindola                                               DataRefImpl Symb) const {
20113b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
20213b69d63SRafael Espindola   if (!GV) {
20313b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
20413b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
20513b69d63SRafael Espindola     OS << AsmSymbols[Index].first;
2067d099195SRui Ueyama     return std::error_code();
20713b69d63SRafael Espindola   }
208a51f0f83SRafael Espindola 
20982e657b5SPeter Collingbourne   if (GV->hasDLLImportStorageClass())
21082e657b5SPeter Collingbourne     OS << "__imp_";
21182e657b5SPeter Collingbourne 
212a51f0f83SRafael Espindola   if (Mang)
21313b69d63SRafael Espindola     Mang->getNameWithPrefix(OS, GV, false);
214a51f0f83SRafael Espindola   else
21513b69d63SRafael Espindola     OS << GV->getName();
216a51f0f83SRafael Espindola 
2177d099195SRui Ueyama   return std::error_code();
218f12b8282SRafael Espindola }
219f12b8282SRafael Espindola 
220f12b8282SRafael Espindola uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const {
22113b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
22213b69d63SRafael Espindola 
22313b69d63SRafael Espindola   if (!GV) {
22413b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
22513b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
22613b69d63SRafael Espindola     return AsmSymbols[Index].second;
22713b69d63SRafael Espindola   }
228f12b8282SRafael Espindola 
229f12b8282SRafael Espindola   uint32_t Res = BasicSymbolRef::SF_None;
230d4bcefc7SRafael Espindola   if (GV->isDeclarationForLinker())
231f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Undefined;
232dc0dbe1fSKevin Enderby   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
233dc0dbe1fSKevin Enderby     Res |= BasicSymbolRef::SF_Hidden;
234dc0dbe1fSKevin Enderby   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
235dc0dbe1fSKevin Enderby     if (GVar->isConstant())
236dc0dbe1fSKevin Enderby       Res |= BasicSymbolRef::SF_Const;
237dc0dbe1fSKevin Enderby   }
23813b69d63SRafael Espindola   if (GV->hasPrivateLinkage())
239f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
24013b69d63SRafael Espindola   if (!GV->hasLocalLinkage())
241f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Global;
24213b69d63SRafael Espindola   if (GV->hasCommonLinkage())
243f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Common;
2448d6fbc3aSRafael Espindola   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
2458d6fbc3aSRafael Espindola       GV->hasExternalWeakLinkage())
246f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Weak;
247f12b8282SRafael Espindola 
2482dc0d9bdSRafael Espindola   if (GV->getName().startswith("llvm."))
249b674c17dSRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
2502dc0d9bdSRafael Espindola   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
2512dc0d9bdSRafael Espindola     if (Var->getSection() == StringRef("llvm.metadata"))
2523885090bSRafael Espindola       Res |= BasicSymbolRef::SF_FormatSpecific;
2533885090bSRafael Espindola   }
2543885090bSRafael Espindola 
255f12b8282SRafael Espindola   return Res;
256f12b8282SRafael Espindola }
257f12b8282SRafael Espindola 
258527e846eSRafael Espindola GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); }
259f12b8282SRafael Espindola 
26025a7e0a8SRafael Espindola std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); }
26125a7e0a8SRafael Espindola 
262f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_begin_impl() const {
263f12b8282SRafael Espindola   Module::const_iterator I = M->begin();
264f12b8282SRafael Espindola   DataRefImpl Ret;
265f12b8282SRafael Espindola   Ret.p = skipEmpty(I, *M);
266f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
267f12b8282SRafael Espindola }
268f12b8282SRafael Espindola 
269f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_end_impl() const {
270f12b8282SRafael Espindola   DataRefImpl Ret;
27113b69d63SRafael Espindola   uint64_t NumAsm = AsmSymbols.size();
27213b69d63SRafael Espindola   NumAsm <<= 2;
27313b69d63SRafael Espindola   Ret.p = 3 | NumAsm;
274f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
275f12b8282SRafael Espindola }
276f12b8282SRafael Espindola 
27710039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) {
27810039c02SPeter Collingbourne   for (const SectionRef &Sec : Obj.sections()) {
279f2fe0141SSteven Wu     if (Sec.isBitcode()) {
28010039c02SPeter Collingbourne       StringRef SecContents;
28110039c02SPeter Collingbourne       if (std::error_code EC = Sec.getContents(SecContents))
28210039c02SPeter Collingbourne         return EC;
28310039c02SPeter Collingbourne       return MemoryBufferRef(SecContents, Obj.getFileName());
28410039c02SPeter Collingbourne     }
28510039c02SPeter Collingbourne   }
28610039c02SPeter Collingbourne 
28710039c02SPeter Collingbourne   return object_error::bitcode_section_not_found;
28810039c02SPeter Collingbourne }
28910039c02SPeter Collingbourne 
29010039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) {
29110039c02SPeter Collingbourne   sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer());
29210039c02SPeter Collingbourne   switch (Type) {
29310039c02SPeter Collingbourne   case sys::fs::file_magic::bitcode:
29410039c02SPeter Collingbourne     return Object;
29510039c02SPeter Collingbourne   case sys::fs::file_magic::elf_relocatable:
29610039c02SPeter Collingbourne   case sys::fs::file_magic::macho_object:
29710039c02SPeter Collingbourne   case sys::fs::file_magic::coff_object: {
2983fcdf6aeSKevin Enderby     Expected<std::unique_ptr<ObjectFile>> ObjFile =
29910039c02SPeter Collingbourne         ObjectFile::createObjectFile(Object, Type);
30010039c02SPeter Collingbourne     if (!ObjFile)
3013fcdf6aeSKevin Enderby       return errorToErrorCode(ObjFile.takeError());
30210039c02SPeter Collingbourne     return findBitcodeInObject(*ObjFile->get());
30310039c02SPeter Collingbourne   }
30410039c02SPeter Collingbourne   default:
30510039c02SPeter Collingbourne     return object_error::invalid_file_type;
30610039c02SPeter Collingbourne   }
30710039c02SPeter Collingbourne }
30810039c02SPeter Collingbourne 
30910a27df8SDavid Blaikie ErrorOr<std::unique_ptr<IRObjectFile>>
3105dec7eaaSRafael Espindola llvm::object::IRObjectFile::create(MemoryBufferRef Object,
31148af1c2aSRafael Espindola                                    LLVMContext &Context) {
31210039c02SPeter Collingbourne   ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object);
31310039c02SPeter Collingbourne   if (!BCOrErr)
31410039c02SPeter Collingbourne     return BCOrErr.getError();
31548af1c2aSRafael Espindola 
316cf981625SRafael Espindola   std::unique_ptr<MemoryBuffer> Buff =
317cf981625SRafael Espindola       MemoryBuffer::getMemBuffer(BCOrErr.get(), false);
31848af1c2aSRafael Espindola 
319dcd1dca2SRafael Espindola   ErrorOr<std::unique_ptr<Module>> MOrErr =
3209d2bfc48SRafael Espindola       getLazyBitcodeModule(std::move(Buff), Context,
321cba833a0SRafael Espindola                            /*ShouldLazyLoadMetadata*/ true);
322dddd1fd9SRafael Espindola   if (std::error_code EC = MOrErr.getError())
323f12b8282SRafael Espindola     return EC;
324dddd1fd9SRafael Espindola 
325dcd1dca2SRafael Espindola   std::unique_ptr<Module> &M = MOrErr.get();
32610a27df8SDavid Blaikie   return llvm::make_unique<IRObjectFile>(Object, std::move(M));
327f12b8282SRafael Espindola }
328