1f12b8282SRafael Espindola //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===//
2f12b8282SRafael Espindola //
3f12b8282SRafael Espindola //                     The LLVM Compiler Infrastructure
4f12b8282SRafael Espindola //
5f12b8282SRafael Espindola // This file is distributed under the University of Illinois Open Source
6f12b8282SRafael Espindola // License. See LICENSE.TXT for details.
7f12b8282SRafael Espindola //
8f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
9f12b8282SRafael Espindola //
10f12b8282SRafael Espindola // Part of the IRObjectFile class implementation.
11f12b8282SRafael Espindola //
12f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
13f12b8282SRafael Espindola 
14ba79dba8SRafael Espindola #include "llvm/Object/IRObjectFile.h"
15ba79dba8SRafael Espindola #include "RecordStreamer.h"
160a446fd5SBenjamin Kramer #include "llvm/ADT/STLExtras.h"
17f12b8282SRafael Espindola #include "llvm/Bitcode/ReaderWriter.h"
18c3f9b5a5SRafael Espindola #include "llvm/IR/GVMaterializer.h"
19d9903888SChandler Carruth #include "llvm/IR/LLVMContext.h"
20a51f0f83SRafael Espindola #include "llvm/IR/Mangler.h"
21f12b8282SRafael Espindola #include "llvm/IR/Module.h"
2213b69d63SRafael Espindola #include "llvm/MC/MCAsmInfo.h"
2313b69d63SRafael Espindola #include "llvm/MC/MCContext.h"
2413b69d63SRafael Espindola #include "llvm/MC/MCInstrInfo.h"
2513b69d63SRafael Espindola #include "llvm/MC/MCObjectFileInfo.h"
2613b69d63SRafael Espindola #include "llvm/MC/MCParser/MCAsmParser.h"
27b3e8a6d2SBenjamin Kramer #include "llvm/MC/MCParser/MCTargetAsmParser.h"
28d9903888SChandler Carruth #include "llvm/MC/MCRegisterInfo.h"
2981902a3aSPete Cooper #include "llvm/MC/MCSubtargetInfo.h"
3010039c02SPeter Collingbourne #include "llvm/Object/ObjectFile.h"
312e60ca96SRafael Espindola #include "llvm/Support/MemoryBuffer.h"
3213b69d63SRafael Espindola #include "llvm/Support/SourceMgr.h"
3313b69d63SRafael Espindola #include "llvm/Support/TargetRegistry.h"
3423f04061SRafael Espindola #include "llvm/Support/raw_ostream.h"
35f12b8282SRafael Espindola using namespace llvm;
36f12b8282SRafael Espindola using namespace object;
37f12b8282SRafael Espindola 
3848af1c2aSRafael Espindola IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod)
3948af1c2aSRafael Espindola     : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) {
40c233f74eSRafael Espindola   Mang.reset(new Mangler());
41*e9cffafdSMehdi Amini   CollectAsmUndefinedRefs(*M, [this](StringRef Name,
42*e9cffafdSMehdi Amini                                      BasicSymbolRef::Flags Flags) {
43*e9cffafdSMehdi Amini     AsmSymbols.push_back(std::make_pair<std::string, uint32_t>(Name, Flags));
44*e9cffafdSMehdi Amini   });
45*e9cffafdSMehdi Amini }
4613b69d63SRafael Espindola 
47*e9cffafdSMehdi Amini // Parse inline ASM and collect the list of symbols that are not defined in
48*e9cffafdSMehdi Amini // the current module. This is inspired from IRObjectFile.
49*e9cffafdSMehdi Amini void IRObjectFile::CollectAsmUndefinedRefs(
50*e9cffafdSMehdi Amini     Module &TheModule,
51*e9cffafdSMehdi Amini     const std::function<void(StringRef, BasicSymbolRef::Flags)> &
52*e9cffafdSMehdi Amini         AsmUndefinedRefs) {
53*e9cffafdSMehdi Amini 
54*e9cffafdSMehdi Amini   const std::string &InlineAsm = TheModule.getModuleInlineAsm();
5513b69d63SRafael Espindola   if (InlineAsm.empty())
5613b69d63SRafael Espindola     return;
5713b69d63SRafael Espindola 
58*e9cffafdSMehdi Amini   Triple TT(TheModule.getTargetTriple());
5913b69d63SRafael Espindola   std::string Err;
608d8b13dcSDaniel Sanders   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
6113b69d63SRafael Espindola   if (!T)
6213b69d63SRafael Espindola     return;
6313b69d63SRafael Espindola 
648d8b13dcSDaniel Sanders   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
6513b69d63SRafael Espindola   if (!MRI)
6613b69d63SRafael Espindola     return;
6713b69d63SRafael Espindola 
688d8b13dcSDaniel Sanders   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
6913b69d63SRafael Espindola   if (!MAI)
7013b69d63SRafael Espindola     return;
7113b69d63SRafael Espindola 
7213b69d63SRafael Espindola   std::unique_ptr<MCSubtargetInfo> STI(
738d8b13dcSDaniel Sanders       T->createMCSubtargetInfo(TT.str(), "", ""));
7413b69d63SRafael Espindola   if (!STI)
7513b69d63SRafael Espindola     return;
7613b69d63SRafael Espindola 
7713b69d63SRafael Espindola   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
7813b69d63SRafael Espindola   if (!MCII)
7913b69d63SRafael Espindola     return;
8013b69d63SRafael Espindola 
8113b69d63SRafael Espindola   MCObjectFileInfo MOFI;
8213b69d63SRafael Espindola   MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
838d8b13dcSDaniel Sanders   MOFI.InitMCObjectFileInfo(TT, Reloc::Default, CodeModel::Default, MCCtx);
8413b69d63SRafael Espindola   std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx));
8520c7259cSPeter Collingbourne   T->createNullTargetStreamer(*Streamer);
8613b69d63SRafael Espindola 
8713b69d63SRafael Espindola   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
8813b69d63SRafael Espindola   SourceMgr SrcMgr;
891961f14cSDavid Blaikie   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
9013b69d63SRafael Espindola   std::unique_ptr<MCAsmParser> Parser(
9113b69d63SRafael Espindola       createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI));
9213b69d63SRafael Espindola 
9313b69d63SRafael Espindola   MCTargetOptions MCOptions;
9413b69d63SRafael Espindola   std::unique_ptr<MCTargetAsmParser> TAP(
9513b69d63SRafael Espindola       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
9613b69d63SRafael Espindola   if (!TAP)
9713b69d63SRafael Espindola     return;
9813b69d63SRafael Espindola 
9913b69d63SRafael Espindola   Parser->setTargetParser(*TAP);
10013b69d63SRafael Espindola   if (Parser->Run(false))
10113b69d63SRafael Espindola     return;
10213b69d63SRafael Espindola 
10313b69d63SRafael Espindola   for (auto &KV : *Streamer) {
10413b69d63SRafael Espindola     StringRef Key = KV.first();
10513b69d63SRafael Espindola     RecordStreamer::State Value = KV.second;
10613b69d63SRafael Espindola     uint32_t Res = BasicSymbolRef::SF_None;
10713b69d63SRafael Espindola     switch (Value) {
10813b69d63SRafael Espindola     case RecordStreamer::NeverSeen:
10913b69d63SRafael Espindola       llvm_unreachable("foo");
11013b69d63SRafael Espindola     case RecordStreamer::DefinedGlobal:
11113b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
11213b69d63SRafael Espindola       break;
11313b69d63SRafael Espindola     case RecordStreamer::Defined:
11413b69d63SRafael Espindola       break;
11513b69d63SRafael Espindola     case RecordStreamer::Global:
11613b69d63SRafael Espindola     case RecordStreamer::Used:
11713b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Undefined;
11813b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
11913b69d63SRafael Espindola       break;
12013b69d63SRafael Espindola     }
121*e9cffafdSMehdi Amini     AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res));
12213b69d63SRafael Espindola   }
123f12b8282SRafael Espindola }
124f12b8282SRafael Espindola 
125dddd1fd9SRafael Espindola IRObjectFile::~IRObjectFile() {
126dddd1fd9SRafael Espindola  }
127c3f9b5a5SRafael Espindola 
128527e846eSRafael Espindola static GlobalValue *getGV(DataRefImpl &Symb) {
12913b69d63SRafael Espindola   if ((Symb.p & 3) == 3)
13013b69d63SRafael Espindola     return nullptr;
13113b69d63SRafael Espindola 
13213b69d63SRafael Espindola   return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3));
133f12b8282SRafael Espindola }
134f12b8282SRafael Espindola 
135f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) {
136f12b8282SRafael Espindola   if (I == M.alias_end())
137f12b8282SRafael Espindola     return 3;
138f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
139f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 2;
140f12b8282SRafael Espindola }
141f12b8282SRafael Espindola 
142f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) {
143f12b8282SRafael Espindola   if (I == M.global_end())
144f12b8282SRafael Espindola     return skipEmpty(M.alias_begin(), M);
145f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
146f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 1;
147f12b8282SRafael Espindola }
148f12b8282SRafael Espindola 
149f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) {
150f12b8282SRafael Espindola   if (I == M.end())
151f12b8282SRafael Espindola     return skipEmpty(M.global_begin(), M);
152f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
153f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 0;
154f12b8282SRafael Espindola }
155f12b8282SRafael Espindola 
15613b69d63SRafael Espindola static unsigned getAsmSymIndex(DataRefImpl Symb) {
15713b69d63SRafael Espindola   assert((Symb.p & uintptr_t(3)) == 3);
15813b69d63SRafael Espindola   uintptr_t Index = Symb.p & ~uintptr_t(3);
15913b69d63SRafael Espindola   Index >>= 2;
16013b69d63SRafael Espindola   return Index;
16113b69d63SRafael Espindola }
16213b69d63SRafael Espindola 
163f12b8282SRafael Espindola void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
16413b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
165f12b8282SRafael Espindola   uintptr_t Res;
16613b69d63SRafael Espindola 
167f12b8282SRafael Espindola   switch (Symb.p & 3) {
168f12b8282SRafael Espindola   case 0: {
169f12b8282SRafael Espindola     Module::const_iterator Iter(static_cast<const Function*>(GV));
170f12b8282SRafael Espindola     ++Iter;
17113b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
172f12b8282SRafael Espindola     break;
173f12b8282SRafael Espindola   }
174f12b8282SRafael Espindola   case 1: {
175f12b8282SRafael Espindola     Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV));
176f12b8282SRafael Espindola     ++Iter;
17713b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
178f12b8282SRafael Espindola     break;
179f12b8282SRafael Espindola   }
180f12b8282SRafael Espindola   case 2: {
181f12b8282SRafael Espindola     Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV));
182f12b8282SRafael Espindola     ++Iter;
18313b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
184f12b8282SRafael Espindola     break;
185f12b8282SRafael Espindola   }
18613b69d63SRafael Espindola   case 3: {
18713b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
18813b69d63SRafael Espindola     assert(Index < AsmSymbols.size());
18913b69d63SRafael Espindola     ++Index;
19013b69d63SRafael Espindola     Res = (Index << 2) | 3;
19113b69d63SRafael Espindola     break;
19213b69d63SRafael Espindola   }
193addddc44SMichael Ilseman   default:
194addddc44SMichael Ilseman     llvm_unreachable("unreachable case");
195f12b8282SRafael Espindola   }
196f12b8282SRafael Espindola 
197f12b8282SRafael Espindola   Symb.p = Res;
198f12b8282SRafael Espindola }
199f12b8282SRafael Espindola 
200db4ed0bdSRafael Espindola std::error_code IRObjectFile::printSymbolName(raw_ostream &OS,
201f12b8282SRafael Espindola                                               DataRefImpl Symb) const {
20213b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
20313b69d63SRafael Espindola   if (!GV) {
20413b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
20513b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
20613b69d63SRafael Espindola     OS << AsmSymbols[Index].first;
2077d099195SRui Ueyama     return std::error_code();
20813b69d63SRafael Espindola   }
209a51f0f83SRafael Espindola 
21082e657b5SPeter Collingbourne   if (GV->hasDLLImportStorageClass())
21182e657b5SPeter Collingbourne     OS << "__imp_";
21282e657b5SPeter Collingbourne 
213a51f0f83SRafael Espindola   if (Mang)
21413b69d63SRafael Espindola     Mang->getNameWithPrefix(OS, GV, false);
215a51f0f83SRafael Espindola   else
21613b69d63SRafael Espindola     OS << GV->getName();
217a51f0f83SRafael Espindola 
2187d099195SRui Ueyama   return std::error_code();
219f12b8282SRafael Espindola }
220f12b8282SRafael Espindola 
221f12b8282SRafael Espindola uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const {
22213b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
22313b69d63SRafael Espindola 
22413b69d63SRafael Espindola   if (!GV) {
22513b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
22613b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
22713b69d63SRafael Espindola     return AsmSymbols[Index].second;
22813b69d63SRafael Espindola   }
229f12b8282SRafael Espindola 
230f12b8282SRafael Espindola   uint32_t Res = BasicSymbolRef::SF_None;
231d4bcefc7SRafael Espindola   if (GV->isDeclarationForLinker())
232f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Undefined;
233dc0dbe1fSKevin Enderby   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
234dc0dbe1fSKevin Enderby     Res |= BasicSymbolRef::SF_Hidden;
235dc0dbe1fSKevin Enderby   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
236dc0dbe1fSKevin Enderby     if (GVar->isConstant())
237dc0dbe1fSKevin Enderby       Res |= BasicSymbolRef::SF_Const;
238dc0dbe1fSKevin Enderby   }
23913b69d63SRafael Espindola   if (GV->hasPrivateLinkage())
240f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
24113b69d63SRafael Espindola   if (!GV->hasLocalLinkage())
242f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Global;
24313b69d63SRafael Espindola   if (GV->hasCommonLinkage())
244f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Common;
2458d6fbc3aSRafael Espindola   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
2468d6fbc3aSRafael Espindola       GV->hasExternalWeakLinkage())
247f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Weak;
248f12b8282SRafael Espindola 
2492dc0d9bdSRafael Espindola   if (GV->getName().startswith("llvm."))
250b674c17dSRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
2512dc0d9bdSRafael Espindola   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
2522dc0d9bdSRafael Espindola     if (Var->getSection() == StringRef("llvm.metadata"))
2533885090bSRafael Espindola       Res |= BasicSymbolRef::SF_FormatSpecific;
2543885090bSRafael Espindola   }
2553885090bSRafael Espindola 
256f12b8282SRafael Espindola   return Res;
257f12b8282SRafael Espindola }
258f12b8282SRafael Espindola 
259527e846eSRafael Espindola GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); }
260f12b8282SRafael Espindola 
26125a7e0a8SRafael Espindola std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); }
26225a7e0a8SRafael Espindola 
263f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_begin_impl() const {
264f12b8282SRafael Espindola   Module::const_iterator I = M->begin();
265f12b8282SRafael Espindola   DataRefImpl Ret;
266f12b8282SRafael Espindola   Ret.p = skipEmpty(I, *M);
267f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
268f12b8282SRafael Espindola }
269f12b8282SRafael Espindola 
270f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_end_impl() const {
271f12b8282SRafael Espindola   DataRefImpl Ret;
27213b69d63SRafael Espindola   uint64_t NumAsm = AsmSymbols.size();
27313b69d63SRafael Espindola   NumAsm <<= 2;
27413b69d63SRafael Espindola   Ret.p = 3 | NumAsm;
275f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
276f12b8282SRafael Espindola }
277f12b8282SRafael Espindola 
27810039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) {
27910039c02SPeter Collingbourne   for (const SectionRef &Sec : Obj.sections()) {
280f2fe0141SSteven Wu     if (Sec.isBitcode()) {
28110039c02SPeter Collingbourne       StringRef SecContents;
28210039c02SPeter Collingbourne       if (std::error_code EC = Sec.getContents(SecContents))
28310039c02SPeter Collingbourne         return EC;
28410039c02SPeter Collingbourne       return MemoryBufferRef(SecContents, Obj.getFileName());
28510039c02SPeter Collingbourne     }
28610039c02SPeter Collingbourne   }
28710039c02SPeter Collingbourne 
28810039c02SPeter Collingbourne   return object_error::bitcode_section_not_found;
28910039c02SPeter Collingbourne }
29010039c02SPeter Collingbourne 
29110039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) {
29210039c02SPeter Collingbourne   sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer());
29310039c02SPeter Collingbourne   switch (Type) {
29410039c02SPeter Collingbourne   case sys::fs::file_magic::bitcode:
29510039c02SPeter Collingbourne     return Object;
29610039c02SPeter Collingbourne   case sys::fs::file_magic::elf_relocatable:
29710039c02SPeter Collingbourne   case sys::fs::file_magic::macho_object:
29810039c02SPeter Collingbourne   case sys::fs::file_magic::coff_object: {
2993fcdf6aeSKevin Enderby     Expected<std::unique_ptr<ObjectFile>> ObjFile =
30010039c02SPeter Collingbourne         ObjectFile::createObjectFile(Object, Type);
30110039c02SPeter Collingbourne     if (!ObjFile)
3023fcdf6aeSKevin Enderby       return errorToErrorCode(ObjFile.takeError());
30310039c02SPeter Collingbourne     return findBitcodeInObject(*ObjFile->get());
30410039c02SPeter Collingbourne   }
30510039c02SPeter Collingbourne   default:
30610039c02SPeter Collingbourne     return object_error::invalid_file_type;
30710039c02SPeter Collingbourne   }
30810039c02SPeter Collingbourne }
30910039c02SPeter Collingbourne 
31010a27df8SDavid Blaikie ErrorOr<std::unique_ptr<IRObjectFile>>
3115dec7eaaSRafael Espindola llvm::object::IRObjectFile::create(MemoryBufferRef Object,
31248af1c2aSRafael Espindola                                    LLVMContext &Context) {
31310039c02SPeter Collingbourne   ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object);
31410039c02SPeter Collingbourne   if (!BCOrErr)
31510039c02SPeter Collingbourne     return BCOrErr.getError();
31648af1c2aSRafael Espindola 
317cf981625SRafael Espindola   std::unique_ptr<MemoryBuffer> Buff =
318cf981625SRafael Espindola       MemoryBuffer::getMemBuffer(BCOrErr.get(), false);
31948af1c2aSRafael Espindola 
320dcd1dca2SRafael Espindola   ErrorOr<std::unique_ptr<Module>> MOrErr =
3219d2bfc48SRafael Espindola       getLazyBitcodeModule(std::move(Buff), Context,
322cba833a0SRafael Espindola                            /*ShouldLazyLoadMetadata*/ true);
323dddd1fd9SRafael Espindola   if (std::error_code EC = MOrErr.getError())
324f12b8282SRafael Espindola     return EC;
325dddd1fd9SRafael Espindola 
326dcd1dca2SRafael Espindola   std::unique_ptr<Module> &M = MOrErr.get();
32710a27df8SDavid Blaikie   return llvm::make_unique<IRObjectFile>(Object, std::move(M));
328f12b8282SRafael Espindola }
329