1f12b8282SRafael Espindola //===- IRObjectFile.cpp - IR object file implementation ---------*- C++ -*-===//
2f12b8282SRafael Espindola //
3f12b8282SRafael Espindola //                     The LLVM Compiler Infrastructure
4f12b8282SRafael Espindola //
5f12b8282SRafael Espindola // This file is distributed under the University of Illinois Open Source
6f12b8282SRafael Espindola // License. See LICENSE.TXT for details.
7f12b8282SRafael Espindola //
8f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
9f12b8282SRafael Espindola //
10f12b8282SRafael Espindola // Part of the IRObjectFile class implementation.
11f12b8282SRafael Espindola //
12f12b8282SRafael Espindola //===----------------------------------------------------------------------===//
13f12b8282SRafael Espindola 
14ba79dba8SRafael Espindola #include "llvm/Object/IRObjectFile.h"
15ba79dba8SRafael Espindola #include "RecordStreamer.h"
160a446fd5SBenjamin Kramer #include "llvm/ADT/STLExtras.h"
17f12b8282SRafael Espindola #include "llvm/Bitcode/ReaderWriter.h"
18c3f9b5a5SRafael Espindola #include "llvm/IR/GVMaterializer.h"
19d9903888SChandler Carruth #include "llvm/IR/LLVMContext.h"
20a51f0f83SRafael Espindola #include "llvm/IR/Mangler.h"
21f12b8282SRafael Espindola #include "llvm/IR/Module.h"
2213b69d63SRafael Espindola #include "llvm/MC/MCAsmInfo.h"
2313b69d63SRafael Espindola #include "llvm/MC/MCContext.h"
2413b69d63SRafael Espindola #include "llvm/MC/MCInstrInfo.h"
2513b69d63SRafael Espindola #include "llvm/MC/MCObjectFileInfo.h"
2613b69d63SRafael Espindola #include "llvm/MC/MCParser/MCAsmParser.h"
27b3e8a6d2SBenjamin Kramer #include "llvm/MC/MCParser/MCTargetAsmParser.h"
28d9903888SChandler Carruth #include "llvm/MC/MCRegisterInfo.h"
2981902a3aSPete Cooper #include "llvm/MC/MCSubtargetInfo.h"
3010039c02SPeter Collingbourne #include "llvm/Object/ObjectFile.h"
312e60ca96SRafael Espindola #include "llvm/Support/MemoryBuffer.h"
3213b69d63SRafael Espindola #include "llvm/Support/SourceMgr.h"
3313b69d63SRafael Espindola #include "llvm/Support/TargetRegistry.h"
3423f04061SRafael Espindola #include "llvm/Support/raw_ostream.h"
35f12b8282SRafael Espindola using namespace llvm;
36f12b8282SRafael Espindola using namespace object;
37f12b8282SRafael Espindola 
3848af1c2aSRafael Espindola IRObjectFile::IRObjectFile(MemoryBufferRef Object, std::unique_ptr<Module> Mod)
3948af1c2aSRafael Espindola     : SymbolicFile(Binary::ID_IR, Object), M(std::move(Mod)) {
40c233f74eSRafael Espindola   Mang.reset(new Mangler());
41*9ff43e40SMehdi Amini   CollectAsmUndefinedRefs(
42*9ff43e40SMehdi Amini       *M, [this](StringRef Name, BasicSymbolRef::Flags Flags) {
43*9ff43e40SMehdi Amini         AsmSymbols.push_back(
44*9ff43e40SMehdi Amini             std::make_pair<std::string, uint32_t>(Name, std::move(Flags)));
45e9cffafdSMehdi Amini       });
46e9cffafdSMehdi Amini }
4713b69d63SRafael Espindola 
48e9cffafdSMehdi Amini // Parse inline ASM and collect the list of symbols that are not defined in
49e9cffafdSMehdi Amini // the current module. This is inspired from IRObjectFile.
50e9cffafdSMehdi Amini void IRObjectFile::CollectAsmUndefinedRefs(
51e9cffafdSMehdi Amini     Module &TheModule,
52e9cffafdSMehdi Amini     const std::function<void(StringRef, BasicSymbolRef::Flags)> &
53e9cffafdSMehdi Amini         AsmUndefinedRefs) {
54e9cffafdSMehdi Amini 
55e9cffafdSMehdi Amini   const std::string &InlineAsm = TheModule.getModuleInlineAsm();
5613b69d63SRafael Espindola   if (InlineAsm.empty())
5713b69d63SRafael Espindola     return;
5813b69d63SRafael Espindola 
59e9cffafdSMehdi Amini   Triple TT(TheModule.getTargetTriple());
6013b69d63SRafael Espindola   std::string Err;
618d8b13dcSDaniel Sanders   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
6213b69d63SRafael Espindola   if (!T)
6313b69d63SRafael Espindola     return;
6413b69d63SRafael Espindola 
658d8b13dcSDaniel Sanders   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
6613b69d63SRafael Espindola   if (!MRI)
6713b69d63SRafael Espindola     return;
6813b69d63SRafael Espindola 
698d8b13dcSDaniel Sanders   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
7013b69d63SRafael Espindola   if (!MAI)
7113b69d63SRafael Espindola     return;
7213b69d63SRafael Espindola 
7313b69d63SRafael Espindola   std::unique_ptr<MCSubtargetInfo> STI(
748d8b13dcSDaniel Sanders       T->createMCSubtargetInfo(TT.str(), "", ""));
7513b69d63SRafael Espindola   if (!STI)
7613b69d63SRafael Espindola     return;
7713b69d63SRafael Espindola 
7813b69d63SRafael Espindola   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
7913b69d63SRafael Espindola   if (!MCII)
8013b69d63SRafael Espindola     return;
8113b69d63SRafael Espindola 
8213b69d63SRafael Espindola   MCObjectFileInfo MOFI;
8313b69d63SRafael Espindola   MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
848d8b13dcSDaniel Sanders   MOFI.InitMCObjectFileInfo(TT, Reloc::Default, CodeModel::Default, MCCtx);
8513b69d63SRafael Espindola   std::unique_ptr<RecordStreamer> Streamer(new RecordStreamer(MCCtx));
8620c7259cSPeter Collingbourne   T->createNullTargetStreamer(*Streamer);
8713b69d63SRafael Espindola 
8813b69d63SRafael Espindola   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
8913b69d63SRafael Espindola   SourceMgr SrcMgr;
901961f14cSDavid Blaikie   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
9113b69d63SRafael Espindola   std::unique_ptr<MCAsmParser> Parser(
9213b69d63SRafael Espindola       createMCAsmParser(SrcMgr, MCCtx, *Streamer, *MAI));
9313b69d63SRafael Espindola 
9413b69d63SRafael Espindola   MCTargetOptions MCOptions;
9513b69d63SRafael Espindola   std::unique_ptr<MCTargetAsmParser> TAP(
9613b69d63SRafael Espindola       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
9713b69d63SRafael Espindola   if (!TAP)
9813b69d63SRafael Espindola     return;
9913b69d63SRafael Espindola 
10013b69d63SRafael Espindola   Parser->setTargetParser(*TAP);
10113b69d63SRafael Espindola   if (Parser->Run(false))
10213b69d63SRafael Espindola     return;
10313b69d63SRafael Espindola 
10413b69d63SRafael Espindola   for (auto &KV : *Streamer) {
10513b69d63SRafael Espindola     StringRef Key = KV.first();
10613b69d63SRafael Espindola     RecordStreamer::State Value = KV.second;
10713b69d63SRafael Espindola     uint32_t Res = BasicSymbolRef::SF_None;
10813b69d63SRafael Espindola     switch (Value) {
10913b69d63SRafael Espindola     case RecordStreamer::NeverSeen:
11013b69d63SRafael Espindola       llvm_unreachable("foo");
11113b69d63SRafael Espindola     case RecordStreamer::DefinedGlobal:
11213b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
11313b69d63SRafael Espindola       break;
11413b69d63SRafael Espindola     case RecordStreamer::Defined:
11513b69d63SRafael Espindola       break;
11613b69d63SRafael Espindola     case RecordStreamer::Global:
11713b69d63SRafael Espindola     case RecordStreamer::Used:
11813b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Undefined;
11913b69d63SRafael Espindola       Res |= BasicSymbolRef::SF_Global;
12013b69d63SRafael Espindola       break;
12113b69d63SRafael Espindola     }
122e9cffafdSMehdi Amini     AsmUndefinedRefs(Key, BasicSymbolRef::Flags(Res));
12313b69d63SRafael Espindola   }
124f12b8282SRafael Espindola }
125f12b8282SRafael Espindola 
126dddd1fd9SRafael Espindola IRObjectFile::~IRObjectFile() {
127dddd1fd9SRafael Espindola  }
128c3f9b5a5SRafael Espindola 
129527e846eSRafael Espindola static GlobalValue *getGV(DataRefImpl &Symb) {
13013b69d63SRafael Espindola   if ((Symb.p & 3) == 3)
13113b69d63SRafael Espindola     return nullptr;
13213b69d63SRafael Espindola 
13313b69d63SRafael Espindola   return reinterpret_cast<GlobalValue*>(Symb.p & ~uintptr_t(3));
134f12b8282SRafael Espindola }
135f12b8282SRafael Espindola 
136f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_alias_iterator I, const Module &M) {
137f12b8282SRafael Espindola   if (I == M.alias_end())
138f12b8282SRafael Espindola     return 3;
139f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
140f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 2;
141f12b8282SRafael Espindola }
142f12b8282SRafael Espindola 
143f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_global_iterator I, const Module &M) {
144f12b8282SRafael Espindola   if (I == M.global_end())
145f12b8282SRafael Espindola     return skipEmpty(M.alias_begin(), M);
146f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
147f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 1;
148f12b8282SRafael Espindola }
149f12b8282SRafael Espindola 
150f12b8282SRafael Espindola static uintptr_t skipEmpty(Module::const_iterator I, const Module &M) {
151f12b8282SRafael Espindola   if (I == M.end())
152f12b8282SRafael Espindola     return skipEmpty(M.global_begin(), M);
153f12b8282SRafael Espindola   const GlobalValue *GV = &*I;
154f12b8282SRafael Espindola   return reinterpret_cast<uintptr_t>(GV) | 0;
155f12b8282SRafael Espindola }
156f12b8282SRafael Espindola 
15713b69d63SRafael Espindola static unsigned getAsmSymIndex(DataRefImpl Symb) {
15813b69d63SRafael Espindola   assert((Symb.p & uintptr_t(3)) == 3);
15913b69d63SRafael Espindola   uintptr_t Index = Symb.p & ~uintptr_t(3);
16013b69d63SRafael Espindola   Index >>= 2;
16113b69d63SRafael Espindola   return Index;
16213b69d63SRafael Espindola }
16313b69d63SRafael Espindola 
164f12b8282SRafael Espindola void IRObjectFile::moveSymbolNext(DataRefImpl &Symb) const {
16513b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
166f12b8282SRafael Espindola   uintptr_t Res;
16713b69d63SRafael Espindola 
168f12b8282SRafael Espindola   switch (Symb.p & 3) {
169f12b8282SRafael Espindola   case 0: {
170f12b8282SRafael Espindola     Module::const_iterator Iter(static_cast<const Function*>(GV));
171f12b8282SRafael Espindola     ++Iter;
17213b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
173f12b8282SRafael Espindola     break;
174f12b8282SRafael Espindola   }
175f12b8282SRafael Espindola   case 1: {
176f12b8282SRafael Espindola     Module::const_global_iterator Iter(static_cast<const GlobalVariable*>(GV));
177f12b8282SRafael Espindola     ++Iter;
17813b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
179f12b8282SRafael Espindola     break;
180f12b8282SRafael Espindola   }
181f12b8282SRafael Espindola   case 2: {
182f12b8282SRafael Espindola     Module::const_alias_iterator Iter(static_cast<const GlobalAlias*>(GV));
183f12b8282SRafael Espindola     ++Iter;
18413b69d63SRafael Espindola     Res = skipEmpty(Iter, *M);
185f12b8282SRafael Espindola     break;
186f12b8282SRafael Espindola   }
18713b69d63SRafael Espindola   case 3: {
18813b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
18913b69d63SRafael Espindola     assert(Index < AsmSymbols.size());
19013b69d63SRafael Espindola     ++Index;
19113b69d63SRafael Espindola     Res = (Index << 2) | 3;
19213b69d63SRafael Espindola     break;
19313b69d63SRafael Espindola   }
194addddc44SMichael Ilseman   default:
195addddc44SMichael Ilseman     llvm_unreachable("unreachable case");
196f12b8282SRafael Espindola   }
197f12b8282SRafael Espindola 
198f12b8282SRafael Espindola   Symb.p = Res;
199f12b8282SRafael Espindola }
200f12b8282SRafael Espindola 
201db4ed0bdSRafael Espindola std::error_code IRObjectFile::printSymbolName(raw_ostream &OS,
202f12b8282SRafael Espindola                                               DataRefImpl Symb) const {
20313b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
20413b69d63SRafael Espindola   if (!GV) {
20513b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
20613b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
20713b69d63SRafael Espindola     OS << AsmSymbols[Index].first;
2087d099195SRui Ueyama     return std::error_code();
20913b69d63SRafael Espindola   }
210a51f0f83SRafael Espindola 
21182e657b5SPeter Collingbourne   if (GV->hasDLLImportStorageClass())
21282e657b5SPeter Collingbourne     OS << "__imp_";
21382e657b5SPeter Collingbourne 
214a51f0f83SRafael Espindola   if (Mang)
21513b69d63SRafael Espindola     Mang->getNameWithPrefix(OS, GV, false);
216a51f0f83SRafael Espindola   else
21713b69d63SRafael Espindola     OS << GV->getName();
218a51f0f83SRafael Espindola 
2197d099195SRui Ueyama   return std::error_code();
220f12b8282SRafael Espindola }
221f12b8282SRafael Espindola 
222f12b8282SRafael Espindola uint32_t IRObjectFile::getSymbolFlags(DataRefImpl Symb) const {
22313b69d63SRafael Espindola   const GlobalValue *GV = getGV(Symb);
22413b69d63SRafael Espindola 
22513b69d63SRafael Espindola   if (!GV) {
22613b69d63SRafael Espindola     unsigned Index = getAsmSymIndex(Symb);
22713b69d63SRafael Espindola     assert(Index <= AsmSymbols.size());
22813b69d63SRafael Espindola     return AsmSymbols[Index].second;
22913b69d63SRafael Espindola   }
230f12b8282SRafael Espindola 
231f12b8282SRafael Espindola   uint32_t Res = BasicSymbolRef::SF_None;
232d4bcefc7SRafael Espindola   if (GV->isDeclarationForLinker())
233f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Undefined;
234dc0dbe1fSKevin Enderby   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
235dc0dbe1fSKevin Enderby     Res |= BasicSymbolRef::SF_Hidden;
236dc0dbe1fSKevin Enderby   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
237dc0dbe1fSKevin Enderby     if (GVar->isConstant())
238dc0dbe1fSKevin Enderby       Res |= BasicSymbolRef::SF_Const;
239dc0dbe1fSKevin Enderby   }
24013b69d63SRafael Espindola   if (GV->hasPrivateLinkage())
241f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
24213b69d63SRafael Espindola   if (!GV->hasLocalLinkage())
243f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Global;
24413b69d63SRafael Espindola   if (GV->hasCommonLinkage())
245f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Common;
2468d6fbc3aSRafael Espindola   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
2478d6fbc3aSRafael Espindola       GV->hasExternalWeakLinkage())
248f12b8282SRafael Espindola     Res |= BasicSymbolRef::SF_Weak;
249f12b8282SRafael Espindola 
2502dc0d9bdSRafael Espindola   if (GV->getName().startswith("llvm."))
251b674c17dSRafael Espindola     Res |= BasicSymbolRef::SF_FormatSpecific;
2522dc0d9bdSRafael Espindola   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
2532dc0d9bdSRafael Espindola     if (Var->getSection() == StringRef("llvm.metadata"))
2543885090bSRafael Espindola       Res |= BasicSymbolRef::SF_FormatSpecific;
2553885090bSRafael Espindola   }
2563885090bSRafael Espindola 
257f12b8282SRafael Espindola   return Res;
258f12b8282SRafael Espindola }
259f12b8282SRafael Espindola 
260527e846eSRafael Espindola GlobalValue *IRObjectFile::getSymbolGV(DataRefImpl Symb) { return getGV(Symb); }
261f12b8282SRafael Espindola 
26225a7e0a8SRafael Espindola std::unique_ptr<Module> IRObjectFile::takeModule() { return std::move(M); }
26325a7e0a8SRafael Espindola 
264f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_begin_impl() const {
265f12b8282SRafael Espindola   Module::const_iterator I = M->begin();
266f12b8282SRafael Espindola   DataRefImpl Ret;
267f12b8282SRafael Espindola   Ret.p = skipEmpty(I, *M);
268f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
269f12b8282SRafael Espindola }
270f12b8282SRafael Espindola 
271f12b8282SRafael Espindola basic_symbol_iterator IRObjectFile::symbol_end_impl() const {
272f12b8282SRafael Espindola   DataRefImpl Ret;
27313b69d63SRafael Espindola   uint64_t NumAsm = AsmSymbols.size();
27413b69d63SRafael Espindola   NumAsm <<= 2;
27513b69d63SRafael Espindola   Ret.p = 3 | NumAsm;
276f12b8282SRafael Espindola   return basic_symbol_iterator(BasicSymbolRef(Ret, this));
277f12b8282SRafael Espindola }
278f12b8282SRafael Espindola 
27910039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInObject(const ObjectFile &Obj) {
28010039c02SPeter Collingbourne   for (const SectionRef &Sec : Obj.sections()) {
281f2fe0141SSteven Wu     if (Sec.isBitcode()) {
28210039c02SPeter Collingbourne       StringRef SecContents;
28310039c02SPeter Collingbourne       if (std::error_code EC = Sec.getContents(SecContents))
28410039c02SPeter Collingbourne         return EC;
28510039c02SPeter Collingbourne       return MemoryBufferRef(SecContents, Obj.getFileName());
28610039c02SPeter Collingbourne     }
28710039c02SPeter Collingbourne   }
28810039c02SPeter Collingbourne 
28910039c02SPeter Collingbourne   return object_error::bitcode_section_not_found;
29010039c02SPeter Collingbourne }
29110039c02SPeter Collingbourne 
29210039c02SPeter Collingbourne ErrorOr<MemoryBufferRef> IRObjectFile::findBitcodeInMemBuffer(MemoryBufferRef Object) {
29310039c02SPeter Collingbourne   sys::fs::file_magic Type = sys::fs::identify_magic(Object.getBuffer());
29410039c02SPeter Collingbourne   switch (Type) {
29510039c02SPeter Collingbourne   case sys::fs::file_magic::bitcode:
29610039c02SPeter Collingbourne     return Object;
29710039c02SPeter Collingbourne   case sys::fs::file_magic::elf_relocatable:
29810039c02SPeter Collingbourne   case sys::fs::file_magic::macho_object:
29910039c02SPeter Collingbourne   case sys::fs::file_magic::coff_object: {
3003fcdf6aeSKevin Enderby     Expected<std::unique_ptr<ObjectFile>> ObjFile =
30110039c02SPeter Collingbourne         ObjectFile::createObjectFile(Object, Type);
30210039c02SPeter Collingbourne     if (!ObjFile)
3033fcdf6aeSKevin Enderby       return errorToErrorCode(ObjFile.takeError());
30410039c02SPeter Collingbourne     return findBitcodeInObject(*ObjFile->get());
30510039c02SPeter Collingbourne   }
30610039c02SPeter Collingbourne   default:
30710039c02SPeter Collingbourne     return object_error::invalid_file_type;
30810039c02SPeter Collingbourne   }
30910039c02SPeter Collingbourne }
31010039c02SPeter Collingbourne 
31110a27df8SDavid Blaikie ErrorOr<std::unique_ptr<IRObjectFile>>
3125dec7eaaSRafael Espindola llvm::object::IRObjectFile::create(MemoryBufferRef Object,
31348af1c2aSRafael Espindola                                    LLVMContext &Context) {
31410039c02SPeter Collingbourne   ErrorOr<MemoryBufferRef> BCOrErr = findBitcodeInMemBuffer(Object);
31510039c02SPeter Collingbourne   if (!BCOrErr)
31610039c02SPeter Collingbourne     return BCOrErr.getError();
31748af1c2aSRafael Espindola 
318cf981625SRafael Espindola   std::unique_ptr<MemoryBuffer> Buff =
319cf981625SRafael Espindola       MemoryBuffer::getMemBuffer(BCOrErr.get(), false);
32048af1c2aSRafael Espindola 
321dcd1dca2SRafael Espindola   ErrorOr<std::unique_ptr<Module>> MOrErr =
3229d2bfc48SRafael Espindola       getLazyBitcodeModule(std::move(Buff), Context,
323cba833a0SRafael Espindola                            /*ShouldLazyLoadMetadata*/ true);
324dddd1fd9SRafael Espindola   if (std::error_code EC = MOrErr.getError())
325f12b8282SRafael Espindola     return EC;
326dddd1fd9SRafael Espindola 
327dcd1dca2SRafael Espindola   std::unique_ptr<Module> &M = MOrErr.get();
32810a27df8SDavid Blaikie   return llvm::make_unique<IRObjectFile>(Object, std::move(M));
329f12b8282SRafael Espindola }
330