11df42facSEugene Zelenko //===- ModuleSymbolTable.cpp - symbol table for in-memory IR --------------===//
2863cbfbeSPeter Collingbourne //
32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information.
52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6863cbfbeSPeter Collingbourne //
7863cbfbeSPeter Collingbourne //===----------------------------------------------------------------------===//
8863cbfbeSPeter Collingbourne //
9863cbfbeSPeter Collingbourne // This class represents a symbol table built from in-memory IR. It provides
10863cbfbeSPeter Collingbourne // access to GlobalValues and should only be used if such access is required
11863cbfbeSPeter Collingbourne // (e.g. in the LTO implementation).
12863cbfbeSPeter Collingbourne //
13863cbfbeSPeter Collingbourne //===----------------------------------------------------------------------===//
14863cbfbeSPeter Collingbourne 
156bda14b3SChandler Carruth #include "llvm/Object/ModuleSymbolTable.h"
16863cbfbeSPeter Collingbourne #include "RecordStreamer.h"
17863cbfbeSPeter Collingbourne #include "llvm/ADT/STLExtras.h"
186bda14b3SChandler Carruth #include "llvm/ADT/SmallString.h"
191df42facSEugene Zelenko #include "llvm/ADT/StringMap.h"
201df42facSEugene Zelenko #include "llvm/ADT/StringRef.h"
211df42facSEugene Zelenko #include "llvm/ADT/Triple.h"
221df42facSEugene Zelenko #include "llvm/IR/Function.h"
231df42facSEugene Zelenko #include "llvm/IR/GlobalAlias.h"
241df42facSEugene Zelenko #include "llvm/IR/GlobalValue.h"
251df42facSEugene Zelenko #include "llvm/IR/GlobalVariable.h"
26a8e582c8SHans Wennborg #include "llvm/IR/InlineAsm.h"
27863cbfbeSPeter Collingbourne #include "llvm/IR/Module.h"
28863cbfbeSPeter Collingbourne #include "llvm/MC/MCAsmInfo.h"
29863cbfbeSPeter Collingbourne #include "llvm/MC/MCContext.h"
301df42facSEugene Zelenko #include "llvm/MC/MCDirectives.h"
31863cbfbeSPeter Collingbourne #include "llvm/MC/MCInstrInfo.h"
32863cbfbeSPeter Collingbourne #include "llvm/MC/MCObjectFileInfo.h"
33863cbfbeSPeter Collingbourne #include "llvm/MC/MCParser/MCAsmParser.h"
34863cbfbeSPeter Collingbourne #include "llvm/MC/MCParser/MCTargetAsmParser.h"
35863cbfbeSPeter Collingbourne #include "llvm/MC/MCRegisterInfo.h"
36863cbfbeSPeter Collingbourne #include "llvm/MC/MCSubtargetInfo.h"
371df42facSEugene Zelenko #include "llvm/MC/MCSymbol.h"
381df42facSEugene Zelenko #include "llvm/MC/MCTargetOptions.h"
391df42facSEugene Zelenko #include "llvm/Object/SymbolicFile.h"
401df42facSEugene Zelenko #include "llvm/Support/Casting.h"
411df42facSEugene Zelenko #include "llvm/Support/CodeGen.h"
421df42facSEugene Zelenko #include "llvm/Support/ErrorHandling.h"
43863cbfbeSPeter Collingbourne #include "llvm/Support/MemoryBuffer.h"
441df42facSEugene Zelenko #include "llvm/Support/SMLoc.h"
45863cbfbeSPeter Collingbourne #include "llvm/Support/SourceMgr.h"
46863cbfbeSPeter Collingbourne #include "llvm/Support/TargetRegistry.h"
476bda14b3SChandler Carruth #include "llvm/Support/raw_ostream.h"
481df42facSEugene Zelenko #include <algorithm>
491df42facSEugene Zelenko #include <cassert>
501df42facSEugene Zelenko #include <cstdint>
511df42facSEugene Zelenko #include <memory>
521df42facSEugene Zelenko #include <string>
531df42facSEugene Zelenko 
54863cbfbeSPeter Collingbourne using namespace llvm;
55863cbfbeSPeter Collingbourne using namespace object;
56863cbfbeSPeter Collingbourne 
57863cbfbeSPeter Collingbourne void ModuleSymbolTable::addModule(Module *M) {
58863cbfbeSPeter Collingbourne   if (FirstMod)
59863cbfbeSPeter Collingbourne     assert(FirstMod->getTargetTriple() == M->getTargetTriple());
60863cbfbeSPeter Collingbourne   else
61863cbfbeSPeter Collingbourne     FirstMod = M;
62863cbfbeSPeter Collingbourne 
63b26bc7fdSRafael Espindola   for (GlobalValue &GV : M->global_values())
64863cbfbeSPeter Collingbourne     SymTab.push_back(&GV);
65863cbfbeSPeter Collingbourne 
66d8204472STeresa Johnson   CollectAsmSymbols(*M, [this](StringRef Name, BasicSymbolRef::Flags Flags) {
67a9bc7b83SBenjamin Kramer     SymTab.push_back(new (AsmSymbols.Allocate())
68a9bc7b83SBenjamin Kramer                          AsmSymbol(std::string(Name), Flags));
69863cbfbeSPeter Collingbourne   });
70863cbfbeSPeter Collingbourne }
71863cbfbeSPeter Collingbourne 
72230b2567SVlad Tsyrklevich static void
73230b2567SVlad Tsyrklevich initializeRecordStreamer(const Module &M,
74230b2567SVlad Tsyrklevich                          function_ref<void(RecordStreamer &)> Init) {
75d8204472STeresa Johnson   StringRef InlineAsm = M.getModuleInlineAsm();
76863cbfbeSPeter Collingbourne   if (InlineAsm.empty())
77863cbfbeSPeter Collingbourne     return;
78863cbfbeSPeter Collingbourne 
79863cbfbeSPeter Collingbourne   std::string Err;
80d8204472STeresa Johnson   const Triple TT(M.getTargetTriple());
81863cbfbeSPeter Collingbourne   const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
82863cbfbeSPeter Collingbourne   assert(T && T->hasMCAsmParser());
83863cbfbeSPeter Collingbourne 
84863cbfbeSPeter Collingbourne   std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
85863cbfbeSPeter Collingbourne   if (!MRI)
86863cbfbeSPeter Collingbourne     return;
87863cbfbeSPeter Collingbourne 
884b63ca13SMirko Brkusanin   MCTargetOptions MCOptions;
894b63ca13SMirko Brkusanin   std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str(), MCOptions));
90863cbfbeSPeter Collingbourne   if (!MAI)
91863cbfbeSPeter Collingbourne     return;
92863cbfbeSPeter Collingbourne 
93863cbfbeSPeter Collingbourne   std::unique_ptr<MCSubtargetInfo> STI(
94863cbfbeSPeter Collingbourne       T->createMCSubtargetInfo(TT.str(), "", ""));
95863cbfbeSPeter Collingbourne   if (!STI)
96863cbfbeSPeter Collingbourne     return;
97863cbfbeSPeter Collingbourne 
98863cbfbeSPeter Collingbourne   std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
99863cbfbeSPeter Collingbourne   if (!MCII)
100863cbfbeSPeter Collingbourne     return;
101863cbfbeSPeter Collingbourne 
102*c2f819afSPhilipp Krones   MCContext MCCtx(TT, MAI.get(), MRI.get(), STI.get());
103*c2f819afSPhilipp Krones   std::unique_ptr<MCObjectFileInfo> MOFI(
104*c2f819afSPhilipp Krones       T->createMCObjectFileInfo(MCCtx, /*PIC=*/false));
105*c2f819afSPhilipp Krones   MOFI->setSDKVersion(M.getSDKVersion());
106*c2f819afSPhilipp Krones   MCCtx.setObjectFileInfo(MOFI.get());
1070d03881eSVitaly Buka   RecordStreamer Streamer(MCCtx, M);
108863cbfbeSPeter Collingbourne   T->createNullTargetStreamer(Streamer);
109863cbfbeSPeter Collingbourne 
110863cbfbeSPeter Collingbourne   std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
111863cbfbeSPeter Collingbourne   SourceMgr SrcMgr;
112863cbfbeSPeter Collingbourne   SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
113863cbfbeSPeter Collingbourne   std::unique_ptr<MCAsmParser> Parser(
114863cbfbeSPeter Collingbourne       createMCAsmParser(SrcMgr, MCCtx, Streamer, *MAI));
115863cbfbeSPeter Collingbourne 
116863cbfbeSPeter Collingbourne   std::unique_ptr<MCTargetAsmParser> TAP(
117863cbfbeSPeter Collingbourne       T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
118863cbfbeSPeter Collingbourne   if (!TAP)
119863cbfbeSPeter Collingbourne     return;
120863cbfbeSPeter Collingbourne 
121a8e582c8SHans Wennborg   // Module-level inline asm is assumed to use At&t syntax (see
122a8e582c8SHans Wennborg   // AsmPrinter::doInitialization()).
123a8e582c8SHans Wennborg   Parser->setAssemblerDialect(InlineAsm::AD_ATT);
124a8e582c8SHans Wennborg 
125863cbfbeSPeter Collingbourne   Parser->setTargetParser(*TAP);
126863cbfbeSPeter Collingbourne   if (Parser->Run(false))
127863cbfbeSPeter Collingbourne     return;
128863cbfbeSPeter Collingbourne 
129230b2567SVlad Tsyrklevich   Init(Streamer);
130230b2567SVlad Tsyrklevich }
131230b2567SVlad Tsyrklevich 
132230b2567SVlad Tsyrklevich void ModuleSymbolTable::CollectAsmSymbols(
133230b2567SVlad Tsyrklevich     const Module &M,
134230b2567SVlad Tsyrklevich     function_ref<void(StringRef, BasicSymbolRef::Flags)> AsmSymbol) {
135230b2567SVlad Tsyrklevich   initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
1360d03881eSVitaly Buka     Streamer.flushSymverDirectives();
137d8204472STeresa Johnson 
138863cbfbeSPeter Collingbourne     for (auto &KV : Streamer) {
139863cbfbeSPeter Collingbourne       StringRef Key = KV.first();
140863cbfbeSPeter Collingbourne       RecordStreamer::State Value = KV.second;
141e2f1b4a6SPeter Collingbourne       // FIXME: For now we just assume that all asm symbols are executable.
142e2f1b4a6SPeter Collingbourne       uint32_t Res = BasicSymbolRef::SF_Executable;
143863cbfbeSPeter Collingbourne       switch (Value) {
144863cbfbeSPeter Collingbourne       case RecordStreamer::NeverSeen:
145863cbfbeSPeter Collingbourne         llvm_unreachable("NeverSeen should have been replaced earlier");
146863cbfbeSPeter Collingbourne       case RecordStreamer::DefinedGlobal:
147863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Global;
148863cbfbeSPeter Collingbourne         break;
149863cbfbeSPeter Collingbourne       case RecordStreamer::Defined:
150863cbfbeSPeter Collingbourne         break;
151863cbfbeSPeter Collingbourne       case RecordStreamer::Global:
152863cbfbeSPeter Collingbourne       case RecordStreamer::Used:
153863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Undefined;
154863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Global;
155863cbfbeSPeter Collingbourne         break;
156863cbfbeSPeter Collingbourne       case RecordStreamer::DefinedWeak:
157863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Weak;
158863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Global;
159863cbfbeSPeter Collingbourne         break;
160863cbfbeSPeter Collingbourne       case RecordStreamer::UndefinedWeak:
161863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Weak;
162863cbfbeSPeter Collingbourne         Res |= BasicSymbolRef::SF_Undefined;
163863cbfbeSPeter Collingbourne       }
164863cbfbeSPeter Collingbourne       AsmSymbol(Key, BasicSymbolRef::Flags(Res));
165863cbfbeSPeter Collingbourne     }
166230b2567SVlad Tsyrklevich   });
167230b2567SVlad Tsyrklevich }
168230b2567SVlad Tsyrklevich 
169230b2567SVlad Tsyrklevich void ModuleSymbolTable::CollectAsmSymvers(
170230b2567SVlad Tsyrklevich     const Module &M, function_ref<void(StringRef, StringRef)> AsmSymver) {
171230b2567SVlad Tsyrklevich   initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
172230b2567SVlad Tsyrklevich     for (auto &KV : Streamer.symverAliases())
173230b2567SVlad Tsyrklevich       for (auto &Alias : KV.second)
174230b2567SVlad Tsyrklevich         AsmSymver(KV.first->getName(), Alias);
175230b2567SVlad Tsyrklevich   });
176863cbfbeSPeter Collingbourne }
177863cbfbeSPeter Collingbourne 
178863cbfbeSPeter Collingbourne void ModuleSymbolTable::printSymbolName(raw_ostream &OS, Symbol S) const {
179863cbfbeSPeter Collingbourne   if (S.is<AsmSymbol *>()) {
180863cbfbeSPeter Collingbourne     OS << S.get<AsmSymbol *>()->first;
181863cbfbeSPeter Collingbourne     return;
182863cbfbeSPeter Collingbourne   }
183863cbfbeSPeter Collingbourne 
184863cbfbeSPeter Collingbourne   auto *GV = S.get<GlobalValue *>();
185863cbfbeSPeter Collingbourne   if (GV->hasDLLImportStorageClass())
186863cbfbeSPeter Collingbourne     OS << "__imp_";
187863cbfbeSPeter Collingbourne 
188863cbfbeSPeter Collingbourne   Mang.getNameWithPrefix(OS, GV, false);
189863cbfbeSPeter Collingbourne }
190863cbfbeSPeter Collingbourne 
191863cbfbeSPeter Collingbourne uint32_t ModuleSymbolTable::getSymbolFlags(Symbol S) const {
192863cbfbeSPeter Collingbourne   if (S.is<AsmSymbol *>())
193863cbfbeSPeter Collingbourne     return S.get<AsmSymbol *>()->second;
194863cbfbeSPeter Collingbourne 
195863cbfbeSPeter Collingbourne   auto *GV = S.get<GlobalValue *>();
196863cbfbeSPeter Collingbourne 
197863cbfbeSPeter Collingbourne   uint32_t Res = BasicSymbolRef::SF_None;
198863cbfbeSPeter Collingbourne   if (GV->isDeclarationForLinker())
199863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_Undefined;
200863cbfbeSPeter Collingbourne   else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
201863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_Hidden;
202863cbfbeSPeter Collingbourne   if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
203863cbfbeSPeter Collingbourne     if (GVar->isConstant())
204863cbfbeSPeter Collingbourne       Res |= BasicSymbolRef::SF_Const;
205863cbfbeSPeter Collingbourne   }
206e2f1b4a6SPeter Collingbourne   if (dyn_cast_or_null<Function>(GV->getBaseObject()))
207e2f1b4a6SPeter Collingbourne     Res |= BasicSymbolRef::SF_Executable;
208d64ecf26SPeter Collingbourne   if (isa<GlobalAlias>(GV))
209d64ecf26SPeter Collingbourne     Res |= BasicSymbolRef::SF_Indirect;
210863cbfbeSPeter Collingbourne   if (GV->hasPrivateLinkage())
211863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_FormatSpecific;
212863cbfbeSPeter Collingbourne   if (!GV->hasLocalLinkage())
213863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_Global;
214863cbfbeSPeter Collingbourne   if (GV->hasCommonLinkage())
215863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_Common;
216863cbfbeSPeter Collingbourne   if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
217863cbfbeSPeter Collingbourne       GV->hasExternalWeakLinkage())
218863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_Weak;
219863cbfbeSPeter Collingbourne 
220863cbfbeSPeter Collingbourne   if (GV->getName().startswith("llvm."))
221863cbfbeSPeter Collingbourne     Res |= BasicSymbolRef::SF_FormatSpecific;
222863cbfbeSPeter Collingbourne   else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
223863cbfbeSPeter Collingbourne     if (Var->getSection() == "llvm.metadata")
224863cbfbeSPeter Collingbourne       Res |= BasicSymbolRef::SF_FormatSpecific;
225863cbfbeSPeter Collingbourne   }
226863cbfbeSPeter Collingbourne 
227863cbfbeSPeter Collingbourne   return Res;
228863cbfbeSPeter Collingbourne }
229