151690af2SDimitry Andric //===- ModuleSymbolTable.cpp - symbol table for in-memory IR --------------===//
2d88c1a5aSDimitry Andric //
3d88c1a5aSDimitry Andric // The LLVM Compiler Infrastructure
4d88c1a5aSDimitry Andric //
5d88c1a5aSDimitry Andric // This file is distributed under the University of Illinois Open Source
6d88c1a5aSDimitry Andric // License. See LICENSE.TXT for details.
7d88c1a5aSDimitry Andric //
8d88c1a5aSDimitry Andric //===----------------------------------------------------------------------===//
9d88c1a5aSDimitry Andric //
10d88c1a5aSDimitry Andric // This class represents a symbol table built from in-memory IR. It provides
11d88c1a5aSDimitry Andric // access to GlobalValues and should only be used if such access is required
12d88c1a5aSDimitry Andric // (e.g. in the LTO implementation).
13d88c1a5aSDimitry Andric //
14d88c1a5aSDimitry Andric //===----------------------------------------------------------------------===//
15d88c1a5aSDimitry Andric
16db17bf38SDimitry Andric #include "llvm/Object/ModuleSymbolTable.h"
17d88c1a5aSDimitry Andric #include "RecordStreamer.h"
18d88c1a5aSDimitry Andric #include "llvm/ADT/STLExtras.h"
19db17bf38SDimitry Andric #include "llvm/ADT/SmallString.h"
2051690af2SDimitry Andric #include "llvm/ADT/StringMap.h"
2151690af2SDimitry Andric #include "llvm/ADT/StringRef.h"
2251690af2SDimitry Andric #include "llvm/ADT/Triple.h"
2351690af2SDimitry Andric #include "llvm/IR/Function.h"
2451690af2SDimitry Andric #include "llvm/IR/GlobalAlias.h"
2551690af2SDimitry Andric #include "llvm/IR/GlobalValue.h"
2651690af2SDimitry Andric #include "llvm/IR/GlobalVariable.h"
27d88c1a5aSDimitry Andric #include "llvm/IR/Module.h"
28d88c1a5aSDimitry Andric #include "llvm/MC/MCAsmInfo.h"
29d88c1a5aSDimitry Andric #include "llvm/MC/MCContext.h"
3051690af2SDimitry Andric #include "llvm/MC/MCDirectives.h"
31d88c1a5aSDimitry Andric #include "llvm/MC/MCInstrInfo.h"
32d88c1a5aSDimitry Andric #include "llvm/MC/MCObjectFileInfo.h"
33d88c1a5aSDimitry Andric #include "llvm/MC/MCParser/MCAsmParser.h"
34d88c1a5aSDimitry Andric #include "llvm/MC/MCParser/MCTargetAsmParser.h"
35d88c1a5aSDimitry Andric #include "llvm/MC/MCRegisterInfo.h"
36d88c1a5aSDimitry Andric #include "llvm/MC/MCSubtargetInfo.h"
3751690af2SDimitry Andric #include "llvm/MC/MCSymbol.h"
3851690af2SDimitry Andric #include "llvm/MC/MCTargetOptions.h"
3951690af2SDimitry Andric #include "llvm/Object/SymbolicFile.h"
4051690af2SDimitry Andric #include "llvm/Support/Casting.h"
4151690af2SDimitry Andric #include "llvm/Support/CodeGen.h"
4251690af2SDimitry Andric #include "llvm/Support/ErrorHandling.h"
43d88c1a5aSDimitry Andric #include "llvm/Support/MemoryBuffer.h"
4451690af2SDimitry Andric #include "llvm/Support/SMLoc.h"
45d88c1a5aSDimitry Andric #include "llvm/Support/SourceMgr.h"
46d88c1a5aSDimitry Andric #include "llvm/Support/TargetRegistry.h"
47db17bf38SDimitry Andric #include "llvm/Support/raw_ostream.h"
4851690af2SDimitry Andric #include <algorithm>
4951690af2SDimitry Andric #include <cassert>
5051690af2SDimitry Andric #include <cstdint>
5151690af2SDimitry Andric #include <memory>
5251690af2SDimitry Andric #include <string>
5351690af2SDimitry Andric
54d88c1a5aSDimitry Andric using namespace llvm;
55d88c1a5aSDimitry Andric using namespace object;
56d88c1a5aSDimitry Andric
addModule(Module * M)57d88c1a5aSDimitry Andric void ModuleSymbolTable::addModule(Module *M) {
58d88c1a5aSDimitry Andric if (FirstMod)
59d88c1a5aSDimitry Andric assert(FirstMod->getTargetTriple() == M->getTargetTriple());
60d88c1a5aSDimitry Andric else
61d88c1a5aSDimitry Andric FirstMod = M;
62d88c1a5aSDimitry Andric
637a7e6055SDimitry Andric for (GlobalValue &GV : M->global_values())
64d88c1a5aSDimitry Andric SymTab.push_back(&GV);
65d88c1a5aSDimitry Andric
667a7e6055SDimitry Andric CollectAsmSymbols(*M, [this](StringRef Name, BasicSymbolRef::Flags Flags) {
677a7e6055SDimitry Andric SymTab.push_back(new (AsmSymbols.Allocate()) AsmSymbol(Name, Flags));
68d88c1a5aSDimitry Andric });
69d88c1a5aSDimitry Andric }
70d88c1a5aSDimitry Andric
714ba319b5SDimitry Andric static void
initializeRecordStreamer(const Module & M,function_ref<void (RecordStreamer &)> Init)724ba319b5SDimitry Andric initializeRecordStreamer(const Module &M,
734ba319b5SDimitry Andric function_ref<void(RecordStreamer &)> Init) {
747a7e6055SDimitry Andric StringRef InlineAsm = M.getModuleInlineAsm();
75d88c1a5aSDimitry Andric if (InlineAsm.empty())
76d88c1a5aSDimitry Andric return;
77d88c1a5aSDimitry Andric
78d88c1a5aSDimitry Andric std::string Err;
797a7e6055SDimitry Andric const Triple TT(M.getTargetTriple());
80d88c1a5aSDimitry Andric const Target *T = TargetRegistry::lookupTarget(TT.str(), Err);
81d88c1a5aSDimitry Andric assert(T && T->hasMCAsmParser());
82d88c1a5aSDimitry Andric
83d88c1a5aSDimitry Andric std::unique_ptr<MCRegisterInfo> MRI(T->createMCRegInfo(TT.str()));
84d88c1a5aSDimitry Andric if (!MRI)
85d88c1a5aSDimitry Andric return;
86d88c1a5aSDimitry Andric
87d88c1a5aSDimitry Andric std::unique_ptr<MCAsmInfo> MAI(T->createMCAsmInfo(*MRI, TT.str()));
88d88c1a5aSDimitry Andric if (!MAI)
89d88c1a5aSDimitry Andric return;
90d88c1a5aSDimitry Andric
91d88c1a5aSDimitry Andric std::unique_ptr<MCSubtargetInfo> STI(
92d88c1a5aSDimitry Andric T->createMCSubtargetInfo(TT.str(), "", ""));
93d88c1a5aSDimitry Andric if (!STI)
94d88c1a5aSDimitry Andric return;
95d88c1a5aSDimitry Andric
96d88c1a5aSDimitry Andric std::unique_ptr<MCInstrInfo> MCII(T->createMCInstrInfo());
97d88c1a5aSDimitry Andric if (!MCII)
98d88c1a5aSDimitry Andric return;
99d88c1a5aSDimitry Andric
100d88c1a5aSDimitry Andric MCObjectFileInfo MOFI;
101d88c1a5aSDimitry Andric MCContext MCCtx(MAI.get(), MRI.get(), &MOFI);
1022cab237bSDimitry Andric MOFI.InitMCObjectFileInfo(TT, /*PIC*/ false, MCCtx);
103*b5893f02SDimitry Andric MOFI.setSDKVersion(M.getSDKVersion());
104ad414d86SDimitry Andric RecordStreamer Streamer(MCCtx, M);
105d88c1a5aSDimitry Andric T->createNullTargetStreamer(Streamer);
106d88c1a5aSDimitry Andric
107d88c1a5aSDimitry Andric std::unique_ptr<MemoryBuffer> Buffer(MemoryBuffer::getMemBuffer(InlineAsm));
108d88c1a5aSDimitry Andric SourceMgr SrcMgr;
109d88c1a5aSDimitry Andric SrcMgr.AddNewSourceBuffer(std::move(Buffer), SMLoc());
110d88c1a5aSDimitry Andric std::unique_ptr<MCAsmParser> Parser(
111d88c1a5aSDimitry Andric createMCAsmParser(SrcMgr, MCCtx, Streamer, *MAI));
112d88c1a5aSDimitry Andric
113d88c1a5aSDimitry Andric MCTargetOptions MCOptions;
114d88c1a5aSDimitry Andric std::unique_ptr<MCTargetAsmParser> TAP(
115d88c1a5aSDimitry Andric T->createMCAsmParser(*STI, *Parser, *MCII, MCOptions));
116d88c1a5aSDimitry Andric if (!TAP)
117d88c1a5aSDimitry Andric return;
118d88c1a5aSDimitry Andric
119d88c1a5aSDimitry Andric Parser->setTargetParser(*TAP);
120d88c1a5aSDimitry Andric if (Parser->Run(false))
121d88c1a5aSDimitry Andric return;
122d88c1a5aSDimitry Andric
1234ba319b5SDimitry Andric Init(Streamer);
1244ba319b5SDimitry Andric }
1254ba319b5SDimitry Andric
CollectAsmSymbols(const Module & M,function_ref<void (StringRef,BasicSymbolRef::Flags)> AsmSymbol)1264ba319b5SDimitry Andric void ModuleSymbolTable::CollectAsmSymbols(
1274ba319b5SDimitry Andric const Module &M,
1284ba319b5SDimitry Andric function_ref<void(StringRef, BasicSymbolRef::Flags)> AsmSymbol) {
1294ba319b5SDimitry Andric initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
130ad414d86SDimitry Andric Streamer.flushSymverDirectives();
1317a7e6055SDimitry Andric
132d88c1a5aSDimitry Andric for (auto &KV : Streamer) {
133d88c1a5aSDimitry Andric StringRef Key = KV.first();
134d88c1a5aSDimitry Andric RecordStreamer::State Value = KV.second;
135d88c1a5aSDimitry Andric // FIXME: For now we just assume that all asm symbols are executable.
136d88c1a5aSDimitry Andric uint32_t Res = BasicSymbolRef::SF_Executable;
137d88c1a5aSDimitry Andric switch (Value) {
138d88c1a5aSDimitry Andric case RecordStreamer::NeverSeen:
139d88c1a5aSDimitry Andric llvm_unreachable("NeverSeen should have been replaced earlier");
140d88c1a5aSDimitry Andric case RecordStreamer::DefinedGlobal:
141d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Global;
142d88c1a5aSDimitry Andric break;
143d88c1a5aSDimitry Andric case RecordStreamer::Defined:
144d88c1a5aSDimitry Andric break;
145d88c1a5aSDimitry Andric case RecordStreamer::Global:
146d88c1a5aSDimitry Andric case RecordStreamer::Used:
147d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Undefined;
148d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Global;
149d88c1a5aSDimitry Andric break;
150d88c1a5aSDimitry Andric case RecordStreamer::DefinedWeak:
151d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Weak;
152d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Global;
153d88c1a5aSDimitry Andric break;
154d88c1a5aSDimitry Andric case RecordStreamer::UndefinedWeak:
155d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Weak;
156d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Undefined;
157d88c1a5aSDimitry Andric }
158d88c1a5aSDimitry Andric AsmSymbol(Key, BasicSymbolRef::Flags(Res));
159d88c1a5aSDimitry Andric }
1604ba319b5SDimitry Andric });
1614ba319b5SDimitry Andric }
1624ba319b5SDimitry Andric
CollectAsmSymvers(const Module & M,function_ref<void (StringRef,StringRef)> AsmSymver)1634ba319b5SDimitry Andric void ModuleSymbolTable::CollectAsmSymvers(
1644ba319b5SDimitry Andric const Module &M, function_ref<void(StringRef, StringRef)> AsmSymver) {
1654ba319b5SDimitry Andric initializeRecordStreamer(M, [&](RecordStreamer &Streamer) {
1664ba319b5SDimitry Andric for (auto &KV : Streamer.symverAliases())
1674ba319b5SDimitry Andric for (auto &Alias : KV.second)
1684ba319b5SDimitry Andric AsmSymver(KV.first->getName(), Alias);
1694ba319b5SDimitry Andric });
170d88c1a5aSDimitry Andric }
171d88c1a5aSDimitry Andric
printSymbolName(raw_ostream & OS,Symbol S) const172d88c1a5aSDimitry Andric void ModuleSymbolTable::printSymbolName(raw_ostream &OS, Symbol S) const {
173d88c1a5aSDimitry Andric if (S.is<AsmSymbol *>()) {
174d88c1a5aSDimitry Andric OS << S.get<AsmSymbol *>()->first;
175d88c1a5aSDimitry Andric return;
176d88c1a5aSDimitry Andric }
177d88c1a5aSDimitry Andric
178d88c1a5aSDimitry Andric auto *GV = S.get<GlobalValue *>();
179d88c1a5aSDimitry Andric if (GV->hasDLLImportStorageClass())
180d88c1a5aSDimitry Andric OS << "__imp_";
181d88c1a5aSDimitry Andric
182d88c1a5aSDimitry Andric Mang.getNameWithPrefix(OS, GV, false);
183d88c1a5aSDimitry Andric }
184d88c1a5aSDimitry Andric
getSymbolFlags(Symbol S) const185d88c1a5aSDimitry Andric uint32_t ModuleSymbolTable::getSymbolFlags(Symbol S) const {
186d88c1a5aSDimitry Andric if (S.is<AsmSymbol *>())
187d88c1a5aSDimitry Andric return S.get<AsmSymbol *>()->second;
188d88c1a5aSDimitry Andric
189d88c1a5aSDimitry Andric auto *GV = S.get<GlobalValue *>();
190d88c1a5aSDimitry Andric
191d88c1a5aSDimitry Andric uint32_t Res = BasicSymbolRef::SF_None;
192d88c1a5aSDimitry Andric if (GV->isDeclarationForLinker())
193d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Undefined;
194d88c1a5aSDimitry Andric else if (GV->hasHiddenVisibility() && !GV->hasLocalLinkage())
195d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Hidden;
196d88c1a5aSDimitry Andric if (const GlobalVariable *GVar = dyn_cast<GlobalVariable>(GV)) {
197d88c1a5aSDimitry Andric if (GVar->isConstant())
198d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Const;
199d88c1a5aSDimitry Andric }
200d88c1a5aSDimitry Andric if (dyn_cast_or_null<Function>(GV->getBaseObject()))
201d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Executable;
202d88c1a5aSDimitry Andric if (isa<GlobalAlias>(GV))
203d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Indirect;
204d88c1a5aSDimitry Andric if (GV->hasPrivateLinkage())
205d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_FormatSpecific;
206d88c1a5aSDimitry Andric if (!GV->hasLocalLinkage())
207d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Global;
208d88c1a5aSDimitry Andric if (GV->hasCommonLinkage())
209d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Common;
210d88c1a5aSDimitry Andric if (GV->hasLinkOnceLinkage() || GV->hasWeakLinkage() ||
211d88c1a5aSDimitry Andric GV->hasExternalWeakLinkage())
212d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_Weak;
213d88c1a5aSDimitry Andric
214d88c1a5aSDimitry Andric if (GV->getName().startswith("llvm."))
215d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_FormatSpecific;
216d88c1a5aSDimitry Andric else if (auto *Var = dyn_cast<GlobalVariable>(GV)) {
217d88c1a5aSDimitry Andric if (Var->getSection() == "llvm.metadata")
218d88c1a5aSDimitry Andric Res |= BasicSymbolRef::SF_FormatSpecific;
219d88c1a5aSDimitry Andric }
220d88c1a5aSDimitry Andric
221d88c1a5aSDimitry Andric return Res;
222d88c1a5aSDimitry Andric }
223