1d88c1a5aSDimitry Andric //===- ThinLTOBitcodeWriter.cpp - Bitcode writing pass for ThinLTO --------===//
2d88c1a5aSDimitry Andric //
3d88c1a5aSDimitry Andric //                     The LLVM Compiler Infrastructure
4d88c1a5aSDimitry Andric //
5d88c1a5aSDimitry Andric // This file is distributed under the University of Illinois Open Source
6d88c1a5aSDimitry Andric // License. See LICENSE.TXT for details.
7d88c1a5aSDimitry Andric //
8d88c1a5aSDimitry Andric //===----------------------------------------------------------------------===//
9d88c1a5aSDimitry Andric 
10f9448bf3SDimitry Andric #include "llvm/Transforms/IPO/ThinLTOBitcodeWriter.h"
117a7e6055SDimitry Andric #include "llvm/Analysis/BasicAliasAnalysis.h"
12d88c1a5aSDimitry Andric #include "llvm/Analysis/ModuleSummaryAnalysis.h"
135517e702SDimitry Andric #include "llvm/Analysis/ProfileSummaryInfo.h"
14d88c1a5aSDimitry Andric #include "llvm/Analysis/TypeMetadataUtils.h"
15d88c1a5aSDimitry Andric #include "llvm/Bitcode/BitcodeWriter.h"
16d88c1a5aSDimitry Andric #include "llvm/IR/Constants.h"
177a7e6055SDimitry Andric #include "llvm/IR/DebugInfo.h"
18d88c1a5aSDimitry Andric #include "llvm/IR/Intrinsics.h"
19d88c1a5aSDimitry Andric #include "llvm/IR/Module.h"
20d88c1a5aSDimitry Andric #include "llvm/IR/PassManager.h"
214ba319b5SDimitry Andric #include "llvm/Object/ModuleSymbolTable.h"
22d88c1a5aSDimitry Andric #include "llvm/Pass.h"
23d88c1a5aSDimitry Andric #include "llvm/Support/ScopedPrinter.h"
247a7e6055SDimitry Andric #include "llvm/Support/raw_ostream.h"
257a7e6055SDimitry Andric #include "llvm/Transforms/IPO.h"
267a7e6055SDimitry Andric #include "llvm/Transforms/IPO/FunctionAttrs.h"
274ba319b5SDimitry Andric #include "llvm/Transforms/IPO/FunctionImport.h"
28d88c1a5aSDimitry Andric #include "llvm/Transforms/Utils/Cloning.h"
29f37b6182SDimitry Andric #include "llvm/Transforms/Utils/ModuleUtils.h"
30d88c1a5aSDimitry Andric using namespace llvm;
31d88c1a5aSDimitry Andric 
32d88c1a5aSDimitry Andric namespace {
33d88c1a5aSDimitry Andric 
34d88c1a5aSDimitry Andric // Promote each local-linkage entity defined by ExportM and used by ImportM by
35d88c1a5aSDimitry Andric // changing visibility and appending the given ModuleId.
promoteInternals(Module & ExportM,Module & ImportM,StringRef ModuleId,SetVector<GlobalValue * > & PromoteExtra)3624d58133SDimitry Andric void promoteInternals(Module &ExportM, Module &ImportM, StringRef ModuleId,
3724d58133SDimitry Andric                       SetVector<GlobalValue *> &PromoteExtra) {
387a7e6055SDimitry Andric   DenseMap<const Comdat *, Comdat *> RenamedComdats;
397a7e6055SDimitry Andric   for (auto &ExportGV : ExportM.global_values()) {
40d88c1a5aSDimitry Andric     if (!ExportGV.hasLocalLinkage())
417a7e6055SDimitry Andric       continue;
42d88c1a5aSDimitry Andric 
437a7e6055SDimitry Andric     auto Name = ExportGV.getName();
442cab237bSDimitry Andric     GlobalValue *ImportGV = nullptr;
452cab237bSDimitry Andric     if (!PromoteExtra.count(&ExportGV)) {
462cab237bSDimitry Andric       ImportGV = ImportM.getNamedValue(Name);
472cab237bSDimitry Andric       if (!ImportGV)
487a7e6055SDimitry Andric         continue;
492cab237bSDimitry Andric       ImportGV->removeDeadConstantUsers();
502cab237bSDimitry Andric       if (ImportGV->use_empty()) {
512cab237bSDimitry Andric         ImportGV->eraseFromParent();
522cab237bSDimitry Andric         continue;
532cab237bSDimitry Andric       }
542cab237bSDimitry Andric     }
55d88c1a5aSDimitry Andric 
567a7e6055SDimitry Andric     std::string NewName = (Name + ModuleId).str();
577a7e6055SDimitry Andric 
587a7e6055SDimitry Andric     if (const auto *C = ExportGV.getComdat())
597a7e6055SDimitry Andric       if (C->getName() == Name)
607a7e6055SDimitry Andric         RenamedComdats.try_emplace(C, ExportM.getOrInsertComdat(NewName));
61d88c1a5aSDimitry Andric 
62d88c1a5aSDimitry Andric     ExportGV.setName(NewName);
63d88c1a5aSDimitry Andric     ExportGV.setLinkage(GlobalValue::ExternalLinkage);
64d88c1a5aSDimitry Andric     ExportGV.setVisibility(GlobalValue::HiddenVisibility);
65d88c1a5aSDimitry Andric 
6624d58133SDimitry Andric     if (ImportGV) {
67d88c1a5aSDimitry Andric       ImportGV->setName(NewName);
68d88c1a5aSDimitry Andric       ImportGV->setVisibility(GlobalValue::HiddenVisibility);
697a7e6055SDimitry Andric     }
7024d58133SDimitry Andric   }
71d88c1a5aSDimitry Andric 
727a7e6055SDimitry Andric   if (!RenamedComdats.empty())
737a7e6055SDimitry Andric     for (auto &GO : ExportM.global_objects())
747a7e6055SDimitry Andric       if (auto *C = GO.getComdat()) {
757a7e6055SDimitry Andric         auto Replacement = RenamedComdats.find(C);
767a7e6055SDimitry Andric         if (Replacement != RenamedComdats.end())
777a7e6055SDimitry Andric           GO.setComdat(Replacement->second);
787a7e6055SDimitry Andric       }
79d88c1a5aSDimitry Andric }
80d88c1a5aSDimitry Andric 
81d88c1a5aSDimitry Andric // Promote all internal (i.e. distinct) type ids used by the module by replacing
82d88c1a5aSDimitry Andric // them with external type ids formed using the module id.
83d88c1a5aSDimitry Andric //
84d88c1a5aSDimitry Andric // Note that this needs to be done before we clone the module because each clone
85d88c1a5aSDimitry Andric // will receive its own set of distinct metadata nodes.
promoteTypeIds(Module & M,StringRef ModuleId)86d88c1a5aSDimitry Andric void promoteTypeIds(Module &M, StringRef ModuleId) {
87d88c1a5aSDimitry Andric   DenseMap<Metadata *, Metadata *> LocalToGlobal;
88d88c1a5aSDimitry Andric   auto ExternalizeTypeId = [&](CallInst *CI, unsigned ArgNo) {
89d88c1a5aSDimitry Andric     Metadata *MD =
90d88c1a5aSDimitry Andric         cast<MetadataAsValue>(CI->getArgOperand(ArgNo))->getMetadata();
91d88c1a5aSDimitry Andric 
92d88c1a5aSDimitry Andric     if (isa<MDNode>(MD) && cast<MDNode>(MD)->isDistinct()) {
93d88c1a5aSDimitry Andric       Metadata *&GlobalMD = LocalToGlobal[MD];
94d88c1a5aSDimitry Andric       if (!GlobalMD) {
95fe4fed2eSDimitry Andric         std::string NewName = (Twine(LocalToGlobal.size()) + ModuleId).str();
96d88c1a5aSDimitry Andric         GlobalMD = MDString::get(M.getContext(), NewName);
97d88c1a5aSDimitry Andric       }
98d88c1a5aSDimitry Andric 
99d88c1a5aSDimitry Andric       CI->setArgOperand(ArgNo,
100d88c1a5aSDimitry Andric                         MetadataAsValue::get(M.getContext(), GlobalMD));
101d88c1a5aSDimitry Andric     }
102d88c1a5aSDimitry Andric   };
103d88c1a5aSDimitry Andric 
104d88c1a5aSDimitry Andric   if (Function *TypeTestFunc =
105d88c1a5aSDimitry Andric           M.getFunction(Intrinsic::getName(Intrinsic::type_test))) {
106d88c1a5aSDimitry Andric     for (const Use &U : TypeTestFunc->uses()) {
107d88c1a5aSDimitry Andric       auto CI = cast<CallInst>(U.getUser());
108d88c1a5aSDimitry Andric       ExternalizeTypeId(CI, 1);
109d88c1a5aSDimitry Andric     }
110d88c1a5aSDimitry Andric   }
111d88c1a5aSDimitry Andric 
112d88c1a5aSDimitry Andric   if (Function *TypeCheckedLoadFunc =
113d88c1a5aSDimitry Andric           M.getFunction(Intrinsic::getName(Intrinsic::type_checked_load))) {
114d88c1a5aSDimitry Andric     for (const Use &U : TypeCheckedLoadFunc->uses()) {
115d88c1a5aSDimitry Andric       auto CI = cast<CallInst>(U.getUser());
116d88c1a5aSDimitry Andric       ExternalizeTypeId(CI, 2);
117d88c1a5aSDimitry Andric     }
118d88c1a5aSDimitry Andric   }
119d88c1a5aSDimitry Andric 
120d88c1a5aSDimitry Andric   for (GlobalObject &GO : M.global_objects()) {
121d88c1a5aSDimitry Andric     SmallVector<MDNode *, 1> MDs;
122d88c1a5aSDimitry Andric     GO.getMetadata(LLVMContext::MD_type, MDs);
123d88c1a5aSDimitry Andric 
124d88c1a5aSDimitry Andric     GO.eraseMetadata(LLVMContext::MD_type);
125d88c1a5aSDimitry Andric     for (auto MD : MDs) {
126d88c1a5aSDimitry Andric       auto I = LocalToGlobal.find(MD->getOperand(1));
127d88c1a5aSDimitry Andric       if (I == LocalToGlobal.end()) {
128d88c1a5aSDimitry Andric         GO.addMetadata(LLVMContext::MD_type, *MD);
129d88c1a5aSDimitry Andric         continue;
130d88c1a5aSDimitry Andric       }
131d88c1a5aSDimitry Andric       GO.addMetadata(
132d88c1a5aSDimitry Andric           LLVMContext::MD_type,
1334ba319b5SDimitry Andric           *MDNode::get(M.getContext(), {MD->getOperand(0), I->second}));
134d88c1a5aSDimitry Andric     }
135d88c1a5aSDimitry Andric   }
136d88c1a5aSDimitry Andric }
137d88c1a5aSDimitry Andric 
138d88c1a5aSDimitry Andric // Drop unused globals, and drop type information from function declarations.
139d88c1a5aSDimitry Andric // FIXME: If we made functions typeless then there would be no need to do this.
simplifyExternals(Module & M)140d88c1a5aSDimitry Andric void simplifyExternals(Module &M) {
141d88c1a5aSDimitry Andric   FunctionType *EmptyFT =
142d88c1a5aSDimitry Andric       FunctionType::get(Type::getVoidTy(M.getContext()), false);
143d88c1a5aSDimitry Andric 
144d88c1a5aSDimitry Andric   for (auto I = M.begin(), E = M.end(); I != E;) {
145d88c1a5aSDimitry Andric     Function &F = *I++;
146d88c1a5aSDimitry Andric     if (F.isDeclaration() && F.use_empty()) {
147d88c1a5aSDimitry Andric       F.eraseFromParent();
148d88c1a5aSDimitry Andric       continue;
149d88c1a5aSDimitry Andric     }
150d88c1a5aSDimitry Andric 
1512cab237bSDimitry Andric     if (!F.isDeclaration() || F.getFunctionType() == EmptyFT ||
1522cab237bSDimitry Andric         // Changing the type of an intrinsic may invalidate the IR.
1532cab237bSDimitry Andric         F.getName().startswith("llvm."))
154d88c1a5aSDimitry Andric       continue;
155d88c1a5aSDimitry Andric 
156d88c1a5aSDimitry Andric     Function *NewF =
157*b5893f02SDimitry Andric         Function::Create(EmptyFT, GlobalValue::ExternalLinkage,
158*b5893f02SDimitry Andric                          F.getAddressSpace(), "", &M);
159d88c1a5aSDimitry Andric     NewF->setVisibility(F.getVisibility());
160d88c1a5aSDimitry Andric     NewF->takeName(&F);
161d88c1a5aSDimitry Andric     F.replaceAllUsesWith(ConstantExpr::getBitCast(NewF, F.getType()));
162d88c1a5aSDimitry Andric     F.eraseFromParent();
163d88c1a5aSDimitry Andric   }
164d88c1a5aSDimitry Andric 
165d88c1a5aSDimitry Andric   for (auto I = M.global_begin(), E = M.global_end(); I != E;) {
166d88c1a5aSDimitry Andric     GlobalVariable &GV = *I++;
167d88c1a5aSDimitry Andric     if (GV.isDeclaration() && GV.use_empty()) {
168d88c1a5aSDimitry Andric       GV.eraseFromParent();
169d88c1a5aSDimitry Andric       continue;
170d88c1a5aSDimitry Andric     }
171d88c1a5aSDimitry Andric   }
172d88c1a5aSDimitry Andric }
173d88c1a5aSDimitry Andric 
1744ba319b5SDimitry Andric static void
filterModule(Module * M,function_ref<bool (const GlobalValue *)> ShouldKeepDefinition)1754ba319b5SDimitry Andric filterModule(Module *M,
1764ba319b5SDimitry Andric              function_ref<bool(const GlobalValue *)> ShouldKeepDefinition) {
1774ba319b5SDimitry Andric   std::vector<GlobalValue *> V;
1784ba319b5SDimitry Andric   for (GlobalValue &GV : M->global_values())
1794ba319b5SDimitry Andric     if (!ShouldKeepDefinition(&GV))
1804ba319b5SDimitry Andric       V.push_back(&GV);
181d88c1a5aSDimitry Andric 
1824ba319b5SDimitry Andric   for (GlobalValue *GV : V)
1834ba319b5SDimitry Andric     if (!convertToDeclaration(*GV))
1844ba319b5SDimitry Andric       GV->eraseFromParent();
1857a7e6055SDimitry Andric }
1867a7e6055SDimitry Andric 
forEachVirtualFunction(Constant * C,function_ref<void (Function *)> Fn)1877a7e6055SDimitry Andric void forEachVirtualFunction(Constant *C, function_ref<void(Function *)> Fn) {
1887a7e6055SDimitry Andric   if (auto *F = dyn_cast<Function>(C))
1897a7e6055SDimitry Andric     return Fn(F);
1907a7e6055SDimitry Andric   if (isa<GlobalValue>(C))
1917a7e6055SDimitry Andric     return;
1927a7e6055SDimitry Andric   for (Value *Op : C->operands())
1937a7e6055SDimitry Andric     forEachVirtualFunction(cast<Constant>(Op), Fn);
194d88c1a5aSDimitry Andric }
195d88c1a5aSDimitry Andric 
196d88c1a5aSDimitry Andric // If it's possible to split M into regular and thin LTO parts, do so and write
197d88c1a5aSDimitry Andric // a multi-module bitcode file with the two parts to OS. Otherwise, write only a
198d88c1a5aSDimitry Andric // regular LTO bitcode file to OS.
splitAndWriteThinLTOBitcode(raw_ostream & OS,raw_ostream * ThinLinkOS,function_ref<AAResults & (Function &)> AARGetter,Module & M)1997a7e6055SDimitry Andric void splitAndWriteThinLTOBitcode(
2007a7e6055SDimitry Andric     raw_ostream &OS, raw_ostream *ThinLinkOS,
2017a7e6055SDimitry Andric     function_ref<AAResults &(Function &)> AARGetter, Module &M) {
202f37b6182SDimitry Andric   std::string ModuleId = getUniqueModuleId(&M);
203d88c1a5aSDimitry Andric   if (ModuleId.empty()) {
2044ba319b5SDimitry Andric     // We couldn't generate a module ID for this module, write it out as a
2054ba319b5SDimitry Andric     // regular LTO module with an index for summary-based dead stripping.
2064ba319b5SDimitry Andric     ProfileSummaryInfo PSI(M);
2074ba319b5SDimitry Andric     M.addModuleFlag(Module::Error, "ThinLTO", uint32_t(0));
2084ba319b5SDimitry Andric     ModuleSummaryIndex Index = buildModuleSummaryIndex(M, nullptr, &PSI);
2094ba319b5SDimitry Andric     WriteBitcodeToFile(M, OS, /*ShouldPreserveUseListOrder=*/false, &Index);
2104ba319b5SDimitry Andric 
2117a7e6055SDimitry Andric     if (ThinLinkOS)
2127a7e6055SDimitry Andric       // We don't have a ThinLTO part, but still write the module to the
2137a7e6055SDimitry Andric       // ThinLinkOS if requested so that the expected output file is produced.
2144ba319b5SDimitry Andric       WriteBitcodeToFile(M, *ThinLinkOS, /*ShouldPreserveUseListOrder=*/false,
2154ba319b5SDimitry Andric                          &Index);
2164ba319b5SDimitry Andric 
217d88c1a5aSDimitry Andric     return;
218d88c1a5aSDimitry Andric   }
219d88c1a5aSDimitry Andric 
220d88c1a5aSDimitry Andric   promoteTypeIds(M, ModuleId);
221d88c1a5aSDimitry Andric 
2227a7e6055SDimitry Andric   // Returns whether a global has attached type metadata. Such globals may
2237a7e6055SDimitry Andric   // participate in CFI or whole-program devirtualization, so they need to
2247a7e6055SDimitry Andric   // appear in the merged module instead of the thin LTO module.
2254ba319b5SDimitry Andric   auto HasTypeMetadata = [](const GlobalObject *GO) {
2264ba319b5SDimitry Andric     return GO->hasMetadata(LLVMContext::MD_type);
227d88c1a5aSDimitry Andric   };
228d88c1a5aSDimitry Andric 
2297a7e6055SDimitry Andric   // Collect the set of virtual functions that are eligible for virtual constant
2307a7e6055SDimitry Andric   // propagation. Each eligible function must not access memory, must return
2317a7e6055SDimitry Andric   // an integer of width <=64 bits, must take at least one argument, must not
2327a7e6055SDimitry Andric   // use its first argument (assumed to be "this") and all arguments other than
2337a7e6055SDimitry Andric   // the first one must be of <=64 bit integer type.
2347a7e6055SDimitry Andric   //
2357a7e6055SDimitry Andric   // Note that we test whether this copy of the function is readnone, rather
2367a7e6055SDimitry Andric   // than testing function attributes, which must hold for any copy of the
2377a7e6055SDimitry Andric   // function, even a less optimized version substituted at link time. This is
2387a7e6055SDimitry Andric   // sound because the virtual constant propagation optimizations effectively
2397a7e6055SDimitry Andric   // inline all implementations of the virtual function into each call site,
2407a7e6055SDimitry Andric   // rather than using function attributes to perform local optimization.
241*b5893f02SDimitry Andric   DenseSet<const Function *> EligibleVirtualFns;
2427a7e6055SDimitry Andric   // If any member of a comdat lives in MergedM, put all members of that
2437a7e6055SDimitry Andric   // comdat in MergedM to keep the comdat together.
2447a7e6055SDimitry Andric   DenseSet<const Comdat *> MergedMComdats;
2457a7e6055SDimitry Andric   for (GlobalVariable &GV : M.globals())
2467a7e6055SDimitry Andric     if (HasTypeMetadata(&GV)) {
2477a7e6055SDimitry Andric       if (const auto *C = GV.getComdat())
2487a7e6055SDimitry Andric         MergedMComdats.insert(C);
2497a7e6055SDimitry Andric       forEachVirtualFunction(GV.getInitializer(), [&](Function *F) {
2507a7e6055SDimitry Andric         auto *RT = dyn_cast<IntegerType>(F->getReturnType());
2517a7e6055SDimitry Andric         if (!RT || RT->getBitWidth() > 64 || F->arg_empty() ||
2527a7e6055SDimitry Andric             !F->arg_begin()->use_empty())
2537a7e6055SDimitry Andric           return;
2547a7e6055SDimitry Andric         for (auto &Arg : make_range(std::next(F->arg_begin()), F->arg_end())) {
2557a7e6055SDimitry Andric           auto *ArgT = dyn_cast<IntegerType>(Arg.getType());
2567a7e6055SDimitry Andric           if (!ArgT || ArgT->getBitWidth() > 64)
2577a7e6055SDimitry Andric             return;
2587a7e6055SDimitry Andric         }
259c4394386SDimitry Andric         if (!F->isDeclaration() &&
260c4394386SDimitry Andric             computeFunctionBodyMemoryAccess(*F, AARGetter(*F)) == MAK_ReadNone)
2617a7e6055SDimitry Andric           EligibleVirtualFns.insert(F);
2627a7e6055SDimitry Andric       });
2637a7e6055SDimitry Andric     }
264d88c1a5aSDimitry Andric 
2657a7e6055SDimitry Andric   ValueToValueMapTy VMap;
2667a7e6055SDimitry Andric   std::unique_ptr<Module> MergedM(
2674ba319b5SDimitry Andric       CloneModule(M, VMap, [&](const GlobalValue *GV) -> bool {
2687a7e6055SDimitry Andric         if (const auto *C = GV->getComdat())
2697a7e6055SDimitry Andric           if (MergedMComdats.count(C))
2707a7e6055SDimitry Andric             return true;
2717a7e6055SDimitry Andric         if (auto *F = dyn_cast<Function>(GV))
2727a7e6055SDimitry Andric           return EligibleVirtualFns.count(F);
2737a7e6055SDimitry Andric         if (auto *GVar = dyn_cast_or_null<GlobalVariable>(GV->getBaseObject()))
2747a7e6055SDimitry Andric           return HasTypeMetadata(GVar);
2757a7e6055SDimitry Andric         return false;
2767a7e6055SDimitry Andric       }));
2777a7e6055SDimitry Andric   StripDebugInfo(*MergedM);
2784ba319b5SDimitry Andric   MergedM->setModuleInlineAsm("");
2797a7e6055SDimitry Andric 
2807a7e6055SDimitry Andric   for (Function &F : *MergedM)
2817a7e6055SDimitry Andric     if (!F.isDeclaration()) {
2827a7e6055SDimitry Andric       // Reset the linkage of all functions eligible for virtual constant
2837a7e6055SDimitry Andric       // propagation. The canonical definitions live in the thin LTO module so
2847a7e6055SDimitry Andric       // that they can be imported.
2857a7e6055SDimitry Andric       F.setLinkage(GlobalValue::AvailableExternallyLinkage);
2867a7e6055SDimitry Andric       F.setComdat(nullptr);
2877a7e6055SDimitry Andric     }
2887a7e6055SDimitry Andric 
28924d58133SDimitry Andric   SetVector<GlobalValue *> CfiFunctions;
29024d58133SDimitry Andric   for (auto &F : M)
29124d58133SDimitry Andric     if ((!F.hasLocalLinkage() || F.hasAddressTaken()) && HasTypeMetadata(&F))
29224d58133SDimitry Andric       CfiFunctions.insert(&F);
29324d58133SDimitry Andric 
2947a7e6055SDimitry Andric   // Remove all globals with type metadata, globals with comdats that live in
2957a7e6055SDimitry Andric   // MergedM, and aliases pointing to such globals from the thin LTO module.
2967a7e6055SDimitry Andric   filterModule(&M, [&](const GlobalValue *GV) {
2977a7e6055SDimitry Andric     if (auto *GVar = dyn_cast_or_null<GlobalVariable>(GV->getBaseObject()))
2987a7e6055SDimitry Andric       if (HasTypeMetadata(GVar))
2997a7e6055SDimitry Andric         return false;
3007a7e6055SDimitry Andric     if (const auto *C = GV->getComdat())
3017a7e6055SDimitry Andric       if (MergedMComdats.count(C))
3027a7e6055SDimitry Andric         return false;
3037a7e6055SDimitry Andric     return true;
3047a7e6055SDimitry Andric   });
305d88c1a5aSDimitry Andric 
30624d58133SDimitry Andric   promoteInternals(*MergedM, M, ModuleId, CfiFunctions);
30724d58133SDimitry Andric   promoteInternals(M, *MergedM, ModuleId, CfiFunctions);
30824d58133SDimitry Andric 
3094ba319b5SDimitry Andric   auto &Ctx = MergedM->getContext();
31024d58133SDimitry Andric   SmallVector<MDNode *, 8> CfiFunctionMDs;
31124d58133SDimitry Andric   for (auto V : CfiFunctions) {
31224d58133SDimitry Andric     Function &F = *cast<Function>(V);
31324d58133SDimitry Andric     SmallVector<MDNode *, 2> Types;
31424d58133SDimitry Andric     F.getMetadata(LLVMContext::MD_type, Types);
31524d58133SDimitry Andric 
31624d58133SDimitry Andric     SmallVector<Metadata *, 4> Elts;
31724d58133SDimitry Andric     Elts.push_back(MDString::get(Ctx, F.getName()));
31824d58133SDimitry Andric     CfiFunctionLinkage Linkage;
31924d58133SDimitry Andric     if (!F.isDeclarationForLinker())
32024d58133SDimitry Andric       Linkage = CFL_Definition;
32124d58133SDimitry Andric     else if (F.isWeakForLinker())
32224d58133SDimitry Andric       Linkage = CFL_WeakDeclaration;
32324d58133SDimitry Andric     else
32424d58133SDimitry Andric       Linkage = CFL_Declaration;
32524d58133SDimitry Andric     Elts.push_back(ConstantAsMetadata::get(
32624d58133SDimitry Andric         llvm::ConstantInt::get(Type::getInt8Ty(Ctx), Linkage)));
32724d58133SDimitry Andric     for (auto Type : Types)
32824d58133SDimitry Andric       Elts.push_back(Type);
32924d58133SDimitry Andric     CfiFunctionMDs.push_back(MDTuple::get(Ctx, Elts));
33024d58133SDimitry Andric   }
33124d58133SDimitry Andric 
33224d58133SDimitry Andric   if(!CfiFunctionMDs.empty()) {
33324d58133SDimitry Andric     NamedMDNode *NMD = MergedM->getOrInsertNamedMetadata("cfi.functions");
33424d58133SDimitry Andric     for (auto MD : CfiFunctionMDs)
33524d58133SDimitry Andric       NMD->addOperand(MD);
33624d58133SDimitry Andric   }
337d88c1a5aSDimitry Andric 
3384ba319b5SDimitry Andric   SmallVector<MDNode *, 8> FunctionAliases;
3394ba319b5SDimitry Andric   for (auto &A : M.aliases()) {
3404ba319b5SDimitry Andric     if (!isa<Function>(A.getAliasee()))
3414ba319b5SDimitry Andric       continue;
3424ba319b5SDimitry Andric 
3434ba319b5SDimitry Andric     auto *F = cast<Function>(A.getAliasee());
3444ba319b5SDimitry Andric 
3454ba319b5SDimitry Andric     Metadata *Elts[] = {
3464ba319b5SDimitry Andric         MDString::get(Ctx, A.getName()),
3474ba319b5SDimitry Andric         MDString::get(Ctx, F->getName()),
3484ba319b5SDimitry Andric         ConstantAsMetadata::get(
3494ba319b5SDimitry Andric             ConstantInt::get(Type::getInt8Ty(Ctx), A.getVisibility())),
3504ba319b5SDimitry Andric         ConstantAsMetadata::get(
3514ba319b5SDimitry Andric             ConstantInt::get(Type::getInt8Ty(Ctx), A.isWeakForLinker())),
3524ba319b5SDimitry Andric     };
3534ba319b5SDimitry Andric 
3544ba319b5SDimitry Andric     FunctionAliases.push_back(MDTuple::get(Ctx, Elts));
3554ba319b5SDimitry Andric   }
3564ba319b5SDimitry Andric 
3574ba319b5SDimitry Andric   if (!FunctionAliases.empty()) {
3584ba319b5SDimitry Andric     NamedMDNode *NMD = MergedM->getOrInsertNamedMetadata("aliases");
3594ba319b5SDimitry Andric     for (auto MD : FunctionAliases)
3604ba319b5SDimitry Andric       NMD->addOperand(MD);
3614ba319b5SDimitry Andric   }
3624ba319b5SDimitry Andric 
3634ba319b5SDimitry Andric   SmallVector<MDNode *, 8> Symvers;
3644ba319b5SDimitry Andric   ModuleSymbolTable::CollectAsmSymvers(M, [&](StringRef Name, StringRef Alias) {
3654ba319b5SDimitry Andric     Function *F = M.getFunction(Name);
3664ba319b5SDimitry Andric     if (!F || F->use_empty())
3674ba319b5SDimitry Andric       return;
3684ba319b5SDimitry Andric 
3694ba319b5SDimitry Andric     Symvers.push_back(MDTuple::get(
3704ba319b5SDimitry Andric         Ctx, {MDString::get(Ctx, Name), MDString::get(Ctx, Alias)}));
3714ba319b5SDimitry Andric   });
3724ba319b5SDimitry Andric 
3734ba319b5SDimitry Andric   if (!Symvers.empty()) {
3744ba319b5SDimitry Andric     NamedMDNode *NMD = MergedM->getOrInsertNamedMetadata("symvers");
3754ba319b5SDimitry Andric     for (auto MD : Symvers)
3764ba319b5SDimitry Andric       NMD->addOperand(MD);
3774ba319b5SDimitry Andric   }
3784ba319b5SDimitry Andric 
379d88c1a5aSDimitry Andric   simplifyExternals(*MergedM);
380d88c1a5aSDimitry Andric 
381d88c1a5aSDimitry Andric   // FIXME: Try to re-use BSI and PFI from the original module here.
3825517e702SDimitry Andric   ProfileSummaryInfo PSI(M);
3835517e702SDimitry Andric   ModuleSummaryIndex Index = buildModuleSummaryIndex(M, nullptr, &PSI);
3847a7e6055SDimitry Andric 
385db17bf38SDimitry Andric   // Mark the merged module as requiring full LTO. We still want an index for
386db17bf38SDimitry Andric   // it though, so that it can participate in summary-based dead stripping.
387db17bf38SDimitry Andric   MergedM->addModuleFlag(Module::Error, "ThinLTO", uint32_t(0));
388db17bf38SDimitry Andric   ModuleSummaryIndex MergedMIndex =
389db17bf38SDimitry Andric       buildModuleSummaryIndex(*MergedM, nullptr, &PSI);
390db17bf38SDimitry Andric 
3917a7e6055SDimitry Andric   SmallVector<char, 0> Buffer;
3927a7e6055SDimitry Andric 
3937a7e6055SDimitry Andric   BitcodeWriter W(Buffer);
3947a7e6055SDimitry Andric   // Save the module hash produced for the full bitcode, which will
3957a7e6055SDimitry Andric   // be used in the backends, and use that in the minimized bitcode
3967a7e6055SDimitry Andric   // produced for the full link.
3977a7e6055SDimitry Andric   ModuleHash ModHash = {{0}};
3984ba319b5SDimitry Andric   W.writeModule(M, /*ShouldPreserveUseListOrder=*/false, &Index,
3997a7e6055SDimitry Andric                 /*GenerateHash=*/true, &ModHash);
4004ba319b5SDimitry Andric   W.writeModule(*MergedM, /*ShouldPreserveUseListOrder=*/false, &MergedMIndex);
401a580b014SDimitry Andric   W.writeSymtab();
4026bc11b14SDimitry Andric   W.writeStrtab();
403d88c1a5aSDimitry Andric   OS << Buffer;
4047a7e6055SDimitry Andric 
4052cab237bSDimitry Andric   // If a minimized bitcode module was requested for the thin link, only
4062cab237bSDimitry Andric   // the information that is needed by thin link will be written in the
4072cab237bSDimitry Andric   // given OS (the merged module will be written as usual).
4087a7e6055SDimitry Andric   if (ThinLinkOS) {
4097a7e6055SDimitry Andric     Buffer.clear();
4107a7e6055SDimitry Andric     BitcodeWriter W2(Buffer);
4117a7e6055SDimitry Andric     StripDebugInfo(M);
4124ba319b5SDimitry Andric     W2.writeThinLinkBitcode(M, Index, ModHash);
4134ba319b5SDimitry Andric     W2.writeModule(*MergedM, /*ShouldPreserveUseListOrder=*/false,
414db17bf38SDimitry Andric                    &MergedMIndex);
415a580b014SDimitry Andric     W2.writeSymtab();
4166bc11b14SDimitry Andric     W2.writeStrtab();
4177a7e6055SDimitry Andric     *ThinLinkOS << Buffer;
4187a7e6055SDimitry Andric   }
419d88c1a5aSDimitry Andric }
420d88c1a5aSDimitry Andric 
421*b5893f02SDimitry Andric // Returns whether this module needs to be split because splitting is
422*b5893f02SDimitry Andric // enabled and it uses type metadata.
requiresSplit(Module & M)423d88c1a5aSDimitry Andric bool requiresSplit(Module &M) {
424*b5893f02SDimitry Andric   // First check if the LTO Unit splitting has been enabled.
425*b5893f02SDimitry Andric   bool EnableSplitLTOUnit = false;
426*b5893f02SDimitry Andric   if (auto *MD = mdconst::extract_or_null<ConstantInt>(
427*b5893f02SDimitry Andric           M.getModuleFlag("EnableSplitLTOUnit")))
428*b5893f02SDimitry Andric     EnableSplitLTOUnit = MD->getZExtValue();
429*b5893f02SDimitry Andric   if (!EnableSplitLTOUnit)
430*b5893f02SDimitry Andric     return false;
431*b5893f02SDimitry Andric 
432*b5893f02SDimitry Andric   // Module only needs to be split if it contains type metadata.
433d88c1a5aSDimitry Andric   for (auto &GO : M.global_objects()) {
4344ba319b5SDimitry Andric     if (GO.hasMetadata(LLVMContext::MD_type))
435d88c1a5aSDimitry Andric       return true;
436d88c1a5aSDimitry Andric   }
437d88c1a5aSDimitry Andric 
438d88c1a5aSDimitry Andric   return false;
439d88c1a5aSDimitry Andric }
440d88c1a5aSDimitry Andric 
writeThinLTOBitcode(raw_ostream & OS,raw_ostream * ThinLinkOS,function_ref<AAResults & (Function &)> AARGetter,Module & M,const ModuleSummaryIndex * Index)4417a7e6055SDimitry Andric void writeThinLTOBitcode(raw_ostream &OS, raw_ostream *ThinLinkOS,
4427a7e6055SDimitry Andric                          function_ref<AAResults &(Function &)> AARGetter,
4437a7e6055SDimitry Andric                          Module &M, const ModuleSummaryIndex *Index) {
444*b5893f02SDimitry Andric   // Split module if splitting is enabled and it contains any type metadata.
445d88c1a5aSDimitry Andric   if (requiresSplit(M))
4467a7e6055SDimitry Andric     return splitAndWriteThinLTOBitcode(OS, ThinLinkOS, AARGetter, M);
447d88c1a5aSDimitry Andric 
448d88c1a5aSDimitry Andric   // Otherwise we can just write it out as a regular module.
4497a7e6055SDimitry Andric 
4507a7e6055SDimitry Andric   // Save the module hash produced for the full bitcode, which will
4517a7e6055SDimitry Andric   // be used in the backends, and use that in the minimized bitcode
4527a7e6055SDimitry Andric   // produced for the full link.
4537a7e6055SDimitry Andric   ModuleHash ModHash = {{0}};
4544ba319b5SDimitry Andric   WriteBitcodeToFile(M, OS, /*ShouldPreserveUseListOrder=*/false, Index,
4557a7e6055SDimitry Andric                      /*GenerateHash=*/true, &ModHash);
4562cab237bSDimitry Andric   // If a minimized bitcode module was requested for the thin link, only
4572cab237bSDimitry Andric   // the information that is needed by thin link will be written in the
4582cab237bSDimitry Andric   // given OS.
4592cab237bSDimitry Andric   if (ThinLinkOS && Index)
4604ba319b5SDimitry Andric     WriteThinLinkBitcodeToFile(M, *ThinLinkOS, *Index, ModHash);
461d88c1a5aSDimitry Andric }
462d88c1a5aSDimitry Andric 
463d88c1a5aSDimitry Andric class WriteThinLTOBitcode : public ModulePass {
464d88c1a5aSDimitry Andric   raw_ostream &OS; // raw_ostream to print on
4657a7e6055SDimitry Andric   // The output stream on which to emit a minimized module for use
4667a7e6055SDimitry Andric   // just in the thin link, if requested.
4677a7e6055SDimitry Andric   raw_ostream *ThinLinkOS;
468d88c1a5aSDimitry Andric 
469d88c1a5aSDimitry Andric public:
470d88c1a5aSDimitry Andric   static char ID; // Pass identification, replacement for typeid
WriteThinLTOBitcode()4717a7e6055SDimitry Andric   WriteThinLTOBitcode() : ModulePass(ID), OS(dbgs()), ThinLinkOS(nullptr) {
472d88c1a5aSDimitry Andric     initializeWriteThinLTOBitcodePass(*PassRegistry::getPassRegistry());
473d88c1a5aSDimitry Andric   }
474d88c1a5aSDimitry Andric 
WriteThinLTOBitcode(raw_ostream & o,raw_ostream * ThinLinkOS)4757a7e6055SDimitry Andric   explicit WriteThinLTOBitcode(raw_ostream &o, raw_ostream *ThinLinkOS)
4767a7e6055SDimitry Andric       : ModulePass(ID), OS(o), ThinLinkOS(ThinLinkOS) {
477d88c1a5aSDimitry Andric     initializeWriteThinLTOBitcodePass(*PassRegistry::getPassRegistry());
478d88c1a5aSDimitry Andric   }
479d88c1a5aSDimitry Andric 
getPassName() const480d88c1a5aSDimitry Andric   StringRef getPassName() const override { return "ThinLTO Bitcode Writer"; }
481d88c1a5aSDimitry Andric 
runOnModule(Module & M)482d88c1a5aSDimitry Andric   bool runOnModule(Module &M) override {
483d88c1a5aSDimitry Andric     const ModuleSummaryIndex *Index =
484d88c1a5aSDimitry Andric         &(getAnalysis<ModuleSummaryIndexWrapperPass>().getIndex());
4857a7e6055SDimitry Andric     writeThinLTOBitcode(OS, ThinLinkOS, LegacyAARGetter(*this), M, Index);
486d88c1a5aSDimitry Andric     return true;
487d88c1a5aSDimitry Andric   }
getAnalysisUsage(AnalysisUsage & AU) const488d88c1a5aSDimitry Andric   void getAnalysisUsage(AnalysisUsage &AU) const override {
489d88c1a5aSDimitry Andric     AU.setPreservesAll();
4907a7e6055SDimitry Andric     AU.addRequired<AssumptionCacheTracker>();
491d88c1a5aSDimitry Andric     AU.addRequired<ModuleSummaryIndexWrapperPass>();
4927a7e6055SDimitry Andric     AU.addRequired<TargetLibraryInfoWrapperPass>();
493d88c1a5aSDimitry Andric   }
494d88c1a5aSDimitry Andric };
495d88c1a5aSDimitry Andric } // anonymous namespace
496d88c1a5aSDimitry Andric 
497d88c1a5aSDimitry Andric char WriteThinLTOBitcode::ID = 0;
498d88c1a5aSDimitry Andric INITIALIZE_PASS_BEGIN(WriteThinLTOBitcode, "write-thinlto-bitcode",
499d88c1a5aSDimitry Andric                       "Write ThinLTO Bitcode", false, true)
INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)5007a7e6055SDimitry Andric INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker)
501d88c1a5aSDimitry Andric INITIALIZE_PASS_DEPENDENCY(ModuleSummaryIndexWrapperPass)
5027a7e6055SDimitry Andric INITIALIZE_PASS_DEPENDENCY(TargetLibraryInfoWrapperPass)
503d88c1a5aSDimitry Andric INITIALIZE_PASS_END(WriteThinLTOBitcode, "write-thinlto-bitcode",
504d88c1a5aSDimitry Andric                     "Write ThinLTO Bitcode", false, true)
505d88c1a5aSDimitry Andric 
5067a7e6055SDimitry Andric ModulePass *llvm::createWriteThinLTOBitcodePass(raw_ostream &Str,
5077a7e6055SDimitry Andric                                                 raw_ostream *ThinLinkOS) {
5087a7e6055SDimitry Andric   return new WriteThinLTOBitcode(Str, ThinLinkOS);
509d88c1a5aSDimitry Andric }
510f9448bf3SDimitry Andric 
511f9448bf3SDimitry Andric PreservedAnalyses
run(Module & M,ModuleAnalysisManager & AM)512f9448bf3SDimitry Andric llvm::ThinLTOBitcodeWriterPass::run(Module &M, ModuleAnalysisManager &AM) {
513f9448bf3SDimitry Andric   FunctionAnalysisManager &FAM =
514f9448bf3SDimitry Andric       AM.getResult<FunctionAnalysisManagerModuleProxy>(M).getManager();
515f9448bf3SDimitry Andric   writeThinLTOBitcode(OS, ThinLinkOS,
516f9448bf3SDimitry Andric                       [&FAM](Function &F) -> AAResults & {
517f9448bf3SDimitry Andric                         return FAM.getResult<AAManager>(F);
518f9448bf3SDimitry Andric                       },
519f9448bf3SDimitry Andric                       M, &AM.getResult<ModuleSummaryIndexAnalysis>(M));
520f9448bf3SDimitry Andric   return PreservedAnalyses::all();
521f9448bf3SDimitry Andric }
522