xref: /llvm-project-15.0.7/llvm/lib/LTO/LTO.cpp (revision 9ffe5a35)
1 //===-LTO.cpp - LLVM Link Time Optimizer ----------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements functions and classes used to support LTO.
11 //
12 //===----------------------------------------------------------------------===//
13 
14 #include "llvm/LTO/LTO.h"
15 #include "llvm/Analysis/TargetLibraryInfo.h"
16 #include "llvm/Analysis/TargetTransformInfo.h"
17 #include "llvm/Bitcode/BitcodeReader.h"
18 #include "llvm/Bitcode/BitcodeWriter.h"
19 #include "llvm/CodeGen/Analysis.h"
20 #include "llvm/IR/AutoUpgrade.h"
21 #include "llvm/IR/DiagnosticPrinter.h"
22 #include "llvm/IR/LegacyPassManager.h"
23 #include "llvm/LTO/LTOBackend.h"
24 #include "llvm/Linker/IRMover.h"
25 #include "llvm/Object/ModuleSummaryIndexObjectFile.h"
26 #include "llvm/Support/ManagedStatic.h"
27 #include "llvm/Support/MemoryBuffer.h"
28 #include "llvm/Support/Path.h"
29 #include "llvm/Support/SHA1.h"
30 #include "llvm/Support/SourceMgr.h"
31 #include "llvm/Support/TargetRegistry.h"
32 #include "llvm/Support/ThreadPool.h"
33 #include "llvm/Support/Threading.h"
34 #include "llvm/Support/raw_ostream.h"
35 #include "llvm/Target/TargetMachine.h"
36 #include "llvm/Target/TargetOptions.h"
37 #include "llvm/Transforms/IPO.h"
38 #include "llvm/Transforms/IPO/PassManagerBuilder.h"
39 #include "llvm/Transforms/Utils/SplitModule.h"
40 
41 #include <set>
42 
43 using namespace llvm;
44 using namespace lto;
45 using namespace object;
46 
47 #define DEBUG_TYPE "lto"
48 
49 // Returns a unique hash for the Module considering the current list of
50 // export/import and other global analysis results.
51 // The hash is produced in \p Key.
52 static void computeCacheKey(
53     SmallString<40> &Key, const Config &Conf, const ModuleSummaryIndex &Index,
54     StringRef ModuleID, const FunctionImporter::ImportMapTy &ImportList,
55     const FunctionImporter::ExportSetTy &ExportList,
56     const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
57     const GVSummaryMapTy &DefinedGlobals) {
58   // Compute the unique hash for this entry.
59   // This is based on the current compiler version, the module itself, the
60   // export list, the hash for every single module in the import list, the
61   // list of ResolvedODR for the module, and the list of preserved symbols.
62   SHA1 Hasher;
63 
64   // Start with the compiler revision
65   Hasher.update(LLVM_VERSION_STRING);
66 #ifdef HAVE_LLVM_REVISION
67   Hasher.update(LLVM_REVISION);
68 #endif
69 
70   // Include the parts of the LTO configuration that affect code generation.
71   auto AddString = [&](StringRef Str) {
72     Hasher.update(Str);
73     Hasher.update(ArrayRef<uint8_t>{0});
74   };
75   auto AddUnsigned = [&](unsigned I) {
76     uint8_t Data[4];
77     Data[0] = I;
78     Data[1] = I >> 8;
79     Data[2] = I >> 16;
80     Data[3] = I >> 24;
81     Hasher.update(ArrayRef<uint8_t>{Data, 4});
82   };
83   AddString(Conf.CPU);
84   // FIXME: Hash more of Options. For now all clients initialize Options from
85   // command-line flags (which is unsupported in production), but may set
86   // RelaxELFRelocations. The clang driver can also pass FunctionSections,
87   // DataSections and DebuggerTuning via command line flags.
88   AddUnsigned(Conf.Options.RelaxELFRelocations);
89   AddUnsigned(Conf.Options.FunctionSections);
90   AddUnsigned(Conf.Options.DataSections);
91   AddUnsigned((unsigned)Conf.Options.DebuggerTuning);
92   for (auto &A : Conf.MAttrs)
93     AddString(A);
94   AddUnsigned(Conf.RelocModel);
95   AddUnsigned(Conf.CodeModel);
96   AddUnsigned(Conf.CGOptLevel);
97   AddUnsigned(Conf.OptLevel);
98   AddString(Conf.OptPipeline);
99   AddString(Conf.AAPipeline);
100   AddString(Conf.OverrideTriple);
101   AddString(Conf.DefaultTriple);
102 
103   // Include the hash for the current module
104   auto ModHash = Index.getModuleHash(ModuleID);
105   Hasher.update(ArrayRef<uint8_t>((uint8_t *)&ModHash[0], sizeof(ModHash)));
106   for (auto F : ExportList)
107     // The export list can impact the internalization, be conservative here
108     Hasher.update(ArrayRef<uint8_t>((uint8_t *)&F, sizeof(F)));
109 
110   // Include the hash for every module we import functions from
111   for (auto &Entry : ImportList) {
112     auto ModHash = Index.getModuleHash(Entry.first());
113     Hasher.update(ArrayRef<uint8_t>((uint8_t *)&ModHash[0], sizeof(ModHash)));
114   }
115 
116   // Include the hash for the resolved ODR.
117   for (auto &Entry : ResolvedODR) {
118     Hasher.update(ArrayRef<uint8_t>((const uint8_t *)&Entry.first,
119                                     sizeof(GlobalValue::GUID)));
120     Hasher.update(ArrayRef<uint8_t>((const uint8_t *)&Entry.second,
121                                     sizeof(GlobalValue::LinkageTypes)));
122   }
123 
124   // Include the hash for the linkage type to reflect internalization and weak
125   // resolution.
126   for (auto &GS : DefinedGlobals) {
127     GlobalValue::LinkageTypes Linkage = GS.second->linkage();
128     Hasher.update(
129         ArrayRef<uint8_t>((const uint8_t *)&Linkage, sizeof(Linkage)));
130   }
131 
132   if (!Conf.SampleProfile.empty()) {
133     auto FileOrErr = MemoryBuffer::getFile(Conf.SampleProfile);
134     if (FileOrErr)
135       Hasher.update(FileOrErr.get()->getBuffer());
136   }
137 
138   Key = toHex(Hasher.result());
139 }
140 
141 static void thinLTOResolveWeakForLinkerGUID(
142     GlobalValueSummaryList &GVSummaryList, GlobalValue::GUID GUID,
143     DenseSet<GlobalValueSummary *> &GlobalInvolvedWithAlias,
144     function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)>
145         isPrevailing,
146     function_ref<void(StringRef, GlobalValue::GUID, GlobalValue::LinkageTypes)>
147         recordNewLinkage) {
148   for (auto &S : GVSummaryList) {
149     GlobalValue::LinkageTypes OriginalLinkage = S->linkage();
150     if (!GlobalValue::isWeakForLinker(OriginalLinkage))
151       continue;
152     // We need to emit only one of these. The prevailing module will keep it,
153     // but turned into a weak, while the others will drop it when possible.
154     // This is both a compile-time optimization and a correctness
155     // transformation. This is necessary for correctness when we have exported
156     // a reference - we need to convert the linkonce to weak to
157     // ensure a copy is kept to satisfy the exported reference.
158     // FIXME: We may want to split the compile time and correctness
159     // aspects into separate routines.
160     if (isPrevailing(GUID, S.get())) {
161       if (GlobalValue::isLinkOnceLinkage(OriginalLinkage))
162         S->setLinkage(GlobalValue::getWeakLinkage(
163             GlobalValue::isLinkOnceODRLinkage(OriginalLinkage)));
164     }
165     // Alias and aliasee can't be turned into available_externally.
166     else if (!isa<AliasSummary>(S.get()) &&
167              !GlobalInvolvedWithAlias.count(S.get()))
168       S->setLinkage(GlobalValue::AvailableExternallyLinkage);
169     if (S->linkage() != OriginalLinkage)
170       recordNewLinkage(S->modulePath(), GUID, S->linkage());
171   }
172 }
173 
174 // Resolve Weak and LinkOnce values in the \p Index.
175 //
176 // We'd like to drop these functions if they are no longer referenced in the
177 // current module. However there is a chance that another module is still
178 // referencing them because of the import. We make sure we always emit at least
179 // one copy.
180 void llvm::thinLTOResolveWeakForLinkerInIndex(
181     ModuleSummaryIndex &Index,
182     function_ref<bool(GlobalValue::GUID, const GlobalValueSummary *)>
183         isPrevailing,
184     function_ref<void(StringRef, GlobalValue::GUID, GlobalValue::LinkageTypes)>
185         recordNewLinkage) {
186   // We won't optimize the globals that are referenced by an alias for now
187   // Ideally we should turn the alias into a global and duplicate the definition
188   // when needed.
189   DenseSet<GlobalValueSummary *> GlobalInvolvedWithAlias;
190   for (auto &I : Index)
191     for (auto &S : I.second)
192       if (auto AS = dyn_cast<AliasSummary>(S.get()))
193         GlobalInvolvedWithAlias.insert(&AS->getAliasee());
194 
195   for (auto &I : Index)
196     thinLTOResolveWeakForLinkerGUID(I.second, I.first, GlobalInvolvedWithAlias,
197                                     isPrevailing, recordNewLinkage);
198 }
199 
200 static void thinLTOInternalizeAndPromoteGUID(
201     GlobalValueSummaryList &GVSummaryList, GlobalValue::GUID GUID,
202     function_ref<bool(StringRef, GlobalValue::GUID)> isExported) {
203   for (auto &S : GVSummaryList) {
204     if (isExported(S->modulePath(), GUID)) {
205       if (GlobalValue::isLocalLinkage(S->linkage()))
206         S->setLinkage(GlobalValue::ExternalLinkage);
207     } else if (!GlobalValue::isLocalLinkage(S->linkage()))
208       S->setLinkage(GlobalValue::InternalLinkage);
209   }
210 }
211 
212 // Update the linkages in the given \p Index to mark exported values
213 // as external and non-exported values as internal.
214 void llvm::thinLTOInternalizeAndPromoteInIndex(
215     ModuleSummaryIndex &Index,
216     function_ref<bool(StringRef, GlobalValue::GUID)> isExported) {
217   for (auto &I : Index)
218     thinLTOInternalizeAndPromoteGUID(I.second, I.first, isExported);
219 }
220 
221 struct InputFile::InputModule {
222   BitcodeModule BM;
223   std::unique_ptr<Module> Mod;
224 
225   // The range of ModuleSymbolTable entries for this input module.
226   size_t SymBegin, SymEnd;
227 };
228 
229 // Requires a destructor for std::vector<InputModule>.
230 InputFile::~InputFile() = default;
231 
232 Expected<std::unique_ptr<InputFile>> InputFile::create(MemoryBufferRef Object) {
233   std::unique_ptr<InputFile> File(new InputFile);
234 
235   ErrorOr<MemoryBufferRef> BCOrErr =
236       IRObjectFile::findBitcodeInMemBuffer(Object);
237   if (!BCOrErr)
238     return errorCodeToError(BCOrErr.getError());
239 
240   Expected<std::vector<BitcodeModule>> BMsOrErr =
241       getBitcodeModuleList(*BCOrErr);
242   if (!BMsOrErr)
243     return BMsOrErr.takeError();
244 
245   if (BMsOrErr->empty())
246     return make_error<StringError>("Bitcode file does not contain any modules",
247                                    inconvertibleErrorCode());
248 
249   // Create an InputModule for each module in the InputFile, and add it to the
250   // ModuleSymbolTable.
251   for (auto BM : *BMsOrErr) {
252     Expected<std::unique_ptr<Module>> MOrErr =
253         BM.getLazyModule(File->Ctx, /*ShouldLazyLoadMetadata*/ true,
254                          /*IsImporting*/ false);
255     if (!MOrErr)
256       return MOrErr.takeError();
257 
258     size_t SymBegin = File->SymTab.symbols().size();
259     File->SymTab.addModule(MOrErr->get());
260     size_t SymEnd = File->SymTab.symbols().size();
261 
262     for (const auto &C : (*MOrErr)->getComdatSymbolTable()) {
263       auto P = File->ComdatMap.insert(
264           std::make_pair(&C.second, File->Comdats.size()));
265       assert(P.second);
266       (void)P;
267       File->Comdats.push_back(C.first());
268     }
269 
270     File->Mods.push_back({BM, std::move(*MOrErr), SymBegin, SymEnd});
271   }
272 
273   return std::move(File);
274 }
275 
276 Expected<int> InputFile::Symbol::getComdatIndex() const {
277   if (!isGV())
278     return -1;
279   const GlobalObject *GO = getGV()->getBaseObject();
280   if (!GO)
281     return make_error<StringError>("Unable to determine comdat of alias!",
282                                    inconvertibleErrorCode());
283   if (const Comdat *C = GO->getComdat()) {
284     auto I = File->ComdatMap.find(C);
285     assert(I != File->ComdatMap.end());
286     return I->second;
287   }
288   return -1;
289 }
290 
291 StringRef InputFile::getName() const {
292   return Mods[0].BM.getModuleIdentifier();
293 }
294 
295 StringRef InputFile::getSourceFileName() const {
296   return Mods[0].Mod->getSourceFileName();
297 }
298 
299 iterator_range<InputFile::symbol_iterator>
300 InputFile::module_symbols(InputModule &IM) {
301   return llvm::make_range(
302       symbol_iterator(SymTab.symbols().data() + IM.SymBegin, SymTab, this),
303       symbol_iterator(SymTab.symbols().data() + IM.SymEnd, SymTab, this));
304 }
305 
306 LTO::RegularLTOState::RegularLTOState(unsigned ParallelCodeGenParallelismLevel,
307                                       Config &Conf)
308     : ParallelCodeGenParallelismLevel(ParallelCodeGenParallelismLevel),
309       Ctx(Conf) {}
310 
311 LTO::ThinLTOState::ThinLTOState(ThinBackend Backend) : Backend(Backend) {
312   if (!Backend)
313     this->Backend =
314         createInProcessThinBackend(llvm::heavyweight_hardware_concurrency());
315 }
316 
317 LTO::LTO(Config Conf, ThinBackend Backend,
318          unsigned ParallelCodeGenParallelismLevel)
319     : Conf(std::move(Conf)),
320       RegularLTO(ParallelCodeGenParallelismLevel, this->Conf),
321       ThinLTO(std::move(Backend)) {}
322 
323 // Requires a destructor for MapVector<BitcodeModule>.
324 LTO::~LTO() = default;
325 
326 // Add the given symbol to the GlobalResolutions map, and resolve its partition.
327 void LTO::addSymbolToGlobalRes(SmallPtrSet<GlobalValue *, 8> &Used,
328                                const InputFile::Symbol &Sym,
329                                SymbolResolution Res, unsigned Partition) {
330   GlobalValue *GV = Sym.isGV() ? Sym.getGV() : nullptr;
331 
332   auto &GlobalRes = GlobalResolutions[Sym.getName()];
333   if (GV) {
334     GlobalRes.UnnamedAddr &= GV->hasGlobalUnnamedAddr();
335     if (Res.Prevailing)
336       GlobalRes.IRName = GV->getName();
337   }
338   // Set the partition to external if we know it is used elsewhere, e.g.
339   // it is visible to a regular object, is referenced from llvm.compiler_used,
340   // or was already recorded as being referenced from a different partition.
341   if (Res.VisibleToRegularObj || (GV && Used.count(GV)) ||
342       (GlobalRes.Partition != GlobalResolution::Unknown &&
343        GlobalRes.Partition != Partition)) {
344     GlobalRes.Partition = GlobalResolution::External;
345   } else
346     // First recorded reference, save the current partition.
347     GlobalRes.Partition = Partition;
348 
349   // Flag as visible outside of ThinLTO if visible from a regular object or
350   // if this is a reference in the regular LTO partition.
351   GlobalRes.VisibleOutsideThinLTO |=
352       (Res.VisibleToRegularObj || (Partition == GlobalResolution::RegularLTO));
353 }
354 
355 static void writeToResolutionFile(raw_ostream &OS, InputFile *Input,
356                                   ArrayRef<SymbolResolution> Res) {
357   StringRef Path = Input->getName();
358   OS << Path << '\n';
359   auto ResI = Res.begin();
360   for (const InputFile::Symbol &Sym : Input->symbols()) {
361     assert(ResI != Res.end());
362     SymbolResolution Res = *ResI++;
363 
364     OS << "-r=" << Path << ',' << Sym.getName() << ',';
365     if (Res.Prevailing)
366       OS << 'p';
367     if (Res.FinalDefinitionInLinkageUnit)
368       OS << 'l';
369     if (Res.VisibleToRegularObj)
370       OS << 'x';
371     OS << '\n';
372   }
373   OS.flush();
374   assert(ResI == Res.end());
375 }
376 
377 Error LTO::add(std::unique_ptr<InputFile> Input,
378                ArrayRef<SymbolResolution> Res) {
379   assert(!CalledGetMaxTasks);
380 
381   if (Conf.ResolutionFile)
382     writeToResolutionFile(*Conf.ResolutionFile, Input.get(), Res);
383 
384   const SymbolResolution *ResI = Res.begin();
385   for (InputFile::InputModule &IM : Input->Mods)
386     if (Error Err = addModule(*Input, IM, ResI, Res.end()))
387       return Err;
388 
389   assert(ResI == Res.end());
390   return Error::success();
391 }
392 
393 Error LTO::addModule(InputFile &Input, InputFile::InputModule &IM,
394                      const SymbolResolution *&ResI,
395                      const SymbolResolution *ResE) {
396   // FIXME: move to backend
397   Module &M = *IM.Mod;
398 
399   if (M.getDataLayoutStr().empty())
400     return make_error<StringError>("input module has no datalayout",
401                                     inconvertibleErrorCode());
402 
403   if (!Conf.OverrideTriple.empty())
404     M.setTargetTriple(Conf.OverrideTriple);
405   else if (M.getTargetTriple().empty())
406     M.setTargetTriple(Conf.DefaultTriple);
407 
408   Expected<bool> HasThinLTOSummary = IM.BM.hasSummary();
409   if (!HasThinLTOSummary)
410     return HasThinLTOSummary.takeError();
411 
412   if (*HasThinLTOSummary)
413     return addThinLTO(IM.BM, M, Input.module_symbols(IM), ResI, ResE);
414   else
415     return addRegularLTO(IM.BM, ResI, ResE);
416 }
417 
418 // Add a regular LTO object to the link.
419 Error LTO::addRegularLTO(BitcodeModule BM, const SymbolResolution *&ResI,
420                          const SymbolResolution *ResE) {
421   if (!RegularLTO.CombinedModule) {
422     RegularLTO.CombinedModule =
423         llvm::make_unique<Module>("ld-temp.o", RegularLTO.Ctx);
424     RegularLTO.Mover = llvm::make_unique<IRMover>(*RegularLTO.CombinedModule);
425   }
426   Expected<std::unique_ptr<Module>> MOrErr =
427       BM.getLazyModule(RegularLTO.Ctx, /*ShouldLazyLoadMetadata*/ true,
428                        /*IsImporting*/ false);
429   if (!MOrErr)
430     return MOrErr.takeError();
431 
432   Module &M = **MOrErr;
433   if (Error Err = M.materializeMetadata())
434     return Err;
435   UpgradeDebugInfo(M);
436 
437   ModuleSymbolTable SymTab;
438   SymTab.addModule(&M);
439 
440   SmallPtrSet<GlobalValue *, 8> Used;
441   collectUsedGlobalVariables(M, Used, /*CompilerUsed*/ false);
442 
443   std::vector<GlobalValue *> Keep;
444 
445   for (GlobalVariable &GV : M.globals())
446     if (GV.hasAppendingLinkage())
447       Keep.push_back(&GV);
448 
449   for (const InputFile::Symbol &Sym :
450        make_range(InputFile::symbol_iterator(SymTab.symbols().begin(), SymTab,
451                                              nullptr),
452                   InputFile::symbol_iterator(SymTab.symbols().end(), SymTab,
453                                              nullptr))) {
454     assert(ResI != ResE);
455     SymbolResolution Res = *ResI++;
456     addSymbolToGlobalRes(Used, Sym, Res, 0);
457 
458     if (Sym.getFlags() & object::BasicSymbolRef::SF_Undefined)
459       continue;
460     if (Res.Prevailing && Sym.isGV()) {
461       GlobalValue *GV = Sym.getGV();
462       Keep.push_back(GV);
463       switch (GV->getLinkage()) {
464       default:
465         break;
466       case GlobalValue::LinkOnceAnyLinkage:
467         GV->setLinkage(GlobalValue::WeakAnyLinkage);
468         break;
469       case GlobalValue::LinkOnceODRLinkage:
470         GV->setLinkage(GlobalValue::WeakODRLinkage);
471         break;
472       }
473     }
474     // Common resolution: collect the maximum size/alignment over all commons.
475     // We also record if we see an instance of a common as prevailing, so that
476     // if none is prevailing we can ignore it later.
477     if (Sym.getFlags() & object::BasicSymbolRef::SF_Common) {
478       // FIXME: We should figure out what to do about commons defined by asm.
479       // For now they aren't reported correctly by ModuleSymbolTable.
480       auto &CommonRes = RegularLTO.Commons[Sym.getGV()->getName()];
481       CommonRes.Size = std::max(CommonRes.Size, Sym.getCommonSize());
482       CommonRes.Align = std::max(CommonRes.Align, Sym.getCommonAlignment());
483       CommonRes.Prevailing |= Res.Prevailing;
484     }
485 
486     // FIXME: use proposed local attribute for FinalDefinitionInLinkageUnit.
487   }
488 
489   return RegularLTO.Mover->move(std::move(*MOrErr), Keep,
490                                 [](GlobalValue &, IRMover::ValueAdder) {},
491                                 /* LinkModuleInlineAsm */ true,
492                                 /* IsPerformingImport */ false);
493 }
494 
495 // Add a ThinLTO object to the link.
496 // FIXME: This function should not need to take as many parameters once we have
497 // a bitcode symbol table.
498 Error LTO::addThinLTO(BitcodeModule BM, Module &M,
499                       iterator_range<InputFile::symbol_iterator> Syms,
500                       const SymbolResolution *&ResI,
501                       const SymbolResolution *ResE) {
502   SmallPtrSet<GlobalValue *, 8> Used;
503   collectUsedGlobalVariables(M, Used, /*CompilerUsed*/ false);
504 
505   Expected<std::unique_ptr<ModuleSummaryIndex>> SummaryOrErr = BM.getSummary();
506   if (!SummaryOrErr)
507     return SummaryOrErr.takeError();
508   ThinLTO.CombinedIndex.mergeFrom(std::move(*SummaryOrErr),
509                                   ThinLTO.ModuleMap.size());
510 
511   for (const InputFile::Symbol &Sym : Syms) {
512     assert(ResI != ResE);
513     SymbolResolution Res = *ResI++;
514     addSymbolToGlobalRes(Used, Sym, Res, ThinLTO.ModuleMap.size() + 1);
515 
516     if (Res.Prevailing && Sym.isGV())
517       ThinLTO.PrevailingModuleForGUID[Sym.getGV()->getGUID()] =
518           BM.getModuleIdentifier();
519   }
520 
521   if (!ThinLTO.ModuleMap.insert({BM.getModuleIdentifier(), BM}).second)
522     return make_error<StringError>(
523         "Expected at most one ThinLTO module per bitcode file",
524         inconvertibleErrorCode());
525 
526   return Error::success();
527 }
528 
529 unsigned LTO::getMaxTasks() const {
530   CalledGetMaxTasks = true;
531   return RegularLTO.ParallelCodeGenParallelismLevel + ThinLTO.ModuleMap.size();
532 }
533 
534 Error LTO::run(AddStreamFn AddStream, NativeObjectCache Cache) {
535   // Save the status of having a regularLTO combined module, as
536   // this is needed for generating the ThinLTO Task ID, and
537   // the CombinedModule will be moved at the end of runRegularLTO.
538   bool HasRegularLTO = RegularLTO.CombinedModule != nullptr;
539   // Invoke regular LTO if there was a regular LTO module to start with.
540   if (HasRegularLTO)
541     if (auto E = runRegularLTO(AddStream))
542       return E;
543   return runThinLTO(AddStream, Cache, HasRegularLTO);
544 }
545 
546 Error LTO::runRegularLTO(AddStreamFn AddStream) {
547   // Make sure commons have the right size/alignment: we kept the largest from
548   // all the prevailing when adding the inputs, and we apply it here.
549   const DataLayout &DL = RegularLTO.CombinedModule->getDataLayout();
550   for (auto &I : RegularLTO.Commons) {
551     if (!I.second.Prevailing)
552       // Don't do anything if no instance of this common was prevailing.
553       continue;
554     GlobalVariable *OldGV = RegularLTO.CombinedModule->getNamedGlobal(I.first);
555     if (OldGV && DL.getTypeAllocSize(OldGV->getValueType()) == I.second.Size) {
556       // Don't create a new global if the type is already correct, just make
557       // sure the alignment is correct.
558       OldGV->setAlignment(I.second.Align);
559       continue;
560     }
561     ArrayType *Ty =
562         ArrayType::get(Type::getInt8Ty(RegularLTO.Ctx), I.second.Size);
563     auto *GV = new GlobalVariable(*RegularLTO.CombinedModule, Ty, false,
564                                   GlobalValue::CommonLinkage,
565                                   ConstantAggregateZero::get(Ty), "");
566     GV->setAlignment(I.second.Align);
567     if (OldGV) {
568       OldGV->replaceAllUsesWith(ConstantExpr::getBitCast(GV, OldGV->getType()));
569       GV->takeName(OldGV);
570       OldGV->eraseFromParent();
571     } else {
572       GV->setName(I.first);
573     }
574   }
575 
576   if (Conf.PreOptModuleHook &&
577       !Conf.PreOptModuleHook(0, *RegularLTO.CombinedModule))
578     return Error::success();
579 
580   if (!Conf.CodeGenOnly) {
581     for (const auto &R : GlobalResolutions) {
582       if (R.second.IRName.empty())
583         continue;
584       if (R.second.Partition != 0 &&
585           R.second.Partition != GlobalResolution::External)
586         continue;
587 
588       GlobalValue *GV =
589           RegularLTO.CombinedModule->getNamedValue(R.second.IRName);
590       // Ignore symbols defined in other partitions.
591       if (!GV || GV->hasLocalLinkage())
592         continue;
593       GV->setUnnamedAddr(R.second.UnnamedAddr ? GlobalValue::UnnamedAddr::Global
594                                               : GlobalValue::UnnamedAddr::None);
595       if (R.second.Partition == 0)
596         GV->setLinkage(GlobalValue::InternalLinkage);
597     }
598 
599     if (Conf.PostInternalizeModuleHook &&
600         !Conf.PostInternalizeModuleHook(0, *RegularLTO.CombinedModule))
601       return Error::success();
602   }
603   return backend(Conf, AddStream, RegularLTO.ParallelCodeGenParallelismLevel,
604                  std::move(RegularLTO.CombinedModule), ThinLTO.CombinedIndex);
605 }
606 
607 /// This class defines the interface to the ThinLTO backend.
608 class lto::ThinBackendProc {
609 protected:
610   Config &Conf;
611   ModuleSummaryIndex &CombinedIndex;
612   const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries;
613 
614 public:
615   ThinBackendProc(Config &Conf, ModuleSummaryIndex &CombinedIndex,
616                   const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries)
617       : Conf(Conf), CombinedIndex(CombinedIndex),
618         ModuleToDefinedGVSummaries(ModuleToDefinedGVSummaries) {}
619 
620   virtual ~ThinBackendProc() {}
621   virtual Error start(
622       unsigned Task, BitcodeModule BM,
623       const FunctionImporter::ImportMapTy &ImportList,
624       const FunctionImporter::ExportSetTy &ExportList,
625       const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
626       MapVector<StringRef, BitcodeModule> &ModuleMap) = 0;
627   virtual Error wait() = 0;
628 };
629 
630 namespace {
631 class InProcessThinBackend : public ThinBackendProc {
632   ThreadPool BackendThreadPool;
633   AddStreamFn AddStream;
634   NativeObjectCache Cache;
635 
636   Optional<Error> Err;
637   std::mutex ErrMu;
638 
639 public:
640   InProcessThinBackend(
641       Config &Conf, ModuleSummaryIndex &CombinedIndex,
642       unsigned ThinLTOParallelismLevel,
643       const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
644       AddStreamFn AddStream, NativeObjectCache Cache)
645       : ThinBackendProc(Conf, CombinedIndex, ModuleToDefinedGVSummaries),
646         BackendThreadPool(ThinLTOParallelismLevel),
647         AddStream(std::move(AddStream)), Cache(std::move(Cache)) {}
648 
649   Error runThinLTOBackendThread(
650       AddStreamFn AddStream, NativeObjectCache Cache, unsigned Task,
651       BitcodeModule BM, ModuleSummaryIndex &CombinedIndex,
652       const FunctionImporter::ImportMapTy &ImportList,
653       const FunctionImporter::ExportSetTy &ExportList,
654       const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
655       const GVSummaryMapTy &DefinedGlobals,
656       MapVector<StringRef, BitcodeModule> &ModuleMap) {
657     auto RunThinBackend = [&](AddStreamFn AddStream) {
658       LTOLLVMContext BackendContext(Conf);
659       Expected<std::unique_ptr<Module>> MOrErr = BM.parseModule(BackendContext);
660       if (!MOrErr)
661         return MOrErr.takeError();
662 
663       return thinBackend(Conf, Task, AddStream, **MOrErr, CombinedIndex,
664                          ImportList, DefinedGlobals, ModuleMap);
665     };
666 
667     auto ModuleID = BM.getModuleIdentifier();
668 
669     if (!Cache || !CombinedIndex.modulePaths().count(ModuleID) ||
670         all_of(CombinedIndex.getModuleHash(ModuleID),
671                [](uint32_t V) { return V == 0; }))
672       // Cache disabled or no entry for this module in the combined index or
673       // no module hash.
674       return RunThinBackend(AddStream);
675 
676     SmallString<40> Key;
677     // The module may be cached, this helps handling it.
678     computeCacheKey(Key, Conf, CombinedIndex, ModuleID, ImportList, ExportList,
679                     ResolvedODR, DefinedGlobals);
680     if (AddStreamFn CacheAddStream = Cache(Task, Key))
681       return RunThinBackend(CacheAddStream);
682 
683     return Error::success();
684   }
685 
686   Error start(
687       unsigned Task, BitcodeModule BM,
688       const FunctionImporter::ImportMapTy &ImportList,
689       const FunctionImporter::ExportSetTy &ExportList,
690       const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
691       MapVector<StringRef, BitcodeModule> &ModuleMap) override {
692     StringRef ModulePath = BM.getModuleIdentifier();
693     assert(ModuleToDefinedGVSummaries.count(ModulePath));
694     const GVSummaryMapTy &DefinedGlobals =
695         ModuleToDefinedGVSummaries.find(ModulePath)->second;
696     BackendThreadPool.async(
697         [=](BitcodeModule BM, ModuleSummaryIndex &CombinedIndex,
698             const FunctionImporter::ImportMapTy &ImportList,
699             const FunctionImporter::ExportSetTy &ExportList,
700             const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>
701                 &ResolvedODR,
702             const GVSummaryMapTy &DefinedGlobals,
703             MapVector<StringRef, BitcodeModule> &ModuleMap) {
704           Error E = runThinLTOBackendThread(
705               AddStream, Cache, Task, BM, CombinedIndex, ImportList,
706               ExportList, ResolvedODR, DefinedGlobals, ModuleMap);
707           if (E) {
708             std::unique_lock<std::mutex> L(ErrMu);
709             if (Err)
710               Err = joinErrors(std::move(*Err), std::move(E));
711             else
712               Err = std::move(E);
713           }
714         },
715         BM, std::ref(CombinedIndex), std::ref(ImportList),
716         std::ref(ExportList), std::ref(ResolvedODR), std::ref(DefinedGlobals),
717         std::ref(ModuleMap));
718     return Error::success();
719   }
720 
721   Error wait() override {
722     BackendThreadPool.wait();
723     if (Err)
724       return std::move(*Err);
725     else
726       return Error::success();
727   }
728 };
729 } // end anonymous namespace
730 
731 ThinBackend lto::createInProcessThinBackend(unsigned ParallelismLevel) {
732   return [=](Config &Conf, ModuleSummaryIndex &CombinedIndex,
733              const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
734              AddStreamFn AddStream, NativeObjectCache Cache) {
735     return llvm::make_unique<InProcessThinBackend>(
736         Conf, CombinedIndex, ParallelismLevel, ModuleToDefinedGVSummaries,
737         AddStream, Cache);
738   };
739 }
740 
741 // Given the original \p Path to an output file, replace any path
742 // prefix matching \p OldPrefix with \p NewPrefix. Also, create the
743 // resulting directory if it does not yet exist.
744 std::string lto::getThinLTOOutputFile(const std::string &Path,
745                                       const std::string &OldPrefix,
746                                       const std::string &NewPrefix) {
747   if (OldPrefix.empty() && NewPrefix.empty())
748     return Path;
749   SmallString<128> NewPath(Path);
750   llvm::sys::path::replace_path_prefix(NewPath, OldPrefix, NewPrefix);
751   StringRef ParentPath = llvm::sys::path::parent_path(NewPath.str());
752   if (!ParentPath.empty()) {
753     // Make sure the new directory exists, creating it if necessary.
754     if (std::error_code EC = llvm::sys::fs::create_directories(ParentPath))
755       llvm::errs() << "warning: could not create directory '" << ParentPath
756                    << "': " << EC.message() << '\n';
757   }
758   return NewPath.str();
759 }
760 
761 namespace {
762 class WriteIndexesThinBackend : public ThinBackendProc {
763   std::string OldPrefix, NewPrefix;
764   bool ShouldEmitImportsFiles;
765 
766   std::string LinkedObjectsFileName;
767   std::unique_ptr<llvm::raw_fd_ostream> LinkedObjectsFile;
768 
769 public:
770   WriteIndexesThinBackend(
771       Config &Conf, ModuleSummaryIndex &CombinedIndex,
772       const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
773       std::string OldPrefix, std::string NewPrefix, bool ShouldEmitImportsFiles,
774       std::string LinkedObjectsFileName)
775       : ThinBackendProc(Conf, CombinedIndex, ModuleToDefinedGVSummaries),
776         OldPrefix(OldPrefix), NewPrefix(NewPrefix),
777         ShouldEmitImportsFiles(ShouldEmitImportsFiles),
778         LinkedObjectsFileName(LinkedObjectsFileName) {}
779 
780   Error start(
781       unsigned Task, BitcodeModule BM,
782       const FunctionImporter::ImportMapTy &ImportList,
783       const FunctionImporter::ExportSetTy &ExportList,
784       const std::map<GlobalValue::GUID, GlobalValue::LinkageTypes> &ResolvedODR,
785       MapVector<StringRef, BitcodeModule> &ModuleMap) override {
786     StringRef ModulePath = BM.getModuleIdentifier();
787     std::string NewModulePath =
788         getThinLTOOutputFile(ModulePath, OldPrefix, NewPrefix);
789 
790     std::error_code EC;
791     if (!LinkedObjectsFileName.empty()) {
792       if (!LinkedObjectsFile) {
793         LinkedObjectsFile = llvm::make_unique<raw_fd_ostream>(
794             LinkedObjectsFileName, EC, sys::fs::OpenFlags::F_None);
795         if (EC)
796           return errorCodeToError(EC);
797       }
798       *LinkedObjectsFile << NewModulePath << '\n';
799     }
800 
801     std::map<std::string, GVSummaryMapTy> ModuleToSummariesForIndex;
802     gatherImportedSummariesForModule(ModulePath, ModuleToDefinedGVSummaries,
803                                      ImportList, ModuleToSummariesForIndex);
804 
805     raw_fd_ostream OS(NewModulePath + ".thinlto.bc", EC,
806                       sys::fs::OpenFlags::F_None);
807     if (EC)
808       return errorCodeToError(EC);
809     WriteIndexToFile(CombinedIndex, OS, &ModuleToSummariesForIndex);
810 
811     if (ShouldEmitImportsFiles)
812       return errorCodeToError(
813           EmitImportsFiles(ModulePath, NewModulePath + ".imports", ImportList));
814     return Error::success();
815   }
816 
817   Error wait() override { return Error::success(); }
818 };
819 } // end anonymous namespace
820 
821 ThinBackend lto::createWriteIndexesThinBackend(std::string OldPrefix,
822                                                std::string NewPrefix,
823                                                bool ShouldEmitImportsFiles,
824                                                std::string LinkedObjectsFile) {
825   return [=](Config &Conf, ModuleSummaryIndex &CombinedIndex,
826              const StringMap<GVSummaryMapTy> &ModuleToDefinedGVSummaries,
827              AddStreamFn AddStream, NativeObjectCache Cache) {
828     return llvm::make_unique<WriteIndexesThinBackend>(
829         Conf, CombinedIndex, ModuleToDefinedGVSummaries, OldPrefix, NewPrefix,
830         ShouldEmitImportsFiles, LinkedObjectsFile);
831   };
832 }
833 
834 Error LTO::runThinLTO(AddStreamFn AddStream, NativeObjectCache Cache,
835                       bool HasRegularLTO) {
836   if (ThinLTO.ModuleMap.empty())
837     return Error::success();
838 
839   if (Conf.CombinedIndexHook && !Conf.CombinedIndexHook(ThinLTO.CombinedIndex))
840     return Error::success();
841 
842   // Collect for each module the list of function it defines (GUID ->
843   // Summary).
844   StringMap<std::map<GlobalValue::GUID, GlobalValueSummary *>>
845       ModuleToDefinedGVSummaries(ThinLTO.ModuleMap.size());
846   ThinLTO.CombinedIndex.collectDefinedGVSummariesPerModule(
847       ModuleToDefinedGVSummaries);
848   // Create entries for any modules that didn't have any GV summaries
849   // (either they didn't have any GVs to start with, or we suppressed
850   // generation of the summaries because they e.g. had inline assembly
851   // uses that couldn't be promoted/renamed on export). This is so
852   // InProcessThinBackend::start can still launch a backend thread, which
853   // is passed the map of summaries for the module, without any special
854   // handling for this case.
855   for (auto &Mod : ThinLTO.ModuleMap)
856     if (!ModuleToDefinedGVSummaries.count(Mod.first))
857       ModuleToDefinedGVSummaries.try_emplace(Mod.first);
858 
859   StringMap<FunctionImporter::ImportMapTy> ImportLists(
860       ThinLTO.ModuleMap.size());
861   StringMap<FunctionImporter::ExportSetTy> ExportLists(
862       ThinLTO.ModuleMap.size());
863   StringMap<std::map<GlobalValue::GUID, GlobalValue::LinkageTypes>> ResolvedODR;
864 
865   if (Conf.OptLevel > 0) {
866     // Compute "dead" symbols, we don't want to import/export these!
867     DenseSet<GlobalValue::GUID> GUIDPreservedSymbols;
868     for (auto &Res : GlobalResolutions) {
869       if (Res.second.VisibleOutsideThinLTO &&
870           // IRName will be defined if we have seen the prevailing copy of
871           // this value. If not, no need to preserve any ThinLTO copies.
872           !Res.second.IRName.empty())
873         GUIDPreservedSymbols.insert(GlobalValue::getGUID(Res.second.IRName));
874     }
875 
876     auto DeadSymbols =
877         computeDeadSymbols(ThinLTO.CombinedIndex, GUIDPreservedSymbols);
878 
879     ComputeCrossModuleImport(ThinLTO.CombinedIndex, ModuleToDefinedGVSummaries,
880                              ImportLists, ExportLists, &DeadSymbols);
881 
882     std::set<GlobalValue::GUID> ExportedGUIDs;
883     for (auto &Res : GlobalResolutions) {
884       // First check if the symbol was flagged as having external references.
885       if (Res.second.Partition != GlobalResolution::External)
886         continue;
887       // IRName will be defined if we have seen the prevailing copy of
888       // this value. If not, no need to mark as exported from a ThinLTO
889       // partition (and we can't get the GUID).
890       if (Res.second.IRName.empty())
891         continue;
892       auto GUID = GlobalValue::getGUID(Res.second.IRName);
893       // Mark exported unless index-based analysis determined it to be dead.
894       if (!DeadSymbols.count(GUID))
895         ExportedGUIDs.insert(GlobalValue::getGUID(Res.second.IRName));
896     }
897 
898     auto isPrevailing = [&](GlobalValue::GUID GUID,
899                             const GlobalValueSummary *S) {
900       return ThinLTO.PrevailingModuleForGUID[GUID] == S->modulePath();
901     };
902     auto isExported = [&](StringRef ModuleIdentifier, GlobalValue::GUID GUID) {
903       const auto &ExportList = ExportLists.find(ModuleIdentifier);
904       return (ExportList != ExportLists.end() &&
905               ExportList->second.count(GUID)) ||
906              ExportedGUIDs.count(GUID);
907     };
908     thinLTOInternalizeAndPromoteInIndex(ThinLTO.CombinedIndex, isExported);
909 
910     auto recordNewLinkage = [&](StringRef ModuleIdentifier,
911                                 GlobalValue::GUID GUID,
912                                 GlobalValue::LinkageTypes NewLinkage) {
913       ResolvedODR[ModuleIdentifier][GUID] = NewLinkage;
914     };
915 
916     thinLTOResolveWeakForLinkerInIndex(ThinLTO.CombinedIndex, isPrevailing,
917                                        recordNewLinkage);
918   }
919 
920   std::unique_ptr<ThinBackendProc> BackendProc =
921       ThinLTO.Backend(Conf, ThinLTO.CombinedIndex, ModuleToDefinedGVSummaries,
922                       AddStream, Cache);
923 
924   // Task numbers start at ParallelCodeGenParallelismLevel if an LTO
925   // module is present, as tasks 0 through ParallelCodeGenParallelismLevel-1
926   // are reserved for parallel code generation partitions.
927   unsigned Task =
928       HasRegularLTO ? RegularLTO.ParallelCodeGenParallelismLevel : 0;
929   for (auto &Mod : ThinLTO.ModuleMap) {
930     if (Error E = BackendProc->start(Task, Mod.second, ImportLists[Mod.first],
931                                      ExportLists[Mod.first],
932                                      ResolvedODR[Mod.first], ThinLTO.ModuleMap))
933       return E;
934     ++Task;
935   }
936 
937   return BackendProc->wait();
938 }
939