1 //===-- ModuleUtils.cpp - Functions to manipulate Modules -----------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This family of functions perform manipulations on Modules.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/Transforms/Utils/ModuleUtils.h"
14 #include "llvm/Analysis/TargetLibraryInfo.h"
15 #include "llvm/Analysis/VectorUtils.h"
16 #include "llvm/IR/DerivedTypes.h"
17 #include "llvm/IR/Function.h"
18 #include "llvm/IR/IRBuilder.h"
19 #include "llvm/IR/Module.h"
20 #include "llvm/Support/raw_ostream.h"
21 using namespace llvm;
22 
23 #define DEBUG_TYPE "moduleutils"
24 
25 static void appendToGlobalArray(const char *Array, Module &M, Function *F,
26                                 int Priority, Constant *Data) {
27   IRBuilder<> IRB(M.getContext());
28   FunctionType *FnTy = FunctionType::get(IRB.getVoidTy(), false);
29 
30   // Get the current set of static global constructors and add the new ctor
31   // to the list.
32   SmallVector<Constant *, 16> CurrentCtors;
33   StructType *EltTy = StructType::get(
34       IRB.getInt32Ty(), PointerType::getUnqual(FnTy), IRB.getInt8PtrTy());
35   if (GlobalVariable *GVCtor = M.getNamedGlobal(Array)) {
36     if (Constant *Init = GVCtor->getInitializer()) {
37       unsigned n = Init->getNumOperands();
38       CurrentCtors.reserve(n + 1);
39       for (unsigned i = 0; i != n; ++i)
40         CurrentCtors.push_back(cast<Constant>(Init->getOperand(i)));
41     }
42     GVCtor->eraseFromParent();
43   }
44 
45   // Build a 3 field global_ctor entry.  We don't take a comdat key.
46   Constant *CSVals[3];
47   CSVals[0] = IRB.getInt32(Priority);
48   CSVals[1] = F;
49   CSVals[2] = Data ? ConstantExpr::getPointerCast(Data, IRB.getInt8PtrTy())
50                    : Constant::getNullValue(IRB.getInt8PtrTy());
51   Constant *RuntimeCtorInit =
52       ConstantStruct::get(EltTy, makeArrayRef(CSVals, EltTy->getNumElements()));
53 
54   CurrentCtors.push_back(RuntimeCtorInit);
55 
56   // Create a new initializer.
57   ArrayType *AT = ArrayType::get(EltTy, CurrentCtors.size());
58   Constant *NewInit = ConstantArray::get(AT, CurrentCtors);
59 
60   // Create the new global variable and replace all uses of
61   // the old global variable with the new one.
62   (void)new GlobalVariable(M, NewInit->getType(), false,
63                            GlobalValue::AppendingLinkage, NewInit, Array);
64 }
65 
66 void llvm::appendToGlobalCtors(Module &M, Function *F, int Priority, Constant *Data) {
67   appendToGlobalArray("llvm.global_ctors", M, F, Priority, Data);
68 }
69 
70 void llvm::appendToGlobalDtors(Module &M, Function *F, int Priority, Constant *Data) {
71   appendToGlobalArray("llvm.global_dtors", M, F, Priority, Data);
72 }
73 
74 static void appendToUsedList(Module &M, StringRef Name, ArrayRef<GlobalValue *> Values) {
75   GlobalVariable *GV = M.getGlobalVariable(Name);
76   SmallPtrSet<Constant *, 16> InitAsSet;
77   SmallVector<Constant *, 16> Init;
78   if (GV) {
79     if (GV->hasInitializer()) {
80       auto *CA = cast<ConstantArray>(GV->getInitializer());
81       for (auto &Op : CA->operands()) {
82         Constant *C = cast_or_null<Constant>(Op);
83         if (InitAsSet.insert(C).second)
84           Init.push_back(C);
85       }
86     }
87     GV->eraseFromParent();
88   }
89 
90   Type *Int8PtrTy = llvm::Type::getInt8PtrTy(M.getContext());
91   for (auto *V : Values) {
92     Constant *C = ConstantExpr::getPointerBitCastOrAddrSpaceCast(V, Int8PtrTy);
93     if (InitAsSet.insert(C).second)
94       Init.push_back(C);
95   }
96 
97   if (Init.empty())
98     return;
99 
100   ArrayType *ATy = ArrayType::get(Int8PtrTy, Init.size());
101   GV = new llvm::GlobalVariable(M, ATy, false, GlobalValue::AppendingLinkage,
102                                 ConstantArray::get(ATy, Init), Name);
103   GV->setSection("llvm.metadata");
104 }
105 
106 void llvm::appendToUsed(Module &M, ArrayRef<GlobalValue *> Values) {
107   appendToUsedList(M, "llvm.used", Values);
108 }
109 
110 void llvm::appendToCompilerUsed(Module &M, ArrayRef<GlobalValue *> Values) {
111   appendToUsedList(M, "llvm.compiler.used", Values);
112 }
113 
114 FunctionCallee
115 llvm::declareSanitizerInitFunction(Module &M, StringRef InitName,
116                                    ArrayRef<Type *> InitArgTypes) {
117   assert(!InitName.empty() && "Expected init function name");
118   return M.getOrInsertFunction(
119       InitName,
120       FunctionType::get(Type::getVoidTy(M.getContext()), InitArgTypes, false),
121       AttributeList());
122 }
123 
124 Function *llvm::createSanitizerCtor(Module &M, StringRef CtorName) {
125   Function *Ctor = Function::createWithDefaultAttr(
126       FunctionType::get(Type::getVoidTy(M.getContext()), false),
127       GlobalValue::InternalLinkage, 0, CtorName, &M);
128   Ctor->addAttribute(AttributeList::FunctionIndex, Attribute::NoUnwind);
129   BasicBlock *CtorBB = BasicBlock::Create(M.getContext(), "", Ctor);
130   ReturnInst::Create(M.getContext(), CtorBB);
131   // Ensure Ctor cannot be discarded, even if in a comdat.
132   appendToUsed(M, {Ctor});
133   return Ctor;
134 }
135 
136 std::pair<Function *, FunctionCallee> llvm::createSanitizerCtorAndInitFunctions(
137     Module &M, StringRef CtorName, StringRef InitName,
138     ArrayRef<Type *> InitArgTypes, ArrayRef<Value *> InitArgs,
139     StringRef VersionCheckName) {
140   assert(!InitName.empty() && "Expected init function name");
141   assert(InitArgs.size() == InitArgTypes.size() &&
142          "Sanitizer's init function expects different number of arguments");
143   FunctionCallee InitFunction =
144       declareSanitizerInitFunction(M, InitName, InitArgTypes);
145   Function *Ctor = createSanitizerCtor(M, CtorName);
146   IRBuilder<> IRB(Ctor->getEntryBlock().getTerminator());
147   IRB.CreateCall(InitFunction, InitArgs);
148   if (!VersionCheckName.empty()) {
149     FunctionCallee VersionCheckFunction = M.getOrInsertFunction(
150         VersionCheckName, FunctionType::get(IRB.getVoidTy(), {}, false),
151         AttributeList());
152     IRB.CreateCall(VersionCheckFunction, {});
153   }
154   return std::make_pair(Ctor, InitFunction);
155 }
156 
157 std::pair<Function *, FunctionCallee>
158 llvm::getOrCreateSanitizerCtorAndInitFunctions(
159     Module &M, StringRef CtorName, StringRef InitName,
160     ArrayRef<Type *> InitArgTypes, ArrayRef<Value *> InitArgs,
161     function_ref<void(Function *, FunctionCallee)> FunctionsCreatedCallback,
162     StringRef VersionCheckName) {
163   assert(!CtorName.empty() && "Expected ctor function name");
164 
165   if (Function *Ctor = M.getFunction(CtorName))
166     // FIXME: Sink this logic into the module, similar to the handling of
167     // globals. This will make moving to a concurrent model much easier.
168     if (Ctor->arg_size() == 0 ||
169         Ctor->getReturnType() == Type::getVoidTy(M.getContext()))
170       return {Ctor, declareSanitizerInitFunction(M, InitName, InitArgTypes)};
171 
172   Function *Ctor;
173   FunctionCallee InitFunction;
174   std::tie(Ctor, InitFunction) = llvm::createSanitizerCtorAndInitFunctions(
175       M, CtorName, InitName, InitArgTypes, InitArgs, VersionCheckName);
176   FunctionsCreatedCallback(Ctor, InitFunction);
177   return std::make_pair(Ctor, InitFunction);
178 }
179 
180 Function *llvm::getOrCreateInitFunction(Module &M, StringRef Name) {
181   assert(!Name.empty() && "Expected init function name");
182   if (Function *F = M.getFunction(Name)) {
183     if (F->arg_size() != 0 ||
184         F->getReturnType() != Type::getVoidTy(M.getContext())) {
185       std::string Err;
186       raw_string_ostream Stream(Err);
187       Stream << "Sanitizer interface function defined with wrong type: " << *F;
188       report_fatal_error(Err);
189     }
190     return F;
191   }
192   Function *F =
193       cast<Function>(M.getOrInsertFunction(Name, AttributeList(),
194                                            Type::getVoidTy(M.getContext()))
195                          .getCallee());
196 
197   appendToGlobalCtors(M, F, 0);
198 
199   return F;
200 }
201 
202 void llvm::filterDeadComdatFunctions(
203     Module &M, SmallVectorImpl<Function *> &DeadComdatFunctions) {
204   // Build a map from the comdat to the number of entries in that comdat we
205   // think are dead. If this fully covers the comdat group, then the entire
206   // group is dead. If we find another entry in the comdat group though, we'll
207   // have to preserve the whole group.
208   SmallDenseMap<Comdat *, int, 16> ComdatEntriesCovered;
209   for (Function *F : DeadComdatFunctions) {
210     Comdat *C = F->getComdat();
211     assert(C && "Expected all input GVs to be in a comdat!");
212     ComdatEntriesCovered[C] += 1;
213   }
214 
215   auto CheckComdat = [&](Comdat &C) {
216     auto CI = ComdatEntriesCovered.find(&C);
217     if (CI == ComdatEntriesCovered.end())
218       return;
219 
220     // If this could have been covered by a dead entry, just subtract one to
221     // account for it.
222     if (CI->second > 0) {
223       CI->second -= 1;
224       return;
225     }
226 
227     // If we've already accounted for all the entries that were dead, the
228     // entire comdat is alive so remove it from the map.
229     ComdatEntriesCovered.erase(CI);
230   };
231 
232   auto CheckAllComdats = [&] {
233     for (Function &F : M.functions())
234       if (Comdat *C = F.getComdat()) {
235         CheckComdat(*C);
236         if (ComdatEntriesCovered.empty())
237           return;
238       }
239     for (GlobalVariable &GV : M.globals())
240       if (Comdat *C = GV.getComdat()) {
241         CheckComdat(*C);
242         if (ComdatEntriesCovered.empty())
243           return;
244       }
245     for (GlobalAlias &GA : M.aliases())
246       if (Comdat *C = GA.getComdat()) {
247         CheckComdat(*C);
248         if (ComdatEntriesCovered.empty())
249           return;
250       }
251   };
252   CheckAllComdats();
253 
254   if (ComdatEntriesCovered.empty()) {
255     DeadComdatFunctions.clear();
256     return;
257   }
258 
259   // Remove the entries that were not covering.
260   erase_if(DeadComdatFunctions, [&](GlobalValue *GV) {
261     return ComdatEntriesCovered.find(GV->getComdat()) ==
262            ComdatEntriesCovered.end();
263   });
264 }
265 
266 std::string llvm::getUniqueModuleId(Module *M) {
267   MD5 Md5;
268   bool ExportsSymbols = false;
269   auto AddGlobal = [&](GlobalValue &GV) {
270     if (GV.isDeclaration() || GV.getName().startswith("llvm.") ||
271         !GV.hasExternalLinkage() || GV.hasComdat())
272       return;
273     ExportsSymbols = true;
274     Md5.update(GV.getName());
275     Md5.update(ArrayRef<uint8_t>{0});
276   };
277 
278   for (auto &F : *M)
279     AddGlobal(F);
280   for (auto &GV : M->globals())
281     AddGlobal(GV);
282   for (auto &GA : M->aliases())
283     AddGlobal(GA);
284   for (auto &IF : M->ifuncs())
285     AddGlobal(IF);
286 
287   if (!ExportsSymbols)
288     return "";
289 
290   MD5::MD5Result R;
291   Md5.final(R);
292 
293   SmallString<32> Str;
294   MD5::stringifyResult(R, Str);
295   return ("." + Str).str();
296 }
297 
298 void VFABI::setVectorVariantNames(
299     CallInst *CI, const SmallVector<std::string, 8> &VariantMappings) {
300   if (VariantMappings.empty())
301     return;
302 
303   SmallString<256> Buffer;
304   llvm::raw_svector_ostream Out(Buffer);
305   for (const std::string &VariantMapping : VariantMappings)
306     Out << VariantMapping << ",";
307   // Get rid of the trailing ','.
308   assert(!Buffer.str().empty() && "Must have at least one char.");
309   Buffer.pop_back();
310 
311   Module *M = CI->getModule();
312 #ifndef NDEBUG
313   for (const std::string &VariantMapping : VariantMappings) {
314     LLVM_DEBUG(dbgs() << "VFABI: adding mapping '" << VariantMapping << "'\n");
315     Optional<VFInfo> VI = VFABI::tryDemangleForVFABI(VariantMapping, *M);
316     assert(VI.hasValue() && "Cannot add an invalid VFABI name.");
317     assert(M->getNamedValue(VI.getValue().VectorName) &&
318            "Cannot add variant to attribute: "
319            "vector function declaration is missing.");
320   }
321 #endif
322   CI->addAttribute(
323       AttributeList::FunctionIndex,
324       Attribute::get(M->getContext(), MappingsAttrName, Buffer.str()));
325 }
326