xref: /llvm-project-15.0.7/lld/COFF/DLL.cpp (revision b3eef01e)
1 //===- DLL.cpp ------------------------------------------------------------===//
2 //
3 //                             The LLVM Linker
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file defines various types of chunks for the DLL import or export
11 // descriptor tables. They are inherently Windows-specific.
12 // You need to read Microsoft PE/COFF spec to understand details
13 // about the data structures.
14 //
15 // If you are not particularly interested in linking against Windows
16 // DLL, you can skip this file, and you should still be able to
17 // understand the rest of the linker.
18 //
19 //===----------------------------------------------------------------------===//
20 
21 #include "Chunks.h"
22 #include "DLL.h"
23 #include "llvm/Object/COFF.h"
24 #include "llvm/Support/Endian.h"
25 #include "llvm/Support/Path.h"
26 
27 using namespace llvm;
28 using namespace llvm::object;
29 using namespace llvm::support::endian;
30 using namespace llvm::COFF;
31 
32 namespace lld {
33 namespace coff {
34 namespace {
35 
36 // Import table
37 
38 static int ptrSize() { return Config->is64() ? 8 : 4; }
39 
40 // A chunk for the import descriptor table.
41 class HintNameChunk : public Chunk {
42 public:
43   HintNameChunk(StringRef N, uint16_t H) : Name(N), Hint(H) {}
44 
45   size_t getSize() const override {
46     // Starts with 2 byte Hint field, followed by a null-terminated string,
47     // ends with 0 or 1 byte padding.
48     return RoundUpToAlignment(Name.size() + 3, 2);
49   }
50 
51   void writeTo(uint8_t *Buf) const override {
52     write16le(Buf + OutputSectionOff, Hint);
53     memcpy(Buf + OutputSectionOff + 2, Name.data(), Name.size());
54   }
55 
56 private:
57   StringRef Name;
58   uint16_t Hint;
59 };
60 
61 // A chunk for the import descriptor table.
62 class LookupChunk : public Chunk {
63 public:
64   explicit LookupChunk(Chunk *C) : HintName(C) {}
65   size_t getSize() const override { return ptrSize(); }
66 
67   void writeTo(uint8_t *Buf) const override {
68     write32le(Buf + OutputSectionOff, HintName->getRVA());
69   }
70 
71   Chunk *HintName;
72 };
73 
74 // A chunk for the import descriptor table.
75 // This chunk represent import-by-ordinal symbols.
76 // See Microsoft PE/COFF spec 7.1. Import Header for details.
77 class OrdinalOnlyChunk : public Chunk {
78 public:
79   explicit OrdinalOnlyChunk(uint16_t V) : Ordinal(V) {}
80   size_t getSize() const override { return ptrSize(); }
81 
82   void writeTo(uint8_t *Buf) const override {
83     // An import-by-ordinal slot has MSB 1 to indicate that
84     // this is import-by-ordinal (and not import-by-name).
85     if (Config->is64()) {
86       write64le(Buf + OutputSectionOff, (1ULL << 63) | Ordinal);
87     } else {
88       write32le(Buf + OutputSectionOff, (1ULL << 31) | Ordinal);
89     }
90   }
91 
92   uint16_t Ordinal;
93 };
94 
95 // A chunk for the import descriptor table.
96 class ImportDirectoryChunk : public Chunk {
97 public:
98   explicit ImportDirectoryChunk(Chunk *N) : DLLName(N) {}
99   size_t getSize() const override { return sizeof(ImportDirectoryTableEntry); }
100 
101   void writeTo(uint8_t *Buf) const override {
102     auto *E = (coff_import_directory_table_entry *)(Buf + OutputSectionOff);
103     E->ImportLookupTableRVA = LookupTab->getRVA();
104     E->NameRVA = DLLName->getRVA();
105     E->ImportAddressTableRVA = AddressTab->getRVA();
106   }
107 
108   Chunk *DLLName;
109   Chunk *LookupTab;
110   Chunk *AddressTab;
111 };
112 
113 // A chunk representing null terminator in the import table.
114 // Contents of this chunk is always null bytes.
115 class NullChunk : public Chunk {
116 public:
117   explicit NullChunk(size_t N) : Size(N) {}
118   bool hasData() const override { return false; }
119   size_t getSize() const override { return Size; }
120   void setAlign(size_t N) { Align = N; }
121 
122 private:
123   size_t Size;
124 };
125 
126 static std::vector<std::vector<DefinedImportData *>>
127 binImports(const std::vector<DefinedImportData *> &Imports) {
128   // Group DLL-imported symbols by DLL name because that's how
129   // symbols are layed out in the import descriptor table.
130   auto Less = [](const std::string &A, const std::string &B) {
131     return Config->DLLOrder[A] < Config->DLLOrder[B];
132   };
133   std::map<std::string, std::vector<DefinedImportData *>,
134            bool(*)(const std::string &, const std::string &)> M(Less);
135   for (DefinedImportData *Sym : Imports)
136     M[Sym->getDLLName().lower()].push_back(Sym);
137 
138   std::vector<std::vector<DefinedImportData *>> V;
139   for (auto &P : M) {
140     // Sort symbols by name for each group.
141     std::vector<DefinedImportData *> &Syms = P.second;
142     std::sort(Syms.begin(), Syms.end(),
143               [](DefinedImportData *A, DefinedImportData *B) {
144                 return A->getName() < B->getName();
145               });
146     V.push_back(std::move(Syms));
147   }
148   return V;
149 }
150 
151 // Export table
152 // See Microsoft PE/COFF spec 4.3 for details.
153 
154 // A chunk for the delay import descriptor table etnry.
155 class DelayDirectoryChunk : public Chunk {
156 public:
157   explicit DelayDirectoryChunk(Chunk *N) : DLLName(N) {}
158 
159   size_t getSize() const override {
160     return sizeof(delay_import_directory_table_entry);
161   }
162 
163   void writeTo(uint8_t *Buf) const override {
164     auto *E = (delay_import_directory_table_entry *)(Buf + OutputSectionOff);
165     E->Attributes = 1;
166     E->Name = DLLName->getRVA();
167     E->ModuleHandle = ModuleHandle->getRVA();
168     E->DelayImportAddressTable = AddressTab->getRVA();
169     E->DelayImportNameTable = NameTab->getRVA();
170   }
171 
172   Chunk *DLLName;
173   Chunk *ModuleHandle;
174   Chunk *AddressTab;
175   Chunk *NameTab;
176 };
177 
178 // Initial contents for delay-loaded functions.
179 // This code calls __delayLoadHelper2 function to resolve a symbol
180 // and then overwrites its jump table slot with the result
181 // for subsequent function calls.
182 static const uint8_t ThunkX64[] = {
183     0x51,                               // push    rcx
184     0x52,                               // push    rdx
185     0x41, 0x50,                         // push    r8
186     0x41, 0x51,                         // push    r9
187     0x48, 0x83, 0xEC, 0x48,             // sub     rsp, 48h
188     0x66, 0x0F, 0x7F, 0x04, 0x24,       // movdqa  xmmword ptr [rsp], xmm0
189     0x66, 0x0F, 0x7F, 0x4C, 0x24, 0x10, // movdqa  xmmword ptr [rsp+10h], xmm1
190     0x66, 0x0F, 0x7F, 0x54, 0x24, 0x20, // movdqa  xmmword ptr [rsp+20h], xmm2
191     0x66, 0x0F, 0x7F, 0x5C, 0x24, 0x30, // movdqa  xmmword ptr [rsp+30h], xmm3
192     0x48, 0x8D, 0x15, 0, 0, 0, 0,       // lea     rdx, [__imp_<FUNCNAME>]
193     0x48, 0x8D, 0x0D, 0, 0, 0, 0,       // lea     rcx, [___DELAY_IMPORT_...]
194     0xE8, 0, 0, 0, 0,                   // call    __delayLoadHelper2
195     0x66, 0x0F, 0x6F, 0x04, 0x24,       // movdqa  xmm0, xmmword ptr [rsp]
196     0x66, 0x0F, 0x6F, 0x4C, 0x24, 0x10, // movdqa  xmm1, xmmword ptr [rsp+10h]
197     0x66, 0x0F, 0x6F, 0x54, 0x24, 0x20, // movdqa  xmm2, xmmword ptr [rsp+20h]
198     0x66, 0x0F, 0x6F, 0x5C, 0x24, 0x30, // movdqa  xmm3, xmmword ptr [rsp+30h]
199     0x48, 0x83, 0xC4, 0x48,             // add     rsp, 48h
200     0x41, 0x59,                         // pop     r9
201     0x41, 0x58,                         // pop     r8
202     0x5A,                               // pop     rdx
203     0x59,                               // pop     rcx
204     0xFF, 0xE0,                         // jmp     rax
205 };
206 
207 static const uint8_t ThunkX86[] = {
208     0x51,              // push  ecx
209     0x52,              // push  edx
210     0x68, 0, 0, 0, 0,  // push  offset ___imp__<FUNCNAME>
211     0x68, 0, 0, 0, 0,  // push  offset ___DELAY_IMPORT_DESCRIPTOR_<DLLNAME>_dll
212     0xE8, 0, 0, 0, 0,  // call  ___delayLoadHelper2@8
213     0x5A,              // pop   edx
214     0x59,              // pop   ecx
215     0xFF, 0xE0,        // jmp   eax
216 };
217 
218 // A chunk for the delay import thunk.
219 class ThunkChunkX64 : public Chunk {
220 public:
221   ThunkChunkX64(Defined *I, Chunk *D, Defined *H)
222       : Imp(I), Desc(D), Helper(H) {}
223 
224   size_t getSize() const override { return sizeof(ThunkX64); }
225 
226   void writeTo(uint8_t *Buf) const override {
227     memcpy(Buf + OutputSectionOff, ThunkX64, sizeof(ThunkX64));
228     write32le(Buf + OutputSectionOff + 36, Imp->getRVA() - RVA - 40);
229     write32le(Buf + OutputSectionOff + 43, Desc->getRVA() - RVA - 47);
230     write32le(Buf + OutputSectionOff + 48, Helper->getRVA() - RVA - 52);
231   }
232 
233   Defined *Imp = nullptr;
234   Chunk *Desc = nullptr;
235   Defined *Helper = nullptr;
236 };
237 
238 class ThunkChunkX86 : public Chunk {
239 public:
240   ThunkChunkX86(Defined *I, Chunk *D, Defined *H)
241       : Imp(I), Desc(D), Helper(H) {}
242 
243   size_t getSize() const override { return sizeof(ThunkX86); }
244 
245   void writeTo(uint8_t *Buf) const override {
246     memcpy(Buf + OutputSectionOff, ThunkX86, sizeof(ThunkX86));
247     write32le(Buf + OutputSectionOff + 3, Imp->getRVA() + Config->ImageBase);
248     write32le(Buf + OutputSectionOff + 8, Desc->getRVA() + Config->ImageBase);
249     write32le(Buf + OutputSectionOff + 13, Helper->getRVA() - RVA - 17);
250   }
251 
252   void getBaserels(std::vector<Baserel> *Res) override {
253     Res->emplace_back(RVA + 3);
254     Res->emplace_back(RVA + 8);
255   }
256 
257   Defined *Imp = nullptr;
258   Chunk *Desc = nullptr;
259   Defined *Helper = nullptr;
260 };
261 
262 // A chunk for the import descriptor table.
263 class DelayAddressChunk : public Chunk {
264 public:
265   explicit DelayAddressChunk(Chunk *C) : Thunk(C) {}
266   size_t getSize() const override { return ptrSize(); }
267 
268   void writeTo(uint8_t *Buf) const override {
269     if (Config->is64()) {
270       write64le(Buf + OutputSectionOff, Thunk->getRVA() + Config->ImageBase);
271     } else {
272       write32le(Buf + OutputSectionOff, Thunk->getRVA() + Config->ImageBase);
273     }
274   }
275 
276   void getBaserels(std::vector<Baserel> *Res) override {
277     Res->emplace_back(RVA);
278   }
279 
280   Chunk *Thunk;
281 };
282 
283 // Export table
284 // Read Microsoft PE/COFF spec 5.3 for details.
285 
286 // A chunk for the export descriptor table.
287 class ExportDirectoryChunk : public Chunk {
288 public:
289   ExportDirectoryChunk(int I, int J, Chunk *D, Chunk *A, Chunk *N, Chunk *O)
290       : MaxOrdinal(I), NameTabSize(J), DLLName(D), AddressTab(A), NameTab(N),
291         OrdinalTab(O) {}
292 
293   size_t getSize() const override {
294     return sizeof(export_directory_table_entry);
295   }
296 
297   void writeTo(uint8_t *Buf) const override {
298     auto *E = (export_directory_table_entry *)(Buf + OutputSectionOff);
299     E->NameRVA = DLLName->getRVA();
300     E->OrdinalBase = 0;
301     E->AddressTableEntries = MaxOrdinal + 1;
302     E->NumberOfNamePointers = NameTabSize;
303     E->ExportAddressTableRVA = AddressTab->getRVA();
304     E->NamePointerRVA = NameTab->getRVA();
305     E->OrdinalTableRVA = OrdinalTab->getRVA();
306   }
307 
308   uint16_t MaxOrdinal;
309   uint16_t NameTabSize;
310   Chunk *DLLName;
311   Chunk *AddressTab;
312   Chunk *NameTab;
313   Chunk *OrdinalTab;
314 };
315 
316 class AddressTableChunk : public Chunk {
317 public:
318   explicit AddressTableChunk(size_t MaxOrdinal) : Size(MaxOrdinal + 1) {}
319   size_t getSize() const override { return Size * 4; }
320 
321   void writeTo(uint8_t *Buf) const override {
322     for (Export &E : Config->Exports) {
323       auto *D = cast<Defined>(E.Sym->repl());
324       write32le(Buf + OutputSectionOff + E.Ordinal * 4, D->getRVA());
325     }
326   }
327 
328 private:
329   size_t Size;
330 };
331 
332 class NamePointersChunk : public Chunk {
333 public:
334   explicit NamePointersChunk(std::vector<Chunk *> &V) : Chunks(V) {}
335   size_t getSize() const override { return Chunks.size() * 4; }
336 
337   void writeTo(uint8_t *Buf) const override {
338     uint8_t *P = Buf + OutputSectionOff;
339     for (Chunk *C : Chunks) {
340       write32le(P, C->getRVA());
341       P += 4;
342     }
343   }
344 
345 private:
346   std::vector<Chunk *> Chunks;
347 };
348 
349 class ExportOrdinalChunk : public Chunk {
350 public:
351   explicit ExportOrdinalChunk(size_t I) : Size(I) {}
352   size_t getSize() const override { return Size * 2; }
353 
354   void writeTo(uint8_t *Buf) const override {
355     uint8_t *P = Buf + OutputSectionOff;
356     for (Export &E : Config->Exports) {
357       if (E.Noname)
358         continue;
359       write16le(P, E.Ordinal);
360       P += 2;
361     }
362   }
363 
364 private:
365   size_t Size;
366 };
367 
368 } // anonymous namespace
369 
370 uint64_t IdataContents::getDirSize() {
371   return Dirs.size() * sizeof(ImportDirectoryTableEntry);
372 }
373 
374 uint64_t IdataContents::getIATSize() {
375   return Addresses.size() * ptrSize();
376 }
377 
378 // Returns a list of .idata contents.
379 // See Microsoft PE/COFF spec 5.4 for details.
380 std::vector<Chunk *> IdataContents::getChunks() {
381   create();
382   std::vector<Chunk *> V;
383   // The loader assumes a specific order of data.
384   // Add each type in the correct order.
385   for (std::unique_ptr<Chunk> &C : Dirs)
386     V.push_back(C.get());
387   for (std::unique_ptr<Chunk> &C : Lookups)
388     V.push_back(C.get());
389   for (std::unique_ptr<Chunk> &C : Addresses)
390     V.push_back(C.get());
391   for (std::unique_ptr<Chunk> &C : Hints)
392     V.push_back(C.get());
393   for (auto &P : DLLNames) {
394     std::unique_ptr<Chunk> &C = P.second;
395     V.push_back(C.get());
396   }
397   return V;
398 }
399 
400 void IdataContents::create() {
401   std::vector<std::vector<DefinedImportData *>> V = binImports(Imports);
402 
403   // Create .idata contents for each DLL.
404   for (std::vector<DefinedImportData *> &Syms : V) {
405     StringRef Name = Syms[0]->getDLLName();
406 
407     // Create lookup and address tables. If they have external names,
408     // we need to create HintName chunks to store the names.
409     // If they don't (if they are import-by-ordinals), we store only
410     // ordinal values to the table.
411     size_t Base = Lookups.size();
412     for (DefinedImportData *S : Syms) {
413       uint16_t Ord = S->getOrdinal();
414       if (S->getExternalName().empty()) {
415         Lookups.push_back(make_unique<OrdinalOnlyChunk>(Ord));
416         Addresses.push_back(make_unique<OrdinalOnlyChunk>(Ord));
417         continue;
418       }
419       auto C = make_unique<HintNameChunk>(S->getExternalName(), Ord);
420       Lookups.push_back(make_unique<LookupChunk>(C.get()));
421       Addresses.push_back(make_unique<LookupChunk>(C.get()));
422       Hints.push_back(std::move(C));
423     }
424     // Terminate with null values.
425     Lookups.push_back(make_unique<NullChunk>(ptrSize()));
426     Addresses.push_back(make_unique<NullChunk>(ptrSize()));
427 
428     for (int I = 0, E = Syms.size(); I < E; ++I)
429       Syms[I]->setLocation(Addresses[Base + I].get());
430 
431     // Create the import table header.
432     if (!DLLNames.count(Name))
433       DLLNames[Name] = make_unique<StringChunk>(Name);
434     auto Dir = make_unique<ImportDirectoryChunk>(DLLNames[Name].get());
435     Dir->LookupTab = Lookups[Base].get();
436     Dir->AddressTab = Addresses[Base].get();
437     Dirs.push_back(std::move(Dir));
438   }
439   // Add null terminator.
440   Dirs.push_back(make_unique<NullChunk>(sizeof(ImportDirectoryTableEntry)));
441 }
442 
443 std::vector<Chunk *> DelayLoadContents::getChunks() {
444   std::vector<Chunk *> V;
445   for (std::unique_ptr<Chunk> &C : Dirs)
446     V.push_back(C.get());
447   for (std::unique_ptr<Chunk> &C : Names)
448     V.push_back(C.get());
449   for (std::unique_ptr<Chunk> &C : HintNames)
450     V.push_back(C.get());
451   for (auto &P : DLLNames) {
452     std::unique_ptr<Chunk> &C = P.second;
453     V.push_back(C.get());
454   }
455   return V;
456 }
457 
458 std::vector<Chunk *> DelayLoadContents::getDataChunks() {
459   std::vector<Chunk *> V;
460   for (std::unique_ptr<Chunk> &C : ModuleHandles)
461     V.push_back(C.get());
462   for (std::unique_ptr<Chunk> &C : Addresses)
463     V.push_back(C.get());
464   return V;
465 }
466 
467 uint64_t DelayLoadContents::getDirSize() {
468   return Dirs.size() * sizeof(delay_import_directory_table_entry);
469 }
470 
471 void DelayLoadContents::create(Defined *H) {
472   Helper = H;
473   std::vector<std::vector<DefinedImportData *>> V = binImports(Imports);
474 
475   // Create .didat contents for each DLL.
476   for (std::vector<DefinedImportData *> &Syms : V) {
477     StringRef Name = Syms[0]->getDLLName();
478 
479     // Create the delay import table header.
480     if (!DLLNames.count(Name))
481       DLLNames[Name] = make_unique<StringChunk>(Name);
482     auto Dir = make_unique<DelayDirectoryChunk>(DLLNames[Name].get());
483 
484     size_t Base = Addresses.size();
485     for (DefinedImportData *S : Syms) {
486       Chunk *T = newThunkChunk(S, Dir.get());
487       auto A = make_unique<DelayAddressChunk>(T);
488       Addresses.push_back(std::move(A));
489       Thunks.push_back(std::unique_ptr<Chunk>(T));
490       StringRef ExtName = S->getExternalName();
491       if (ExtName.empty()) {
492         Names.push_back(make_unique<OrdinalOnlyChunk>(S->getOrdinal()));
493       } else {
494         auto C = make_unique<HintNameChunk>(ExtName, 0);
495         Names.push_back(make_unique<LookupChunk>(C.get()));
496         HintNames.push_back(std::move(C));
497       }
498     }
499     // Terminate with null values.
500     Addresses.push_back(make_unique<NullChunk>(8));
501     Names.push_back(make_unique<NullChunk>(8));
502 
503     for (int I = 0, E = Syms.size(); I < E; ++I)
504       Syms[I]->setLocation(Addresses[Base + I].get());
505     auto *MH = new NullChunk(8);
506     MH->setAlign(8);
507     ModuleHandles.push_back(std::unique_ptr<Chunk>(MH));
508 
509     // Fill the delay import table header fields.
510     Dir->ModuleHandle = MH;
511     Dir->AddressTab = Addresses[Base].get();
512     Dir->NameTab = Names[Base].get();
513     Dirs.push_back(std::move(Dir));
514   }
515   // Add null terminator.
516   Dirs.push_back(
517       make_unique<NullChunk>(sizeof(delay_import_directory_table_entry)));
518 }
519 
520 Chunk *DelayLoadContents::newThunkChunk(DefinedImportData *S, Chunk *Dir) {
521   switch (Config->Machine) {
522   case AMD64:
523     return new ThunkChunkX64(S, Dir, Helper);
524   case I386:
525     return new ThunkChunkX86(S, Dir, Helper);
526   default:
527     llvm_unreachable("unsupported machine type");
528   }
529 }
530 
531 EdataContents::EdataContents() {
532   uint16_t MaxOrdinal = 0;
533   for (Export &E : Config->Exports)
534     MaxOrdinal = std::max(MaxOrdinal, E.Ordinal);
535 
536   auto *DLLName = new StringChunk(sys::path::filename(Config->OutputFile));
537   auto *AddressTab = new AddressTableChunk(MaxOrdinal);
538   std::vector<Chunk *> Names;
539   for (Export &E : Config->Exports)
540     if (!E.Noname)
541       Names.push_back(new StringChunk(E.ExportName));
542   auto *NameTab = new NamePointersChunk(Names);
543   auto *OrdinalTab = new ExportOrdinalChunk(Names.size());
544   auto *Dir = new ExportDirectoryChunk(MaxOrdinal, Names.size(), DLLName,
545                                        AddressTab, NameTab, OrdinalTab);
546   Chunks.push_back(std::unique_ptr<Chunk>(Dir));
547   Chunks.push_back(std::unique_ptr<Chunk>(DLLName));
548   Chunks.push_back(std::unique_ptr<Chunk>(AddressTab));
549   Chunks.push_back(std::unique_ptr<Chunk>(NameTab));
550   Chunks.push_back(std::unique_ptr<Chunk>(OrdinalTab));
551   for (Chunk *C : Names)
552     Chunks.push_back(std::unique_ptr<Chunk>(C));
553 }
554 
555 } // namespace coff
556 } // namespace lld
557