166d00febSPaula Toth //===-- Implementation of crt for x86_64 ----------------------------------===//
2f6ccb4feSSiva Chandra Reddy //
3f6ccb4feSSiva Chandra Reddy // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4f6ccb4feSSiva Chandra Reddy // See https://llvm.org/LICENSE.txt for license information.
5f6ccb4feSSiva Chandra Reddy // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6f6ccb4feSSiva Chandra Reddy //
7f6ccb4feSSiva Chandra Reddy //===----------------------------------------------------------------------===//
8f6ccb4feSSiva Chandra Reddy
95d59385bSSiva Chandra Reddy #include "config/linux/app.h"
103cc2161cSSiva Chandra Reddy #include "src/__support/OSUtil/syscall.h"
11*8dc42802SSiva Chandra Reddy #include "src/__support/threads/thread.h"
12b950a0d4SSiva Chandra Reddy #include "src/string/memory_utils/memcpy_implementations.h"
13f6ccb4feSSiva Chandra Reddy
145d59385bSSiva Chandra Reddy #include <asm/prctl.h>
15f6ccb4feSSiva Chandra Reddy #include <linux/auxvec.h>
165d59385bSSiva Chandra Reddy #include <linux/elf.h>
17f6ccb4feSSiva Chandra Reddy #include <stdint.h>
1886bebe1aSSiva Chandra Reddy #include <sys/mman.h>
1986bebe1aSSiva Chandra Reddy #include <sys/syscall.h>
20f6ccb4feSSiva Chandra Reddy
21f6ccb4feSSiva Chandra Reddy extern "C" int main(int, char **, char **);
22f6ccb4feSSiva Chandra Reddy
235d59385bSSiva Chandra Reddy namespace __llvm_libc {
245d59385bSSiva Chandra Reddy
255d59385bSSiva Chandra Reddy #ifdef SYS_mmap2
265d59385bSSiva Chandra Reddy static constexpr long mmapSyscallNumber = SYS_mmap2;
275d59385bSSiva Chandra Reddy #elif SYS_mmap
285d59385bSSiva Chandra Reddy static constexpr long mmapSyscallNumber = SYS_mmap;
295d59385bSSiva Chandra Reddy #else
305d59385bSSiva Chandra Reddy #error "Target platform does not have SYS_mmap or SYS_mmap2 defined"
315d59385bSSiva Chandra Reddy #endif
325d59385bSSiva Chandra Reddy
335d59385bSSiva Chandra Reddy AppProperties app;
345d59385bSSiva Chandra Reddy
35*8dc42802SSiva Chandra Reddy static ThreadAttributes main_thread_attrib;
36*8dc42802SSiva Chandra Reddy
375d59385bSSiva Chandra Reddy // TODO: The function is x86_64 specific. Move it to config/linux/app.h
385d59385bSSiva Chandra Reddy // and generalize it. Also, dynamic loading is not handled currently.
init_tls(TLSDescriptor & tls_descriptor)39859c1897SSiva Chandra Reddy void init_tls(TLSDescriptor &tls_descriptor) {
40859c1897SSiva Chandra Reddy if (app.tls.size == 0) {
41859c1897SSiva Chandra Reddy tls_descriptor.size = 0;
42859c1897SSiva Chandra Reddy tls_descriptor.tp = 0;
435d59385bSSiva Chandra Reddy return;
44859c1897SSiva Chandra Reddy }
455d59385bSSiva Chandra Reddy
465d59385bSSiva Chandra Reddy // We will assume the alignment is always a power of two.
47c74c3442SSiva Chandra Reddy uintptr_t tlsSize = app.tls.size & -app.tls.align;
48c74c3442SSiva Chandra Reddy if (tlsSize != app.tls.size)
49c74c3442SSiva Chandra Reddy tlsSize += app.tls.align;
505d59385bSSiva Chandra Reddy
515d59385bSSiva Chandra Reddy // Per the x86_64 TLS ABI, the entry pointed to by the thread pointer is the
525d59385bSSiva Chandra Reddy // address of the TLS block. So, we add more size to accomodate this address
535d59385bSSiva Chandra Reddy // entry.
54859c1897SSiva Chandra Reddy uintptr_t tlsSizeWithAddr = tlsSize + sizeof(uintptr_t);
555d59385bSSiva Chandra Reddy
565d59385bSSiva Chandra Reddy // We cannot call the mmap function here as the functions set errno on
575d59385bSSiva Chandra Reddy // failure. Since errno is implemented via a thread local variable, we cannot
585d59385bSSiva Chandra Reddy // use errno before TLS is setup.
595d59385bSSiva Chandra Reddy long mmapRetVal = __llvm_libc::syscall(
605d59385bSSiva Chandra Reddy mmapSyscallNumber, nullptr, tlsSizeWithAddr, PROT_READ | PROT_WRITE,
615d59385bSSiva Chandra Reddy MAP_ANONYMOUS | MAP_PRIVATE, -1, 0);
625d59385bSSiva Chandra Reddy // We cannot check the return value with MAP_FAILED as that is the return
635d59385bSSiva Chandra Reddy // of the mmap function and not the mmap syscall.
645d59385bSSiva Chandra Reddy if (mmapRetVal < 0 && static_cast<uintptr_t>(mmapRetVal) > -app.pageSize)
655d59385bSSiva Chandra Reddy __llvm_libc::syscall(SYS_exit, 1);
665d59385bSSiva Chandra Reddy uintptr_t *tlsAddr = reinterpret_cast<uintptr_t *>(mmapRetVal);
675d59385bSSiva Chandra Reddy
685d59385bSSiva Chandra Reddy // x86_64 TLS faces down from the thread pointer with the first entry
695d59385bSSiva Chandra Reddy // pointing to the address of the first real TLS byte.
705d59385bSSiva Chandra Reddy uintptr_t endPtr = reinterpret_cast<uintptr_t>(tlsAddr) + tlsSize;
715d59385bSSiva Chandra Reddy *reinterpret_cast<uintptr_t *>(endPtr) = endPtr;
725d59385bSSiva Chandra Reddy
73b950a0d4SSiva Chandra Reddy __llvm_libc::inline_memcpy(reinterpret_cast<char *>(tlsAddr),
74b950a0d4SSiva Chandra Reddy reinterpret_cast<const char *>(app.tls.address),
75be6af89fSSiva Chandra app.tls.init_size);
76859c1897SSiva Chandra Reddy
77859c1897SSiva Chandra Reddy tls_descriptor = {tlsSizeWithAddr, uintptr_t(tlsAddr), endPtr};
78859c1897SSiva Chandra Reddy return;
79859c1897SSiva Chandra Reddy }
80859c1897SSiva Chandra Reddy
cleanup_tls(uintptr_t addr,uintptr_t size)81859c1897SSiva Chandra Reddy void cleanup_tls(uintptr_t addr, uintptr_t size) {
82859c1897SSiva Chandra Reddy if (size == 0)
83859c1897SSiva Chandra Reddy return;
84859c1897SSiva Chandra Reddy __llvm_libc::syscall(SYS_munmap, addr, size);
85859c1897SSiva Chandra Reddy }
86859c1897SSiva Chandra Reddy
87859c1897SSiva Chandra Reddy // Sets the thread pointer to |val|. Returns true on success, false on failure.
set_thread_ptr(uintptr_t val)88859c1897SSiva Chandra Reddy static bool set_thread_ptr(uintptr_t val) {
89859c1897SSiva Chandra Reddy return __llvm_libc::syscall(SYS_arch_prctl, ARCH_SET_FS, val) == -1 ? false
90859c1897SSiva Chandra Reddy : true;
915d59385bSSiva Chandra Reddy }
925d59385bSSiva Chandra Reddy
935d59385bSSiva Chandra Reddy } // namespace __llvm_libc
945d59385bSSiva Chandra Reddy
955d59385bSSiva Chandra Reddy using __llvm_libc::app;
965d59385bSSiva Chandra Reddy
97f6ccb4feSSiva Chandra Reddy // TODO: Would be nice to use the aux entry structure from elf.h when available.
98f6ccb4feSSiva Chandra Reddy struct AuxEntry {
99f6ccb4feSSiva Chandra Reddy uint64_t type;
100f6ccb4feSSiva Chandra Reddy uint64_t value;
101f6ccb4feSSiva Chandra Reddy };
102f6ccb4feSSiva Chandra Reddy
_start()103f6ccb4feSSiva Chandra Reddy extern "C" void _start() {
104f6ccb4feSSiva Chandra Reddy // This TU is compiled with -fno-omit-frame-pointer. Hence, the previous value
105f6ccb4feSSiva Chandra Reddy // of the base pointer is pushed on to the stack. So, we step over it (the
106f6ccb4feSSiva Chandra Reddy // "+ 1" below) to get to the args.
107fe2cc14aSSiva Chandra Reddy app.args = reinterpret_cast<__llvm_libc::Args *>(
108fe2cc14aSSiva Chandra Reddy reinterpret_cast<uintptr_t *>(__builtin_frame_address(0)) + 1);
109fe2cc14aSSiva Chandra Reddy
110fe2cc14aSSiva Chandra Reddy // The x86_64 ABI requires that the stack pointer is aligned to a 16-byte
111fe2cc14aSSiva Chandra Reddy // boundary. We align it here but we cannot use any local variables created
112fe2cc14aSSiva Chandra Reddy // before the following alignment. Best would be to not create any local
113fe2cc14aSSiva Chandra Reddy // variables before the alignment. Also, note that we are aligning the stack
114fe2cc14aSSiva Chandra Reddy // downwards as the x86_64 stack grows downwards. This ensures that we don't
115fe2cc14aSSiva Chandra Reddy // tread on argc, argv etc.
116fe2cc14aSSiva Chandra Reddy // NOTE: Compiler attributes for alignment do not help here as the stack
117fe2cc14aSSiva Chandra Reddy // pointer on entry to this _start function is controlled by the OS. In fact,
118fe2cc14aSSiva Chandra Reddy // compilers can generate code assuming the alignment as required by the ABI.
119fe2cc14aSSiva Chandra Reddy // If the stack pointers as setup by the OS are already aligned, then the
120fe2cc14aSSiva Chandra Reddy // following code is a NOP.
121fe2cc14aSSiva Chandra Reddy __asm__ __volatile__("andq $0xfffffffffffffff0, %%rsp\n\t" ::: "%rsp");
122fe2cc14aSSiva Chandra Reddy __asm__ __volatile__("andq $0xfffffffffffffff0, %%rbp\n\t" ::: "%rbp");
123f6ccb4feSSiva Chandra Reddy
124*8dc42802SSiva Chandra Reddy auto tid = __llvm_libc::syscall(SYS_gettid);
125*8dc42802SSiva Chandra Reddy if (tid <= 0)
126*8dc42802SSiva Chandra Reddy __llvm_libc::syscall(SYS_exit, 1);
127*8dc42802SSiva Chandra Reddy __llvm_libc::main_thread_attrib.tid = tid;
128*8dc42802SSiva Chandra Reddy
129f6ccb4feSSiva Chandra Reddy // After the argv array, is a 8-byte long NULL value before the array of env
130f6ccb4feSSiva Chandra Reddy // values. The end of the env values is marked by another 8-byte long NULL
131f6ccb4feSSiva Chandra Reddy // value. We step over it (the "+ 1" below) to get to the env values.
132fe2cc14aSSiva Chandra Reddy uint64_t *env_ptr = app.args->argv + app.args->argc + 1;
133f6ccb4feSSiva Chandra Reddy uint64_t *env_end_marker = env_ptr;
134f2a7f835SRaman Tenneti app.envPtr = env_ptr;
135f6ccb4feSSiva Chandra Reddy while (*env_end_marker)
136f6ccb4feSSiva Chandra Reddy ++env_end_marker;
137f6ccb4feSSiva Chandra Reddy
138f6ccb4feSSiva Chandra Reddy // After the env array, is the aux-vector. The end of the aux-vector is
139f6ccb4feSSiva Chandra Reddy // denoted by an AT_NULL entry.
1405d59385bSSiva Chandra Reddy Elf64_Phdr *programHdrTable = nullptr;
1415d59385bSSiva Chandra Reddy uintptr_t programHdrCount;
142f6ccb4feSSiva Chandra Reddy for (AuxEntry *aux_entry = reinterpret_cast<AuxEntry *>(env_end_marker + 1);
143f6ccb4feSSiva Chandra Reddy aux_entry->type != AT_NULL; ++aux_entry) {
1445d59385bSSiva Chandra Reddy switch (aux_entry->type) {
1455d59385bSSiva Chandra Reddy case AT_PHDR:
1465d59385bSSiva Chandra Reddy programHdrTable = reinterpret_cast<Elf64_Phdr *>(aux_entry->value);
1475d59385bSSiva Chandra Reddy break;
1485d59385bSSiva Chandra Reddy case AT_PHNUM:
1495d59385bSSiva Chandra Reddy programHdrCount = aux_entry->value;
1505d59385bSSiva Chandra Reddy break;
1515d59385bSSiva Chandra Reddy case AT_PAGESZ:
1525d59385bSSiva Chandra Reddy app.pageSize = aux_entry->value;
1535d59385bSSiva Chandra Reddy break;
1545d59385bSSiva Chandra Reddy default:
1555d59385bSSiva Chandra Reddy break; // TODO: Read other useful entries from the aux vector.
156f6ccb4feSSiva Chandra Reddy }
1575d59385bSSiva Chandra Reddy }
1585d59385bSSiva Chandra Reddy
159be6af89fSSiva Chandra app.tls.size = 0;
1605d59385bSSiva Chandra Reddy for (uintptr_t i = 0; i < programHdrCount; ++i) {
1615d59385bSSiva Chandra Reddy Elf64_Phdr *phdr = programHdrTable + i;
1625d59385bSSiva Chandra Reddy if (phdr->p_type != PT_TLS)
1635d59385bSSiva Chandra Reddy continue;
1645d59385bSSiva Chandra Reddy // TODO: p_vaddr value has to be adjusted for static-pie executables.
1655d59385bSSiva Chandra Reddy app.tls.address = phdr->p_vaddr;
1665d59385bSSiva Chandra Reddy app.tls.size = phdr->p_memsz;
167be6af89fSSiva Chandra app.tls.init_size = phdr->p_filesz;
1685d59385bSSiva Chandra Reddy app.tls.align = phdr->p_align;
1695d59385bSSiva Chandra Reddy }
1705d59385bSSiva Chandra Reddy
171859c1897SSiva Chandra Reddy __llvm_libc::TLSDescriptor tls;
172859c1897SSiva Chandra Reddy __llvm_libc::init_tls(tls);
173859c1897SSiva Chandra Reddy if (tls.size != 0 && !__llvm_libc::set_thread_ptr(tls.tp))
174859c1897SSiva Chandra Reddy __llvm_libc::syscall(SYS_exit, 1);
175f6ccb4feSSiva Chandra Reddy
176*8dc42802SSiva Chandra Reddy __llvm_libc::self.attrib = &__llvm_libc::main_thread_attrib;
177*8dc42802SSiva Chandra Reddy
178859c1897SSiva Chandra Reddy int retval = main(app.args->argc, reinterpret_cast<char **>(app.args->argv),
179859c1897SSiva Chandra Reddy reinterpret_cast<char **>(env_ptr));
180859c1897SSiva Chandra Reddy __llvm_libc::cleanup_tls(tls.addr, tls.size);
181859c1897SSiva Chandra Reddy __llvm_libc::syscall(SYS_exit, retval);
182f6ccb4feSSiva Chandra Reddy }
183