xref: /oneTBB/src/tbbmalloc_proxy/proxy.cpp (revision 8827ea7d)
151c0b2f7Stbbdev /*
2b15aabb3Stbbdev     Copyright (c) 2005-2021 Intel Corporation
351c0b2f7Stbbdev 
451c0b2f7Stbbdev     Licensed under the Apache License, Version 2.0 (the "License");
551c0b2f7Stbbdev     you may not use this file except in compliance with the License.
651c0b2f7Stbbdev     You may obtain a copy of the License at
751c0b2f7Stbbdev 
851c0b2f7Stbbdev         http://www.apache.org/licenses/LICENSE-2.0
951c0b2f7Stbbdev 
1051c0b2f7Stbbdev     Unless required by applicable law or agreed to in writing, software
1151c0b2f7Stbbdev     distributed under the License is distributed on an "AS IS" BASIS,
1251c0b2f7Stbbdev     WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
1351c0b2f7Stbbdev     See the License for the specific language governing permissions and
1451c0b2f7Stbbdev     limitations under the License.
1551c0b2f7Stbbdev */
1651c0b2f7Stbbdev 
17734f0bc0SPablo Romero #if __unix__ && !__ANDROID__
1851c0b2f7Stbbdev // include <bits/c++config.h> indirectly so that <cstdlib> is not included
1951c0b2f7Stbbdev #include <cstddef>
2051c0b2f7Stbbdev // include <features.h> indirectly so that <stdlib.h> is not included
2151c0b2f7Stbbdev #include <unistd.h>
2251c0b2f7Stbbdev // Working around compiler issue with Anaconda's gcc 7.3 compiler package.
2351c0b2f7Stbbdev // New gcc ported for old libc may provide their inline implementation
2451c0b2f7Stbbdev // of aligned_alloc as required by new C++ standard, this makes it hard to
2551c0b2f7Stbbdev // redefine aligned_alloc here. However, running on systems with new libc
2651c0b2f7Stbbdev // version, it still needs it to be redefined, thus tricking system headers
27734f0bc0SPablo Romero #if defined(__GLIBC_PREREQ)
28734f0bc0SPablo Romero #if !__GLIBC_PREREQ(2, 16) && _GLIBCXX_HAVE_ALIGNED_ALLOC
2951c0b2f7Stbbdev // tell <cstdlib> that there is no aligned_alloc
3051c0b2f7Stbbdev #undef _GLIBCXX_HAVE_ALIGNED_ALLOC
3151c0b2f7Stbbdev // trick <stdlib.h> to define another symbol instead
3251c0b2f7Stbbdev #define aligned_alloc __hidden_redefined_aligned_alloc
3351c0b2f7Stbbdev // Fix the state and undefine the trick
3451c0b2f7Stbbdev #include <cstdlib>
3551c0b2f7Stbbdev #undef aligned_alloc
36734f0bc0SPablo Romero #endif // !__GLIBC_PREREQ(2, 16) && _GLIBCXX_HAVE_ALIGNED_ALLOC
37734f0bc0SPablo Romero #endif // defined(__GLIBC_PREREQ)
38734f0bc0SPablo Romero #include <cstdlib>
39734f0bc0SPablo Romero #endif // __unix__ && !__ANDROID__
4051c0b2f7Stbbdev 
4151c0b2f7Stbbdev #include "proxy.h"
4251c0b2f7Stbbdev 
4349e08aacStbbdev #include "oneapi/tbb/detail/_config.h"
44*8827ea7dSLong Nguyen #include "oneapi/tbb/scalable_allocator.h"
4551c0b2f7Stbbdev #include "../tbb/environment.h"
4651c0b2f7Stbbdev 
4751c0b2f7Stbbdev #if !defined(__EXCEPTIONS) && !defined(_CPPUNWIND) && !defined(__SUNPRO_CC)
4851c0b2f7Stbbdev     #if TBB_USE_EXCEPTIONS
4951c0b2f7Stbbdev         #error Compilation settings do not support exception handling. Please do not set TBB_USE_EXCEPTIONS macro or set it to 0.
5051c0b2f7Stbbdev     #elif !defined(TBB_USE_EXCEPTIONS)
5151c0b2f7Stbbdev         #define TBB_USE_EXCEPTIONS 0
5251c0b2f7Stbbdev     #endif
5351c0b2f7Stbbdev #elif !defined(TBB_USE_EXCEPTIONS)
5451c0b2f7Stbbdev     #define TBB_USE_EXCEPTIONS 1
5551c0b2f7Stbbdev #endif
5651c0b2f7Stbbdev 
5751c0b2f7Stbbdev #if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || _WIN32 && !__TBB_WIN8UI_SUPPORT
5851c0b2f7Stbbdev /*** internal global operator new implementation (Linux, Windows) ***/
5951c0b2f7Stbbdev #include <new>
6051c0b2f7Stbbdev 
6151c0b2f7Stbbdev // Synchronization primitives to protect original library pointers and new_handler
6251c0b2f7Stbbdev #include "../tbbmalloc/Synchronize.h"
6351c0b2f7Stbbdev // Use MallocMutex implementation
6451c0b2f7Stbbdev typedef MallocMutex ProxyMutex;
6551c0b2f7Stbbdev 
66478de5b1Stbbdev // Adds aliasing and copy attributes to function if available
67478de5b1Stbbdev #if defined(__has_attribute)
68478de5b1Stbbdev     #if __has_attribute(__copy__)
69478de5b1Stbbdev         #define __TBB_ALIAS_ATTR_COPY(name) __attribute__((alias (#name), __copy__(name)))
70478de5b1Stbbdev     #endif
71478de5b1Stbbdev #endif
72478de5b1Stbbdev 
73478de5b1Stbbdev #ifndef __TBB_ALIAS_ATTR_COPY
74478de5b1Stbbdev     #define __TBB_ALIAS_ATTR_COPY(name) __attribute__((alias (#name)))
75478de5b1Stbbdev #endif
76478de5b1Stbbdev 
7751c0b2f7Stbbdev // In case there is no std::get_new_handler function
7851c0b2f7Stbbdev // which provides synchronized access to std::new_handler
7951c0b2f7Stbbdev #if !__TBB_CPP11_GET_NEW_HANDLER_PRESENT
8051c0b2f7Stbbdev static ProxyMutex new_lock;
8151c0b2f7Stbbdev #endif
8251c0b2f7Stbbdev 
8351c0b2f7Stbbdev static inline void* InternalOperatorNew(size_t sz) {
8451c0b2f7Stbbdev     void* res = scalable_malloc(sz);
8551c0b2f7Stbbdev #if TBB_USE_EXCEPTIONS
8651c0b2f7Stbbdev     while (!res) {
8751c0b2f7Stbbdev         std::new_handler handler;
8851c0b2f7Stbbdev #if __TBB_CPP11_GET_NEW_HANDLER_PRESENT
8951c0b2f7Stbbdev         handler = std::get_new_handler();
9051c0b2f7Stbbdev #else
9151c0b2f7Stbbdev         {
9251c0b2f7Stbbdev             ProxyMutex::scoped_lock lock(new_lock);
9351c0b2f7Stbbdev             handler = std::set_new_handler(0);
9451c0b2f7Stbbdev             std::set_new_handler(handler);
9551c0b2f7Stbbdev         }
9651c0b2f7Stbbdev #endif
9751c0b2f7Stbbdev         if (handler) {
9851c0b2f7Stbbdev             (*handler)();
9951c0b2f7Stbbdev         } else {
10051c0b2f7Stbbdev             throw std::bad_alloc();
10151c0b2f7Stbbdev         }
10251c0b2f7Stbbdev         res = scalable_malloc(sz);
10351c0b2f7Stbbdev }
10451c0b2f7Stbbdev #endif /* TBB_USE_EXCEPTIONS */
10551c0b2f7Stbbdev     return res;
10651c0b2f7Stbbdev }
10751c0b2f7Stbbdev /*** end of internal global operator new implementation ***/
10851c0b2f7Stbbdev #endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED || _WIN32 && !__TBB_WIN8UI_SUPPORT
10951c0b2f7Stbbdev 
11051c0b2f7Stbbdev #if MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED
11151c0b2f7Stbbdev 
11251c0b2f7Stbbdev #ifndef __THROW
11351c0b2f7Stbbdev #define __THROW
11451c0b2f7Stbbdev #endif
11551c0b2f7Stbbdev 
11651c0b2f7Stbbdev /*** service functions and variables ***/
11751c0b2f7Stbbdev #include <string.h> // for memset
11851c0b2f7Stbbdev #include <unistd.h> // for sysconf
11951c0b2f7Stbbdev 
12051c0b2f7Stbbdev static long memoryPageSize;
12151c0b2f7Stbbdev 
12251c0b2f7Stbbdev static inline void initPageSize()
12351c0b2f7Stbbdev {
12451c0b2f7Stbbdev     memoryPageSize = sysconf(_SC_PAGESIZE);
12551c0b2f7Stbbdev }
12651c0b2f7Stbbdev 
12751c0b2f7Stbbdev #if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
12851c0b2f7Stbbdev #include <dlfcn.h>
12951c0b2f7Stbbdev #include <malloc.h>    // mallinfo
13051c0b2f7Stbbdev 
13151c0b2f7Stbbdev /* __TBB_malloc_proxy used as a weak symbol by libtbbmalloc for:
13251c0b2f7Stbbdev    1) detection that the proxy library is loaded
13351c0b2f7Stbbdev    2) check that dlsym("malloc") found something different from our replacement malloc
13451c0b2f7Stbbdev */
13551c0b2f7Stbbdev 
136478de5b1Stbbdev extern "C" void *__TBB_malloc_proxy(size_t) __TBB_ALIAS_ATTR_COPY(malloc);
13751c0b2f7Stbbdev 
13851c0b2f7Stbbdev static void *orig_msize;
13951c0b2f7Stbbdev 
14051c0b2f7Stbbdev #elif MALLOC_ZONE_OVERLOAD_ENABLED
14151c0b2f7Stbbdev 
14251c0b2f7Stbbdev #include "proxy_overload_osx.h"
14351c0b2f7Stbbdev 
14451c0b2f7Stbbdev #endif // MALLOC_ZONE_OVERLOAD_ENABLED
14551c0b2f7Stbbdev 
14651c0b2f7Stbbdev // Original (i.e., replaced) functions,
14751c0b2f7Stbbdev // they are never changed for MALLOC_ZONE_OVERLOAD_ENABLED.
14851c0b2f7Stbbdev static void *orig_free,
14951c0b2f7Stbbdev     *orig_realloc;
15051c0b2f7Stbbdev 
15151c0b2f7Stbbdev #if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
15251c0b2f7Stbbdev #define ZONE_ARG
15351c0b2f7Stbbdev #define PREFIX(name) name
15451c0b2f7Stbbdev 
15551c0b2f7Stbbdev static void *orig_libc_free,
15651c0b2f7Stbbdev     *orig_libc_realloc;
15751c0b2f7Stbbdev 
15851c0b2f7Stbbdev // We already tried to find ptr to original functions.
15951c0b2f7Stbbdev static std::atomic<bool> origFuncSearched{false};
16051c0b2f7Stbbdev 
16151c0b2f7Stbbdev inline void InitOrigPointers()
16251c0b2f7Stbbdev {
16351c0b2f7Stbbdev     // race is OK here, as different threads found same functions
16451c0b2f7Stbbdev     if (!origFuncSearched.load(std::memory_order_acquire)) {
16551c0b2f7Stbbdev         orig_free = dlsym(RTLD_NEXT, "free");
16651c0b2f7Stbbdev         orig_realloc = dlsym(RTLD_NEXT, "realloc");
16751c0b2f7Stbbdev         orig_msize = dlsym(RTLD_NEXT, "malloc_usable_size");
16851c0b2f7Stbbdev         orig_libc_free = dlsym(RTLD_NEXT, "__libc_free");
16951c0b2f7Stbbdev         orig_libc_realloc = dlsym(RTLD_NEXT, "__libc_realloc");
17051c0b2f7Stbbdev 
17151c0b2f7Stbbdev         origFuncSearched.store(true, std::memory_order_release);
17251c0b2f7Stbbdev     }
17351c0b2f7Stbbdev }
17451c0b2f7Stbbdev 
17551c0b2f7Stbbdev /*** replacements for malloc and the family ***/
17651c0b2f7Stbbdev extern "C" {
17751c0b2f7Stbbdev #elif MALLOC_ZONE_OVERLOAD_ENABLED
17851c0b2f7Stbbdev 
17951c0b2f7Stbbdev // each impl_* function has such 1st argument, it's unused
18051c0b2f7Stbbdev #define ZONE_ARG struct _malloc_zone_t *,
18151c0b2f7Stbbdev #define PREFIX(name) impl_##name
18251c0b2f7Stbbdev // not interested in original functions for zone overload
18351c0b2f7Stbbdev inline void InitOrigPointers() {}
18451c0b2f7Stbbdev 
18551c0b2f7Stbbdev #endif // MALLOC_UNIXLIKE_OVERLOAD_ENABLED and MALLOC_ZONE_OVERLOAD_ENABLED
18651c0b2f7Stbbdev 
18751c0b2f7Stbbdev void *PREFIX(malloc)(ZONE_ARG size_t size) __THROW
18851c0b2f7Stbbdev {
18951c0b2f7Stbbdev     return scalable_malloc(size);
19051c0b2f7Stbbdev }
19151c0b2f7Stbbdev 
19251c0b2f7Stbbdev void *PREFIX(calloc)(ZONE_ARG size_t num, size_t size) __THROW
19351c0b2f7Stbbdev {
19451c0b2f7Stbbdev     return scalable_calloc(num, size);
19551c0b2f7Stbbdev }
19651c0b2f7Stbbdev 
19751c0b2f7Stbbdev void PREFIX(free)(ZONE_ARG void *object) __THROW
19851c0b2f7Stbbdev {
19951c0b2f7Stbbdev     InitOrigPointers();
20051c0b2f7Stbbdev     __TBB_malloc_safer_free(object, (void (*)(void*))orig_free);
20151c0b2f7Stbbdev }
20251c0b2f7Stbbdev 
20351c0b2f7Stbbdev void *PREFIX(realloc)(ZONE_ARG void* ptr, size_t sz) __THROW
20451c0b2f7Stbbdev {
20551c0b2f7Stbbdev     InitOrigPointers();
20651c0b2f7Stbbdev     return __TBB_malloc_safer_realloc(ptr, sz, orig_realloc);
20751c0b2f7Stbbdev }
20851c0b2f7Stbbdev 
20951c0b2f7Stbbdev /* The older *NIX interface for aligned allocations;
21051c0b2f7Stbbdev    it's formally substituted by posix_memalign and deprecated,
21151c0b2f7Stbbdev    so we do not expect it to cause cyclic dependency with C RTL. */
21251c0b2f7Stbbdev void *PREFIX(memalign)(ZONE_ARG size_t alignment, size_t size) __THROW
21351c0b2f7Stbbdev {
21451c0b2f7Stbbdev     return scalable_aligned_malloc(size, alignment);
21551c0b2f7Stbbdev }
21651c0b2f7Stbbdev 
21751c0b2f7Stbbdev /* valloc allocates memory aligned on a page boundary */
21851c0b2f7Stbbdev void *PREFIX(valloc)(ZONE_ARG size_t size) __THROW
21951c0b2f7Stbbdev {
22051c0b2f7Stbbdev     if (! memoryPageSize) initPageSize();
22151c0b2f7Stbbdev 
22251c0b2f7Stbbdev     return scalable_aligned_malloc(size, memoryPageSize);
22351c0b2f7Stbbdev }
22451c0b2f7Stbbdev 
22551c0b2f7Stbbdev #undef ZONE_ARG
22651c0b2f7Stbbdev #undef PREFIX
22751c0b2f7Stbbdev 
22851c0b2f7Stbbdev #if MALLOC_UNIXLIKE_OVERLOAD_ENABLED
22951c0b2f7Stbbdev 
23051c0b2f7Stbbdev // match prototype from system headers
23151c0b2f7Stbbdev #if __ANDROID__
23251c0b2f7Stbbdev size_t malloc_usable_size(const void *ptr) __THROW
23351c0b2f7Stbbdev #else
23451c0b2f7Stbbdev size_t malloc_usable_size(void *ptr) __THROW
23551c0b2f7Stbbdev #endif
23651c0b2f7Stbbdev {
23751c0b2f7Stbbdev     InitOrigPointers();
23851c0b2f7Stbbdev     return __TBB_malloc_safer_msize(const_cast<void*>(ptr), (size_t (*)(void*))orig_msize);
23951c0b2f7Stbbdev }
24051c0b2f7Stbbdev 
24151c0b2f7Stbbdev int posix_memalign(void **memptr, size_t alignment, size_t size) __THROW
24251c0b2f7Stbbdev {
24351c0b2f7Stbbdev     return scalable_posix_memalign(memptr, alignment, size);
24451c0b2f7Stbbdev }
24551c0b2f7Stbbdev 
24651c0b2f7Stbbdev /* pvalloc allocates smallest set of complete pages which can hold
24751c0b2f7Stbbdev    the requested number of bytes. Result is aligned on page boundary. */
24851c0b2f7Stbbdev void *pvalloc(size_t size) __THROW
24951c0b2f7Stbbdev {
25051c0b2f7Stbbdev     if (! memoryPageSize) initPageSize();
25151c0b2f7Stbbdev     // align size up to the page size,
25251c0b2f7Stbbdev     // pvalloc(0) returns 1 page, see man libmpatrol
25351c0b2f7Stbbdev     size = size? ((size-1) | (memoryPageSize-1)) + 1 : memoryPageSize;
25451c0b2f7Stbbdev 
25551c0b2f7Stbbdev     return scalable_aligned_malloc(size, memoryPageSize);
25651c0b2f7Stbbdev }
25751c0b2f7Stbbdev 
25851c0b2f7Stbbdev int mallopt(int /*param*/, int /*value*/) __THROW
25951c0b2f7Stbbdev {
26051c0b2f7Stbbdev     return 1;
26151c0b2f7Stbbdev }
26251c0b2f7Stbbdev 
26351c0b2f7Stbbdev struct mallinfo mallinfo() __THROW
26451c0b2f7Stbbdev {
26551c0b2f7Stbbdev     struct mallinfo m;
26651c0b2f7Stbbdev     memset(&m, 0, sizeof(struct mallinfo));
26751c0b2f7Stbbdev 
26851c0b2f7Stbbdev     return m;
26951c0b2f7Stbbdev }
27051c0b2f7Stbbdev 
27151c0b2f7Stbbdev #if __ANDROID__
27251c0b2f7Stbbdev // Android doesn't have malloc_usable_size, provide it to be compatible
27351c0b2f7Stbbdev // with Linux, in addition overload dlmalloc_usable_size() that presented
27451c0b2f7Stbbdev // under Android.
275478de5b1Stbbdev size_t dlmalloc_usable_size(const void *ptr) __TBB_ALIAS_ATTR_COPY(malloc_usable_size);
27651c0b2f7Stbbdev #else // __ANDROID__
277478de5b1Stbbdev // TODO: consider using __typeof__ to guarantee the correct declaration types
27851c0b2f7Stbbdev // C11 function, supported starting GLIBC 2.16
279478de5b1Stbbdev void *aligned_alloc(size_t alignment, size_t size) __TBB_ALIAS_ATTR_COPY(memalign);
28051c0b2f7Stbbdev // Those non-standard functions are exported by GLIBC, and might be used
281478de5b1Stbbdev // in conjunction with standard malloc/free, so we must overload them.
28251c0b2f7Stbbdev // Bionic doesn't have them. Not removing from the linker scripts,
28351c0b2f7Stbbdev // as absent entry points are ignored by the linker.
28451c0b2f7Stbbdev 
285478de5b1Stbbdev void *__libc_malloc(size_t size) __TBB_ALIAS_ATTR_COPY(malloc);
286478de5b1Stbbdev void *__libc_calloc(size_t num, size_t size) __TBB_ALIAS_ATTR_COPY(calloc);
287478de5b1Stbbdev void *__libc_memalign(size_t alignment, size_t size) __TBB_ALIAS_ATTR_COPY(memalign);
288478de5b1Stbbdev void *__libc_pvalloc(size_t size) __TBB_ALIAS_ATTR_COPY(pvalloc);
289478de5b1Stbbdev void *__libc_valloc(size_t size) __TBB_ALIAS_ATTR_COPY(valloc);
29051c0b2f7Stbbdev 
29151c0b2f7Stbbdev // call original __libc_* to support naive replacement of free via __libc_free etc
29251c0b2f7Stbbdev void __libc_free(void *ptr)
29351c0b2f7Stbbdev {
29451c0b2f7Stbbdev     InitOrigPointers();
29551c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_libc_free);
29651c0b2f7Stbbdev }
29751c0b2f7Stbbdev 
29851c0b2f7Stbbdev void *__libc_realloc(void *ptr, size_t size)
29951c0b2f7Stbbdev {
30051c0b2f7Stbbdev     InitOrigPointers();
30151c0b2f7Stbbdev     return __TBB_malloc_safer_realloc(ptr, size, orig_libc_realloc);
30251c0b2f7Stbbdev }
30351c0b2f7Stbbdev #endif // !__ANDROID__
30451c0b2f7Stbbdev 
30551c0b2f7Stbbdev } /* extern "C" */
30651c0b2f7Stbbdev 
30751c0b2f7Stbbdev /*** replacements for global operators new and delete ***/
30851c0b2f7Stbbdev 
30951c0b2f7Stbbdev void* operator new(size_t sz) {
31051c0b2f7Stbbdev     return InternalOperatorNew(sz);
31151c0b2f7Stbbdev }
31251c0b2f7Stbbdev void* operator new[](size_t sz) {
31351c0b2f7Stbbdev     return InternalOperatorNew(sz);
31451c0b2f7Stbbdev }
31551c0b2f7Stbbdev void operator delete(void* ptr) noexcept {
31651c0b2f7Stbbdev     InitOrigPointers();
31751c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
31851c0b2f7Stbbdev }
31951c0b2f7Stbbdev void operator delete[](void* ptr) noexcept {
32051c0b2f7Stbbdev     InitOrigPointers();
32151c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
32251c0b2f7Stbbdev }
32351c0b2f7Stbbdev void* operator new(size_t sz, const std::nothrow_t&) noexcept {
32451c0b2f7Stbbdev     return scalable_malloc(sz);
32551c0b2f7Stbbdev }
32651c0b2f7Stbbdev void* operator new[](std::size_t sz, const std::nothrow_t&) noexcept {
32751c0b2f7Stbbdev     return scalable_malloc(sz);
32851c0b2f7Stbbdev }
32951c0b2f7Stbbdev void operator delete(void* ptr, const std::nothrow_t&) noexcept {
33051c0b2f7Stbbdev     InitOrigPointers();
33151c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
33251c0b2f7Stbbdev }
33351c0b2f7Stbbdev void operator delete[](void* ptr, const std::nothrow_t&) noexcept {
33451c0b2f7Stbbdev     InitOrigPointers();
33551c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, (void (*)(void*))orig_free);
33651c0b2f7Stbbdev }
33751c0b2f7Stbbdev 
33851c0b2f7Stbbdev #endif /* MALLOC_UNIXLIKE_OVERLOAD_ENABLED */
33951c0b2f7Stbbdev #endif /* MALLOC_UNIXLIKE_OVERLOAD_ENABLED || MALLOC_ZONE_OVERLOAD_ENABLED */
34051c0b2f7Stbbdev 
34151c0b2f7Stbbdev #ifdef _WIN32
34251c0b2f7Stbbdev #include <windows.h>
34351c0b2f7Stbbdev 
34451c0b2f7Stbbdev #if !__TBB_WIN8UI_SUPPORT
34551c0b2f7Stbbdev 
34651c0b2f7Stbbdev #include <stdio.h>
34751c0b2f7Stbbdev 
34851c0b2f7Stbbdev #include "function_replacement.h"
34951c0b2f7Stbbdev 
35051c0b2f7Stbbdev template<typename T, size_t N> // generic function to find length of array
35151c0b2f7Stbbdev inline size_t arrayLength(const T(&)[N]) {
35251c0b2f7Stbbdev     return N;
35351c0b2f7Stbbdev }
35451c0b2f7Stbbdev 
35551c0b2f7Stbbdev void __TBB_malloc_safer_delete( void *ptr)
35651c0b2f7Stbbdev {
35751c0b2f7Stbbdev     __TBB_malloc_safer_free( ptr, NULL );
35851c0b2f7Stbbdev }
35951c0b2f7Stbbdev 
36051c0b2f7Stbbdev void* safer_aligned_malloc( size_t size, size_t alignment )
36151c0b2f7Stbbdev {
36251c0b2f7Stbbdev     // workaround for "is power of 2 pow N" bug that accepts zeros
36351c0b2f7Stbbdev     return scalable_aligned_malloc( size, alignment>sizeof(size_t*)?alignment:sizeof(size_t*) );
36451c0b2f7Stbbdev }
36551c0b2f7Stbbdev 
36651c0b2f7Stbbdev // we do not support _expand();
36751c0b2f7Stbbdev void* safer_expand( void *, size_t )
36851c0b2f7Stbbdev {
36951c0b2f7Stbbdev     return NULL;
37051c0b2f7Stbbdev }
37151c0b2f7Stbbdev 
37251c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(CRTLIB)                                             \
37351c0b2f7Stbbdev void (*orig_free_##CRTLIB)(void*);                                                                   \
37451c0b2f7Stbbdev void __TBB_malloc_safer_free_##CRTLIB(void *ptr)                                                     \
37551c0b2f7Stbbdev {                                                                                                    \
37651c0b2f7Stbbdev     __TBB_malloc_safer_free( ptr, orig_free_##CRTLIB );                                              \
37751c0b2f7Stbbdev }                                                                                                    \
37851c0b2f7Stbbdev                                                                                                      \
37951c0b2f7Stbbdev void (*orig__aligned_free_##CRTLIB)(void*);                                                          \
38051c0b2f7Stbbdev void __TBB_malloc_safer__aligned_free_##CRTLIB(void *ptr)                                            \
38151c0b2f7Stbbdev {                                                                                                    \
38251c0b2f7Stbbdev     __TBB_malloc_safer_free( ptr, orig__aligned_free_##CRTLIB );                                     \
38351c0b2f7Stbbdev }                                                                                                    \
38451c0b2f7Stbbdev                                                                                                      \
38551c0b2f7Stbbdev size_t (*orig__msize_##CRTLIB)(void*);                                                               \
38651c0b2f7Stbbdev size_t __TBB_malloc_safer__msize_##CRTLIB(void *ptr)                                                 \
38751c0b2f7Stbbdev {                                                                                                    \
38851c0b2f7Stbbdev     return __TBB_malloc_safer_msize( ptr, orig__msize_##CRTLIB );                                    \
38951c0b2f7Stbbdev }                                                                                                    \
39051c0b2f7Stbbdev                                                                                                      \
39151c0b2f7Stbbdev size_t (*orig__aligned_msize_##CRTLIB)(void*, size_t, size_t);                                       \
39251c0b2f7Stbbdev size_t __TBB_malloc_safer__aligned_msize_##CRTLIB( void *ptr, size_t alignment, size_t offset)       \
39351c0b2f7Stbbdev {                                                                                                    \
39451c0b2f7Stbbdev     return __TBB_malloc_safer_aligned_msize( ptr, alignment, offset, orig__aligned_msize_##CRTLIB ); \
39551c0b2f7Stbbdev }                                                                                                    \
39651c0b2f7Stbbdev                                                                                                      \
39751c0b2f7Stbbdev void* __TBB_malloc_safer_realloc_##CRTLIB( void *ptr, size_t size )                                  \
39851c0b2f7Stbbdev {                                                                                                    \
39951c0b2f7Stbbdev     orig_ptrs func_ptrs = {orig_free_##CRTLIB, orig__msize_##CRTLIB};                                \
40051c0b2f7Stbbdev     return __TBB_malloc_safer_realloc( ptr, size, &func_ptrs );                                      \
40151c0b2f7Stbbdev }                                                                                                    \
40251c0b2f7Stbbdev                                                                                                      \
40351c0b2f7Stbbdev void* __TBB_malloc_safer__aligned_realloc_##CRTLIB( void *ptr, size_t size, size_t alignment )       \
40451c0b2f7Stbbdev {                                                                                                    \
40551c0b2f7Stbbdev     orig_aligned_ptrs func_ptrs = {orig__aligned_free_##CRTLIB, orig__aligned_msize_##CRTLIB};       \
40651c0b2f7Stbbdev     return __TBB_malloc_safer_aligned_realloc( ptr, size, alignment, &func_ptrs );                   \
40751c0b2f7Stbbdev }
40851c0b2f7Stbbdev 
40951c0b2f7Stbbdev // Only for ucrtbase: substitution for _o_free
41051c0b2f7Stbbdev void (*orig__o_free)(void*);
41151c0b2f7Stbbdev void __TBB_malloc__o_free(void *ptr)
41251c0b2f7Stbbdev {
41351c0b2f7Stbbdev     __TBB_malloc_safer_free( ptr, orig__o_free );
41451c0b2f7Stbbdev }
41551c0b2f7Stbbdev // Only for ucrtbase: substitution for _free_base
41651c0b2f7Stbbdev void(*orig__free_base)(void*);
41751c0b2f7Stbbdev void __TBB_malloc__free_base(void *ptr)
41851c0b2f7Stbbdev {
41951c0b2f7Stbbdev     __TBB_malloc_safer_free(ptr, orig__free_base);
42051c0b2f7Stbbdev }
42151c0b2f7Stbbdev 
42251c0b2f7Stbbdev // Size limit is MAX_PATTERN_SIZE (28) byte codes / 56 symbols per line.
42351c0b2f7Stbbdev // * can be used to match any digit in byte codes.
42451c0b2f7Stbbdev // # followed by several * indicate a relative address that needs to be corrected.
42551c0b2f7Stbbdev // Purpose of the pattern is to mark an instruction bound; it should consist of several
42651c0b2f7Stbbdev // full instructions plus one extra byte code. It's not required for the patterns
42751c0b2f7Stbbdev // to be unique (i.e., it's OK to have same pattern for unrelated functions).
42851c0b2f7Stbbdev // TODO: use hot patch prologues if exist
42951c0b2f7Stbbdev const char* known_bytecodes[] = {
43051c0b2f7Stbbdev #if _WIN64
43151c0b2f7Stbbdev //  "========================================================" - 56 symbols
43251c0b2f7Stbbdev     "4883EC284885C974",       // release free()
43351c0b2f7Stbbdev     "4883EC284885C975",       // release _msize()
43451c0b2f7Stbbdev     "4885C974375348",         // release free() 8.0.50727.42, 10.0
43551c0b2f7Stbbdev     "E907000000CCCC",         // release _aligned_msize(), _aligned_free() ucrtbase.dll
43651c0b2f7Stbbdev     "C7442410000000008B",     // release free() ucrtbase.dll 10.0.14393.33
43751c0b2f7Stbbdev     "E90B000000CCCC",         // release _msize() ucrtbase.dll 10.0.14393.33
43851c0b2f7Stbbdev     "48895C24085748",         // release _aligned_msize() ucrtbase.dll 10.0.14393.33
43951c0b2f7Stbbdev     "E903000000CCCC",         // release _aligned_msize() ucrtbase.dll 10.0.16299.522
44051c0b2f7Stbbdev     "48894C24084883EC28BA",   // debug prologue
44151c0b2f7Stbbdev     "4C894424184889542410",   // debug _aligned_msize() 10.0
44251c0b2f7Stbbdev     "48894C24084883EC2848",   // debug _aligned_free 10.0
44351c0b2f7Stbbdev     "488BD1488D0D#*******E9", // _o_free(), ucrtbase.dll
44451c0b2f7Stbbdev  #if __TBB_OVERLOAD_OLD_MSVCR
44551c0b2f7Stbbdev     "48895C2408574883EC3049", // release _aligned_msize 9.0
44651c0b2f7Stbbdev     "4883EC384885C975",       // release _msize() 9.0
44751c0b2f7Stbbdev     "4C8BC1488B0DA6E4040033", // an old win64 SDK
44851c0b2f7Stbbdev  #endif
44951c0b2f7Stbbdev #else // _WIN32
45051c0b2f7Stbbdev //  "========================================================" - 56 symbols
45151c0b2f7Stbbdev     "8BFF558BEC8B",           // multiple
45251c0b2f7Stbbdev     "8BFF558BEC83",           // release free() & _msize() 10.0.40219.325, _msize() ucrtbase.dll
45351c0b2f7Stbbdev     "8BFF558BECFF",           // release _aligned_msize ucrtbase.dll
45451c0b2f7Stbbdev     "8BFF558BEC51",           // release free() & _msize() ucrtbase.dll 10.0.14393.33
45551c0b2f7Stbbdev     "558BEC8B450885C074",     // release _aligned_free 11.0
45651c0b2f7Stbbdev     "558BEC837D08000F",       // release _msize() 11.0.51106.1
45751c0b2f7Stbbdev     "558BEC837D08007419FF",   // release free() 11.0.50727.1
45851c0b2f7Stbbdev     "558BEC8B450885C075",     // release _aligned_msize() 11.0.50727.1
45951c0b2f7Stbbdev     "558BEC6A018B",           // debug free() & _msize() 11.0
46051c0b2f7Stbbdev     "558BEC8B451050",         // debug _aligned_msize() 11.0
46151c0b2f7Stbbdev     "558BEC8B450850",         // debug _aligned_free 11.0
46251c0b2f7Stbbdev     "8BFF558BEC6A",           // debug free() & _msize() 10.0.40219.325
46351c0b2f7Stbbdev  #if __TBB_OVERLOAD_OLD_MSVCR
46451c0b2f7Stbbdev     "6A1868********E8",       // release free() 8.0.50727.4053, 9.0
46551c0b2f7Stbbdev     "6A1C68********E8",       // release _msize() 8.0.50727.4053, 9.0
46651c0b2f7Stbbdev  #endif
46751c0b2f7Stbbdev #endif // _WIN64/_WIN32
46851c0b2f7Stbbdev     NULL
46951c0b2f7Stbbdev     };
47051c0b2f7Stbbdev 
47151c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,function_name,dbgsuffix) \
47251c0b2f7Stbbdev     ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
47351c0b2f7Stbbdev       (FUNCPTR)__TBB_malloc_safer_##function_name##_##CRT_VER##dbgsuffix, \
47451c0b2f7Stbbdev       known_bytecodes, (FUNCPTR*)&orig_##function_name##_##CRT_VER##dbgsuffix );
47551c0b2f7Stbbdev 
47651c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,function_name,dbgsuffix) \
47751c0b2f7Stbbdev     ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
47851c0b2f7Stbbdev       (FUNCPTR)__TBB_malloc_safer_##function_name##_##CRT_VER##dbgsuffix, 0, NULL );
47951c0b2f7Stbbdev 
48051c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_REDIRECT(CRT_VER,function_name,dest_func,dbgsuffix) \
48151c0b2f7Stbbdev     ReplaceFunctionWithStore( #CRT_VER #dbgsuffix ".dll", #function_name, \
48251c0b2f7Stbbdev       (FUNCPTR)__TBB_malloc_safer_##dest_func##_##CRT_VER##dbgsuffix, 0, NULL );
48351c0b2f7Stbbdev 
48451c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,dbgsuffix)                             \
48551c0b2f7Stbbdev     if (BytecodesAreKnown(#CRT_VER #dbgsuffix ".dll")) {                                          \
48651c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,free,dbgsuffix)                         \
48751c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_msize,dbgsuffix)                       \
48851c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,realloc,dbgsuffix)          \
48951c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_aligned_free,dbgsuffix)                \
49051c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY(CRT_VER,_aligned_msize,dbgsuffix)               \
49151c0b2f7Stbbdev       __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_ENTRY_NO_FALLBACK(CRT_VER,_aligned_realloc,dbgsuffix) \
49251c0b2f7Stbbdev     } else                                                                                        \
49351c0b2f7Stbbdev         SkipReplacement(#CRT_VER #dbgsuffix ".dll");
49451c0b2f7Stbbdev 
49551c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(CRT_VER) __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,)
49651c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_DEBUG(CRT_VER) __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_IMPL(CRT_VER,d)
49751c0b2f7Stbbdev 
49851c0b2f7Stbbdev #define __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(CRT_VER)     \
49951c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(CRT_VER) \
50051c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_DEBUG(CRT_VER)
50151c0b2f7Stbbdev 
50251c0b2f7Stbbdev #if __TBB_OVERLOAD_OLD_MSVCR
50351c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr70d);
50451c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr70);
50551c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr71d);
50651c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr71);
50751c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr80d);
50851c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr80);
50951c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr90d);
51051c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr90);
51151c0b2f7Stbbdev #endif
51251c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr100d);
51351c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr100);
51451c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr110d);
51551c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr110);
51651c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr120d);
51751c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(msvcr120);
51851c0b2f7Stbbdev __TBB_ORIG_ALLOCATOR_REPLACEMENT_WRAPPER(ucrtbase);
51951c0b2f7Stbbdev 
52051c0b2f7Stbbdev /*** replacements for global operators new and delete ***/
52151c0b2f7Stbbdev 
52251c0b2f7Stbbdev #if _MSC_VER && !defined(__INTEL_COMPILER)
52351c0b2f7Stbbdev #pragma warning( push )
52451c0b2f7Stbbdev #pragma warning( disable : 4290 )
52551c0b2f7Stbbdev #endif
52651c0b2f7Stbbdev 
52751c0b2f7Stbbdev /*** operator new overloads internals (Linux, Windows) ***/
52851c0b2f7Stbbdev 
52951c0b2f7Stbbdev void* operator_new(size_t sz) {
53051c0b2f7Stbbdev     return InternalOperatorNew(sz);
53151c0b2f7Stbbdev }
53251c0b2f7Stbbdev void* operator_new_arr(size_t sz) {
53351c0b2f7Stbbdev     return InternalOperatorNew(sz);
53451c0b2f7Stbbdev }
53551c0b2f7Stbbdev void operator_delete(void* ptr) noexcept {
53651c0b2f7Stbbdev     __TBB_malloc_safer_delete(ptr);
53751c0b2f7Stbbdev }
53851c0b2f7Stbbdev #if _MSC_VER && !defined(__INTEL_COMPILER)
53951c0b2f7Stbbdev #pragma warning( pop )
54051c0b2f7Stbbdev #endif
54151c0b2f7Stbbdev 
54251c0b2f7Stbbdev void operator_delete_arr(void* ptr) noexcept {
54351c0b2f7Stbbdev     __TBB_malloc_safer_delete(ptr);
54451c0b2f7Stbbdev }
54551c0b2f7Stbbdev void* operator_new_t(size_t sz, const std::nothrow_t&) noexcept {
54651c0b2f7Stbbdev     return scalable_malloc(sz);
54751c0b2f7Stbbdev }
54851c0b2f7Stbbdev void* operator_new_arr_t(std::size_t sz, const std::nothrow_t&) noexcept {
54951c0b2f7Stbbdev     return scalable_malloc(sz);
55051c0b2f7Stbbdev }
55151c0b2f7Stbbdev void operator_delete_t(void* ptr, const std::nothrow_t&) noexcept {
55251c0b2f7Stbbdev     __TBB_malloc_safer_delete(ptr);
55351c0b2f7Stbbdev }
55451c0b2f7Stbbdev void operator_delete_arr_t(void* ptr, const std::nothrow_t&) noexcept {
55551c0b2f7Stbbdev     __TBB_malloc_safer_delete(ptr);
55651c0b2f7Stbbdev }
55751c0b2f7Stbbdev 
55851c0b2f7Stbbdev struct Module {
55951c0b2f7Stbbdev     const char *name;
56051c0b2f7Stbbdev     bool        doFuncReplacement; // do replacement in the DLL
56151c0b2f7Stbbdev };
56251c0b2f7Stbbdev 
56351c0b2f7Stbbdev Module modules_to_replace[] = {
56451c0b2f7Stbbdev     {"msvcr100d.dll", true},
56551c0b2f7Stbbdev     {"msvcr100.dll", true},
56651c0b2f7Stbbdev     {"msvcr110d.dll", true},
56751c0b2f7Stbbdev     {"msvcr110.dll", true},
56851c0b2f7Stbbdev     {"msvcr120d.dll", true},
56951c0b2f7Stbbdev     {"msvcr120.dll", true},
57051c0b2f7Stbbdev     {"ucrtbase.dll", true},
57151c0b2f7Stbbdev //    "ucrtbased.dll" is not supported because of problems with _dbg functions
57251c0b2f7Stbbdev #if __TBB_OVERLOAD_OLD_MSVCR
57351c0b2f7Stbbdev     {"msvcr90d.dll", true},
57451c0b2f7Stbbdev     {"msvcr90.dll", true},
57551c0b2f7Stbbdev     {"msvcr80d.dll", true},
57651c0b2f7Stbbdev     {"msvcr80.dll", true},
57751c0b2f7Stbbdev     {"msvcr70d.dll", true},
57851c0b2f7Stbbdev     {"msvcr70.dll", true},
57951c0b2f7Stbbdev     {"msvcr71d.dll", true},
58051c0b2f7Stbbdev     {"msvcr71.dll", true},
58151c0b2f7Stbbdev #endif
58251c0b2f7Stbbdev #if __TBB_TODO
58351c0b2f7Stbbdev     // TODO: Try enabling replacement for non-versioned system binaries below
58451c0b2f7Stbbdev     {"msvcrtd.dll", true},
58551c0b2f7Stbbdev     {"msvcrt.dll", true},
58651c0b2f7Stbbdev #endif
58751c0b2f7Stbbdev     };
58851c0b2f7Stbbdev 
58951c0b2f7Stbbdev /*
59051c0b2f7Stbbdev We need to replace following functions:
59151c0b2f7Stbbdev malloc
59251c0b2f7Stbbdev calloc
59351c0b2f7Stbbdev _aligned_malloc
59451c0b2f7Stbbdev _expand (by dummy implementation)
59551c0b2f7Stbbdev ??2@YAPAXI@Z      operator new                         (ia32)
59651c0b2f7Stbbdev ??_U@YAPAXI@Z     void * operator new[] (size_t size)  (ia32)
59751c0b2f7Stbbdev ??3@YAXPAX@Z      operator delete                      (ia32)
59851c0b2f7Stbbdev ??_V@YAXPAX@Z     operator delete[]                    (ia32)
59951c0b2f7Stbbdev ??2@YAPEAX_K@Z    void * operator new(unsigned __int64)   (intel64)
60051c0b2f7Stbbdev ??_V@YAXPEAX@Z    void * operator new[](unsigned __int64) (intel64)
60151c0b2f7Stbbdev ??3@YAXPEAX@Z     operator delete                         (intel64)
60251c0b2f7Stbbdev ??_V@YAXPEAX@Z    operator delete[]                       (intel64)
60351c0b2f7Stbbdev ??2@YAPAXIABUnothrow_t@std@@@Z      void * operator new (size_t sz, const std::nothrow_t&) throw()  (optional)
60451c0b2f7Stbbdev ??_U@YAPAXIABUnothrow_t@std@@@Z     void * operator new[] (size_t sz, const std::nothrow_t&) throw() (optional)
60551c0b2f7Stbbdev 
60651c0b2f7Stbbdev and these functions have runtime-specific replacement:
60751c0b2f7Stbbdev realloc
60851c0b2f7Stbbdev free
60951c0b2f7Stbbdev _msize
61051c0b2f7Stbbdev _aligned_realloc
61151c0b2f7Stbbdev _aligned_free
61251c0b2f7Stbbdev _aligned_msize
61351c0b2f7Stbbdev */
61451c0b2f7Stbbdev 
61551c0b2f7Stbbdev typedef struct FRData_t {
61651c0b2f7Stbbdev     //char *_module;
61751c0b2f7Stbbdev     const char *_func;
61851c0b2f7Stbbdev     FUNCPTR _fptr;
61951c0b2f7Stbbdev     FRR_ON_ERROR _on_error;
62051c0b2f7Stbbdev } FRDATA;
62151c0b2f7Stbbdev 
62251c0b2f7Stbbdev FRDATA c_routines_to_replace[] = {
62351c0b2f7Stbbdev     { "malloc",  (FUNCPTR)scalable_malloc, FRR_FAIL },
62451c0b2f7Stbbdev     { "calloc",  (FUNCPTR)scalable_calloc, FRR_FAIL },
62551c0b2f7Stbbdev     { "_aligned_malloc",  (FUNCPTR)safer_aligned_malloc, FRR_FAIL },
62651c0b2f7Stbbdev     { "_expand",  (FUNCPTR)safer_expand, FRR_IGNORE },
62751c0b2f7Stbbdev };
62851c0b2f7Stbbdev 
62951c0b2f7Stbbdev FRDATA cxx_routines_to_replace[] = {
63051c0b2f7Stbbdev #if _WIN64
63151c0b2f7Stbbdev     { "??2@YAPEAX_K@Z", (FUNCPTR)operator_new, FRR_FAIL },
63251c0b2f7Stbbdev     { "??_U@YAPEAX_K@Z", (FUNCPTR)operator_new_arr, FRR_FAIL },
63351c0b2f7Stbbdev     { "??3@YAXPEAX@Z", (FUNCPTR)operator_delete, FRR_FAIL },
63451c0b2f7Stbbdev     { "??_V@YAXPEAX@Z", (FUNCPTR)operator_delete_arr, FRR_FAIL },
63551c0b2f7Stbbdev #else
63651c0b2f7Stbbdev     { "??2@YAPAXI@Z", (FUNCPTR)operator_new, FRR_FAIL },
63751c0b2f7Stbbdev     { "??_U@YAPAXI@Z", (FUNCPTR)operator_new_arr, FRR_FAIL },
63851c0b2f7Stbbdev     { "??3@YAXPAX@Z", (FUNCPTR)operator_delete, FRR_FAIL },
63951c0b2f7Stbbdev     { "??_V@YAXPAX@Z", (FUNCPTR)operator_delete_arr, FRR_FAIL },
64051c0b2f7Stbbdev #endif
64151c0b2f7Stbbdev     { "??2@YAPAXIABUnothrow_t@std@@@Z", (FUNCPTR)operator_new_t, FRR_IGNORE },
64251c0b2f7Stbbdev     { "??_U@YAPAXIABUnothrow_t@std@@@Z", (FUNCPTR)operator_new_arr_t, FRR_IGNORE }
64351c0b2f7Stbbdev };
64451c0b2f7Stbbdev 
64551c0b2f7Stbbdev #ifndef UNICODE
64651c0b2f7Stbbdev typedef char unicode_char_t;
64751c0b2f7Stbbdev #define WCHAR_SPEC "%s"
64851c0b2f7Stbbdev #else
64951c0b2f7Stbbdev typedef wchar_t unicode_char_t;
65051c0b2f7Stbbdev #define WCHAR_SPEC "%ls"
65151c0b2f7Stbbdev #endif
65251c0b2f7Stbbdev 
65351c0b2f7Stbbdev // Check that we recognize bytecodes that should be replaced by trampolines.
65451c0b2f7Stbbdev // If some functions have unknown prologue patterns, replacement should not be done.
65551c0b2f7Stbbdev bool BytecodesAreKnown(const unicode_char_t *dllName)
65651c0b2f7Stbbdev {
65751c0b2f7Stbbdev     const char *funcName[] = {"free", "_msize", "_aligned_free", "_aligned_msize", 0};
65851c0b2f7Stbbdev     HMODULE module = GetModuleHandle(dllName);
65951c0b2f7Stbbdev 
66051c0b2f7Stbbdev     if (!module)
66151c0b2f7Stbbdev         return false;
66251c0b2f7Stbbdev     for (int i=0; funcName[i]; i++)
66351c0b2f7Stbbdev         if (! IsPrologueKnown(dllName, funcName[i], known_bytecodes, module)) {
66451c0b2f7Stbbdev             fprintf(stderr, "TBBmalloc: skip allocation functions replacement in " WCHAR_SPEC
66551c0b2f7Stbbdev                     ": unknown prologue for function " WCHAR_SPEC "\n", dllName, funcName[i]);
66651c0b2f7Stbbdev             return false;
66751c0b2f7Stbbdev         }
66851c0b2f7Stbbdev     return true;
66951c0b2f7Stbbdev }
67051c0b2f7Stbbdev 
67151c0b2f7Stbbdev void SkipReplacement(const unicode_char_t *dllName)
67251c0b2f7Stbbdev {
67351c0b2f7Stbbdev #ifndef UNICODE
67451c0b2f7Stbbdev     const char *dllStr = dllName;
67551c0b2f7Stbbdev #else
67651c0b2f7Stbbdev     const size_t sz = 128; // all DLL name must fit
67751c0b2f7Stbbdev 
67851c0b2f7Stbbdev     char buffer[sz];
67951c0b2f7Stbbdev     size_t real_sz;
68051c0b2f7Stbbdev     char *dllStr = buffer;
68151c0b2f7Stbbdev 
68251c0b2f7Stbbdev     errno_t ret = wcstombs_s(&real_sz, dllStr, sz, dllName, sz-1);
68351c0b2f7Stbbdev     __TBB_ASSERT(!ret, "Dll name conversion failed");
68451c0b2f7Stbbdev #endif
68551c0b2f7Stbbdev 
68651c0b2f7Stbbdev     for (size_t i=0; i<arrayLength(modules_to_replace); i++)
68751c0b2f7Stbbdev         if (!strcmp(modules_to_replace[i].name, dllStr)) {
68851c0b2f7Stbbdev             modules_to_replace[i].doFuncReplacement = false;
68951c0b2f7Stbbdev             break;
69051c0b2f7Stbbdev         }
69151c0b2f7Stbbdev }
69251c0b2f7Stbbdev 
69351c0b2f7Stbbdev void ReplaceFunctionWithStore( const unicode_char_t *dllName, const char *funcName, FUNCPTR newFunc, const char ** opcodes, FUNCPTR* origFunc,  FRR_ON_ERROR on_error = FRR_FAIL )
69451c0b2f7Stbbdev {
69551c0b2f7Stbbdev     FRR_TYPE res = ReplaceFunction( dllName, funcName, newFunc, opcodes, origFunc );
69651c0b2f7Stbbdev 
69751c0b2f7Stbbdev     if (res == FRR_OK || res == FRR_NODLL || (res == FRR_NOFUNC && on_error == FRR_IGNORE))
69851c0b2f7Stbbdev         return;
69951c0b2f7Stbbdev 
70051c0b2f7Stbbdev     fprintf(stderr, "Failed to %s function %s in module %s\n",
70151c0b2f7Stbbdev             res==FRR_NOFUNC? "find" : "replace", funcName, dllName);
70251c0b2f7Stbbdev 
70351c0b2f7Stbbdev     // Unable to replace a required function
70451c0b2f7Stbbdev     // Aborting because incomplete replacement of memory management functions
70551c0b2f7Stbbdev     // may leave the program in an invalid state
70651c0b2f7Stbbdev     abort();
70751c0b2f7Stbbdev }
70851c0b2f7Stbbdev 
70951c0b2f7Stbbdev void doMallocReplacement()
71051c0b2f7Stbbdev {
71151c0b2f7Stbbdev     // Replace functions and keep backup of original code (separate for each runtime)
71251c0b2f7Stbbdev #if __TBB_OVERLOAD_OLD_MSVCR
71351c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr70)
71451c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr71)
71551c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr80)
71651c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr90)
71751c0b2f7Stbbdev #endif
71851c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr100)
71951c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr110)
72051c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL(msvcr120)
72151c0b2f7Stbbdev     __TBB_ORIG_ALLOCATOR_REPLACEMENT_CALL_RELEASE(ucrtbase)
72251c0b2f7Stbbdev 
72351c0b2f7Stbbdev     // Replace functions without storing original code
72451c0b2f7Stbbdev     for (size_t j = 0; j < arrayLength(modules_to_replace); j++) {
72551c0b2f7Stbbdev         if (!modules_to_replace[j].doFuncReplacement)
72651c0b2f7Stbbdev             continue;
72751c0b2f7Stbbdev         for (size_t i = 0; i < arrayLength(c_routines_to_replace); i++)
72851c0b2f7Stbbdev         {
72951c0b2f7Stbbdev             ReplaceFunctionWithStore( modules_to_replace[j].name, c_routines_to_replace[i]._func, c_routines_to_replace[i]._fptr, NULL, NULL,  c_routines_to_replace[i]._on_error );
73051c0b2f7Stbbdev         }
73151c0b2f7Stbbdev         if ( strcmp(modules_to_replace[j].name, "ucrtbase.dll") == 0 ) {
73251c0b2f7Stbbdev             HMODULE ucrtbase_handle = GetModuleHandle("ucrtbase.dll");
73351c0b2f7Stbbdev             if (!ucrtbase_handle)
73451c0b2f7Stbbdev                 continue;
73551c0b2f7Stbbdev             // If _o_free function is present and patchable, redirect it to tbbmalloc as well
73651c0b2f7Stbbdev             // This prevents issues with other _o_* functions which might allocate memory with malloc
73751c0b2f7Stbbdev             if ( IsPrologueKnown("ucrtbase.dll", "_o_free", known_bytecodes, ucrtbase_handle)) {
73851c0b2f7Stbbdev                 ReplaceFunctionWithStore( "ucrtbase.dll", "_o_free", (FUNCPTR)__TBB_malloc__o_free, known_bytecodes, (FUNCPTR*)&orig__o_free,  FRR_FAIL );
73951c0b2f7Stbbdev             }
74051c0b2f7Stbbdev             // Similarly for _free_base
74151c0b2f7Stbbdev             if (IsPrologueKnown("ucrtbase.dll", "_free_base", known_bytecodes, ucrtbase_handle)) {
74251c0b2f7Stbbdev                 ReplaceFunctionWithStore("ucrtbase.dll", "_free_base", (FUNCPTR)__TBB_malloc__free_base, known_bytecodes, (FUNCPTR*)&orig__free_base, FRR_FAIL);
74351c0b2f7Stbbdev             }
74451c0b2f7Stbbdev             // ucrtbase.dll does not export operator new/delete, so skip the rest of the loop.
74551c0b2f7Stbbdev             continue;
74651c0b2f7Stbbdev         }
74751c0b2f7Stbbdev 
74851c0b2f7Stbbdev         for (size_t i = 0; i < arrayLength(cxx_routines_to_replace); i++)
74951c0b2f7Stbbdev         {
75051c0b2f7Stbbdev #if !_WIN64
75151c0b2f7Stbbdev             // in Microsoft* Visual Studio* 2012 and 2013 32-bit operator delete consists of 2 bytes only: short jump to free(ptr);
75251c0b2f7Stbbdev             // replacement should be skipped for this particular case.
75351c0b2f7Stbbdev             if ( ((strcmp(modules_to_replace[j].name, "msvcr110.dll") == 0) || (strcmp(modules_to_replace[j].name, "msvcr120.dll") == 0)) && (strcmp(cxx_routines_to_replace[i]._func, "??3@YAXPAX@Z") == 0) ) continue;
75451c0b2f7Stbbdev             // in Microsoft* Visual Studio* 2013 32-bit operator delete[] consists of 2 bytes only: short jump to free(ptr);
75551c0b2f7Stbbdev             // replacement should be skipped for this particular case.
75651c0b2f7Stbbdev             if ( (strcmp(modules_to_replace[j].name, "msvcr120.dll") == 0) && (strcmp(cxx_routines_to_replace[i]._func, "??_V@YAXPAX@Z") == 0) ) continue;
75751c0b2f7Stbbdev #endif
75851c0b2f7Stbbdev             ReplaceFunctionWithStore( modules_to_replace[j].name, cxx_routines_to_replace[i]._func, cxx_routines_to_replace[i]._fptr, NULL, NULL,  cxx_routines_to_replace[i]._on_error );
75951c0b2f7Stbbdev         }
76051c0b2f7Stbbdev     }
76151c0b2f7Stbbdev }
76251c0b2f7Stbbdev 
76351c0b2f7Stbbdev #endif // !__TBB_WIN8UI_SUPPORT
76451c0b2f7Stbbdev 
76551c0b2f7Stbbdev #if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
76651c0b2f7Stbbdev     // Suppress warning for UWP build ('main' signature found without threading model)
76751c0b2f7Stbbdev     #pragma warning(push)
76851c0b2f7Stbbdev     #pragma warning(disable:4447)
76951c0b2f7Stbbdev #endif
77051c0b2f7Stbbdev 
77151c0b2f7Stbbdev extern "C" BOOL WINAPI DllMain( HINSTANCE hInst, DWORD callReason, LPVOID reserved )
77251c0b2f7Stbbdev {
77351c0b2f7Stbbdev 
77451c0b2f7Stbbdev     if ( callReason==DLL_PROCESS_ATTACH && reserved && hInst ) {
77551c0b2f7Stbbdev #if !__TBB_WIN8UI_SUPPORT
77651c0b2f7Stbbdev         if (!tbb::detail::r1::GetBoolEnvironmentVariable("TBB_MALLOC_DISABLE_REPLACEMENT"))
77751c0b2f7Stbbdev         {
77851c0b2f7Stbbdev             doMallocReplacement();
77951c0b2f7Stbbdev         }
78051c0b2f7Stbbdev #endif // !__TBB_WIN8UI_SUPPORT
78151c0b2f7Stbbdev     }
78251c0b2f7Stbbdev 
78351c0b2f7Stbbdev     return TRUE;
78451c0b2f7Stbbdev }
78551c0b2f7Stbbdev 
78651c0b2f7Stbbdev #if defined(_MSC_VER) && !defined(__INTEL_COMPILER)
78751c0b2f7Stbbdev     #pragma warning(pop)
78851c0b2f7Stbbdev #endif
78951c0b2f7Stbbdev 
79051c0b2f7Stbbdev // Just to make the linker happy and link the DLL to the application
79151c0b2f7Stbbdev extern "C" __declspec(dllexport) void __TBB_malloc_proxy()
79251c0b2f7Stbbdev {
79351c0b2f7Stbbdev 
79451c0b2f7Stbbdev }
79551c0b2f7Stbbdev 
79651c0b2f7Stbbdev #endif //_WIN32
797