| /* ===---------- emutls.c - Implements __emutls_get_address ---------------=== |
| * |
| * The LLVM Compiler Infrastructure |
| * |
| * This file is dual licensed under the MIT and the University of Illinois Open |
| * Source Licenses. See LICENSE.TXT for details. |
| * |
| * ===----------------------------------------------------------------------=== |
| */ |
| #include <stdint.h> |
| #include <stdlib.h> |
| #include <string.h> |
| |
| #include "int_lib.h" |
| #include "int_util.h" |
| |
| #ifdef __BIONIC__ |
| /* There are 4 pthread key cleanup rounds on Bionic. Delay emutls deallocation |
| to round 2. We need to delay deallocation because: |
| - Android versions older than M lack __cxa_thread_atexit_impl, so apps |
| use a pthread key destructor to call C++ destructors. |
| - Apps might use __thread/thread_local variables in pthread destructors. |
| We can't wait until the final two rounds, because jemalloc needs two rounds |
| after the final malloc/free call to free its thread-specific data (see |
| https://reviews.llvm.org/D46978#1107507). */ |
| #define EMUTLS_SKIP_DESTRUCTOR_ROUNDS 1 |
| #else |
| #define EMUTLS_SKIP_DESTRUCTOR_ROUNDS 0 |
| #endif |
| |
| typedef struct emutls_address_array { |
| uintptr_t skip_destructor_rounds; |
| uintptr_t size; /* number of elements in the 'data' array */ |
| void* data[]; |
| } emutls_address_array; |
| |
| static void emutls_shutdown(emutls_address_array *array); |
| |
| #ifndef _WIN32 |
| |
| #include <pthread.h> |
| |
| static pthread_mutex_t emutls_mutex = PTHREAD_MUTEX_INITIALIZER; |
| static pthread_key_t emutls_pthread_key; |
| |
| typedef unsigned int gcc_word __attribute__((mode(word))); |
| typedef unsigned int gcc_pointer __attribute__((mode(pointer))); |
| |
| /* Default is not to use posix_memalign, so systems like Android |
| * can use thread local data without heavier POSIX memory allocators. |
| */ |
| #ifndef EMUTLS_USE_POSIX_MEMALIGN |
| #define EMUTLS_USE_POSIX_MEMALIGN 0 |
| #endif |
| |
| static __inline void *emutls_memalign_alloc(size_t align, size_t size) { |
| void *base; |
| #if EMUTLS_USE_POSIX_MEMALIGN |
| if (posix_memalign(&base, align, size) != 0) |
| abort(); |
| #else |
| #define EXTRA_ALIGN_PTR_BYTES (align - 1 + sizeof(void*)) |
| char* object; |
| if ((object = (char*)malloc(EXTRA_ALIGN_PTR_BYTES + size)) == NULL) |
| abort(); |
| base = (void*)(((uintptr_t)(object + EXTRA_ALIGN_PTR_BYTES)) |
| & ~(uintptr_t)(align - 1)); |
| |
| ((void**)base)[-1] = object; |
| #endif |
| return base; |
| } |
| |
| static __inline void emutls_memalign_free(void *base) { |
| #if EMUTLS_USE_POSIX_MEMALIGN |
| free(base); |
| #else |
| /* The mallocated address is in ((void**)base)[-1] */ |
| free(((void**)base)[-1]); |
| #endif |
| } |
| |
| static __inline void emutls_setspecific(emutls_address_array *value) { |
| pthread_setspecific(emutls_pthread_key, (void*) value); |
| } |
| |
| static __inline emutls_address_array* emutls_getspecific() { |
| return (emutls_address_array*) pthread_getspecific(emutls_pthread_key); |
| } |
| |
| static void emutls_key_destructor(void* ptr) { |
| emutls_address_array *array = (emutls_address_array*)ptr; |
| if (array->skip_destructor_rounds > 0) { |
| /* emutls is deallocated using a pthread key destructor. These |
| * destructors are called in several rounds to accommodate destructor |
| * functions that (re)initialize key values with pthread_setspecific. |
| * Delay the emutls deallocation to accommodate other end-of-thread |
| * cleanup tasks like calling thread_local destructors (e.g. the |
| * __cxa_thread_atexit fallback in libc++abi). |
| */ |
| array->skip_destructor_rounds--; |
| emutls_setspecific(array); |
| } else { |
| emutls_shutdown(array); |
| free(ptr); |
| } |
| } |
| |
| static __inline void emutls_init(void) { |
| if (pthread_key_create(&emutls_pthread_key, emutls_key_destructor) != 0) |
| abort(); |
| } |
| |
| static __inline void emutls_init_once(void) { |
| static pthread_once_t once = PTHREAD_ONCE_INIT; |
| pthread_once(&once, emutls_init); |
| } |
| |
| static __inline void emutls_lock() { |
| pthread_mutex_lock(&emutls_mutex); |
| } |
| |
| static __inline void emutls_unlock() { |
| pthread_mutex_unlock(&emutls_mutex); |
| } |
| |
| #else /* _WIN32 */ |
| |
| #include <windows.h> |
| #include <malloc.h> |
| #include <stdio.h> |
| #include <assert.h> |
| |
| static LPCRITICAL_SECTION emutls_mutex; |
| static DWORD emutls_tls_index = TLS_OUT_OF_INDEXES; |
| |
| typedef uintptr_t gcc_word; |
| typedef void * gcc_pointer; |
| |
| static void win_error(DWORD last_err, const char *hint) { |
| char *buffer = NULL; |
| if (FormatMessageA(FORMAT_MESSAGE_ALLOCATE_BUFFER | |
| FORMAT_MESSAGE_FROM_SYSTEM | |
| FORMAT_MESSAGE_MAX_WIDTH_MASK, |
| NULL, last_err, 0, (LPSTR)&buffer, 1, NULL)) { |
| fprintf(stderr, "Windows error: %s\n", buffer); |
| } else { |
| fprintf(stderr, "Unkown Windows error: %s\n", hint); |
| } |
| LocalFree(buffer); |
| } |
| |
| static __inline void win_abort(DWORD last_err, const char *hint) { |
| win_error(last_err, hint); |
| abort(); |
| } |
| |
| static __inline void *emutls_memalign_alloc(size_t align, size_t size) { |
| void *base = _aligned_malloc(size, align); |
| if (!base) |
| win_abort(GetLastError(), "_aligned_malloc"); |
| return base; |
| } |
| |
| static __inline void emutls_memalign_free(void *base) { |
| _aligned_free(base); |
| } |
| |
| static void emutls_exit(void) { |
| if (emutls_mutex) { |
| DeleteCriticalSection(emutls_mutex); |
| _aligned_free(emutls_mutex); |
| emutls_mutex = NULL; |
| } |
| if (emutls_tls_index != TLS_OUT_OF_INDEXES) { |
| emutls_shutdown((emutls_address_array*)TlsGetValue(emutls_tls_index)); |
| TlsFree(emutls_tls_index); |
| emutls_tls_index = TLS_OUT_OF_INDEXES; |
| } |
| } |
| |
| #pragma warning (push) |
| #pragma warning (disable : 4100) |
| static BOOL CALLBACK emutls_init(PINIT_ONCE p0, PVOID p1, PVOID *p2) { |
| emutls_mutex = (LPCRITICAL_SECTION)_aligned_malloc(sizeof(CRITICAL_SECTION), 16); |
| if (!emutls_mutex) { |
| win_error(GetLastError(), "_aligned_malloc"); |
| return FALSE; |
| } |
| InitializeCriticalSection(emutls_mutex); |
| |
| emutls_tls_index = TlsAlloc(); |
| if (emutls_tls_index == TLS_OUT_OF_INDEXES) { |
| emutls_exit(); |
| win_error(GetLastError(), "TlsAlloc"); |
| return FALSE; |
| } |
| atexit(&emutls_exit); |
| return TRUE; |
| } |
| |
| static __inline void emutls_init_once(void) { |
| static INIT_ONCE once; |
| InitOnceExecuteOnce(&once, emutls_init, NULL, NULL); |
| } |
| |
| static __inline void emutls_lock() { |
| EnterCriticalSection(emutls_mutex); |
| } |
| |
| static __inline void emutls_unlock() { |
| LeaveCriticalSection(emutls_mutex); |
| } |
| |
| static __inline void emutls_setspecific(emutls_address_array *value) { |
| if (TlsSetValue(emutls_tls_index, (LPVOID) value) == 0) |
| win_abort(GetLastError(), "TlsSetValue"); |
| } |
| |
| static __inline emutls_address_array* emutls_getspecific() { |
| LPVOID value = TlsGetValue(emutls_tls_index); |
| if (value == NULL) { |
| const DWORD err = GetLastError(); |
| if (err != ERROR_SUCCESS) |
| win_abort(err, "TlsGetValue"); |
| } |
| return (emutls_address_array*) value; |
| } |
| |
| /* Provide atomic load/store functions for emutls_get_index if built with MSVC. |
| */ |
| #if !defined(__ATOMIC_RELEASE) |
| #include <intrin.h> |
| |
| enum { __ATOMIC_ACQUIRE = 2, __ATOMIC_RELEASE = 3 }; |
| |
| static __inline uintptr_t __atomic_load_n(void *ptr, unsigned type) { |
| assert(type == __ATOMIC_ACQUIRE); |
| // These return the previous value - but since we do an OR with 0, |
| // it's equivalent to a plain load. |
| #ifdef _WIN64 |
| return InterlockedOr64(ptr, 0); |
| #else |
| return InterlockedOr(ptr, 0); |
| #endif |
| } |
| |
| static __inline void __atomic_store_n(void *ptr, uintptr_t val, unsigned type) { |
| assert(type == __ATOMIC_RELEASE); |
| InterlockedExchangePointer((void *volatile *)ptr, (void *)val); |
| } |
| |
| #endif /* __ATOMIC_RELEASE */ |
| |
| #pragma warning (pop) |
| |
| #endif /* _WIN32 */ |
| |
| static size_t emutls_num_object = 0; /* number of allocated TLS objects */ |
| |
| /* Free the allocated TLS data |
| */ |
| static void emutls_shutdown(emutls_address_array *array) { |
| if (array) { |
| uintptr_t i; |
| for (i = 0; i < array->size; ++i) { |
| if (array->data[i]) |
| emutls_memalign_free(array->data[i]); |
| } |
| } |
| } |
| |
| /* For every TLS variable xyz, |
| * there is one __emutls_control variable named __emutls_v.xyz. |
| * If xyz has non-zero initial value, __emutls_v.xyz's "value" |
| * will point to __emutls_t.xyz, which has the initial value. |
| */ |
| typedef struct __emutls_control { |
| /* Must use gcc_word here, instead of size_t, to match GCC. When |
| gcc_word is larger than size_t, the upper extra bits are all |
| zeros. We can use variables of size_t to operate on size and |
| align. */ |
| gcc_word size; /* size of the object in bytes */ |
| gcc_word align; /* alignment of the object in bytes */ |
| union { |
| uintptr_t index; /* data[index-1] is the object address */ |
| void* address; /* object address, when in single thread env */ |
| } object; |
| void* value; /* null or non-zero initial value for the object */ |
| } __emutls_control; |
| |
| /* Emulated TLS objects are always allocated at run-time. */ |
| static __inline void *emutls_allocate_object(__emutls_control *control) { |
| /* Use standard C types, check with gcc's emutls.o. */ |
| COMPILE_TIME_ASSERT(sizeof(uintptr_t) == sizeof(gcc_pointer)); |
| COMPILE_TIME_ASSERT(sizeof(uintptr_t) == sizeof(void*)); |
| |
| size_t size = control->size; |
| size_t align = control->align; |
| void* base; |
| if (align < sizeof(void*)) |
| align = sizeof(void*); |
| /* Make sure that align is power of 2. */ |
| if ((align & (align - 1)) != 0) |
| abort(); |
| |
| base = emutls_memalign_alloc(align, size); |
| if (control->value) |
| memcpy(base, control->value, size); |
| else |
| memset(base, 0, size); |
| return base; |
| } |
| |
| |
| /* Returns control->object.index; set index if not allocated yet. */ |
| static __inline uintptr_t emutls_get_index(__emutls_control *control) { |
| uintptr_t index = __atomic_load_n(&control->object.index, __ATOMIC_ACQUIRE); |
| if (!index) { |
| emutls_init_once(); |
| emutls_lock(); |
| index = control->object.index; |
| if (!index) { |
| index = ++emutls_num_object; |
| __atomic_store_n(&control->object.index, index, __ATOMIC_RELEASE); |
| } |
| emutls_unlock(); |
| } |
| return index; |
| } |
| |
| /* Updates newly allocated thread local emutls_address_array. */ |
| static __inline void emutls_check_array_set_size(emutls_address_array *array, |
| uintptr_t size) { |
| if (array == NULL) |
| abort(); |
| array->size = size; |
| emutls_setspecific(array); |
| } |
| |
| /* Returns the new 'data' array size, number of elements, |
| * which must be no smaller than the given index. |
| */ |
| static __inline uintptr_t emutls_new_data_array_size(uintptr_t index) { |
| /* Need to allocate emutls_address_array with extra slots |
| * to store the header. |
| * Round up the emutls_address_array size to multiple of 16. |
| */ |
| uintptr_t header_words = sizeof(emutls_address_array) / sizeof(void *); |
| return ((index + header_words + 15) & ~((uintptr_t)15)) - header_words; |
| } |
| |
| /* Returns the size in bytes required for an emutls_address_array with |
| * N number of elements for data field. |
| */ |
| static __inline uintptr_t emutls_asize(uintptr_t N) { |
| return N * sizeof(void *) + sizeof(emutls_address_array); |
| } |
| |
| /* Returns the thread local emutls_address_array. |
| * Extends its size if necessary to hold address at index. |
| */ |
| static __inline emutls_address_array * |
| emutls_get_address_array(uintptr_t index) { |
| emutls_address_array* array = emutls_getspecific(); |
| if (array == NULL) { |
| uintptr_t new_size = emutls_new_data_array_size(index); |
| array = (emutls_address_array*) malloc(emutls_asize(new_size)); |
| if (array) { |
| memset(array->data, 0, new_size * sizeof(void*)); |
| array->skip_destructor_rounds = EMUTLS_SKIP_DESTRUCTOR_ROUNDS; |
| } |
| emutls_check_array_set_size(array, new_size); |
| } else if (index > array->size) { |
| uintptr_t orig_size = array->size; |
| uintptr_t new_size = emutls_new_data_array_size(index); |
| array = (emutls_address_array*) realloc(array, emutls_asize(new_size)); |
| if (array) |
| memset(array->data + orig_size, 0, |
| (new_size - orig_size) * sizeof(void*)); |
| emutls_check_array_set_size(array, new_size); |
| } |
| return array; |
| } |
| |
| void* __emutls_get_address(__emutls_control* control) { |
| uintptr_t index = emutls_get_index(control); |
| emutls_address_array* array = emutls_get_address_array(index--); |
| if (array->data[index] == NULL) |
| array->data[index] = emutls_allocate_object(control); |
| return array->data[index]; |
| } |