/*
* Fast TLS access for compatmalloc.
*
* Uses __thread with initial-exec TLS model to get direct fs: segment
* loads (~1-3 cycles) instead of __tls_get_addr PLT calls (~25 cycles)
* or pthread_getspecific PLT calls (~10-15 cycles).
*
* initial-exec is safe for LD_PRELOAD / DT_NEEDED shared libraries
* (loaded at program start). NOT safe for dlopen'd libraries.
*/
__thread void * = 0;
void *
void