src/jemalloc.c - platform/external/jemalloc_new - Git at Google

 #include "jemalloc/internal/jemalloc_preamble.h"
 #include "jemalloc/internal/jemalloc_internal_includes.h"

 #include "jemalloc/internal/assert.h"
 #include "jemalloc/internal/atomic.h"
 #include "jemalloc/internal/buf_writer.h"
 #include "jemalloc/internal/ctl.h"
 #include "jemalloc/internal/emap.h"
 #include "jemalloc/internal/extent_dss.h"
 #include "jemalloc/internal/extent_mmap.h"
 #include "jemalloc/internal/fxp.h"
 #include "jemalloc/internal/san.h"
 #include "jemalloc/internal/hook.h"
 #include "jemalloc/internal/jemalloc_internal_types.h"
 #include "jemalloc/internal/log.h"
 #include "jemalloc/internal/malloc_io.h"
 #include "jemalloc/internal/mutex.h"
 #include "jemalloc/internal/nstime.h"
 #include "jemalloc/internal/rtree.h"
 #include "jemalloc/internal/safety_check.h"
 #include "jemalloc/internal/sc.h"
 #include "jemalloc/internal/spin.h"
 #include "jemalloc/internal/sz.h"
 #include "jemalloc/internal/ticker.h"
 #include "jemalloc/internal/thread_event.h"
 #include "jemalloc/internal/util.h"

 #include "jemalloc/internal/conf.h"

 /******************************************************************************/
 /* Data. */

 /* Runtime configuration options. */
 const char *je_malloc_conf
 #ifndef _WIN32
     JEMALLOC_ATTR(weak)
 #endif
         ;
 /*
  * The usual rule is that the closer to runtime you are, the higher priority
  * your configuration settings are (so the jemalloc config options get lower
  * priority than the per-binary setting, which gets lower priority than the /etc
  * setting, which gets lower priority than the environment settings).
  *
  * But it's a fairly common use case in some testing environments for a user to
  * be able to control the binary, but nothing else (e.g. a performancy canary
  * uses the production OS and environment variables, but can run any binary in
  * those circumstances).  For these use cases, it's handy to have an in-binary
  * mechanism for overriding environment variable settings, with the idea that if
  * the results are positive they get promoted to the official settings, and
  * moved from the binary to the environment variable.
  *
  * We don't actually want this to be widespread, so we'll give it a silly name
  * and not mention it in headers or documentation.
  */
 const char *je_malloc_conf_2_conf_harder
 #ifndef _WIN32
     JEMALLOC_ATTR(weak)
 #endif
         ;

 const char *opt_malloc_conf_symlink = NULL;
 const char *opt_malloc_conf_env_var = NULL;

 bool opt_abort =
 #ifdef JEMALLOC_DEBUG
     true
 #else
     false
 #endif
     ;
 bool opt_abort_conf =
 #ifdef JEMALLOC_DEBUG
     true
 #else
     false
 #endif
     ;
 /* Intentionally default off, even with debug builds. */
 bool        opt_confirm_conf = false;
 const char *opt_junk =
 #if (defined(JEMALLOC_DEBUG) && defined(JEMALLOC_FILL))
     "true"
 #else
     "false"
 #endif
     ;
 bool opt_junk_alloc =
 #if (defined(JEMALLOC_DEBUG) && defined(JEMALLOC_FILL))
     true
 #else
     false
 #endif
     ;
 bool opt_junk_free =
 #if (defined(JEMALLOC_DEBUG) && defined(JEMALLOC_FILL))
     true
 #else
     false
 #endif
     ;
 bool opt_trust_madvise =
 #ifdef JEMALLOC_PURGE_MADVISE_DONTNEED_ZEROS
     false
 #else
     true
 #endif
     ;

 bool opt_cache_oblivious =
 #ifdef JEMALLOC_CACHE_OBLIVIOUS
     true
 #else
     false
 #endif
     ;

 zero_realloc_action_t opt_zero_realloc_action =
 #ifdef JEMALLOC_ZERO_REALLOC_DEFAULT_FREE
     zero_realloc_action_free
 #else
     zero_realloc_action_alloc
 #endif
     ;

 atomic_zu_t zero_realloc_count = ATOMIC_INIT(0);

 /*
  * Disable large size classes is now the default behavior in jemalloc.
  * Although it is configurable in MALLOC_CONF, this is mainly for debugging
  * purposes and should not be tuned.
  */
 bool opt_disable_large_size_classes = true;

 const char *const zero_realloc_mode_names[] = {
     "alloc",
     "free",
     "abort",
 };

 /*
  * These are the documented values for junk fill debugging facilities -- see the
  * man page.
  */
 static const uint8_t junk_alloc_byte = 0xa5;
 static const uint8_t junk_free_byte = 0x5a;

 static void
 default_junk_alloc(void *ptr, size_t usize) {
 	memset(ptr, junk_alloc_byte, usize);
 }

 static void
 default_junk_free(void *ptr, size_t usize) {
 	memset(ptr, junk_free_byte, usize);
 }

 void (*JET_MUTABLE junk_alloc_callback)(
     void *ptr, size_t size) = &default_junk_alloc;
 void (*JET_MUTABLE junk_free_callback)(
     void *ptr, size_t size) = &default_junk_free;
 void (*JET_MUTABLE invalid_conf_abort)(void) = &abort;

 bool         opt_utrace = false;
 bool         opt_xmalloc = false;
 bool         opt_experimental_infallible_new = false;
 bool         opt_experimental_tcache_gc = true;
 bool         opt_zero = false;
 unsigned     opt_narenas = 0;
 fxp_t opt_narenas_ratio = FXP_INIT_INT(4);

 unsigned ncpus;

 unsigned opt_debug_double_free_max_scan =
     SAFETY_CHECK_DOUBLE_FREE_MAX_SCAN_DEFAULT;

 size_t opt_calloc_madvise_threshold = CALLOC_MADVISE_THRESHOLD_DEFAULT;

 /* Protects arenas initialization. */
 static malloc_mutex_t arenas_lock;

 /* The global hpa, and whether it's on. */
 bool             opt_hpa = false;
 hpa_shard_opts_t opt_hpa_opts = HPA_SHARD_OPTS_DEFAULT;
 sec_opts_t       opt_hpa_sec_opts = SEC_OPTS_DEFAULT;

 /*
  * Arenas that are used to service external requests.  Not all elements of the
  * arenas array are necessarily used; arenas are created lazily as needed.
  *
  * arenas[0..narenas_auto) are used for automatic multiplexing of threads and
  * arenas.  arenas[narenas_auto..narenas_total) are only used if the application
  * takes some action to create them and allocate from them.
  *
  * Points to an arena_t.
  */
 JEMALLOC_ALIGNED(CACHELINE)
 atomic_p_t        arenas[MALLOCX_ARENA_LIMIT];
 static atomic_u_t narenas_total; /* Use narenas_total_*(). */
 /* Below three are read-only after initialization. */
 static arena_t *a0; /* arenas[0]. */
 unsigned        narenas_auto;
 unsigned        manual_arena_base;

 malloc_init_t malloc_init_state = malloc_init_uninitialized;

 /* False should be the common case.  Set to true to trigger initialization. */
 bool malloc_slow = true;

 /* When malloc_slow is true, set the corresponding bits for sanity check. */
 enum {
 	flag_opt_junk_alloc = (1U),
 	flag_opt_junk_free = (1U << 1),
 	flag_opt_zero = (1U << 2),
 	flag_opt_utrace = (1U << 3),
 	flag_opt_xmalloc = (1U << 4)
 };
 static uint8_t malloc_slow_flags;

 #ifdef JEMALLOC_THREADED_INIT
 /* Used to let the initializing thread recursively allocate. */
 #	define NO_INITIALIZER ((unsigned long)0)
 #	define INITIALIZER pthread_self()
 #	define IS_INITIALIZER                                                 \
 		(pthread_equal(malloc_initializer, pthread_self()))
 static pthread_t malloc_initializer = NO_INITIALIZER;
 #else
 #	define NO_INITIALIZER false
 #	define INITIALIZER true
 #	define IS_INITIALIZER malloc_initializer
 static bool malloc_initializer = NO_INITIALIZER;
 #endif

 /* Used to avoid initialization races. */
 #ifdef _WIN32
 #	if _WIN32_WINNT >= 0x0600
 static malloc_mutex_t init_lock = SRWLOCK_INIT;
 #	else
 static malloc_mutex_t init_lock;
 static bool           init_lock_initialized = false;

 JEMALLOC_ATTR(constructor)
 static void WINAPI
 _init_init_lock(void) {
 	/*
 	 * If another constructor in the same binary is using mallctl to e.g.
 	 * set up extent hooks, it may end up running before this one, and
 	 * malloc_init_hard will crash trying to lock the uninitialized lock. So
 	 * we force an initialization of the lock in malloc_init_hard as well.
 	 * We don't try to care about atomicity of the accessed to the
 	 * init_lock_initialized boolean, since it really only matters early in
 	 * the process creation, before any separate thread normally starts
 	 * doing anything.
 	 */
 	if (!init_lock_initialized) {
 		malloc_mutex_init(&init_lock, "init", WITNESS_RANK_INIT,
 		    malloc_mutex_rank_exclusive);
 	}
 	init_lock_initialized = true;
 }

 #		ifdef _MSC_VER
 #			pragma section(".CRT$XCU", read)
 JEMALLOC_SECTION(".CRT$XCU")
 JEMALLOC_ATTR(used)
 static const void(WINAPI *init_init_lock)(void) = _init_init_lock;
 #		endif
 #	endif
 #else
 static malloc_mutex_t init_lock = MALLOC_MUTEX_INITIALIZER;
 #endif

 typedef struct {
 	void  *p; /* Input pointer (as in realloc(p, s)). */
 	size_t s; /* Request size. */
 	void  *r; /* Result pointer. */
 } malloc_utrace_t;

 #ifdef JEMALLOC_UTRACE
 #	define UTRACE(a, b, c)                                                \
 		do {                                                           \
 			if (unlikely(opt_utrace)) {                            \
 				int             utrace_serrno = errno;         \
 				malloc_utrace_t ut;                            \
 				ut.p = (a);                                    \
 				ut.s = (b);                                    \
 				ut.r = (c);                                    \
 				UTRACE_CALL(&ut, sizeof(ut));                  \
 				errno = utrace_serrno;                         \
 			}                                                      \
 		} while (0)
 #else
 #	define UTRACE(a, b, c)
 #endif


 /******************************************************************************/
 /*
  * Function prototypes for static functions that are referenced prior to
  * definition.
  */

 static bool malloc_init_hard_a0(void);
 static bool malloc_init_hard(void);

 /******************************************************************************/
 /*
  * Begin miscellaneous support functions.
  */

 JEMALLOC_ALWAYS_INLINE bool
 malloc_init_a0(void) {
 	if (unlikely(malloc_init_state == malloc_init_uninitialized)) {
 		return malloc_init_hard_a0();
 	}
 	return false;
 }

 JEMALLOC_ALWAYS_INLINE bool
 malloc_init(void) {
 	if (unlikely(!malloc_initialized()) && malloc_init_hard()) {
 		return true;
 	}
 	return false;
 }

 /*
  * The a0*() functions are used instead of i{d,}alloc() in situations that
  * cannot tolerate TLS variable access.
  */

 static void *
 a0ialloc(size_t size, bool zero, bool is_internal) {
 	if (unlikely(malloc_init_a0())) {
 		return NULL;
 	}

 	return iallocztm(TSDN_NULL, size, sz_size2index(size), zero, NULL,
 	    is_internal, arena_get(TSDN_NULL, 0, true), true);
 }

 static void
 a0idalloc(void *ptr, bool is_internal) {
 	idalloctm(TSDN_NULL, ptr, NULL, NULL, is_internal, true);
 }

 void *
 a0malloc(size_t size) {
 	return a0ialloc(size, false, true);
 }

 void
 a0dalloc(void *ptr) {
 	a0idalloc(ptr, true);
 }

 /*
  * FreeBSD's libc uses the bootstrap_*() functions in bootstrap-sensitive
  * situations that cannot tolerate TLS variable access (TLS allocation and very
  * early internal data structure initialization).
  */

 void *
 bootstrap_malloc(size_t size) {
 	if (unlikely(size == 0)) {
 		size = 1;
 	}

 	return a0ialloc(size, false, false);
 }

 void *
 bootstrap_calloc(size_t num, size_t size) {
 	size_t num_size;

 	num_size = num * size;
 	if (unlikely(num_size == 0)) {
 		assert(num == 0 || size == 0);
 		num_size = 1;
 	}

 	return a0ialloc(num_size, true, false);
 }

 void
 bootstrap_free(void *ptr) {
 	if (unlikely(ptr == NULL)) {
 		return;
 	}

 	a0idalloc(ptr, false);
 }

 void
 arena_set(unsigned ind, arena_t *arena) {
 	atomic_store_p(&arenas[ind], arena, ATOMIC_RELEASE);
 }

 static void
 narenas_total_set(unsigned narenas) {
 	atomic_store_u(&narenas_total, narenas, ATOMIC_RELEASE);
 }

 static void
 narenas_total_inc(void) {
 	atomic_fetch_add_u(&narenas_total, 1, ATOMIC_RELEASE);
 }

 unsigned
 narenas_total_get(void) {
 	return atomic_load_u(&narenas_total, ATOMIC_ACQUIRE);
 }

 /* Create a new arena and insert it into the arenas array at index ind. */
 static arena_t *
 arena_init_locked(tsdn_t *tsdn, unsigned ind, const arena_config_t *config) {
 	arena_t *arena;

 	assert(ind <= narenas_total_get());
 	if (ind >= MALLOCX_ARENA_LIMIT) {
 		return NULL;
 	}
 	if (ind == narenas_total_get()) {
 		narenas_total_inc();
 	}

 	/*
 	 * Another thread may have already initialized arenas[ind] if it's an
 	 * auto arena.
 	 */
 	arena = arena_get(tsdn, ind, false);
 	if (arena != NULL) {
 		assert(arena_is_auto(arena));
 		return arena;
 	}

 	/* Actually initialize the arena. */
 	arena = arena_new(tsdn, ind, config);

 	return arena;
 }

 static void
 arena_new_create_background_thread(tsdn_t *tsdn, unsigned ind) {
 	if (ind == 0) {
 		return;
 	}

 	if (have_background_thread) {
 		if (background_thread_create(tsdn_tsd(tsdn), ind)) {
 			malloc_printf(
 			    "<jemalloc>: error in background thread "
 			    "creation for arena %u. Abort.\n",
 			    ind);
 			abort();
 		}
 	}
 }

 arena_t *
 arena_init(tsdn_t *tsdn, unsigned ind, const arena_config_t *config) {
 	arena_t *arena;

 	malloc_mutex_lock(tsdn, &arenas_lock);
 	arena = arena_init_locked(tsdn, ind, config);
 	malloc_mutex_unlock(tsdn, &arenas_lock);

 	arena_new_create_background_thread(tsdn, ind);

 	return arena;
 }

 static void
 arena_bind(tsd_t *tsd, unsigned ind, bool internal) {
 	arena_t *arena = arena_get(tsd_tsdn(tsd), ind, false);
 	arena_nthreads_inc(arena, internal);

 	if (internal) {
 		tsd_iarena_set(tsd, arena);
 	} else {
 		tsd_arena_set(tsd, arena);
 		/*
 		 * While shard acts as a random seed, the cast below should
 		 * not make much difference.
 		 */
 		uint8_t shard = (uint8_t)atomic_fetch_add_u(
 		    &arena->binshard_next, 1, ATOMIC_RELAXED);
 		tsd_binshards_t *bins = tsd_binshardsp_get(tsd);
 		for (unsigned i = 0; i < SC_NBINS; i++) {
 			assert(bin_infos[i].n_shards > 0
 			    && bin_infos[i].n_shards <= BIN_SHARDS_MAX);
 			bins->binshard[i] = shard % bin_infos[i].n_shards;
 		}
 	}
 }

 void
 arena_migrate(tsd_t *tsd, arena_t *oldarena, arena_t *newarena) {
 	assert(oldarena != NULL);
 	assert(newarena != NULL);

 	arena_nthreads_dec(oldarena, false);
 	arena_nthreads_inc(newarena, false);
 	tsd_arena_set(tsd, newarena);

 	if (arena_nthreads_get(oldarena, false) == 0
 	    && !background_thread_enabled()) {
 		/*
 		 * Purge if the old arena has no associated threads anymore and
 		 * no background threads.
 		 */
 		arena_decay(tsd_tsdn(tsd), oldarena,
 		    /* is_background_thread */ false, /* all */ true);
 	}
 }

 static void
 arena_unbind(tsd_t *tsd, unsigned ind, bool internal) {
 	arena_t *arena;

 	arena = arena_get(tsd_tsdn(tsd), ind, false);
 	arena_nthreads_dec(arena, internal);

 	if (internal) {
 		tsd_iarena_set(tsd, NULL);
 	} else {
 		tsd_arena_set(tsd, NULL);
 	}
 }

 /* Slow path, called only by arena_choose(). */
 arena_t *
 arena_choose_hard(tsd_t *tsd, bool internal) {
 	arena_t *ret JEMALLOC_CC_SILENCE_INIT(NULL);

 	if (have_percpu_arena && PERCPU_ARENA_ENABLED(opt_percpu_arena)) {
 		unsigned choose = percpu_arena_choose();
 		ret = arena_get(tsd_tsdn(tsd), choose, true);
 		assert(ret != NULL);
 		arena_bind(tsd, arena_ind_get(ret), false);
 		arena_bind(tsd, arena_ind_get(ret), true);

 		return ret;
 	}

 	if (narenas_auto > 1) {
 		unsigned i, j, choose[2], first_null;
 		bool     is_new_arena[2];

 		/*
 		 * Determine binding for both non-internal and internal
 		 * allocation.
 		 *
 		 *   choose[0]: For application allocation.
 		 *   choose[1]: For internal metadata allocation.
 		 */

 		for (j = 0; j < 2; j++) {
 			choose[j] = 0;
 			is_new_arena[j] = false;
 		}

 		first_null = narenas_auto;
 		malloc_mutex_lock(tsd_tsdn(tsd), &arenas_lock);
 		assert(arena_get(tsd_tsdn(tsd), 0, false) != NULL);
 		for (i = 1; i < narenas_auto; i++) {
 			if (arena_get(tsd_tsdn(tsd), i, false) != NULL) {
 				/*
 				 * Choose the first arena that has the lowest
 				 * number of threads assigned to it.
 				 */
 				for (j = 0; j < 2; j++) {
 					if (arena_nthreads_get(
 					        arena_get(
 					            tsd_tsdn(tsd), i, false),
 					        !!j)
 					    < arena_nthreads_get(
 					        arena_get(tsd_tsdn(tsd),
 					            choose[j], false),
 					        !!j)) {
 						choose[j] = i;
 					}
 				}
 			} else if (first_null == narenas_auto) {
 				/*
 				 * Record the index of the first uninitialized
 				 * arena, in case all extant arenas are in use.
 				 *
 				 * NB: It is possible for there to be
 				 * discontinuities in terms of initialized
 				 * versus uninitialized arenas, due to the
 				 * "thread.arena" mallctl.
 				 */
 				first_null = i;
 			}
 		}

 		for (j = 0; j < 2; j++) {
 			if (arena_nthreads_get(
 			        arena_get(tsd_tsdn(tsd), choose[j], false), !!j)
 			        == 0
 			    || first_null == narenas_auto) {
 				/*
 				 * Use an unloaded arena, or the least loaded
 				 * arena if all arenas are already initialized.
 				 */
 				if (!!j == internal) {
 					ret = arena_get(
 					    tsd_tsdn(tsd), choose[j], false);
 				}
 			} else {
 				arena_t *arena;

 				/* Initialize a new arena. */
 				choose[j] = first_null;
 				arena = arena_init_locked(tsd_tsdn(tsd),
 				    choose[j], &arena_config_default);
 				if (arena == NULL) {
 					malloc_mutex_unlock(
 					    tsd_tsdn(tsd), &arenas_lock);
 					return NULL;
 				}
 				is_new_arena[j] = true;
 				if (!!j == internal) {
 					ret = arena;
 				}
 			}
 			arena_bind(tsd, choose[j], !!j);
 		}
 		malloc_mutex_unlock(tsd_tsdn(tsd), &arenas_lock);

 		for (j = 0; j < 2; j++) {
 			if (is_new_arena[j]) {
 				assert(choose[j] > 0);
 				arena_new_create_background_thread(
 				    tsd_tsdn(tsd), choose[j]);
 			}
 		}

 	} else {
 		ret = arena_get(tsd_tsdn(tsd), 0, false);
 		arena_bind(tsd, 0, false);
 		arena_bind(tsd, 0, true);
 	}

 	return ret;
 }

 void
 iarena_cleanup(tsd_t *tsd) {
 	arena_t *iarena;

 	iarena = tsd_iarena_get(tsd);
 	if (iarena != NULL) {
 		arena_unbind(tsd, arena_ind_get(iarena), true);
 	}
 }

 void
 arena_cleanup(tsd_t *tsd) {
 	arena_t *arena;

 	arena = tsd_arena_get(tsd);
 	if (arena != NULL) {
 		arena_unbind(tsd, arena_ind_get(arena), false);
 	}
 }

 static void
 stats_print_atexit(void) {
 	if (config_stats) {
 		tsdn_t  *tsdn;
 		unsigned narenas, i;

 		tsdn = tsdn_fetch();

 		/*
 		 * Merge stats from extant threads.  This is racy, since
 		 * individual threads do not lock when recording tcache stats
 		 * events.  As a consequence, the final stats may be slightly
 		 * out of date by the time they are reported, if other threads
 		 * continue to allocate.
 		 */
 		for (i = 0, narenas = narenas_total_get(); i < narenas; i++) {
 			arena_t *arena = arena_get(tsdn, i, false);
 			if (arena != NULL) {
 				tcache_slow_t *tcache_slow;

 				malloc_mutex_lock(tsdn, &arena->tcache_ql_mtx);
 				ql_foreach (
 				    tcache_slow, &arena->tcache_ql, link) {
 					tcache_stats_merge(
 					    tsdn, tcache_slow->tcache, arena);
 				}
 				malloc_mutex_unlock(
 				    tsdn, &arena->tcache_ql_mtx);
 			}
 		}
 	}
 	je_malloc_stats_print(NULL, NULL, opt_stats_print_opts);
 }

 /*
  * Ensure that we don't hold any locks upon entry to or exit from allocator
  * code (in a "broad" sense that doesn't count a reentrant allocation as an
  * entrance or exit).
  */
 JEMALLOC_ALWAYS_INLINE void
 check_entry_exit_locking(tsdn_t *tsdn) {
 	if (!config_debug) {
 		return;
 	}
 	if (tsdn_null(tsdn)) {
 		return;
 	}
 	tsd_t *tsd = tsdn_tsd(tsdn);
 	/*
 	 * It's possible we hold locks at entry/exit if we're in a nested
 	 * allocation.
 	 */
 	int8_t reentrancy_level = tsd_reentrancy_level_get(tsd);
 	if (reentrancy_level != 0) {
 		return;
 	}
 	witness_assert_lockless(tsdn_witness_tsdp_get(tsdn));
 }

 /*
  * End miscellaneous support functions.
  */
 /******************************************************************************/
 /*
  * Begin initialization functions.
  */

 static unsigned
 malloc_ncpus(void) {
 	long result;

 #ifdef _WIN32
 	SYSTEM_INFO si;
 	GetSystemInfo(&si);
 	result = si.dwNumberOfProcessors;
 #elif defined(CPU_COUNT)
 	/*
 	 * glibc >= 2.6 has the CPU_COUNT macro.
 	 *
 	 * glibc's sysconf() uses isspace().  glibc allocates for the first time
 	 * *before* setting up the isspace tables.  Therefore we need a
 	 * different method to get the number of CPUs.
 	 *
 	 * The getaffinity approach is also preferred when only a subset of CPUs
 	 * is available, to avoid using more arenas than necessary.
 	 */
 	{
 #	if defined(__FreeBSD__) || defined(__DragonFly__)
 		cpuset_t set;
 #	else
 		cpu_set_t set;
 #	endif
 #	if defined(JEMALLOC_HAVE_SCHED_SETAFFINITY)
 		sched_getaffinity(0, sizeof(set), &set);
 #	else
 		pthread_getaffinity_np(pthread_self(), sizeof(set), &set);
 #	endif
 		result = CPU_COUNT(&set);
 	}
 #else
 	result = sysconf(_SC_NPROCESSORS_ONLN);
 #endif
 	return ((result == -1) ? 1 : (unsigned)result);
 }

 /*
  * Ensure that number of CPUs is determistinc, i.e. it is the same based on:
  * - sched_getaffinity()
  * - _SC_NPROCESSORS_ONLN
  * - _SC_NPROCESSORS_CONF
  * Since otherwise tricky things is possible with percpu arenas in use.
  */
 static bool
 malloc_cpu_count_is_deterministic(void) {
 #ifdef _WIN32
 	return true;
 #else
 	long cpu_onln = sysconf(_SC_NPROCESSORS_ONLN);
 	long cpu_conf = sysconf(_SC_NPROCESSORS_CONF);
 	if (cpu_onln != cpu_conf) {
 		return false;
 	}
 #	if defined(CPU_COUNT)
 #		if defined(__FreeBSD__) || defined(__DragonFly__)
 	cpuset_t set;
 #		else
 	cpu_set_t set;
 #		endif /* __FreeBSD__ */
 #		if defined(JEMALLOC_HAVE_SCHED_SETAFFINITY)
 	sched_getaffinity(0, sizeof(set), &set);
 #		else  /* !JEMALLOC_HAVE_SCHED_SETAFFINITY */
 	pthread_getaffinity_np(pthread_self(), sizeof(set), &set);
 #		endif /* JEMALLOC_HAVE_SCHED_SETAFFINITY */
 	long cpu_affinity = CPU_COUNT(&set);
 	if (cpu_affinity != cpu_conf) {
 		return false;
 	}
 #	endif         /* CPU_COUNT */
 	return true;
 #endif
 }

 static void
 malloc_slow_flag_init(void) {
 	/*
 	 * Combine the runtime options into malloc_slow for fast path.  Called
 	 * after processing all the options.
 	 */
 	malloc_slow_flags |= (opt_junk_alloc ? flag_opt_junk_alloc : 0)
 	    | (opt_junk_free ? flag_opt_junk_free : 0)
 	    | (opt_zero ? flag_opt_zero : 0)
 	    | (opt_utrace ? flag_opt_utrace : 0)
 	    | (opt_xmalloc ? flag_opt_xmalloc : 0);

 	malloc_slow = (malloc_slow_flags != 0);
 }

 static bool
 malloc_init_hard_needed(void) {
 	if (malloc_initialized()
 	    || (IS_INITIALIZER
 	        && malloc_init_state == malloc_init_recursible)) {
 		/*
 		 * Another thread initialized the allocator before this one
 		 * acquired init_lock, or this thread is the initializing
 		 * thread, and it is recursively allocating.
 		 */
 		return false;
 	}
 #ifdef JEMALLOC_THREADED_INIT
 	if (malloc_initializer != NO_INITIALIZER && !IS_INITIALIZER) {
 		/* Busy-wait until the initializing thread completes. */
 		spin_t spinner = SPIN_INITIALIZER;
 		do {
 			malloc_mutex_unlock(TSDN_NULL, &init_lock);
 			spin_adaptive(&spinner);
 			malloc_mutex_lock(TSDN_NULL, &init_lock);
 		} while (!malloc_initialized());
 		return false;
 	}
 #endif
 	return true;
 }

 static bool
 malloc_init_hard_a0_locked(void) {
 	malloc_initializer = INITIALIZER;

 	JEMALLOC_DIAGNOSTIC_PUSH
 	JEMALLOC_DIAGNOSTIC_IGNORE_MISSING_STRUCT_FIELD_INITIALIZERS
 	sc_data_t sc_data = {0};
 	JEMALLOC_DIAGNOSTIC_POP

 	/*
 	 * Ordering here is somewhat tricky; we need sc_boot() first, since that
 	 * determines what the size classes will be, and then
 	 * malloc_conf_init(), since any slab size tweaking will need to be done
 	 * before sz_boot and bin_info_boot, which assume that the values they
 	 * read out of sc_data_global are final.
 	 */
 	sc_boot(&sc_data);
 	unsigned bin_shard_sizes[SC_NBINS];
 	bin_shard_sizes_boot(bin_shard_sizes);
 	/*
 	 * prof_boot0 only initializes opt_prof_prefix.  We need to do it before
 	 * we parse malloc_conf options, in case malloc_conf parsing overwrites
 	 * it.
 	 */
 	if (config_prof) {
 		prof_boot0();
 	}
 	char readlink_buf[PATH_MAX + 1];
 	readlink_buf[0] = '\0';
 	malloc_conf_init(&sc_data, bin_shard_sizes, readlink_buf);
 	san_init(opt_lg_san_uaf_align);
 	sz_boot(&sc_data, opt_cache_oblivious);
 	bin_info_boot(&sc_data, bin_shard_sizes);

 	if (opt_stats_print) {
 		/* Print statistics at exit. */
 		if (atexit(stats_print_atexit) != 0) {
 			malloc_write("<jemalloc>: Error in atexit()\n");
 			if (opt_abort) {
 				abort();
 			}
 		}
 	}

 	if (stats_boot()) {
 		return true;
 	}
 	if (pages_boot()) {
 		return true;
 	}
 	if (base_boot(TSDN_NULL)) {
 		return true;
 	}
 	/* emap_global is static, hence zeroed. */
 	if (emap_init(&arena_emap_global, b0get(), /* zeroed */ true)) {
 		return true;
 	}
 	if (extent_boot()) {
 		return true;
 	}
 	if (ctl_boot()) {
 		return true;
 	}
 	if (config_prof) {
 		prof_boot1();
 	}
 	if (opt_hpa && !hpa_supported()) {
 		malloc_printf(
 		    "<jemalloc>: HPA not supported in the current "
 		    "configuration; %s.",
 		    opt_abort_conf ? "aborting" : "disabling");
 		if (opt_abort_conf) {
 			malloc_abort_invalid_conf();
 		} else {
 			opt_hpa = false;
 		}
 	}
 	if (arena_boot(&sc_data, b0get(), opt_hpa)) {
 		return true;
 	}
 	if (tcache_boot(TSDN_NULL, b0get())) {
 		return true;
 	}
 	if (malloc_mutex_init(&arenas_lock, "arenas", WITNESS_RANK_ARENAS,
 	        malloc_mutex_rank_exclusive)) {
 		return true;
 	}
 	hook_boot();
 	experimental_thread_events_boot();
 	/*
 	 * Create enough scaffolding to allow recursive allocation in
 	 * malloc_ncpus().
 	 */
 	narenas_auto = 1;
 	manual_arena_base = narenas_auto + 1;
 	memset(arenas, 0, sizeof(arena_t *) * narenas_auto);
 	/*
 	 * Initialize one arena here.  The rest are lazily created in
 	 * arena_choose_hard().
 	 */
 	if (arena_init(TSDN_NULL, 0, &arena_config_default) == NULL) {
 		return true;
 	}
 	a0 = arena_get(TSDN_NULL, 0, false);

 	if (opt_hpa && !hpa_supported()) {
 		malloc_printf(
 		    "<jemalloc>: HPA not supported in the current "
 		    "configuration; %s.",
 		    opt_abort_conf ? "aborting" : "disabling");
 		if (opt_abort_conf) {
 			malloc_abort_invalid_conf();
 		} else {
 			opt_hpa = false;
 		}
 	}

 	malloc_init_state = malloc_init_a0_initialized;

 	size_t buf_len = strlen(readlink_buf);
 	if (buf_len > 0) {
 		void *readlink_allocated = a0ialloc(buf_len + 1, false, true);
 		if (readlink_allocated != NULL) {
 			memcpy(readlink_allocated, readlink_buf, buf_len + 1);
 			opt_malloc_conf_symlink = readlink_allocated;
 		}
 	}

 	return false;
 }

 static bool
 malloc_init_hard_a0(void) {
 	bool ret;

 	malloc_mutex_lock(TSDN_NULL, &init_lock);
 	ret = malloc_init_hard_a0_locked();
 	malloc_mutex_unlock(TSDN_NULL, &init_lock);
 	return ret;
 }

 /* Initialize data structures which may trigger recursive allocation. */
 static bool
 malloc_init_hard_recursible(void) {
 	malloc_init_state = malloc_init_recursible;

 	ncpus = malloc_ncpus();
 	if (opt_percpu_arena != percpu_arena_disabled) {
 		bool cpu_count_is_deterministic =
 		    malloc_cpu_count_is_deterministic();
 		if (!cpu_count_is_deterministic) {
 			/*
 			 * If # of CPU is not deterministic, and narenas not
 			 * specified, disables per cpu arena since it may not
 			 * detect CPU IDs properly.
 			 */
 			if (opt_narenas == 0) {
 				opt_percpu_arena = percpu_arena_disabled;
 				malloc_write(
 				    "<jemalloc>: Number of CPUs "
 				    "detected is not deterministic. Per-CPU "
 				    "arena disabled.\n");
 				if (opt_abort_conf) {
 					malloc_abort_invalid_conf();
 				}
 				if (opt_abort) {
 					abort();
 				}
 			}
 		}
 	}

 #if (defined(JEMALLOC_HAVE_PTHREAD_ATFORK) && !defined(JEMALLOC_MUTEX_INIT_CB) \
     && !defined(JEMALLOC_ZONE) && !defined(_WIN32)                             \
     && !defined(__native_client__))
 	/* LinuxThreads' pthread_atfork() allocates. */
 	if (pthread_atfork(jemalloc_prefork, jemalloc_postfork_parent,
 	        jemalloc_postfork_child)
 	    != 0) {
 		malloc_write("<jemalloc>: Error in pthread_atfork()\n");
 		if (opt_abort) {
 			abort();
 		}
 		return true;
 	}
 #endif

 	if (background_thread_boot0()) {
 		return true;
 	}

 	return false;
 }

 static unsigned
 malloc_narenas_default(void) {
 	assert(ncpus > 0);
 	/*
 	 * For SMP systems, create more than one arena per CPU by
 	 * default.
 	 */
 	if (ncpus > 1) {
 		fxp_t    fxp_ncpus = FXP_INIT_INT(ncpus);
 		fxp_t    goal = fxp_mul(fxp_ncpus, opt_narenas_ratio);
 		uint32_t int_goal = fxp_round_nearest(goal);
 		if (int_goal == 0) {
 			return 1;
 		}
 		return int_goal;
 	} else {
 		return 1;
 	}
 }

 static percpu_arena_mode_t
 percpu_arena_as_initialized(percpu_arena_mode_t mode) {
 	assert(!malloc_initialized());
 	assert(mode <= percpu_arena_disabled);

 	if (mode != percpu_arena_disabled) {
 		mode += percpu_arena_mode_enabled_base;
 	}

 	return mode;
 }

 static bool
 malloc_init_narenas(tsdn_t *tsdn) {
 	assert(ncpus > 0);

 	if (opt_percpu_arena != percpu_arena_disabled) {
 		if (!have_percpu_arena || malloc_getcpu() < 0) {
 			opt_percpu_arena = percpu_arena_disabled;
 			malloc_printf(
 			    "<jemalloc>: perCPU arena getcpu() not "
 			    "available. Setting narenas to %u.\n",
 			    opt_narenas ? opt_narenas
 			                : malloc_narenas_default());
 			if (opt_abort) {
 				abort();
 			}
 		} else {
 			if (ncpus >= MALLOCX_ARENA_LIMIT) {
 				malloc_printf(
 				    "<jemalloc>: narenas w/ percpu"
 				    "arena beyond limit (%d)\n",
 				    ncpus);
 				if (opt_abort) {
 					abort();
 				}
 				return true;
 			}
 			/* NB: opt_percpu_arena isn't fully initialized yet. */
 			if (percpu_arena_as_initialized(opt_percpu_arena)
 			        == per_phycpu_arena
 			    && ncpus % 2 != 0) {
 				malloc_printf(
 				    "<jemalloc>: invalid "
 				    "configuration -- per physical CPU arena "
 				    "with odd number (%u) of CPUs (no hyper "
 				    "threading?).\n",
 				    ncpus);
 				if (opt_abort)
 					abort();
 			}
 			unsigned n = percpu_arena_ind_limit(
 			    percpu_arena_as_initialized(opt_percpu_arena));
 			if (opt_narenas < n) {
 				/*
 				 * If narenas is specified with percpu_arena
 				 * enabled, actual narenas is set as the greater
 				 * of the two. percpu_arena_choose will be free
 				 * to use any of the arenas based on CPU
 				 * id. This is conservative (at a small cost)
 				 * but ensures correctness.
 				 *
 				 * If for some reason the ncpus determined at
 				 * boot is not the actual number (e.g. because
 				 * of affinity setting from numactl), reserving
 				 * narenas this way provides a workaround for
 				 * percpu_arena.
 				 */
 				opt_narenas = n;
 			}
 		}
 	}
 	if (opt_narenas == 0) {
 		opt_narenas = malloc_narenas_default();
 	}
 	assert(opt_narenas > 0);

 	narenas_auto = opt_narenas;
 	/*
 	 * Limit the number of arenas to the indexing range of MALLOCX_ARENA().
 	 */
 	if (narenas_auto >= MALLOCX_ARENA_LIMIT) {
 		narenas_auto = MALLOCX_ARENA_LIMIT - 1;
 		malloc_printf("<jemalloc>: Reducing narenas to limit (%d)\n",
 		    narenas_auto);
 	}
 	narenas_total_set(narenas_auto);
 	if (arena_init_huge(tsdn, a0)) {
 		narenas_total_inc();
 	}
 	manual_arena_base = narenas_total_get();

 	return false;
 }

 static void
 malloc_init_percpu(void) {
 	opt_percpu_arena = percpu_arena_as_initialized(opt_percpu_arena);
 }

 static bool
 malloc_init_hard_finish(void) {
 	if (malloc_mutex_boot()) {
 		return true;
 	}

 	malloc_init_state = malloc_init_initialized;
 	malloc_slow_flag_init();

 	return false;
 }

 static void
 malloc_init_hard_cleanup(tsdn_t *tsdn, bool reentrancy_set) {
 	malloc_mutex_assert_owner(tsdn, &init_lock);
 	malloc_mutex_unlock(tsdn, &init_lock);
 	if (reentrancy_set) {
 		assert(!tsdn_null(tsdn));
 		tsd_t *tsd = tsdn_tsd(tsdn);
 		assert(tsd_reentrancy_level_get(tsd) > 0);
 		post_reentrancy(tsd);
 	}
 }

 static bool
 malloc_init_hard(void) {
 	tsd_t *tsd;

 	assert(TCACHE_MAXCLASS_LIMIT <= USIZE_GROW_SLOW_THRESHOLD);
 	assert(SC_LOOKUP_MAXCLASS <= USIZE_GROW_SLOW_THRESHOLD);
 	/*
 	 * This asserts an extreme case where TINY_MAXCLASS is larger
 	 * than LARGE_MINCLASS.  It could only happen if some constants
 	 * are configured miserably wrong.
 	 */
 	assert(SC_LG_TINY_MAXCLASS <= (size_t)1ULL << (LG_PAGE + SC_LG_NGROUP));

 #if defined(_WIN32) && _WIN32_WINNT < 0x0600
 	_init_init_lock();
 #endif
 	malloc_mutex_lock(TSDN_NULL, &init_lock);

 #define UNLOCK_RETURN(tsdn, ret, reentrancy)                                   \
 	malloc_init_hard_cleanup(tsdn, reentrancy);                            \
 	return ret;

 	if (!malloc_init_hard_needed()) {
 		UNLOCK_RETURN(TSDN_NULL, false, false)
 	}

 	if (malloc_init_state != malloc_init_a0_initialized
 	    && malloc_init_hard_a0_locked()) {
 		UNLOCK_RETURN(TSDN_NULL, true, false)
 	}

 	malloc_mutex_unlock(TSDN_NULL, &init_lock);
 	/* Recursive allocation relies on functional tsd. */
 	tsd = malloc_tsd_boot0();
 	if (tsd == NULL) {
 		return true;
 	}
 	if (malloc_init_hard_recursible()) {
 		return true;
 	}

 	malloc_mutex_lock(tsd_tsdn(tsd), &init_lock);
 	/* Set reentrancy level to 1 during init. */
 	pre_reentrancy(tsd, NULL);
 	/* Initialize narenas before prof_boot2 (for allocation). */
 	if (malloc_init_narenas(tsd_tsdn(tsd))
 	    || background_thread_boot1(tsd_tsdn(tsd), b0get())) {
 		UNLOCK_RETURN(tsd_tsdn(tsd), true, true)
 	}
 	if (opt_hpa) {
 		/*
 		 * We didn't initialize arena 0 hpa_shard in arena_new, because
 		 * background_thread_enabled wasn't initialized yet, but we
 		 * need it to set correct value for deferral_allowed.
 		 */
 		arena_t         *a0 = arena_get(tsd_tsdn(tsd), 0, false);
 		hpa_shard_opts_t hpa_shard_opts = opt_hpa_opts;
 		hpa_shard_opts.deferral_allowed = background_thread_enabled();
 		if (pa_shard_enable_hpa(tsd_tsdn(tsd), &a0->pa_shard,
 		        &hpa_shard_opts, &opt_hpa_sec_opts)) {
 			UNLOCK_RETURN(tsd_tsdn(tsd), true, true)
 		}
 	}
 	if (config_prof && prof_boot2(tsd, b0get())) {
 		UNLOCK_RETURN(tsd_tsdn(tsd), true, true)
 	}

 	malloc_init_percpu();

 	if (malloc_init_hard_finish()) {
 		UNLOCK_RETURN(tsd_tsdn(tsd), true, true)
 	}
 	post_reentrancy(tsd);
 	malloc_mutex_unlock(tsd_tsdn(tsd), &init_lock);

 	witness_assert_lockless(
 	    witness_tsd_tsdn(tsd_witness_tsdp_get_unsafe(tsd)));
 	malloc_tsd_boot1();
 	/* Update TSD after tsd_boot1. */
 	tsd = tsd_fetch();
 	if (opt_background_thread) {
 		assert(have_background_thread);
 		/*
 		 * Need to finish init & unlock first before creating background
 		 * threads (pthread_create depends on malloc).  ctl_init (which
 		 * sets isthreaded) needs to be called without holding any lock.
 		 */
 		background_thread_ctl_init(tsd_tsdn(tsd));
 		if (background_thread_create(tsd, 0)) {
 			return true;
 		}
 	}
 #undef UNLOCK_RETURN
 	return false;
 }

 /*
  * End initialization functions.
  */
 /******************************************************************************/
 /*
  * Begin allocation-path internal functions and data structures.
  */

 /*
  * Settings determined by the documented behavior of the allocation functions.
  */
 typedef struct static_opts_s static_opts_t;
 struct static_opts_s {
 	/* Whether or not allocation size may overflow. */
 	bool may_overflow;

 	/*
 	 * Whether or not allocations (with alignment) of size 0 should be
 	 * treated as size 1.
 	 */
 	bool bump_empty_aligned_alloc;
 	/*
 	 * Whether to assert that allocations are not of size 0 (after any
 	 * bumping).
 	 */
 	bool assert_nonempty_alloc;

 	/*
 	 * Whether or not to modify the 'result' argument to malloc in case of
 	 * error.
 	 */
 	bool null_out_result_on_error;
 	/* Whether to set errno when we encounter an error condition. */
 	bool set_errno_on_error;

 	/*
 	 * The minimum valid alignment for functions requesting aligned storage.
 	 */
 	size_t min_alignment;

 	/* The error string to use if we oom. */
 	const char *oom_string;
 	/* The error string to use if the passed-in alignment is invalid. */
 	const char *invalid_alignment_string;

 	/*
 	 * False if we're configured to skip some time-consuming operations.
 	 *
 	 * This isn't really a malloc "behavior", but it acts as a useful
 	 * summary of several other static (or at least, static after program
 	 * initialization) options.
 	 */
 	bool slow;
 	/*
 	 * Return size.
 	 */
 	bool usize;
 };

 JEMALLOC_ALWAYS_INLINE void
 static_opts_init(static_opts_t *static_opts) {
 	static_opts->may_overflow = false;
 	static_opts->bump_empty_aligned_alloc = false;
 	static_opts->assert_nonempty_alloc = false;
 	static_opts->null_out_result_on_error = false;
 	static_opts->set_errno_on_error = false;
 	static_opts->min_alignment = 0;
 	static_opts->oom_string = "";
 	static_opts->invalid_alignment_string = "";
 	static_opts->slow = false;
 	static_opts->usize = false;
 }

 typedef struct dynamic_opts_s dynamic_opts_t;
 struct dynamic_opts_s {
 	void   **result;
 	size_t   usize;
 	size_t   num_items;
 	size_t   item_size;
 	size_t   alignment;
 	bool     zero;
 	unsigned tcache_ind;
 	unsigned arena_ind;
 };

 JEMALLOC_ALWAYS_INLINE void
 dynamic_opts_init(dynamic_opts_t *dynamic_opts) {
 	dynamic_opts->result = NULL;
 	dynamic_opts->usize = 0;
 	dynamic_opts->num_items = 0;
 	dynamic_opts->item_size = 0;
 	dynamic_opts->alignment = 0;
 	dynamic_opts->zero = false;
 	dynamic_opts->tcache_ind = TCACHE_IND_AUTOMATIC;
 	dynamic_opts->arena_ind = ARENA_IND_AUTOMATIC;
 }

 /*
  * ind parameter is optional and is only checked and filled if alignment == 0;
  * return true if result is out of range.
  */
 JEMALLOC_ALWAYS_INLINE bool
 aligned_usize_get(size_t size, size_t alignment, size_t *usize, szind_t *ind,
     bool bump_empty_aligned_alloc) {
 	assert(usize != NULL);
 	if (alignment == 0) {
 		if (ind != NULL) {
 			*ind = sz_size2index(size);
 			if (unlikely(*ind >= SC_NSIZES)) {
 				return true;
 			}
 			*usize = sz_large_size_classes_disabled()
 			    ? sz_s2u(size)
 			    : sz_index2size(*ind);
 			assert(*usize > 0 && *usize <= SC_LARGE_MAXCLASS);
 			return false;
 		}
 		*usize = sz_s2u(size);
 	} else {
 		if (bump_empty_aligned_alloc && unlikely(size == 0)) {
 			size = 1;
 		}
 		*usize = sz_sa2u(size, alignment);
 	}
 	if (unlikely(*usize == 0 || *usize > SC_LARGE_MAXCLASS)) {
 		return true;
 	}
 	return false;
 }

 JEMALLOC_ALWAYS_INLINE bool
 zero_get(bool guarantee, bool slow) {
 	if (config_fill && slow && unlikely(opt_zero)) {
 		return true;
 	} else {
 		return guarantee;
 	}
 }

 /* Return true if a manual arena is specified and arena_get() OOMs. */
 JEMALLOC_ALWAYS_INLINE bool
 arena_get_from_ind(tsd_t *tsd, unsigned arena_ind, arena_t **arena_p) {
 	if (arena_ind == ARENA_IND_AUTOMATIC) {
 		/*
 		 * In case of automatic arena management, we defer arena
 		 * computation until as late as we can, hoping to fill the
 		 * allocation out of the tcache.
 		 */
 		*arena_p = NULL;
 	} else {
 		*arena_p = arena_get(tsd_tsdn(tsd), arena_ind, true);
 		if (unlikely(*arena_p == NULL) && arena_ind >= narenas_auto) {
 			return true;
 		}
 	}
 	return false;
 }

 /* ind is ignored if dopts->alignment > 0. */
 JEMALLOC_ALWAYS_INLINE void *
 imalloc_no_sample(static_opts_t *sopts, dynamic_opts_t *dopts, tsd_t *tsd,
     size_t size, size_t usize, szind_t ind, bool slab) {
 	/* Fill in the tcache. */
 	tcache_t *tcache = tcache_get_from_ind(
 	    tsd, dopts->tcache_ind, sopts->slow, /* is_alloc */ true);

 	/* Fill in the arena. */
 	arena_t *arena;
 	if (arena_get_from_ind(tsd, dopts->arena_ind, &arena)) {
 		return NULL;
 	}

 	if (unlikely(dopts->alignment != 0)) {
 		return ipalloct_explicit_slab(tsd_tsdn(tsd), usize,
 		    dopts->alignment, dopts->zero, slab, tcache, arena);
 	}

 	return iallocztm_explicit_slab(tsd_tsdn(tsd), size, ind, dopts->zero,
 	    slab, tcache, false, arena, sopts->slow);
 }

 JEMALLOC_ALWAYS_INLINE void *
 imalloc_sample(static_opts_t *sopts, dynamic_opts_t *dopts, tsd_t *tsd,
     size_t usize, szind_t ind) {
 	void *ret;

 	dopts->alignment = prof_sample_align(usize, dopts->alignment);
 	/*
 	 * If the allocation is small enough that it would normally be allocated
 	 * on a slab, we need to take additional steps to ensure that it gets
 	 * its own extent instead.
 	 */
 	if (sz_can_use_slab(usize)) {
 		assert((dopts->alignment & PROF_SAMPLE_ALIGNMENT_MASK) == 0);
 		size_t  bumped_usize = sz_sa2u(usize, dopts->alignment);
 		szind_t bumped_ind = sz_size2index(bumped_usize);
 		dopts->tcache_ind = TCACHE_IND_NONE;
 		ret = imalloc_no_sample(sopts, dopts, tsd, bumped_usize,
 		    bumped_usize, bumped_ind, /* slab */ false);
 		if (unlikely(ret == NULL)) {
 			return NULL;
 		}
 		arena_prof_promote(tsd_tsdn(tsd), ret, usize, bumped_usize);
 	} else {
 		ret = imalloc_no_sample(sopts, dopts, tsd, usize, usize, ind,
 		    /* slab */ false);
 	}
 	assert(prof_sample_aligned(ret));

 	return ret;
 }

 /*
  * Returns true if the allocation will overflow, and false otherwise.  Sets
  * *size to the product either way.
  */
 JEMALLOC_ALWAYS_INLINE bool
 compute_size_with_overflow(
     bool may_overflow, dynamic_opts_t *dopts, size_t *size) {
 	/*
 	 * This function is just num_items * item_size, except that we may have
 	 * to check for overflow.
 	 */

 	if (!may_overflow) {
 		assert(dopts->num_items == 1);
 		*size = dopts->item_size;
 		return false;
 	}

 	/* A size_t with its high-half bits all set to 1. */
 	static const size_t high_bits = SIZE_T_MAX << (sizeof(size_t) * 8 / 2);

 	*size = dopts->item_size * dopts->num_items;

 	if (unlikely(*size == 0)) {
 		return (dopts->num_items != 0 && dopts->item_size != 0);
 	}

 	/*
 	 * We got a non-zero size, but we don't know if we overflowed to get
 	 * there.  To avoid having to do a divide, we'll be clever and note that
 	 * if both A and B can be represented in N/2 bits, then their product
 	 * can be represented in N bits (without the possibility of overflow).
 	 */
 	if (likely((high_bits & (dopts->num_items | dopts->item_size)) == 0)) {
 		return false;
 	}
 	if (likely(*size / dopts->item_size == dopts->num_items)) {
 		return false;
 	}
 	return true;
 }

 JEMALLOC_ALWAYS_INLINE int
 imalloc_body(static_opts_t *sopts, dynamic_opts_t *dopts, tsd_t *tsd) {
 	/* Where the actual allocated memory will live. */
 	void *allocation = NULL;
 	/* Filled in by compute_size_with_overflow below. */
 	size_t size = 0;
 	/*
 	 * The zero initialization for ind is actually dead store, in that its
 	 * value is reset before any branch on its value is taken.  Sometimes
 	 * though, it's convenient to pass it as arguments before this point.
 	 * To avoid undefined behavior then, we initialize it with dummy stores.
 	 */
 	szind_t ind = 0;
 	/* usize will always be properly initialized. */
 	size_t usize;

 	/* Reentrancy is only checked on slow path. */
 	int8_t reentrancy_level;

 	/* Compute the amount of memory the user wants. */
 	if (unlikely(compute_size_with_overflow(
 	        sopts->may_overflow, dopts, &size))) {
 		goto label_oom;
 	}

 	if (unlikely(dopts->alignment < sopts->min_alignment
 	        || (dopts->alignment & (dopts->alignment - 1)) != 0)) {
 		goto label_invalid_alignment;
 	}

 	/* This is the beginning of the "core" algorithm. */
 	dopts->zero = zero_get(dopts->zero, sopts->slow);
 	if (aligned_usize_get(size, dopts->alignment, &usize, &ind,
 	        sopts->bump_empty_aligned_alloc)) {
 		goto label_oom;
 	}
 	dopts->usize = usize;
 	/* Validate the user input. */
 	if (sopts->assert_nonempty_alloc) {
 		assert(size != 0);
 	}

 	check_entry_exit_locking(tsd_tsdn(tsd));

 	/*
 	 * If we need to handle reentrancy, we can do it out of a
 	 * known-initialized arena (i.e. arena 0).
 	 */
 	reentrancy_level = tsd_reentrancy_level_get(tsd);
 	if (sopts->slow && unlikely(reentrancy_level > 0)) {
 		/*
 		 * We should never specify particular arenas or tcaches from
 		 * within our internal allocations.
 		 */
 		assert(dopts->tcache_ind == TCACHE_IND_AUTOMATIC
 		    || dopts->tcache_ind == TCACHE_IND_NONE);
 		assert(dopts->arena_ind == ARENA_IND_AUTOMATIC);
 		dopts->tcache_ind = TCACHE_IND_NONE;
 		/* We know that arena 0 has already been initialized. */
 		dopts->arena_ind = 0;
 	}

 	/*
 	 * If dopts->alignment > 0, then ind is still 0, but usize was computed
 	 * in the previous if statement.  Down the positive alignment path,
 	 * imalloc_no_sample and imalloc_sample will ignore ind.
 	 */

 	/* If profiling is on, get our profiling context. */
 	if (config_prof && opt_prof) {
 		bool prof_active = prof_active_get_unlocked();
 		bool sample_event = te_prof_sample_event_lookahead(tsd, usize);
 		prof_tctx_t *tctx = prof_alloc_prep(
 		    tsd, prof_active, sample_event);

 		emap_alloc_ctx_t alloc_ctx;
 		if (likely(tctx == PROF_TCTX_SENTINEL)) {
 			alloc_ctx.slab = sz_can_use_slab(usize);
 			allocation = imalloc_no_sample(sopts, dopts, tsd, usize,
 			    usize, ind, alloc_ctx.slab);
 		} else if (tctx != NULL) {
 			allocation = imalloc_sample(
 			    sopts, dopts, tsd, usize, ind);
 			alloc_ctx.slab = false;
 		} else {
 			allocation = NULL;
 		}

 		if (unlikely(allocation == NULL)) {
 			prof_alloc_rollback(tsd, tctx);
 			goto label_oom;
 		}
 		prof_malloc(tsd, allocation, size, usize, &alloc_ctx, tctx);
 	} else {
 		assert(!opt_prof);
 		allocation = imalloc_no_sample(sopts, dopts, tsd, size, usize,
 		    ind, sz_can_use_slab(usize));
 		if (unlikely(allocation == NULL)) {
 			goto label_oom;
 		}
 	}

 	/*
 	 * Allocation has been done at this point.  We still have some
 	 * post-allocation work to do though.
 	 */

 	thread_alloc_event(tsd, usize);

 	assert(dopts->alignment == 0
 	    || ((uintptr_t)allocation & (dopts->alignment - 1)) == ZU(0));

 	assert(usize == isalloc(tsd_tsdn(tsd), allocation));

 	if (config_fill && sopts->slow && !dopts->zero
 	    && unlikely(opt_junk_alloc)) {
 		junk_alloc_callback(allocation, usize);
 	}

 	if (sopts->slow) {
 		UTRACE(0, size, allocation);
 	}

 	/* Success! */
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	*dopts->result = allocation;
 	return 0;

 label_oom:
 	if (unlikely(sopts->slow) && config_xmalloc && unlikely(opt_xmalloc)) {
 		malloc_write(sopts->oom_string);
 		abort();
 	}

 	if (sopts->slow) {
 		UTRACE(NULL, size, NULL);
 	}

 	check_entry_exit_locking(tsd_tsdn(tsd));

 	if (sopts->set_errno_on_error) {
 		set_errno(ENOMEM);
 	}

 	if (sopts->null_out_result_on_error) {
 		*dopts->result = NULL;
 	}

 	return ENOMEM;

 	/*
 	 * This label is only jumped to by one goto; we move it out of line
 	 * anyways to avoid obscuring the non-error paths, and for symmetry with
 	 * the oom case.
 	 */
 label_invalid_alignment:
 	if (config_xmalloc && unlikely(opt_xmalloc)) {
 		malloc_write(sopts->invalid_alignment_string);
 		abort();
 	}

 	if (sopts->set_errno_on_error) {
 		set_errno(EINVAL);
 	}

 	if (sopts->slow) {
 		UTRACE(NULL, size, NULL);
 	}

 	check_entry_exit_locking(tsd_tsdn(tsd));

 	if (sopts->null_out_result_on_error) {
 		*dopts->result = NULL;
 	}

 	return EINVAL;
 }

 JEMALLOC_ALWAYS_INLINE bool
 imalloc_init_check(static_opts_t *sopts, dynamic_opts_t *dopts) {
 	if (unlikely(!malloc_initialized()) && unlikely(malloc_init())) {
 		if (config_xmalloc && unlikely(opt_xmalloc)) {
 			malloc_write(sopts->oom_string);
 			abort();
 		}
 		UTRACE(NULL, dopts->num_items * dopts->item_size, NULL);
 		set_errno(ENOMEM);
 		*dopts->result = NULL;

 		return false;
 	}

 	return true;
 }

 /* Returns the errno-style error code of the allocation. */
 JEMALLOC_ALWAYS_INLINE int
 imalloc(static_opts_t *sopts, dynamic_opts_t *dopts) {
 	if (tsd_get_allocates() && !imalloc_init_check(sopts, dopts)) {
 		return ENOMEM;
 	}

 	/* We always need the tsd.  Let's grab it right away. */
 	tsd_t *tsd = tsd_fetch();
 	assert(tsd);
 	if (likely(tsd_fast(tsd))) {
 		/* Fast and common path. */
 		tsd_assert_fast(tsd);
 		sopts->slow = false;
 		return imalloc_body(sopts, dopts, tsd);
 	} else {
 		if (!tsd_get_allocates() && !imalloc_init_check(sopts, dopts)) {
 			return ENOMEM;
 		}

 		sopts->slow = true;
 		return imalloc_body(sopts, dopts, tsd);
 	}
 }

 JEMALLOC_NOINLINE
 void *
 malloc_default(size_t size) {
 	void          *ret;
 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	/*
 	 * This variant has logging hook on exit but not on entry.  It's callled
 	 * only by je_malloc, below, which emits the entry one for us (and, if
 	 * it calls us, does so only via tail call).
 	 */

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.null_out_result_on_error = true;
 	sopts.set_errno_on_error = true;
 	sopts.oom_string = "<jemalloc>: Error in malloc(): out of memory\n";

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	dopts.item_size = size;

 	imalloc(&sopts, &dopts);
 	/*
 	 * Note that this branch gets optimized away -- it immediately follows
 	 * the check on tsd_fast that sets sopts.slow.
 	 */
 	if (sopts.slow) {
 		uintptr_t args[3] = {size};
 		hook_invoke_alloc(hook_alloc_malloc, ret, (uintptr_t)ret, args);
 	}

 	return ret;
 }

 /******************************************************************************/
 /*
  * Begin malloc(3)-compatible functions.
  */

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) JEMALLOC_ALLOC_SIZE(1) je_malloc(size_t size) {
 	LOG("core.malloc.entry", "size: %zu", size);

 	void *ret = imalloc_fastpath(size, &malloc_default);

 	LOG("core.malloc.exit", "result: %p", ret);
 	return ret;
 }

 JEMALLOC_EXPORT int JEMALLOC_NOTHROW
 JEMALLOC_ATTR(nonnull(1))
     je_posix_memalign(void **memptr, size_t alignment, size_t size) {
 	int            ret;
 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.posix_memalign.entry",
 	    "mem ptr: %p, alignment: %zu, "
 	    "size: %zu",
 	    memptr, alignment, size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.bump_empty_aligned_alloc = true;
 	sopts.min_alignment = sizeof(void *);
 	sopts.oom_string =
 	    "<jemalloc>: Error allocating aligned memory: out of memory\n";
 	sopts.invalid_alignment_string =
 	    "<jemalloc>: Error allocating aligned memory: invalid alignment\n";

 	dopts.result = memptr;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	dopts.alignment = alignment;

 	ret = imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {
 		    (uintptr_t)memptr, (uintptr_t)alignment, (uintptr_t)size};
 		hook_invoke_alloc(
 		    hook_alloc_posix_memalign, *memptr, (uintptr_t)ret, args);
 	}

 	LOG("core.posix_memalign.exit", "result: %d, alloc ptr: %p", ret,
 	    *memptr);

 	return ret;
 }

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) JEMALLOC_ALLOC_SIZE(2)
     je_aligned_alloc(size_t alignment, size_t size) {
 	void *ret;

 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.aligned_alloc.entry", "alignment: %zu, size: %zu\n",
 	    alignment, size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.bump_empty_aligned_alloc = true;
 	sopts.null_out_result_on_error = true;
 	sopts.set_errno_on_error = true;
 	sopts.min_alignment = 1;
 	sopts.oom_string =
 	    "<jemalloc>: Error allocating aligned memory: out of memory\n";
 	sopts.invalid_alignment_string =
 	    "<jemalloc>: Error allocating aligned memory: invalid alignment\n";

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	dopts.alignment = alignment;

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {(uintptr_t)alignment, (uintptr_t)size};
 		hook_invoke_alloc(
 		    hook_alloc_aligned_alloc, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.aligned_alloc.exit", "result: %p", ret);

 	return ret;
 }

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) JEMALLOC_ALLOC_SIZE2(1, 2)
     je_calloc(size_t num, size_t size) {
 	void          *ret;
 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.calloc.entry", "num: %zu, size: %zu", num, size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.may_overflow = true;
 	sopts.null_out_result_on_error = true;
 	sopts.set_errno_on_error = true;
 	sopts.oom_string = "<jemalloc>: Error in calloc(): out of memory\n";

 	dopts.result = &ret;
 	dopts.num_items = num;
 	dopts.item_size = size;
 	dopts.zero = true;

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {(uintptr_t)num, (uintptr_t)size};
 		hook_invoke_alloc(hook_alloc_calloc, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.calloc.exit", "result: %p", ret);

 	return ret;
 }

 JEMALLOC_ALWAYS_INLINE void
 ifree(tsd_t *tsd, void *ptr, tcache_t *tcache, bool slow_path) {
 	if (!slow_path) {
 		tsd_assert_fast(tsd);
 	}
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	if (tsd_reentrancy_level_get(tsd) != 0) {
 		assert(slow_path);
 	}

 	assert(ptr != NULL);
 	assert(malloc_initialized() || IS_INITIALIZER);

 	emap_alloc_ctx_t alloc_ctx;
 	emap_alloc_ctx_lookup(
 	    tsd_tsdn(tsd), &arena_emap_global, ptr, &alloc_ctx);
 	assert(alloc_ctx.szind != SC_NSIZES);

 	size_t usize = emap_alloc_ctx_usize_get(&alloc_ctx);
 	if (config_prof && opt_prof) {
 		prof_free(tsd, ptr, usize, &alloc_ctx);
 	}

 	if (likely(!slow_path)) {
 		idalloctm(tsd_tsdn(tsd), ptr, tcache, &alloc_ctx, false, false);
 	} else {
 		if (config_fill && slow_path && opt_junk_free) {
 			junk_free_callback(ptr, usize);
 		}
 		idalloctm(tsd_tsdn(tsd), ptr, tcache, &alloc_ctx, false, true);
 	}
 	thread_dalloc_event(tsd, usize);
 }

 JEMALLOC_ALWAYS_INLINE void
 isfree(tsd_t *tsd, void *ptr, size_t usize, tcache_t *tcache, bool slow_path) {
 	if (!slow_path) {
 		tsd_assert_fast(tsd);
 	}
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	if (tsd_reentrancy_level_get(tsd) != 0) {
 		assert(slow_path);
 	}

 	assert(ptr != NULL);
 	assert(malloc_initialized() || IS_INITIALIZER);

 	emap_alloc_ctx_t alloc_ctx;
 	szind_t          szind = sz_size2index(usize);
 	if (!config_prof) {
 		emap_alloc_ctx_init(
 		    &alloc_ctx, szind, (szind < SC_NBINS), usize);
 	} else {
 		if (likely(!prof_sample_aligned(ptr))) {
 			/*
 			 * When the ptr is not page aligned, it was not sampled.
 			 * usize can be trusted to determine szind and slab.
 			 */
 			emap_alloc_ctx_init(
 			    &alloc_ctx, szind, (szind < SC_NBINS), usize);
 		} else if (opt_prof) {
 			/*
 			 * Small sampled allocs promoted can still get correct
 			 * usize here.  Check comments in edata_usize_get.
 			 */
 			emap_alloc_ctx_lookup(
 			    tsd_tsdn(tsd), &arena_emap_global, ptr, &alloc_ctx);

 			if (config_opt_safety_checks) {
 				/* Small alloc may have !slab (sampled). */
 				size_t true_size = emap_alloc_ctx_usize_get(
 				    &alloc_ctx);
 				if (unlikely(alloc_ctx.szind
 				        != sz_size2index(usize))) {
 					safety_check_fail_sized_dealloc(
 					    /* current_dealloc */ true, ptr,
 					    /* true_size */ true_size,
 					    /* input_size */ usize);
 				}
 			}
 		} else {
 			emap_alloc_ctx_init(
 			    &alloc_ctx, szind, (szind < SC_NBINS), usize);
 		}
 	}
 	bool fail = maybe_check_alloc_ctx(tsd, ptr, &alloc_ctx);
 	if (fail) {
 		/*
 		 * This is a heap corruption bug.  In real life we'll crash; for
 		 * the unit test we just want to avoid breaking anything too
 		 * badly to get a test result out.  Let's leak instead of trying
 		 * to free.
 		 */
 		return;
 	}

 	if (config_prof && opt_prof) {
 		prof_free(tsd, ptr, usize, &alloc_ctx);
 	}
 	if (likely(!slow_path)) {
 		isdalloct(tsd_tsdn(tsd), ptr, usize, tcache, &alloc_ctx, false);
 	} else {
 		if (config_fill && slow_path && opt_junk_free) {
 			junk_free_callback(ptr, usize);
 		}
 		isdalloct(tsd_tsdn(tsd), ptr, usize, tcache, &alloc_ctx, true);
 	}
 	thread_dalloc_event(tsd, usize);
 }

 JEMALLOC_NOINLINE
 void
 free_default(void *ptr) {
 	UTRACE(ptr, 0, 0);
 	if (likely(ptr != NULL)) {
 		/*
 		 * We avoid setting up tsd fully (e.g. tcache, arena binding)
 		 * based on only free() calls -- other activities trigger the
 		 * minimal to full transition.  This is because free() may
 		 * happen during thread shutdown after tls deallocation: if a
 		 * thread never had any malloc activities until then, a
 		 * fully-setup tsd won't be destructed properly.
 		 */
 		tsd_t *tsd = tsd_fetch_min();
 		check_entry_exit_locking(tsd_tsdn(tsd));

 		if (likely(tsd_fast(tsd))) {
 			tcache_t *tcache = tcache_get_from_ind(tsd,
 			    TCACHE_IND_AUTOMATIC, /* slow */ false,
 			    /* is_alloc */ false);
 			ifree(tsd, ptr, tcache, /* slow */ false);
 		} else {
 			tcache_t *tcache = tcache_get_from_ind(tsd,
 			    TCACHE_IND_AUTOMATIC, /* slow */ true,
 			    /* is_alloc */ false);
 			uintptr_t args_raw[3] = {(uintptr_t)ptr};
 			hook_invoke_dalloc(hook_dalloc_free, ptr, args_raw);
 			ifree(tsd, ptr, tcache, /* slow */ true);
 		}

 		check_entry_exit_locking(tsd_tsdn(tsd));
 	}
 }

 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_free(void *ptr) {
 	LOG("core.free.entry", "ptr: %p", ptr);

 	je_free_impl(ptr);

 	LOG("core.free.exit", "");
 }

 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_free_sized(void *ptr, size_t size) {
 	LOG("core.free_sized.entry", "ptr: %p, size: %zu", ptr, size);

 	je_sdallocx_noflags(ptr, size);

 	LOG("core.free_sized.exit", "");
 }

 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_free_aligned_sized(void *ptr, size_t alignment, size_t size) {
 	return je_sdallocx(ptr, size, /* flags */ MALLOCX_ALIGN(alignment));
 }

 /*
  * End malloc(3)-compatible functions.
  */
 /******************************************************************************/
 /*
  * Begin non-standard override functions.
  */

 #ifdef JEMALLOC_OVERRIDE_MEMALIGN
 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) je_memalign(size_t alignment, size_t size) {
 	void          *ret;
 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.memalign.entry", "alignment: %zu, size: %zu\n", alignment,
 	    size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.bump_empty_aligned_alloc = true;
 	sopts.min_alignment = 1;
 	sopts.oom_string =
 	    "<jemalloc>: Error allocating aligned memory: out of memory\n";
 	sopts.invalid_alignment_string =
 	    "<jemalloc>: Error allocating aligned memory: invalid alignment\n";
 	sopts.null_out_result_on_error = true;

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	dopts.alignment = alignment;

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {alignment, size};
 		hook_invoke_alloc(
 		    hook_alloc_memalign, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.memalign.exit", "result: %p", ret);
 	return ret;
 }
 #endif

 #ifdef JEMALLOC_OVERRIDE_VALLOC
 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) je_valloc(size_t size) {
 	void *ret;

 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.valloc.entry", "size: %zu\n", size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.null_out_result_on_error = true;
 	sopts.min_alignment = PAGE;
 	sopts.oom_string =
 	    "<jemalloc>: Error allocating aligned memory: out of memory\n";
 	sopts.invalid_alignment_string =
 	    "<jemalloc>: Error allocating aligned memory: invalid alignment\n";

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	dopts.alignment = PAGE;

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {size};
 		hook_invoke_alloc(hook_alloc_valloc, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.valloc.exit", "result: %p\n", ret);
 	return ret;
 }
 #endif

 #ifdef JEMALLOC_OVERRIDE_PVALLOC
 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) je_pvalloc(size_t size) {
 	void *ret;

 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.pvalloc.entry", "size: %zu\n", size);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.null_out_result_on_error = true;
 	sopts.min_alignment = PAGE;
 	sopts.oom_string =
 	    "<jemalloc>: Error allocating aligned memory: out of memory\n";
 	sopts.invalid_alignment_string =
 	    "<jemalloc>: Error allocating aligned memory: invalid alignment\n";

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	/*
 	 * This is the only difference from je_valloc - size is rounded up to
 	 * a PAGE multiple.
 	 */
 	dopts.item_size = PAGE_CEILING(size);
 	dopts.alignment = PAGE;

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {size};
 		hook_invoke_alloc(
 		    hook_alloc_pvalloc, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.pvalloc.exit", "result: %p\n", ret);
 	return ret;
 }
 #endif

 #if defined(JEMALLOC_IS_MALLOC) && defined(JEMALLOC_GLIBC_MALLOC_HOOK)
 /*
  * glibc provides the RTLD_DEEPBIND flag for dlopen which can make it possible
  * to inconsistently reference libc's malloc(3)-compatible functions
  * (https://bugzilla.mozilla.org/show_bug.cgi?id=493541).
  *
  * These definitions interpose hooks in glibc.  The functions are actually
  * passed an extra argument for the caller return address, which will be
  * ignored.
  */
 #	include <features.h> // defines __GLIBC__ if we are compiling against glibc

 JEMALLOC_EXPORT void (*__free_hook)(void *ptr) = je_free;
 JEMALLOC_EXPORT void *(*__malloc_hook)(size_t size) = je_malloc;
 JEMALLOC_EXPORT void *(*__realloc_hook)(void *ptr, size_t size) = je_realloc;
 #	ifdef JEMALLOC_GLIBC_MEMALIGN_HOOK
 JEMALLOC_EXPORT void *(*__memalign_hook)(
     size_t alignment, size_t size) = je_memalign;
 #	endif

 #	ifdef __GLIBC__
 /*
  * To enable static linking with glibc, the libc specific malloc interface must
  * be implemented also, so none of glibc's malloc.o functions are added to the
  * link.
  */
 #		define ALIAS(je_fn) __attribute__((alias(#je_fn), used))
 /* To force macro expansion of je_ prefix before stringification. */
 #		define PREALIAS(je_fn) ALIAS(je_fn)
 #		ifdef JEMALLOC_OVERRIDE___LIBC_CALLOC
 void *__libc_calloc(size_t n, size_t size) PREALIAS(je_calloc);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_FREE
 void __libc_free(void *ptr) PREALIAS(je_free);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_FREE_SIZED
 void __libc_free_sized(void *ptr, size_t size) PREALIAS(je_free_sized);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_FREE_ALIGNED_SIZED
 void __libc_free_aligned_sized(void *ptr, size_t alignment, size_t size)
     PREALIAS(je_free_aligned_sized);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_MALLOC
 void *__libc_malloc(size_t size) PREALIAS(je_malloc);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_MEMALIGN
 void *__libc_memalign(size_t align, size_t s) PREALIAS(je_memalign);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_REALLOC
 void *__libc_realloc(void *ptr, size_t size) PREALIAS(je_realloc);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_VALLOC
 void *__libc_valloc(size_t size) PREALIAS(je_valloc);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___LIBC_PVALLOC
 void *__libc_pvalloc(size_t size) PREALIAS(je_pvalloc);
 #		endif
 #		ifdef JEMALLOC_OVERRIDE___POSIX_MEMALIGN
 int __posix_memalign(void **r, size_t a, size_t s) PREALIAS(je_posix_memalign);
 #		endif
 #		undef PREALIAS
 #		undef ALIAS
 #	endif
 #endif

 /*
  * End non-standard override functions.
  */
 /******************************************************************************/
 /*
  * Begin non-standard functions.
  */

 JEMALLOC_ALWAYS_INLINE unsigned
 mallocx_tcache_get(int flags) {
 	if (likely((flags & MALLOCX_TCACHE_MASK) == 0)) {
 		return TCACHE_IND_AUTOMATIC;
 	} else if ((flags & MALLOCX_TCACHE_MASK) == MALLOCX_TCACHE_NONE) {
 		return TCACHE_IND_NONE;
 	} else {
 		return MALLOCX_TCACHE_GET(flags);
 	}
 }

 JEMALLOC_ALWAYS_INLINE unsigned
 mallocx_arena_get(int flags) {
 	if (unlikely((flags & MALLOCX_ARENA_MASK) != 0)) {
 		return MALLOCX_ARENA_GET(flags);
 	} else {
 		return ARENA_IND_AUTOMATIC;
 	}
 }

 #ifdef JEMALLOC_EXPERIMENTAL_SMALLOCX_API

 #	define JEMALLOC_SMALLOCX_CONCAT_HELPER(x, y) x##y
 #	define JEMALLOC_SMALLOCX_CONCAT_HELPER2(x, y)                         \
 		JEMALLOC_SMALLOCX_CONCAT_HELPER(x, y)

 typedef struct {
 	void  *ptr;
 	size_t size;
 } smallocx_return_t;

 JEMALLOC_EXPORT JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN smallocx_return_t
     JEMALLOC_NOTHROW
     /*
  * The attribute JEMALLOC_ATTR(malloc) cannot be used due to:
  *  - https://gcc.gnu.org/bugzilla/show_bug.cgi?id=86488
  */
     JEMALLOC_SMALLOCX_CONCAT_HELPER2(je_smallocx_, JEMALLOC_VERSION_GID_IDENT)(
         size_t size, int flags) {
 	/*
 	 * Note: the attribute JEMALLOC_ALLOC_SIZE(1) cannot be
 	 * used here because it makes writing beyond the `size`
 	 * of the `ptr` undefined behavior, but the objective
 	 * of this function is to allow writing beyond `size`
 	 * up to `smallocx_return_t::size`.
 	 */
 	smallocx_return_t ret;
 	static_opts_t     sopts;
 	dynamic_opts_t    dopts;

 	LOG("core.smallocx.entry", "size: %zu, flags: %d", size, flags);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.assert_nonempty_alloc = true;
 	sopts.null_out_result_on_error = true;
 	sopts.oom_string = "<jemalloc>: Error in mallocx(): out of memory\n";
 	sopts.usize = true;

 	dopts.result = &ret.ptr;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	if (unlikely(flags != 0)) {
 		dopts.alignment = MALLOCX_ALIGN_GET(flags);
 		dopts.zero = MALLOCX_ZERO_GET(flags);
 		dopts.tcache_ind = mallocx_tcache_get(flags);
 		dopts.arena_ind = mallocx_arena_get(flags);
 	}

 	imalloc(&sopts, &dopts);
 	assert(dopts.usize == je_nallocx(size, flags));
 	ret.size = dopts.usize;

 	LOG("core.smallocx.exit", "result: %p, size: %zu", ret.ptr, ret.size);
 	return ret;
 }
 #	undef JEMALLOC_SMALLOCX_CONCAT_HELPER
 #	undef JEMALLOC_SMALLOCX_CONCAT_HELPER2
 #endif

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ATTR(malloc) JEMALLOC_ALLOC_SIZE(1)
     je_mallocx(size_t size, int flags) {
 	void          *ret;
 	static_opts_t  sopts;
 	dynamic_opts_t dopts;

 	LOG("core.mallocx.entry", "size: %zu, flags: %d", size, flags);

 	static_opts_init(&sopts);
 	dynamic_opts_init(&dopts);

 	sopts.assert_nonempty_alloc = true;
 	sopts.null_out_result_on_error = true;
 	sopts.oom_string = "<jemalloc>: Error in mallocx(): out of memory\n";

 	dopts.result = &ret;
 	dopts.num_items = 1;
 	dopts.item_size = size;
 	if (unlikely(flags != 0)) {
 		dopts.alignment = MALLOCX_ALIGN_GET(flags);
 		dopts.zero = MALLOCX_ZERO_GET(flags);
 		dopts.tcache_ind = mallocx_tcache_get(flags);
 		dopts.arena_ind = mallocx_arena_get(flags);
 	}

 	imalloc(&sopts, &dopts);
 	if (sopts.slow) {
 		uintptr_t args[3] = {size, flags};
 		hook_invoke_alloc(
 		    hook_alloc_mallocx, ret, (uintptr_t)ret, args);
 	}

 	LOG("core.mallocx.exit", "result: %p", ret);
 	return ret;
 }

 static void *
 irallocx_prof_sample(tsdn_t *tsdn, void *old_ptr, size_t old_usize,
     size_t usize, size_t alignment, bool zero, tcache_t *tcache, arena_t *arena,
     prof_tctx_t *tctx, hook_ralloc_args_t *hook_args) {
 	void *p;

 	if (tctx == NULL) {
 		return NULL;
 	}

 	alignment = prof_sample_align(usize, alignment);
 	/*
 	 * If the allocation is small enough that it would normally be allocated
 	 * on a slab, we need to take additional steps to ensure that it gets
 	 * its own extent instead.
 	 */
 	if (sz_can_use_slab(usize)) {
 		size_t bumped_usize = sz_sa2u(usize, alignment);
 		p = iralloct_explicit_slab(tsdn, old_ptr, old_usize,
 		    bumped_usize, alignment, zero, /* slab */ false, tcache,
 		    arena, hook_args);
 		if (p == NULL) {
 			return NULL;
 		}
 		arena_prof_promote(tsdn, p, usize, bumped_usize);
 	} else {
 		p = iralloct_explicit_slab(tsdn, old_ptr, old_usize, usize,
 		    alignment, zero, /* slab */ false, tcache, arena,
 		    hook_args);
 	}
 	assert(prof_sample_aligned(p));

 	return p;
 }

 JEMALLOC_ALWAYS_INLINE void *
 irallocx_prof(tsd_t *tsd, void *old_ptr, size_t old_usize, size_t size,
     size_t alignment, size_t usize, bool zero, tcache_t *tcache, arena_t *arena,
     emap_alloc_ctx_t *alloc_ctx, hook_ralloc_args_t *hook_args) {
 	prof_info_t old_prof_info;
 	prof_info_get_and_reset_recent(tsd, old_ptr, alloc_ctx, &old_prof_info);
 	bool         prof_active = prof_active_get_unlocked();
 	bool         sample_event = te_prof_sample_event_lookahead(tsd, usize);
 	prof_tctx_t *tctx = prof_alloc_prep(tsd, prof_active, sample_event);
 	void        *p;
 	if (unlikely(tctx != PROF_TCTX_SENTINEL)) {
 		p = irallocx_prof_sample(tsd_tsdn(tsd), old_ptr, old_usize,
 		    usize, alignment, zero, tcache, arena, tctx, hook_args);
 	} else {
 		p = iralloct(tsd_tsdn(tsd), old_ptr, old_usize, size, alignment,
 		    usize, zero, tcache, arena, hook_args);
 	}
 	if (unlikely(p == NULL)) {
 		prof_alloc_rollback(tsd, tctx);
 		return NULL;
 	}
 	assert(usize == isalloc(tsd_tsdn(tsd), p));
 	prof_realloc(tsd, p, size, usize, tctx, prof_active, old_ptr, old_usize,
 	    &old_prof_info, sample_event);

 	return p;
 }

 static void *
 do_rallocx(void *ptr, size_t size, int flags, bool is_realloc) {
 	void    *p;
 	tsd_t   *tsd;
 	size_t   usize;
 	size_t   old_usize;
 	size_t   alignment = MALLOCX_ALIGN_GET(flags);
 	arena_t *arena;

 	assert(ptr != NULL);
 	assert(size != 0);
 	assert(malloc_initialized() || IS_INITIALIZER);
 	tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	bool zero = zero_get(MALLOCX_ZERO_GET(flags), /* slow */ true);

 	unsigned arena_ind = mallocx_arena_get(flags);
 	if (arena_get_from_ind(tsd, arena_ind, &arena)) {
 		goto label_oom;
 	}

 	unsigned  tcache_ind = mallocx_tcache_get(flags);
 	tcache_t *tcache = tcache_get_from_ind(tsd, tcache_ind,
 	    /* slow */ true, /* is_alloc */ true);

 	emap_alloc_ctx_t alloc_ctx;
 	emap_alloc_ctx_lookup(
 	    tsd_tsdn(tsd), &arena_emap_global, ptr, &alloc_ctx);
 	assert(alloc_ctx.szind != SC_NSIZES);
 	old_usize = emap_alloc_ctx_usize_get(&alloc_ctx);
 	assert(old_usize == isalloc(tsd_tsdn(tsd), ptr));
 	if (aligned_usize_get(size, alignment, &usize, NULL, false)) {
 		goto label_oom;
 	}

 	hook_ralloc_args_t hook_args = {
 	    is_realloc, {(uintptr_t)ptr, size, flags, 0}};
 	if (config_prof && opt_prof) {
 		p = irallocx_prof(tsd, ptr, old_usize, size, alignment, usize,
 		    zero, tcache, arena, &alloc_ctx, &hook_args);
 		if (unlikely(p == NULL)) {
 			goto label_oom;
 		}
 	} else {
 		p = iralloct(tsd_tsdn(tsd), ptr, old_usize, size, alignment,
 		    usize, zero, tcache, arena, &hook_args);
 		if (unlikely(p == NULL)) {
 			goto label_oom;
 		}
 		assert(usize == isalloc(tsd_tsdn(tsd), p));
 	}
 	assert(alignment == 0 || ((uintptr_t)p & (alignment - 1)) == ZU(0));
 	thread_alloc_event(tsd, usize);
 	thread_dalloc_event(tsd, old_usize);

 	UTRACE(ptr, size, p);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	if (config_fill && unlikely(opt_junk_alloc) && usize > old_usize
 	    && !zero) {
 		size_t excess_len = usize - old_usize;
 		void  *excess_start = (void *)((byte_t *)p + old_usize);
 		junk_alloc_callback(excess_start, excess_len);
 	}

 	return p;
 label_oom:
 	if (is_realloc) {
 		set_errno(ENOMEM);
 	}
 	if (config_xmalloc && unlikely(opt_xmalloc)) {
 		malloc_write("<jemalloc>: Error in rallocx(): out of memory\n");
 		abort();
 	}
 	UTRACE(ptr, size, 0);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	return NULL;
 }

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ALLOC_SIZE(2) je_rallocx(void *ptr, size_t size, int flags) {
 	LOG("core.rallocx.entry", "ptr: %p, size: %zu, flags: %d", ptr, size,
 	    flags);
 	void *ret = do_rallocx(ptr, size, flags, false);
 	LOG("core.rallocx.exit", "result: %p", ret);
 	return ret;
 }

 static void *
 do_realloc_nonnull_zero(void *ptr) {
 	if (config_stats) {
 		atomic_fetch_add_zu(&zero_realloc_count, 1, ATOMIC_RELAXED);
 	}
 	if (opt_zero_realloc_action == zero_realloc_action_alloc) {
 		/*
 		 * The user might have gotten an alloc setting while expecting a
 		 * free setting.  If that's the case, we at least try to
 		 * reduce the harm, and turn off the tcache while allocating, so
 		 * that we'll get a true first fit.
 		 */
 		return do_rallocx(ptr, 1, MALLOCX_TCACHE_NONE, true);
 	} else if (opt_zero_realloc_action == zero_realloc_action_free) {
 		UTRACE(ptr, 0, 0);
 		tsd_t *tsd = tsd_fetch();
 		check_entry_exit_locking(tsd_tsdn(tsd));

 		tcache_t *tcache = tcache_get_from_ind(tsd,
 		    TCACHE_IND_AUTOMATIC, /* slow */ true,
 		    /* is_alloc */ false);
 		uintptr_t args[3] = {(uintptr_t)ptr, 0};
 		hook_invoke_dalloc(hook_dalloc_realloc, ptr, args);
 		ifree(tsd, ptr, tcache, true);

 		check_entry_exit_locking(tsd_tsdn(tsd));
 		return NULL;
 	} else {
 		safety_check_fail(
 		    "Called realloc(non-null-ptr, 0) with "
 		    "zero_realloc:abort set\n");
 		/* In real code, this will never run; the safety check failure
 		 * will call abort.  In the unit test, we just want to bail out
 		 * without corrupting internal state that the test needs to
 		 * finish.
 		 */
 		return NULL;
 	}
 }

 JEMALLOC_EXPORT
 JEMALLOC_ALLOCATOR JEMALLOC_RESTRICT_RETURN void JEMALLOC_NOTHROW *
 JEMALLOC_ALLOC_SIZE(2) je_realloc(void *ptr, size_t size) {
 	LOG("core.realloc.entry", "ptr: %p, size: %zu\n", ptr, size);

 	if (likely(ptr != NULL && size != 0)) {
 		void *ret = do_rallocx(ptr, size, 0, true);
 		LOG("core.realloc.exit", "result: %p", ret);
 		return ret;
 	} else if (ptr != NULL && size == 0) {
 		void *ret = do_realloc_nonnull_zero(ptr);
 		LOG("core.realloc.exit", "result: %p", ret);
 		return ret;
 	} else {
 		/* realloc(NULL, size) is equivalent to malloc(size). */
 		void *ret;

 		static_opts_t  sopts;
 		dynamic_opts_t dopts;

 		static_opts_init(&sopts);
 		dynamic_opts_init(&dopts);

 		sopts.null_out_result_on_error = true;
 		sopts.set_errno_on_error = true;
 		sopts.oom_string =
 		    "<jemalloc>: Error in realloc(): out of memory\n";

 		dopts.result = &ret;
 		dopts.num_items = 1;
 		dopts.item_size = size;

 		imalloc(&sopts, &dopts);
 		if (sopts.slow) {
 			uintptr_t args[3] = {(uintptr_t)ptr, size};
 			hook_invoke_alloc(
 			    hook_alloc_realloc, ret, (uintptr_t)ret, args);
 		}
 		LOG("core.realloc.exit", "result: %p", ret);
 		return ret;
 	}
 }

 JEMALLOC_ALWAYS_INLINE size_t
 ixallocx_helper(tsdn_t *tsdn, void *ptr, size_t old_usize, size_t size,
     size_t extra, size_t alignment, bool zero) {
 	size_t newsize;

 	if (ixalloc(
 	        tsdn, ptr, old_usize, size, extra, alignment, zero, &newsize)) {
 		return old_usize;
 	}

 	return newsize;
 }

 static size_t
 ixallocx_prof_sample(tsdn_t *tsdn, void *ptr, size_t old_usize, size_t size,
     size_t extra, size_t alignment, bool zero, prof_tctx_t *tctx) {
 	/* Sampled allocation needs to be page aligned. */
 	if (tctx == NULL || !prof_sample_aligned(ptr)) {
 		return old_usize;
 	}

 	return ixallocx_helper(
 	    tsdn, ptr, old_usize, size, extra, alignment, zero);
 }

 JEMALLOC_ALWAYS_INLINE size_t
 ixallocx_prof(tsd_t *tsd, void *ptr, size_t old_usize, size_t size,
     size_t extra, size_t alignment, bool zero, emap_alloc_ctx_t *alloc_ctx) {
 	/*
 	 * old_prof_info is only used for asserting that the profiling info
 	 * isn't changed by the ixalloc() call.
 	 */
 	prof_info_t old_prof_info;
 	prof_info_get(tsd, ptr, alloc_ctx, &old_prof_info);

 	/*
 	 * usize isn't knowable before ixalloc() returns when extra is non-zero.
 	 * Therefore, compute its maximum possible value and use that in
 	 * prof_alloc_prep() to decide whether to capture a backtrace.
 	 * prof_realloc() will use the actual usize to decide whether to sample.
 	 */
 	size_t usize_max;
 	if (aligned_usize_get(
 	        size + extra, alignment, &usize_max, NULL, false)) {
 		/*
 		 * usize_max is out of range, and chances are that allocation
 		 * will fail, but use the maximum possible value and carry on
 		 * with prof_alloc_prep(), just in case allocation succeeds.
 		 */
 		usize_max = SC_LARGE_MAXCLASS;
 	}
 	bool prof_active = prof_active_get_unlocked();
 	bool sample_event = te_prof_sample_event_lookahead(tsd, usize_max);
 	prof_tctx_t *tctx = prof_alloc_prep(tsd, prof_active, sample_event);

 	size_t usize;
 	if (unlikely(tctx != PROF_TCTX_SENTINEL)) {
 		usize = ixallocx_prof_sample(tsd_tsdn(tsd), ptr, old_usize,
 		    size, extra, alignment, zero, tctx);
 	} else {
 		usize = ixallocx_helper(tsd_tsdn(tsd), ptr, old_usize, size,
 		    extra, alignment, zero);
 	}

 	/*
 	 * At this point we can still safely get the original profiling
 	 * information associated with the ptr, because (a) the edata_t object
 	 * associated with the ptr still lives and (b) the profiling info
 	 * fields are not touched.  "(a)" is asserted in the outer je_xallocx()
 	 * function, and "(b)" is indirectly verified below by checking that
 	 * the alloc_tctx field is unchanged.
 	 */
 	prof_info_t prof_info;
 	if (usize == old_usize) {
 		prof_info_get(tsd, ptr, alloc_ctx, &prof_info);
 		prof_alloc_rollback(tsd, tctx);
 	} else {
 		/*
 		 * Need to retrieve the new alloc_ctx since the modification
 		 * to edata has already been done.
 		 */
 		emap_alloc_ctx_t new_alloc_ctx;
 		emap_alloc_ctx_lookup(
 		    tsd_tsdn(tsd), &arena_emap_global, ptr, &new_alloc_ctx);
 		prof_info_get_and_reset_recent(
 		    tsd, ptr, &new_alloc_ctx, &prof_info);
 		assert(usize <= usize_max);
 		sample_event = te_prof_sample_event_lookahead(tsd, usize);
 		prof_realloc(tsd, ptr, size, usize, tctx, prof_active, ptr,
 		    old_usize, &prof_info, sample_event);
 	}

 	assert(old_prof_info.alloc_tctx == prof_info.alloc_tctx);
 	return usize;
 }

 JEMALLOC_EXPORT size_t JEMALLOC_NOTHROW
 je_xallocx(void *ptr, size_t size, size_t extra, int flags) {
 	tsd_t *tsd;
 	size_t usize, old_usize;
 	size_t alignment = MALLOCX_ALIGN_GET(flags);
 	bool   zero = zero_get(MALLOCX_ZERO_GET(flags), /* slow */ true);

 	LOG("core.xallocx.entry",
 	    "ptr: %p, size: %zu, extra: %zu, "
 	    "flags: %d",
 	    ptr, size, extra, flags);

 	assert(ptr != NULL);
 	assert(size != 0);
 	assert(SIZE_T_MAX - size >= extra);
 	assert(malloc_initialized() || IS_INITIALIZER);
 	tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	/*
 	 * old_edata is only for verifying that xallocx() keeps the edata_t
 	 * object associated with the ptr (though the content of the edata_t
 	 * object can be changed).
 	 */
 	edata_t *old_edata = emap_edata_lookup(
 	    tsd_tsdn(tsd), &arena_emap_global, ptr);

 	emap_alloc_ctx_t alloc_ctx;
 	emap_alloc_ctx_lookup(
 	    tsd_tsdn(tsd), &arena_emap_global, ptr, &alloc_ctx);
 	assert(alloc_ctx.szind != SC_NSIZES);
 	old_usize = emap_alloc_ctx_usize_get(&alloc_ctx);
 	assert(old_usize == isalloc(tsd_tsdn(tsd), ptr));
 	/*
 	 * The API explicitly absolves itself of protecting against (size +
 	 * extra) numerical overflow, but we may need to clamp extra to avoid
 	 * exceeding SC_LARGE_MAXCLASS.
 	 *
 	 * Ordinarily, size limit checking is handled deeper down, but here we
 	 * have to check as part of (size + extra) clamping, since we need the
 	 * clamped value in the above helper functions.
 	 */
 	if (unlikely(size > SC_LARGE_MAXCLASS)) {
 		usize = old_usize;
 		goto label_not_resized;
 	}
 	if (unlikely(SC_LARGE_MAXCLASS - size < extra)) {
 		extra = SC_LARGE_MAXCLASS - size;
 	}

 	if (config_prof && opt_prof) {
 		usize = ixallocx_prof(tsd, ptr, old_usize, size, extra,
 		    alignment, zero, &alloc_ctx);
 	} else {
 		usize = ixallocx_helper(tsd_tsdn(tsd), ptr, old_usize, size,
 		    extra, alignment, zero);
 	}

 	/*
 	 * xallocx() should keep using the same edata_t object (though its
 	 * content can be changed).
 	 */
 	assert(emap_edata_lookup(tsd_tsdn(tsd), &arena_emap_global, ptr)
 	    == old_edata);

 	if (unlikely(usize == old_usize)) {
 		goto label_not_resized;
 	}
 	thread_alloc_event(tsd, usize);
 	thread_dalloc_event(tsd, old_usize);

 	if (config_fill && unlikely(opt_junk_alloc) && usize > old_usize
 	    && !zero) {
 		size_t excess_len = usize - old_usize;
 		void  *excess_start = (void *)((byte_t *)ptr + old_usize);
 		junk_alloc_callback(excess_start, excess_len);
 	}
 label_not_resized:
 	if (unlikely(!tsd_fast(tsd))) {
 		uintptr_t args[4] = {(uintptr_t)ptr, size, extra, flags};
 		hook_invoke_expand(hook_expand_xallocx, ptr, old_usize, usize,
 		    (uintptr_t)usize, args);
 	}

 	UTRACE(ptr, size, ptr);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	LOG("core.xallocx.exit", "result: %zu", usize);
 	return usize;
 }

 JEMALLOC_EXPORT size_t JEMALLOC_NOTHROW
 JEMALLOC_ATTR(pure) je_sallocx(const void *ptr, int flags) {
 	size_t  usize;
 	tsdn_t *tsdn;

 	LOG("core.sallocx.entry", "ptr: %p, flags: %d", ptr, flags);

 	assert(malloc_initialized() || IS_INITIALIZER);
 	assert(ptr != NULL);

 	tsdn = tsdn_fetch();
 	check_entry_exit_locking(tsdn);

 	if (config_debug || force_ivsalloc) {
 		usize = ivsalloc(tsdn, ptr);
 		assert(force_ivsalloc || usize != 0);
 	} else {
 		usize = isalloc(tsdn, ptr);
 	}

 	check_entry_exit_locking(tsdn);

 	LOG("core.sallocx.exit", "result: %zu", usize);
 	return usize;
 }

 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_dallocx(void *ptr, int flags) {
 	LOG("core.dallocx.entry", "ptr: %p, flags: %d", ptr, flags);

 	assert(ptr != NULL);
 	assert(malloc_initialized() || IS_INITIALIZER);

 	tsd_t *tsd = tsd_fetch_min();
 	bool   fast = tsd_fast(tsd);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	unsigned  tcache_ind = mallocx_tcache_get(flags);
 	tcache_t *tcache = tcache_get_from_ind(tsd, tcache_ind, !fast,
 	    /* is_alloc */ false);

 	UTRACE(ptr, 0, 0);
 	if (likely(fast)) {
 		tsd_assert_fast(tsd);
 		ifree(tsd, ptr, tcache, false);
 	} else {
 		uintptr_t args_raw[3] = {(uintptr_t)ptr, flags};
 		hook_invoke_dalloc(hook_dalloc_dallocx, ptr, args_raw);
 		ifree(tsd, ptr, tcache, true);
 	}
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	LOG("core.dallocx.exit", "");
 }

 JEMALLOC_ALWAYS_INLINE size_t
 inallocx(tsdn_t *tsdn, size_t size, int flags) {
 	check_entry_exit_locking(tsdn);
 	size_t usize;
 	/* In case of out of range, let the user see it rather than fail. */
 	aligned_usize_get(size, MALLOCX_ALIGN_GET(flags), &usize, NULL, false);
 	check_entry_exit_locking(tsdn);
 	return usize;
 }

 JEMALLOC_NOINLINE void
 sdallocx_default(void *ptr, size_t size, int flags) {
 	assert(ptr != NULL);
 	assert(malloc_initialized() || IS_INITIALIZER);

 	tsd_t *tsd = tsd_fetch_min();
 	bool   fast = tsd_fast(tsd);
 	size_t usize = inallocx(tsd_tsdn(tsd), size, flags);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	unsigned  tcache_ind = mallocx_tcache_get(flags);
 	tcache_t *tcache = tcache_get_from_ind(tsd, tcache_ind, !fast,
 	    /* is_alloc */ false);

 	UTRACE(ptr, 0, 0);
 	if (likely(fast)) {
 		tsd_assert_fast(tsd);
 		isfree(tsd, ptr, usize, tcache, false);
 	} else {
 		uintptr_t args_raw[3] = {(uintptr_t)ptr, size, flags};
 		hook_invoke_dalloc(hook_dalloc_sdallocx, ptr, args_raw);
 		isfree(tsd, ptr, usize, tcache, true);
 	}
 	check_entry_exit_locking(tsd_tsdn(tsd));
 }

 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_sdallocx(void *ptr, size_t size, int flags) {
 	LOG("core.sdallocx.entry", "ptr: %p, size: %zu, flags: %d", ptr, size,
 	    flags);

 	je_sdallocx_impl(ptr, size, flags);

 	LOG("core.sdallocx.exit", "");
 }

 JEMALLOC_EXPORT size_t JEMALLOC_NOTHROW
 JEMALLOC_ATTR(pure) je_nallocx(size_t size, int flags) {
 	size_t  usize;
 	tsdn_t *tsdn;

 	assert(size != 0);

 	if (unlikely(malloc_init())) {
 		LOG("core.nallocx.exit", "result: %zu", ZU(0));
 		return 0;
 	}

 	tsdn = tsdn_fetch();
 	check_entry_exit_locking(tsdn);

 	usize = inallocx(tsdn, size, flags);
 	if (unlikely(usize > SC_LARGE_MAXCLASS)) {
 		LOG("core.nallocx.exit", "result: %zu", ZU(0));
 		return 0;
 	}

 	check_entry_exit_locking(tsdn);
 	LOG("core.nallocx.exit", "result: %zu", usize);
 	return usize;
 }

 JEMALLOC_EXPORT int JEMALLOC_NOTHROW
 je_mallctl(
     const char *name, void *oldp, size_t *oldlenp, void *newp, size_t newlen) {
 	int    ret;
 	tsd_t *tsd;

 	LOG("core.mallctl.entry", "name: %s", name);

 	if (unlikely(malloc_init())) {
 		LOG("core.mallctl.exit", "result: %d", EAGAIN);
 		return EAGAIN;
 	}

 	tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	ret = ctl_byname(tsd, name, oldp, oldlenp, newp, newlen);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	LOG("core.mallctl.exit", "result: %d", ret);
 	return ret;
 }

 JEMALLOC_EXPORT int JEMALLOC_NOTHROW
 je_mallctlnametomib(const char *name, size_t *mibp, size_t *miblenp) {
 	int ret;

 	LOG("core.mallctlnametomib.entry", "name: %s", name);

 	if (unlikely(malloc_init())) {
 		LOG("core.mallctlnametomib.exit", "result: %d", EAGAIN);
 		return EAGAIN;
 	}

 	tsd_t *tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	ret = ctl_nametomib(tsd, name, mibp, miblenp);
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	LOG("core.mallctlnametomib.exit", "result: %d", ret);
 	return ret;
 }

 JEMALLOC_EXPORT int JEMALLOC_NOTHROW
 je_mallctlbymib(const size_t *mib, size_t miblen, void *oldp, size_t *oldlenp,
     void *newp, size_t newlen) {
 	int    ret;
 	tsd_t *tsd;

 	LOG("core.mallctlbymib.entry", "");

 	if (unlikely(malloc_init())) {
 		LOG("core.mallctlbymib.exit", "result: %d", EAGAIN);
 		return EAGAIN;
 	}

 	tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	ret = ctl_bymib(tsd, mib, miblen, oldp, oldlenp, newp, newlen);
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	LOG("core.mallctlbymib.exit", "result: %d", ret);
 	return ret;
 }

 #define STATS_PRINT_BUFSIZE 65536
 JEMALLOC_EXPORT void JEMALLOC_NOTHROW
 je_malloc_stats_print(
     void (*write_cb)(void *, const char *), void *cbopaque, const char *opts) {
 	tsdn_t *tsdn;

 	LOG("core.malloc_stats_print.entry", "");

 	tsdn = tsdn_fetch();
 	check_entry_exit_locking(tsdn);

 	if (config_debug) {
 		stats_print(write_cb, cbopaque, opts);
 	} else {
 		buf_writer_t buf_writer;
 		buf_writer_init(tsdn, &buf_writer, write_cb, cbopaque, NULL,
 		    STATS_PRINT_BUFSIZE);
 		stats_print(buf_writer_cb, &buf_writer, opts);
 		buf_writer_terminate(tsdn, &buf_writer);
 	}

 	check_entry_exit_locking(tsdn);
 	LOG("core.malloc_stats_print.exit", "");
 }
 #undef STATS_PRINT_BUFSIZE

 JEMALLOC_ALWAYS_INLINE size_t
 je_malloc_usable_size_impl(JEMALLOC_USABLE_SIZE_CONST void *ptr) {
 	assert(malloc_initialized() || IS_INITIALIZER);

 	tsdn_t *tsdn = tsdn_fetch();
 	check_entry_exit_locking(tsdn);

 	size_t ret;
 	if (unlikely(ptr == NULL)) {
 		ret = 0;
 	} else {
 		if (config_debug || force_ivsalloc) {
 			ret = ivsalloc(tsdn, ptr);
 			assert(force_ivsalloc || ret != 0);
 		} else {
 			ret = isalloc(tsdn, ptr);
 		}
 	}
 	check_entry_exit_locking(tsdn);

 	return ret;
 }

 JEMALLOC_EXPORT size_t JEMALLOC_NOTHROW
 je_malloc_usable_size(JEMALLOC_USABLE_SIZE_CONST void *ptr) {
 	LOG("core.malloc_usable_size.entry", "ptr: %p", ptr);

 	size_t ret = je_malloc_usable_size_impl(ptr);

 	LOG("core.malloc_usable_size.exit", "result: %zu", ret);
 	return ret;
 }

 #ifdef JEMALLOC_HAVE_MALLOC_SIZE
 JEMALLOC_EXPORT size_t JEMALLOC_NOTHROW
 je_malloc_size(const void *ptr) {
 	LOG("core.malloc_size.entry", "ptr: %p", ptr);

 	size_t ret = je_malloc_usable_size_impl(ptr);

 	LOG("core.malloc_size.exit", "result: %zu", ret);
 	return ret;
 }
 #endif

 static void
 batch_alloc_prof_sample_assert(tsd_t *tsd, size_t batch, size_t usize) {
 	assert(config_prof && opt_prof);
 	bool prof_sample_event = te_prof_sample_event_lookahead(
 	    tsd, batch * usize);
 	assert(!prof_sample_event);
 	size_t surplus;
 	prof_sample_event = te_prof_sample_event_lookahead_surplus(
 	    tsd, (batch + 1) * usize, &surplus);
 	assert(prof_sample_event);
 	assert(surplus < usize);
 }

 size_t
 batch_alloc(void **ptrs, size_t num, size_t size, int flags) {
 	LOG("core.batch_alloc.entry",
 	    "ptrs: %p, num: %zu, size: %zu, flags: %d", ptrs, num, size, flags);

 	tsd_t *tsd = tsd_fetch();
 	check_entry_exit_locking(tsd_tsdn(tsd));

 	size_t filled = 0;

 	if (unlikely(tsd == NULL || tsd_reentrancy_level_get(tsd) > 0)) {
 		goto label_done;
 	}

 	size_t alignment = MALLOCX_ALIGN_GET(flags);
 	size_t usize;
 	if (aligned_usize_get(size, alignment, &usize, NULL, false)) {
 		goto label_done;
 	}
 	szind_t ind = sz_size2index(usize);
 	bool    zero = zero_get(MALLOCX_ZERO_GET(flags), /* slow */ true);

 	/*
 	 * The cache bin and arena will be lazily initialized; it's hard to
 	 * know in advance whether each of them needs to be initialized.
 	 */
 	cache_bin_t *bin = NULL;
 	arena_t     *arena = NULL;

 	size_t nregs = 0;
 	if (likely(ind < SC_NBINS)) {
 		nregs = bin_infos[ind].nregs;
 		assert(nregs > 0);
 	}

 	while (filled < num) {
 		size_t batch = num - filled;
 		size_t surplus = SIZE_MAX; /* Dead store. */
 		bool   prof_sample_event = config_prof && opt_prof
 		    && prof_active_get_unlocked()
 		    && te_prof_sample_event_lookahead_surplus(
 		        tsd, batch * usize, &surplus);

 		if (prof_sample_event) {
 			/*
 			 * Adjust so that the batch does not trigger prof
 			 * sampling.
 			 */
 			batch -= surplus / usize + 1;
 			batch_alloc_prof_sample_assert(tsd, batch, usize);
 		}

 		size_t progress = 0;

 		if (likely(ind < SC_NBINS) && batch >= nregs) {
 			if (arena == NULL) {
 				unsigned arena_ind = mallocx_arena_get(flags);
 				if (arena_get_from_ind(
 				        tsd, arena_ind, &arena)) {
 					goto label_done;
 				}
 				if (arena == NULL) {
 					arena = arena_choose(tsd, NULL);
 				}
 				if (unlikely(arena == NULL)) {
 					goto label_done;
 				}
 			}
 			size_t arena_batch = batch - batch % nregs;
 			size_t n = arena_fill_small_fresh(tsd_tsdn(tsd), arena,
 			    ind, ptrs + filled, arena_batch, zero);
 			progress += n;
 			filled += n;
 		}

 		unsigned  tcache_ind = mallocx_tcache_get(flags);
 		tcache_t *tcache = tcache_get_from_ind(tsd, tcache_ind,
 		    /* slow */ true, /* is_alloc */ true);
 		if (likely(tcache != NULL
 		        && ind < tcache_nbins_get(tcache->tcache_slow)
 		        && !tcache_bin_disabled(
 		            ind, &tcache->bins[ind], tcache->tcache_slow))
 		    && progress < batch) {
 			if (bin == NULL) {
 				bin = &tcache->bins[ind];
 			}
 			/*
 			 * If we don't have a tcache bin, we don't want to
 			 * immediately give up, because there's the possibility
 			 * that the user explicitly requested to bypass the
 			 * tcache, or that the user explicitly turned off the
 			 * tcache; in such cases, we go through the slow path,
 			 * i.e. the mallocx() call at the end of the while loop.
 			 */
 			if (bin != NULL) {
 				size_t bin_batch = batch - progress;
 				/*
 				 * n can be less than bin_batch, meaning that
 				 * the cache bin does not have enough memory.
 				 * In such cases, we rely on the slow path,
 				 * i.e. the mallocx() call at the end of the
 				 * while loop, to fill in the cache, and in the
 				 * next iteration of the while loop, the tcache
 				 * will contain a lot of memory, and we can
 				 * harvest them here.  Compared to the
 				 * alternative approach where we directly go to
 				 * the arena bins here, the overhead of our
 				 * current approach should usually be minimal,
 				 * since we never try to fetch more memory than
 				 * what a slab contains via the tcache.  An
 				 * additional benefit is that the tcache will
 				 * not be empty for the next allocation request.
 				 */
 				size_t n = cache_bin_alloc_batch(
 				    bin, bin_batch, ptrs + filled);
 				if (config_stats) {
 					bin->tstats.nrequests += n;
 				}
 				if (zero) {
 					for (size_t i = 0; i < n; ++i) {
 						memset(
 						    ptrs[filled + i], 0, usize);
 					}
 				}
 				if (config_prof && opt_prof
 				    && unlikely(ind >= SC_NBINS)) {
 					for (size_t i = 0; i < n; ++i) {
 						prof_tctx_reset_sampled(
 						    tsd, ptrs[filled + i]);
 					}
 				}
 				progress += n;
 				filled += n;
 			}
 		}

 		/*
 		 * For thread events other than prof sampling, trigger them as
 		 * if there's a single allocation of size (n * usize).  This is
 		 * fine because:
 		 * (a) these events do not alter the allocation itself, and
 		 * (b) it's possible that some event would have been triggered
 		 *     multiple times, instead of only once, if the allocations
 		 *     were handled individually, but it would do no harm (or
 		 *     even be beneficial) to coalesce the triggerings.
 		 */
 		thread_alloc_event(tsd, progress * usize);

 		if (progress < batch || prof_sample_event) {
 			void *p = je_mallocx(size, flags);
 			if (p == NULL) { /* OOM */
 				break;
 			}
 			if (progress == batch) {
 				assert(prof_sampled(tsd, p));
 			}
 			ptrs[filled++] = p;
 		}
 	}

 label_done:
 	check_entry_exit_locking(tsd_tsdn(tsd));
 	LOG("core.batch_alloc.exit", "result: %zu", filled);
 	return filled;
 }

 /*
  * End non-standard functions.
  */
 /******************************************************************************/
 /*
  * The following functions are used by threading libraries for protection of
  * malloc during fork().
  */

 /*
  * If an application creates a thread before doing any allocation in the main
  * thread, then calls fork(2) in the main thread followed by memory allocation
  * in the child process, a race can occur that results in deadlock within the
  * child: the main thread may have forked while the created thread had
  * partially initialized the allocator.  Ordinarily jemalloc prevents
  * fork/malloc races via the following functions it registers during
  * initialization using pthread_atfork(), but of course that does no good if
  * the allocator isn't fully initialized at fork time.  The following library
  * constructor is a partial solution to this problem.  It may still be possible
  * to trigger the deadlock described above, but doing so would involve forking
  * via a library constructor that runs before jemalloc's runs.
  */
 #ifndef JEMALLOC_JET
 JEMALLOC_ATTR(constructor)
 static void
 jemalloc_constructor(void) {
 	malloc_init();
 }
 #endif

 #ifndef JEMALLOC_MUTEX_INIT_CB
 void
 jemalloc_prefork(void)
 #else
 JEMALLOC_EXPORT void
 _malloc_prefork(void)
 #endif
 {
 	tsd_t   *tsd;
 	unsigned i, j, narenas;
 	arena_t *arena;

 #ifdef JEMALLOC_MUTEX_INIT_CB
 	if (!malloc_initialized()) {
 		return;
 	}
 #endif
 	assert(malloc_initialized());

 	tsd = tsd_fetch();

 	narenas = narenas_total_get();

 	witness_prefork(tsd_witness_tsdp_get(tsd));
 	/* Acquire all mutexes in a safe order. */
 	ctl_prefork(tsd_tsdn(tsd));
 	tcache_prefork(tsd_tsdn(tsd));
 	malloc_mutex_prefork(tsd_tsdn(tsd), &arenas_lock);
 	if (have_background_thread) {
 		background_thread_prefork0(tsd_tsdn(tsd));
 	}
 	prof_prefork0(tsd_tsdn(tsd));
 	if (have_background_thread) {
 		background_thread_prefork1(tsd_tsdn(tsd));
 	}
 	/* Break arena prefork into stages to preserve lock order. */
 	for (i = 0; i < 9; i++) {
 		for (j = 0; j < narenas; j++) {
 			if ((arena = arena_get(tsd_tsdn(tsd), j, false))
 			    != NULL) {
 				switch (i) {
 				case 0:
 					arena_prefork0(tsd_tsdn(tsd), arena);
 					break;
 				case 1:
 					arena_prefork1(tsd_tsdn(tsd), arena);
 					break;
 				case 2:
 					arena_prefork2(tsd_tsdn(tsd), arena);
 					break;
 				case 3:
 					arena_prefork3(tsd_tsdn(tsd), arena);
 					break;
 				case 4:
 					arena_prefork4(tsd_tsdn(tsd), arena);
 					break;
 				case 5:
 					arena_prefork5(tsd_tsdn(tsd), arena);
 					break;
 				case 6:
 					arena_prefork6(tsd_tsdn(tsd), arena);
 					break;
 				case 7:
 					arena_prefork7(tsd_tsdn(tsd), arena);
 					break;
 				case 8:
 					arena_prefork8(tsd_tsdn(tsd), arena);
 					break;
 				default:
 					not_reached();
 				}
 			}
 		}
 	}
 	prof_prefork1(tsd_tsdn(tsd));
 	stats_prefork(tsd_tsdn(tsd));
 	tsd_prefork(tsd);
 }

 #ifndef JEMALLOC_MUTEX_INIT_CB
 void
 jemalloc_postfork_parent(void)
 #else
 JEMALLOC_EXPORT void
 _malloc_postfork(void)
 #endif
 {
 	tsd_t   *tsd;
 	unsigned i, narenas;

 #ifdef JEMALLOC_MUTEX_INIT_CB
 	if (!malloc_initialized()) {
 		return;
 	}
 #endif
 	assert(malloc_initialized());

 	tsd = tsd_fetch();

 	tsd_postfork_parent(tsd);

 	witness_postfork_parent(tsd_witness_tsdp_get(tsd));
 	/* Release all mutexes, now that fork() has completed. */
 	stats_postfork_parent(tsd_tsdn(tsd));
 	for (i = 0, narenas = narenas_total_get(); i < narenas; i++) {
 		arena_t *arena;

 		if ((arena = arena_get(tsd_tsdn(tsd), i, false)) != NULL) {
 			arena_postfork_parent(tsd_tsdn(tsd), arena);
 		}
 	}
 	prof_postfork_parent(tsd_tsdn(tsd));
 	if (have_background_thread) {
 		background_thread_postfork_parent(tsd_tsdn(tsd));
 	}
 	malloc_mutex_postfork_parent(tsd_tsdn(tsd), &arenas_lock);
 	tcache_postfork_parent(tsd_tsdn(tsd));
 	ctl_postfork_parent(tsd_tsdn(tsd));
 }

 void
 jemalloc_postfork_child(void) {
 	tsd_t   *tsd;
 	unsigned i, narenas;

 	assert(malloc_initialized());

 	tsd = tsd_fetch();

 	tsd_postfork_child(tsd);

 	witness_postfork_child(tsd_witness_tsdp_get(tsd));
 	/* Release all mutexes, now that fork() has completed. */
 	stats_postfork_child(tsd_tsdn(tsd));
 	for (i = 0, narenas = narenas_total_get(); i < narenas; i++) {
 		arena_t *arena;

 		if ((arena = arena_get(tsd_tsdn(tsd), i, false)) != NULL) {
 			arena_postfork_child(tsd_tsdn(tsd), arena);
 		}
 	}
 	prof_postfork_child(tsd_tsdn(tsd));
 	if (have_background_thread) {
 		background_thread_postfork_child(tsd_tsdn(tsd));
 	}
 	malloc_mutex_postfork_child(tsd_tsdn(tsd), &arenas_lock);
 	tcache_postfork_child(tsd_tsdn(tsd));
 	ctl_postfork_child(tsd_tsdn(tsd));
 }

 /******************************************************************************/