1. add tcache_max and nhbins into tcache_t so that they are per-tcache, with one auto tcache per thread, it's also per-thread; 2. add mallctl for each thread to set its own tcache_max (of its auto tcache); 3. store the maximum number of items in each bin instead of using a global storage; 4. add tests for the modifications above. 5. Rename `nhbins` and `tcache_maxclass` to `global_do_not_change_nhbins` and `global_do_not_change_tcache_maxclass`.
260 lines
7.3 KiB
C
260 lines
7.3 KiB
C
#ifndef JEMALLOC_INTERNAL_TCACHE_INLINES_H
|
|
#define JEMALLOC_INTERNAL_TCACHE_INLINES_H
|
|
|
|
#include "jemalloc/internal/jemalloc_preamble.h"
|
|
#include "jemalloc/internal/arena_externs.h"
|
|
#include "jemalloc/internal/bin.h"
|
|
#include "jemalloc/internal/jemalloc_internal_inlines_b.h"
|
|
#include "jemalloc/internal/jemalloc_internal_types.h"
|
|
#include "jemalloc/internal/large_externs.h"
|
|
#include "jemalloc/internal/san.h"
|
|
#include "jemalloc/internal/sc.h"
|
|
#include "jemalloc/internal/sz.h"
|
|
#include "jemalloc/internal/tcache_externs.h"
|
|
#include "jemalloc/internal/util.h"
|
|
|
|
static inline bool
|
|
tcache_enabled_get(tsd_t *tsd) {
|
|
return tsd_tcache_enabled_get(tsd);
|
|
}
|
|
|
|
static inline void
|
|
tcache_enabled_set(tsd_t *tsd, bool enabled) {
|
|
bool was_enabled = tsd_tcache_enabled_get(tsd);
|
|
|
|
if (!was_enabled && enabled) {
|
|
tsd_tcache_data_init(tsd, NULL);
|
|
} else if (was_enabled && !enabled) {
|
|
tcache_cleanup(tsd);
|
|
}
|
|
/* Commit the state last. Above calls check current state. */
|
|
tsd_tcache_enabled_set(tsd, enabled);
|
|
tsd_slow_update(tsd);
|
|
}
|
|
|
|
static inline unsigned
|
|
tcache_nhbins_get(tcache_t *tcache) {
|
|
assert(tcache != NULL);
|
|
assert(tcache->tcache_nhbins <= TCACHE_NBINS_MAX);
|
|
return tcache->tcache_nhbins;
|
|
}
|
|
|
|
static inline size_t
|
|
tcache_max_get(tcache_t *tcache) {
|
|
assert(tcache != NULL);
|
|
assert(tcache->tcache_max <= TCACHE_MAXCLASS_LIMIT);
|
|
return tcache->tcache_max;
|
|
}
|
|
|
|
static inline void
|
|
tcache_max_and_nhbins_set(tcache_t *tcache, size_t tcache_max) {
|
|
assert(tcache != NULL);
|
|
assert(tcache_max <= TCACHE_MAXCLASS_LIMIT);
|
|
tcache->tcache_max = tcache_max;
|
|
tcache->tcache_nhbins = sz_size2index(tcache_max) + 1;
|
|
}
|
|
|
|
static inline void
|
|
thread_tcache_max_and_nhbins_set(tsd_t *tsd, size_t tcache_max) {
|
|
assert(tcache_max <= TCACHE_MAXCLASS_LIMIT);
|
|
assert(tcache_max == sz_s2u(tcache_max));
|
|
tcache_t *tcache = tsd_tcachep_get(tsd);
|
|
tcache_slow_t *tcache_slow;
|
|
assert(tcache != NULL);
|
|
|
|
bool enabled = tcache_available(tsd);
|
|
arena_t *assigned_arena;
|
|
if (enabled) {
|
|
tcache_slow = tcache_slow_get(tsd);
|
|
assert(tcache != NULL && tcache_slow != NULL);
|
|
assigned_arena = tcache_slow->arena;
|
|
/* Shutdown and reboot the tcache for a clean slate. */
|
|
tcache_cleanup(tsd);
|
|
}
|
|
|
|
/*
|
|
* Still set tcache_max and tcache_nhbins of the tcache even if
|
|
* the tcache is not available yet because the values are
|
|
* stored in tsd_t and are always available for changing.
|
|
*/
|
|
tcache_max_and_nhbins_set(tcache, tcache_max);
|
|
|
|
if (enabled) {
|
|
tsd_tcache_data_init(tsd, assigned_arena);
|
|
}
|
|
|
|
assert(tcache_nhbins_get(tcache) == sz_size2index(tcache_max) + 1);
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE bool
|
|
tcache_small_bin_disabled(szind_t ind, cache_bin_t *bin) {
|
|
assert(ind < SC_NBINS);
|
|
assert(bin != NULL);
|
|
bool ret = cache_bin_info_ncached_max(&bin->bin_info) == 0;
|
|
if (ret) {
|
|
/* small size class but cache bin disabled. */
|
|
assert((uintptr_t)(*bin->stack_head) ==
|
|
cache_bin_preceding_junk);
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE bool
|
|
tcache_large_bin_disabled(szind_t ind, cache_bin_t *bin) {
|
|
assert(ind >= SC_NBINS);
|
|
assert(bin != NULL);
|
|
return (cache_bin_info_ncached_max(&bin->bin_info) == 0 ||
|
|
cache_bin_still_zero_initialized(bin));
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE void *
|
|
tcache_alloc_small(tsd_t *tsd, arena_t *arena, tcache_t *tcache,
|
|
size_t size, szind_t binind, bool zero, bool slow_path) {
|
|
void *ret;
|
|
bool tcache_success;
|
|
|
|
assert(binind < SC_NBINS);
|
|
cache_bin_t *bin = &tcache->bins[binind];
|
|
ret = cache_bin_alloc(bin, &tcache_success);
|
|
assert(tcache_success == (ret != NULL));
|
|
if (unlikely(!tcache_success)) {
|
|
bool tcache_hard_success;
|
|
arena = arena_choose(tsd, arena);
|
|
if (unlikely(arena == NULL)) {
|
|
return NULL;
|
|
}
|
|
if (unlikely(tcache_small_bin_disabled(binind, bin))) {
|
|
/* stats and zero are handled directly by the arena. */
|
|
return arena_malloc_hard(tsd_tsdn(tsd), arena, size,
|
|
binind, zero, /* slab */ true);
|
|
}
|
|
tcache_bin_flush_stashed(tsd, tcache, bin, binind,
|
|
/* is_small */ true);
|
|
|
|
ret = tcache_alloc_small_hard(tsd_tsdn(tsd), arena, tcache,
|
|
bin, binind, &tcache_hard_success);
|
|
if (tcache_hard_success == false) {
|
|
return NULL;
|
|
}
|
|
}
|
|
|
|
assert(ret);
|
|
if (unlikely(zero)) {
|
|
size_t usize = sz_index2size(binind);
|
|
assert(tcache_salloc(tsd_tsdn(tsd), ret) == usize);
|
|
memset(ret, 0, usize);
|
|
}
|
|
if (config_stats) {
|
|
bin->tstats.nrequests++;
|
|
}
|
|
return ret;
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE void *
|
|
tcache_alloc_large(tsd_t *tsd, arena_t *arena, tcache_t *tcache, size_t size,
|
|
szind_t binind, bool zero, bool slow_path) {
|
|
void *ret;
|
|
bool tcache_success;
|
|
|
|
assert(binind >= SC_NBINS && binind < tcache_nhbins_get(tcache));
|
|
cache_bin_t *bin = &tcache->bins[binind];
|
|
ret = cache_bin_alloc(bin, &tcache_success);
|
|
assert(tcache_success == (ret != NULL));
|
|
if (unlikely(!tcache_success)) {
|
|
/*
|
|
* Only allocate one large object at a time, because it's quite
|
|
* expensive to create one and not use it.
|
|
*/
|
|
arena = arena_choose(tsd, arena);
|
|
if (unlikely(arena == NULL)) {
|
|
return NULL;
|
|
}
|
|
tcache_bin_flush_stashed(tsd, tcache, bin, binind,
|
|
/* is_small */ false);
|
|
|
|
ret = large_malloc(tsd_tsdn(tsd), arena, sz_s2u(size), zero);
|
|
if (ret == NULL) {
|
|
return NULL;
|
|
}
|
|
} else {
|
|
if (unlikely(zero)) {
|
|
size_t usize = sz_index2size(binind);
|
|
assert(usize <= tcache_max_get(tcache));
|
|
memset(ret, 0, usize);
|
|
}
|
|
|
|
if (config_stats) {
|
|
bin->tstats.nrequests++;
|
|
}
|
|
}
|
|
|
|
return ret;
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE void
|
|
tcache_dalloc_small(tsd_t *tsd, tcache_t *tcache, void *ptr, szind_t binind,
|
|
bool slow_path) {
|
|
assert(tcache_salloc(tsd_tsdn(tsd), ptr) <= SC_SMALL_MAXCLASS);
|
|
|
|
cache_bin_t *bin = &tcache->bins[binind];
|
|
/*
|
|
* Not marking the branch unlikely because this is past free_fastpath()
|
|
* (which handles the most common cases), i.e. at this point it's often
|
|
* uncommon cases.
|
|
*/
|
|
if (cache_bin_nonfast_aligned(ptr)) {
|
|
/* Junk unconditionally, even if bin is full. */
|
|
san_junk_ptr(ptr, sz_index2size(binind));
|
|
if (cache_bin_stash(bin, ptr)) {
|
|
return;
|
|
}
|
|
assert(cache_bin_full(bin));
|
|
/* Bin full; fall through into the flush branch. */
|
|
}
|
|
|
|
if (unlikely(!cache_bin_dalloc_easy(bin, ptr))) {
|
|
if (unlikely(tcache_small_bin_disabled(binind, bin))) {
|
|
arena_dalloc_small(tsd_tsdn(tsd), ptr);
|
|
return;
|
|
}
|
|
cache_bin_sz_t max = cache_bin_info_ncached_max(
|
|
&bin->bin_info);
|
|
unsigned remain = max >> opt_lg_tcache_flush_small_div;
|
|
tcache_bin_flush_small(tsd, tcache, bin, binind, remain);
|
|
bool ret = cache_bin_dalloc_easy(bin, ptr);
|
|
assert(ret);
|
|
}
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE void
|
|
tcache_dalloc_large(tsd_t *tsd, tcache_t *tcache, void *ptr, szind_t binind,
|
|
bool slow_path) {
|
|
|
|
assert(tcache_salloc(tsd_tsdn(tsd), ptr) > SC_SMALL_MAXCLASS);
|
|
assert(tcache_salloc(tsd_tsdn(tsd), ptr) <= tcache_max_get(tcache));
|
|
|
|
cache_bin_t *bin = &tcache->bins[binind];
|
|
if (unlikely(!cache_bin_dalloc_easy(bin, ptr))) {
|
|
unsigned remain = cache_bin_info_ncached_max(
|
|
&bin->bin_info) >> opt_lg_tcache_flush_large_div;
|
|
tcache_bin_flush_large(tsd, tcache, bin, binind, remain);
|
|
bool ret = cache_bin_dalloc_easy(bin, ptr);
|
|
assert(ret);
|
|
}
|
|
}
|
|
|
|
JEMALLOC_ALWAYS_INLINE tcache_t *
|
|
tcaches_get(tsd_t *tsd, unsigned ind) {
|
|
tcaches_t *elm = &tcaches[ind];
|
|
if (unlikely(elm->tcache == NULL)) {
|
|
malloc_printf("<jemalloc>: invalid tcache id (%u).\n", ind);
|
|
abort();
|
|
} else if (unlikely(elm->tcache == TCACHES_ELM_NEED_REINIT)) {
|
|
elm->tcache = tcache_create_explicit(tsd);
|
|
}
|
|
return elm->tcache;
|
|
}
|
|
|
|
#endif /* JEMALLOC_INTERNAL_TCACHE_INLINES_H */
|