1102 lines
26 KiB
C
1102 lines
26 KiB
C
#include "jemalloc/internal/jemalloc_preamble.h"
|
|
#include "jemalloc/internal/jemalloc_internal_includes.h"
|
|
|
|
#include "jemalloc/internal/ctl.h"
|
|
#include "jemalloc/internal/assert.h"
|
|
#include "jemalloc/internal/mutex.h"
|
|
#include "jemalloc/internal/counter.h"
|
|
#include "jemalloc/internal/prof_data.h"
|
|
#include "jemalloc/internal/prof_log.h"
|
|
#include "jemalloc/internal/prof_recent.h"
|
|
#include "jemalloc/internal/prof_sys.h"
|
|
#include "jemalloc/internal/thread_event.h"
|
|
|
|
/*
|
|
* This file implements the profiling "APIs" needed by other parts of jemalloc,
|
|
* and also manages the relevant "operational" data, mainly options and mutexes;
|
|
* the core profiling data structures are encapsulated in prof_data.c.
|
|
*/
|
|
|
|
/******************************************************************************/
|
|
|
|
#ifdef JEMALLOC_PROF_LIBUNWIND
|
|
#define UNW_LOCAL_ONLY
|
|
#include <libunwind.h>
|
|
#endif
|
|
|
|
#ifdef JEMALLOC_PROF_LIBGCC
|
|
/*
|
|
* We have a circular dependency -- jemalloc_internal.h tells us if we should
|
|
* use libgcc's unwinding functionality, but after we've included that, we've
|
|
* already hooked _Unwind_Backtrace. We'll temporarily disable hooking.
|
|
*/
|
|
#undef _Unwind_Backtrace
|
|
#include <unwind.h>
|
|
#define _Unwind_Backtrace JEMALLOC_HOOK(_Unwind_Backtrace, test_hooks_libc_hook)
|
|
#endif
|
|
|
|
/******************************************************************************/
|
|
/* Data. */
|
|
|
|
bool opt_prof = false;
|
|
bool opt_prof_active = true;
|
|
bool opt_prof_thread_active_init = true;
|
|
size_t opt_lg_prof_sample = LG_PROF_SAMPLE_DEFAULT;
|
|
ssize_t opt_lg_prof_interval = LG_PROF_INTERVAL_DEFAULT;
|
|
bool opt_prof_gdump = false;
|
|
bool opt_prof_final = false;
|
|
bool opt_prof_leak = false;
|
|
bool opt_prof_accum = false;
|
|
char opt_prof_prefix[PROF_DUMP_FILENAME_LEN];
|
|
bool opt_prof_sys_thread_name = false;
|
|
|
|
/* Accessed via prof_sample_event_handler(). */
|
|
static counter_accum_t prof_idump_accumulated;
|
|
|
|
/*
|
|
* Initialized as opt_prof_active, and accessed via
|
|
* prof_active_[gs]et{_unlocked,}().
|
|
*/
|
|
bool prof_active;
|
|
static malloc_mutex_t prof_active_mtx;
|
|
|
|
/*
|
|
* Initialized as opt_prof_thread_active_init, and accessed via
|
|
* prof_thread_active_init_[gs]et().
|
|
*/
|
|
static bool prof_thread_active_init;
|
|
static malloc_mutex_t prof_thread_active_init_mtx;
|
|
|
|
/*
|
|
* Initialized as opt_prof_gdump, and accessed via
|
|
* prof_gdump_[gs]et{_unlocked,}().
|
|
*/
|
|
bool prof_gdump_val;
|
|
static malloc_mutex_t prof_gdump_mtx;
|
|
|
|
uint64_t prof_interval = 0;
|
|
|
|
size_t lg_prof_sample;
|
|
|
|
/* Non static to enable profiling. */
|
|
malloc_mutex_t bt2gctx_mtx;
|
|
|
|
malloc_mutex_t tdatas_mtx;
|
|
|
|
static uint64_t next_thr_uid;
|
|
static malloc_mutex_t next_thr_uid_mtx;
|
|
|
|
static malloc_mutex_t prof_dump_filename_mtx;
|
|
static uint64_t prof_dump_seq;
|
|
static uint64_t prof_dump_iseq;
|
|
static uint64_t prof_dump_mseq;
|
|
static uint64_t prof_dump_useq;
|
|
|
|
/* The fallback allocator profiling functionality will use. */
|
|
base_t *prof_base;
|
|
|
|
malloc_mutex_t prof_dump_mtx;
|
|
static char *prof_dump_prefix = NULL;
|
|
|
|
/* Do not dump any profiles until bootstrapping is complete. */
|
|
bool prof_booted = false;
|
|
|
|
/******************************************************************************/
|
|
|
|
/*
|
|
* If profiling is off, then PROF_DUMP_FILENAME_LEN is 1, so we'll end up
|
|
* calling strncpy with a size of 0, which triggers a -Wstringop-truncation
|
|
* warning (strncpy can never actually be called in this case, since we bail out
|
|
* much earlier when config_prof is false). This function works around the
|
|
* warning to let us leave the warning on.
|
|
*/
|
|
static inline void
|
|
prof_strncpy(char *UNUSED dest, const char *UNUSED src, size_t UNUSED size) {
|
|
cassert(config_prof);
|
|
#ifdef JEMALLOC_PROF
|
|
strncpy(dest, src, size);
|
|
#endif
|
|
}
|
|
|
|
void
|
|
prof_alloc_rollback(tsd_t *tsd, prof_tctx_t *tctx) {
|
|
cassert(config_prof);
|
|
|
|
if (tsd_reentrancy_level_get(tsd) > 0) {
|
|
assert((uintptr_t)tctx == (uintptr_t)1U);
|
|
return;
|
|
}
|
|
|
|
if ((uintptr_t)tctx > (uintptr_t)1U) {
|
|
malloc_mutex_lock(tsd_tsdn(tsd), tctx->tdata->lock);
|
|
tctx->prepared = false;
|
|
prof_tctx_try_destroy(tsd, tctx);
|
|
}
|
|
}
|
|
|
|
void
|
|
prof_malloc_sample_object(tsd_t *tsd, const void *ptr, size_t size,
|
|
size_t usize, prof_tctx_t *tctx) {
|
|
if (opt_prof_sys_thread_name) {
|
|
prof_sys_thread_name_fetch(tsd);
|
|
}
|
|
|
|
edata_t *edata = emap_edata_lookup(tsd_tsdn(tsd), &arena_emap_global,
|
|
ptr);
|
|
prof_info_set(tsd, edata, tctx);
|
|
|
|
malloc_mutex_lock(tsd_tsdn(tsd), tctx->tdata->lock);
|
|
tctx->cnts.curobjs++;
|
|
tctx->cnts.curbytes += usize;
|
|
if (opt_prof_accum) {
|
|
tctx->cnts.accumobjs++;
|
|
tctx->cnts.accumbytes += usize;
|
|
}
|
|
bool record_recent = prof_recent_alloc_prepare(tsd, tctx);
|
|
tctx->prepared = false;
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), tctx->tdata->lock);
|
|
if (record_recent) {
|
|
assert(tctx == edata_prof_tctx_get(edata));
|
|
prof_recent_alloc(tsd, edata, size);
|
|
}
|
|
}
|
|
|
|
void
|
|
prof_free_sampled_object(tsd_t *tsd, size_t usize, prof_info_t *prof_info) {
|
|
assert(prof_info != NULL);
|
|
prof_tctx_t *tctx = prof_info->alloc_tctx;
|
|
assert((uintptr_t)tctx > (uintptr_t)1U);
|
|
|
|
malloc_mutex_lock(tsd_tsdn(tsd), tctx->tdata->lock);
|
|
|
|
assert(tctx->cnts.curobjs > 0);
|
|
assert(tctx->cnts.curbytes >= usize);
|
|
tctx->cnts.curobjs--;
|
|
tctx->cnts.curbytes -= usize;
|
|
|
|
prof_try_log(tsd, usize, prof_info);
|
|
|
|
prof_tctx_try_destroy(tsd, tctx);
|
|
}
|
|
|
|
void
|
|
bt_init(prof_bt_t *bt, void **vec) {
|
|
cassert(config_prof);
|
|
|
|
bt->vec = vec;
|
|
bt->len = 0;
|
|
}
|
|
|
|
#ifdef JEMALLOC_PROF_LIBUNWIND
|
|
static void
|
|
prof_backtrace_impl(prof_bt_t *bt) {
|
|
int nframes;
|
|
|
|
cassert(config_prof);
|
|
assert(bt->len == 0);
|
|
assert(bt->vec != NULL);
|
|
|
|
nframes = unw_backtrace(bt->vec, PROF_BT_MAX);
|
|
if (nframes <= 0) {
|
|
return;
|
|
}
|
|
bt->len = nframes;
|
|
}
|
|
#elif (defined(JEMALLOC_PROF_LIBGCC))
|
|
static _Unwind_Reason_Code
|
|
prof_unwind_init_callback(struct _Unwind_Context *context, void *arg) {
|
|
cassert(config_prof);
|
|
|
|
return _URC_NO_REASON;
|
|
}
|
|
|
|
static _Unwind_Reason_Code
|
|
prof_unwind_callback(struct _Unwind_Context *context, void *arg) {
|
|
prof_unwind_data_t *data = (prof_unwind_data_t *)arg;
|
|
void *ip;
|
|
|
|
cassert(config_prof);
|
|
|
|
ip = (void *)_Unwind_GetIP(context);
|
|
if (ip == NULL) {
|
|
return _URC_END_OF_STACK;
|
|
}
|
|
data->bt->vec[data->bt->len] = ip;
|
|
data->bt->len++;
|
|
if (data->bt->len == data->max) {
|
|
return _URC_END_OF_STACK;
|
|
}
|
|
|
|
return _URC_NO_REASON;
|
|
}
|
|
|
|
static void
|
|
prof_backtrace_impl(prof_bt_t *bt) {
|
|
prof_unwind_data_t data = {bt, PROF_BT_MAX};
|
|
|
|
cassert(config_prof);
|
|
|
|
_Unwind_Backtrace(prof_unwind_callback, &data);
|
|
}
|
|
#elif (defined(JEMALLOC_PROF_GCC))
|
|
static void
|
|
prof_backtrace_impl(prof_bt_t *bt) {
|
|
#define BT_FRAME(i) \
|
|
if ((i) < PROF_BT_MAX) { \
|
|
void *p; \
|
|
if (__builtin_frame_address(i) == 0) { \
|
|
return; \
|
|
} \
|
|
p = __builtin_return_address(i); \
|
|
if (p == NULL) { \
|
|
return; \
|
|
} \
|
|
bt->vec[(i)] = p; \
|
|
bt->len = (i) + 1; \
|
|
} else { \
|
|
return; \
|
|
}
|
|
|
|
cassert(config_prof);
|
|
|
|
BT_FRAME(0)
|
|
BT_FRAME(1)
|
|
BT_FRAME(2)
|
|
BT_FRAME(3)
|
|
BT_FRAME(4)
|
|
BT_FRAME(5)
|
|
BT_FRAME(6)
|
|
BT_FRAME(7)
|
|
BT_FRAME(8)
|
|
BT_FRAME(9)
|
|
|
|
BT_FRAME(10)
|
|
BT_FRAME(11)
|
|
BT_FRAME(12)
|
|
BT_FRAME(13)
|
|
BT_FRAME(14)
|
|
BT_FRAME(15)
|
|
BT_FRAME(16)
|
|
BT_FRAME(17)
|
|
BT_FRAME(18)
|
|
BT_FRAME(19)
|
|
|
|
BT_FRAME(20)
|
|
BT_FRAME(21)
|
|
BT_FRAME(22)
|
|
BT_FRAME(23)
|
|
BT_FRAME(24)
|
|
BT_FRAME(25)
|
|
BT_FRAME(26)
|
|
BT_FRAME(27)
|
|
BT_FRAME(28)
|
|
BT_FRAME(29)
|
|
|
|
BT_FRAME(30)
|
|
BT_FRAME(31)
|
|
BT_FRAME(32)
|
|
BT_FRAME(33)
|
|
BT_FRAME(34)
|
|
BT_FRAME(35)
|
|
BT_FRAME(36)
|
|
BT_FRAME(37)
|
|
BT_FRAME(38)
|
|
BT_FRAME(39)
|
|
|
|
BT_FRAME(40)
|
|
BT_FRAME(41)
|
|
BT_FRAME(42)
|
|
BT_FRAME(43)
|
|
BT_FRAME(44)
|
|
BT_FRAME(45)
|
|
BT_FRAME(46)
|
|
BT_FRAME(47)
|
|
BT_FRAME(48)
|
|
BT_FRAME(49)
|
|
|
|
BT_FRAME(50)
|
|
BT_FRAME(51)
|
|
BT_FRAME(52)
|
|
BT_FRAME(53)
|
|
BT_FRAME(54)
|
|
BT_FRAME(55)
|
|
BT_FRAME(56)
|
|
BT_FRAME(57)
|
|
BT_FRAME(58)
|
|
BT_FRAME(59)
|
|
|
|
BT_FRAME(60)
|
|
BT_FRAME(61)
|
|
BT_FRAME(62)
|
|
BT_FRAME(63)
|
|
BT_FRAME(64)
|
|
BT_FRAME(65)
|
|
BT_FRAME(66)
|
|
BT_FRAME(67)
|
|
BT_FRAME(68)
|
|
BT_FRAME(69)
|
|
|
|
BT_FRAME(70)
|
|
BT_FRAME(71)
|
|
BT_FRAME(72)
|
|
BT_FRAME(73)
|
|
BT_FRAME(74)
|
|
BT_FRAME(75)
|
|
BT_FRAME(76)
|
|
BT_FRAME(77)
|
|
BT_FRAME(78)
|
|
BT_FRAME(79)
|
|
|
|
BT_FRAME(80)
|
|
BT_FRAME(81)
|
|
BT_FRAME(82)
|
|
BT_FRAME(83)
|
|
BT_FRAME(84)
|
|
BT_FRAME(85)
|
|
BT_FRAME(86)
|
|
BT_FRAME(87)
|
|
BT_FRAME(88)
|
|
BT_FRAME(89)
|
|
|
|
BT_FRAME(90)
|
|
BT_FRAME(91)
|
|
BT_FRAME(92)
|
|
BT_FRAME(93)
|
|
BT_FRAME(94)
|
|
BT_FRAME(95)
|
|
BT_FRAME(96)
|
|
BT_FRAME(97)
|
|
BT_FRAME(98)
|
|
BT_FRAME(99)
|
|
|
|
BT_FRAME(100)
|
|
BT_FRAME(101)
|
|
BT_FRAME(102)
|
|
BT_FRAME(103)
|
|
BT_FRAME(104)
|
|
BT_FRAME(105)
|
|
BT_FRAME(106)
|
|
BT_FRAME(107)
|
|
BT_FRAME(108)
|
|
BT_FRAME(109)
|
|
|
|
BT_FRAME(110)
|
|
BT_FRAME(111)
|
|
BT_FRAME(112)
|
|
BT_FRAME(113)
|
|
BT_FRAME(114)
|
|
BT_FRAME(115)
|
|
BT_FRAME(116)
|
|
BT_FRAME(117)
|
|
BT_FRAME(118)
|
|
BT_FRAME(119)
|
|
|
|
BT_FRAME(120)
|
|
BT_FRAME(121)
|
|
BT_FRAME(122)
|
|
BT_FRAME(123)
|
|
BT_FRAME(124)
|
|
BT_FRAME(125)
|
|
BT_FRAME(126)
|
|
BT_FRAME(127)
|
|
#undef BT_FRAME
|
|
}
|
|
#else
|
|
static void
|
|
prof_backtrace_impl(prof_bt_t *bt) {
|
|
cassert(config_prof);
|
|
not_reached();
|
|
}
|
|
#endif
|
|
|
|
void
|
|
prof_backtrace(tsd_t *tsd, prof_bt_t *bt) {
|
|
cassert(config_prof);
|
|
pre_reentrancy(tsd, NULL);
|
|
prof_backtrace_impl(bt);
|
|
post_reentrancy(tsd);
|
|
}
|
|
|
|
/*
|
|
* The bodies of this function and prof_leakcheck() are compiled out unless heap
|
|
* profiling is enabled, so that it is possible to compile jemalloc with
|
|
* floating point support completely disabled. Avoiding floating point code is
|
|
* important on memory-constrained systems, but it also enables a workaround for
|
|
* versions of glibc that don't properly save/restore floating point registers
|
|
* during dynamic lazy symbol loading (which internally calls into whatever
|
|
* malloc implementation happens to be integrated into the application). Note
|
|
* that some compilers (e.g. gcc 4.8) may use floating point registers for fast
|
|
* memory moves, so jemalloc must be compiled with such optimizations disabled
|
|
* (e.g.
|
|
* -mno-sse) in order for the workaround to be complete.
|
|
*/
|
|
uint64_t
|
|
prof_sample_new_event_wait(tsd_t *tsd) {
|
|
#ifdef JEMALLOC_PROF
|
|
if (lg_prof_sample == 0) {
|
|
return TE_MIN_START_WAIT;
|
|
}
|
|
|
|
/*
|
|
* Compute sample interval as a geometrically distributed random
|
|
* variable with mean (2^lg_prof_sample).
|
|
*
|
|
* __ __
|
|
* | log(u) | 1
|
|
* bytes_until_sample = | -------- |, where p = ---------------
|
|
* | log(1-p) | lg_prof_sample
|
|
* 2
|
|
*
|
|
* For more information on the math, see:
|
|
*
|
|
* Non-Uniform Random Variate Generation
|
|
* Luc Devroye
|
|
* Springer-Verlag, New York, 1986
|
|
* pp 500
|
|
* (http://luc.devroye.org/rnbookindex.html)
|
|
*
|
|
* In the actual computation, there's a non-zero probability that our
|
|
* pseudo random number generator generates an exact 0, and to avoid
|
|
* log(0), we set u to 1.0 in case r is 0. Therefore u effectively is
|
|
* uniformly distributed in (0, 1] instead of [0, 1). Further, rather
|
|
* than taking the ceiling, we take the floor and then add 1, since
|
|
* otherwise bytes_until_sample would be 0 if u is exactly 1.0.
|
|
*/
|
|
uint64_t r = prng_lg_range_u64(tsd_prng_statep_get(tsd), 53);
|
|
double u = (r == 0U) ? 1.0 : (double)r * (1.0/9007199254740992.0L);
|
|
return (uint64_t)(log(u) /
|
|
log(1.0 - (1.0 / (double)((uint64_t)1U << lg_prof_sample))))
|
|
+ (uint64_t)1U;
|
|
#else
|
|
not_reached();
|
|
return TE_MAX_START_WAIT;
|
|
#endif
|
|
}
|
|
|
|
uint64_t
|
|
prof_sample_postponed_event_wait(tsd_t *tsd) {
|
|
/*
|
|
* The postponed wait time for prof sample event is computed as if we
|
|
* want a new wait time (i.e. as if the event were triggered). If we
|
|
* instead postpone to the immediate next allocation, like how we're
|
|
* handling the other events, then we can have sampling bias, if e.g.
|
|
* the allocation immediately following a reentrancy always comes from
|
|
* the same stack trace.
|
|
*/
|
|
return prof_sample_new_event_wait(tsd);
|
|
}
|
|
|
|
void
|
|
prof_sample_event_handler(tsd_t *tsd, uint64_t elapsed) {
|
|
cassert(config_prof);
|
|
assert(elapsed > 0 && elapsed != TE_INVALID_ELAPSED);
|
|
if (prof_interval == 0 || !prof_active_get_unlocked()) {
|
|
return;
|
|
}
|
|
if (counter_accum(tsd_tsdn(tsd), &prof_idump_accumulated, elapsed)) {
|
|
prof_idump(tsd_tsdn(tsd));
|
|
}
|
|
}
|
|
|
|
int
|
|
prof_getpid(void) {
|
|
#ifdef _WIN32
|
|
return GetCurrentProcessId();
|
|
#else
|
|
return getpid();
|
|
#endif
|
|
}
|
|
|
|
static const char *
|
|
prof_dump_prefix_get(tsdn_t* tsdn) {
|
|
malloc_mutex_assert_owner(tsdn, &prof_dump_filename_mtx);
|
|
|
|
return prof_dump_prefix == NULL ? opt_prof_prefix : prof_dump_prefix;
|
|
}
|
|
|
|
static bool
|
|
prof_dump_prefix_is_empty(tsdn_t *tsdn) {
|
|
malloc_mutex_lock(tsdn, &prof_dump_filename_mtx);
|
|
bool ret = (prof_dump_prefix_get(tsdn)[0] == '\0');
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
return ret;
|
|
}
|
|
|
|
#define DUMP_FILENAME_BUFSIZE (PATH_MAX + 1)
|
|
#define VSEQ_INVALID UINT64_C(0xffffffffffffffff)
|
|
static void
|
|
prof_dump_filename(tsd_t *tsd, char *filename, char v, uint64_t vseq) {
|
|
cassert(config_prof);
|
|
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
const char *prof_prefix = prof_dump_prefix_get(tsd_tsdn(tsd));
|
|
|
|
if (vseq != VSEQ_INVALID) {
|
|
/* "<prefix>.<pid>.<seq>.v<vseq>.heap" */
|
|
malloc_snprintf(filename, DUMP_FILENAME_BUFSIZE,
|
|
"%s.%d.%"FMTu64".%c%"FMTu64".heap",
|
|
prof_prefix, prof_getpid(), prof_dump_seq, v, vseq);
|
|
} else {
|
|
/* "<prefix>.<pid>.<seq>.<v>.heap" */
|
|
malloc_snprintf(filename, DUMP_FILENAME_BUFSIZE,
|
|
"%s.%d.%"FMTu64".%c.heap",
|
|
prof_prefix, prof_getpid(), prof_dump_seq, v);
|
|
}
|
|
prof_dump_seq++;
|
|
}
|
|
|
|
void
|
|
prof_get_default_filename(tsdn_t *tsdn, char *filename, uint64_t ind) {
|
|
malloc_mutex_lock(tsdn, &prof_dump_filename_mtx);
|
|
malloc_snprintf(filename, PROF_DUMP_FILENAME_LEN,
|
|
"%s.%d.%"FMTu64".json", prof_dump_prefix_get(tsdn), prof_getpid(),
|
|
ind);
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
}
|
|
|
|
static void
|
|
prof_fdump(void) {
|
|
tsd_t *tsd;
|
|
char filename[DUMP_FILENAME_BUFSIZE];
|
|
|
|
cassert(config_prof);
|
|
assert(opt_prof_final);
|
|
|
|
if (!prof_booted) {
|
|
return;
|
|
}
|
|
tsd = tsd_fetch();
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
assert(!prof_dump_prefix_is_empty(tsd_tsdn(tsd)));
|
|
|
|
malloc_mutex_lock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
prof_dump_filename(tsd, filename, 'f', VSEQ_INVALID);
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
prof_dump(tsd, false, filename, opt_prof_leak);
|
|
}
|
|
|
|
static bool
|
|
prof_idump_accum_init(void) {
|
|
cassert(config_prof);
|
|
|
|
return counter_accum_init(&prof_idump_accumulated, prof_interval);
|
|
}
|
|
|
|
bool
|
|
prof_dump_prefix_set(tsdn_t *tsdn, const char *prefix) {
|
|
cassert(config_prof);
|
|
ctl_mtx_assert_held(tsdn);
|
|
malloc_mutex_lock(tsdn, &prof_dump_filename_mtx);
|
|
if (prof_dump_prefix == NULL) {
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
/* Everything is still guarded by ctl_mtx. */
|
|
char *buffer = base_alloc(tsdn, prof_base,
|
|
PROF_DUMP_FILENAME_LEN, QUANTUM);
|
|
if (buffer == NULL) {
|
|
return true;
|
|
}
|
|
malloc_mutex_lock(tsdn, &prof_dump_filename_mtx);
|
|
prof_dump_prefix = buffer;
|
|
}
|
|
assert(prof_dump_prefix != NULL);
|
|
|
|
prof_strncpy(prof_dump_prefix, prefix, PROF_DUMP_FILENAME_LEN - 1);
|
|
prof_dump_prefix[PROF_DUMP_FILENAME_LEN - 1] = '\0';
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
|
|
return false;
|
|
}
|
|
|
|
void
|
|
prof_idump(tsdn_t *tsdn) {
|
|
tsd_t *tsd;
|
|
prof_tdata_t *tdata;
|
|
|
|
cassert(config_prof);
|
|
|
|
if (!prof_booted || tsdn_null(tsdn) || !prof_active_get_unlocked()) {
|
|
return;
|
|
}
|
|
tsd = tsdn_tsd(tsdn);
|
|
if (tsd_reentrancy_level_get(tsd) > 0) {
|
|
return;
|
|
}
|
|
|
|
tdata = prof_tdata_get(tsd, true);
|
|
if (tdata == NULL) {
|
|
return;
|
|
}
|
|
if (tdata->enq) {
|
|
tdata->enq_idump = true;
|
|
return;
|
|
}
|
|
|
|
malloc_mutex_lock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
if (prof_dump_prefix_get(tsd_tsdn(tsd))[0] == '\0') {
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
return;
|
|
}
|
|
char filename[PATH_MAX + 1];
|
|
prof_dump_filename(tsd, filename, 'i', prof_dump_iseq);
|
|
prof_dump_iseq++;
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
prof_dump(tsd, false, filename, false);
|
|
}
|
|
|
|
bool
|
|
prof_mdump(tsd_t *tsd, const char *filename) {
|
|
cassert(config_prof);
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
|
|
if (!opt_prof || !prof_booted) {
|
|
return true;
|
|
}
|
|
char filename_buf[DUMP_FILENAME_BUFSIZE];
|
|
if (filename == NULL) {
|
|
/* No filename specified, so automatically generate one. */
|
|
malloc_mutex_lock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
if (prof_dump_prefix_get(tsd_tsdn(tsd))[0] == '\0') {
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
return true;
|
|
}
|
|
prof_dump_filename(tsd, filename_buf, 'm', prof_dump_mseq);
|
|
prof_dump_mseq++;
|
|
malloc_mutex_unlock(tsd_tsdn(tsd), &prof_dump_filename_mtx);
|
|
filename = filename_buf;
|
|
}
|
|
return prof_dump(tsd, true, filename, false);
|
|
}
|
|
|
|
void
|
|
prof_gdump(tsdn_t *tsdn) {
|
|
tsd_t *tsd;
|
|
prof_tdata_t *tdata;
|
|
|
|
cassert(config_prof);
|
|
|
|
if (!prof_booted || tsdn_null(tsdn) || !prof_active_get_unlocked()) {
|
|
return;
|
|
}
|
|
tsd = tsdn_tsd(tsdn);
|
|
if (tsd_reentrancy_level_get(tsd) > 0) {
|
|
return;
|
|
}
|
|
|
|
tdata = prof_tdata_get(tsd, false);
|
|
if (tdata == NULL) {
|
|
return;
|
|
}
|
|
if (tdata->enq) {
|
|
tdata->enq_gdump = true;
|
|
return;
|
|
}
|
|
|
|
malloc_mutex_lock(tsdn, &prof_dump_filename_mtx);
|
|
if (prof_dump_prefix_get(tsdn)[0] == '\0') {
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
return;
|
|
}
|
|
char filename[DUMP_FILENAME_BUFSIZE];
|
|
prof_dump_filename(tsd, filename, 'u', prof_dump_useq);
|
|
prof_dump_useq++;
|
|
malloc_mutex_unlock(tsdn, &prof_dump_filename_mtx);
|
|
prof_dump(tsd, false, filename, false);
|
|
}
|
|
|
|
static uint64_t
|
|
prof_thr_uid_alloc(tsdn_t *tsdn) {
|
|
uint64_t thr_uid;
|
|
|
|
malloc_mutex_lock(tsdn, &next_thr_uid_mtx);
|
|
thr_uid = next_thr_uid;
|
|
next_thr_uid++;
|
|
malloc_mutex_unlock(tsdn, &next_thr_uid_mtx);
|
|
|
|
return thr_uid;
|
|
}
|
|
|
|
prof_tdata_t *
|
|
prof_tdata_init(tsd_t *tsd) {
|
|
return prof_tdata_init_impl(tsd, prof_thr_uid_alloc(tsd_tsdn(tsd)), 0,
|
|
NULL, prof_thread_active_init_get(tsd_tsdn(tsd)));
|
|
}
|
|
|
|
prof_tdata_t *
|
|
prof_tdata_reinit(tsd_t *tsd, prof_tdata_t *tdata) {
|
|
uint64_t thr_uid = tdata->thr_uid;
|
|
uint64_t thr_discrim = tdata->thr_discrim + 1;
|
|
char *thread_name = (tdata->thread_name != NULL) ?
|
|
prof_thread_name_alloc(tsd, tdata->thread_name) : NULL;
|
|
bool active = tdata->active;
|
|
|
|
prof_tdata_detach(tsd, tdata);
|
|
return prof_tdata_init_impl(tsd, thr_uid, thr_discrim, thread_name,
|
|
active);
|
|
}
|
|
|
|
void
|
|
prof_tdata_cleanup(tsd_t *tsd) {
|
|
prof_tdata_t *tdata;
|
|
|
|
if (!config_prof) {
|
|
return;
|
|
}
|
|
|
|
tdata = tsd_prof_tdata_get(tsd);
|
|
if (tdata != NULL) {
|
|
prof_tdata_detach(tsd, tdata);
|
|
}
|
|
}
|
|
|
|
bool
|
|
prof_active_get(tsdn_t *tsdn) {
|
|
bool prof_active_current;
|
|
|
|
prof_active_assert();
|
|
malloc_mutex_lock(tsdn, &prof_active_mtx);
|
|
prof_active_current = prof_active;
|
|
malloc_mutex_unlock(tsdn, &prof_active_mtx);
|
|
return prof_active_current;
|
|
}
|
|
|
|
bool
|
|
prof_active_set(tsdn_t *tsdn, bool active) {
|
|
bool prof_active_old;
|
|
|
|
prof_active_assert();
|
|
malloc_mutex_lock(tsdn, &prof_active_mtx);
|
|
prof_active_old = prof_active;
|
|
prof_active = active;
|
|
malloc_mutex_unlock(tsdn, &prof_active_mtx);
|
|
prof_active_assert();
|
|
return prof_active_old;
|
|
}
|
|
|
|
const char *
|
|
prof_thread_name_get(tsd_t *tsd) {
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
|
|
prof_tdata_t *tdata;
|
|
|
|
tdata = prof_tdata_get(tsd, true);
|
|
if (tdata == NULL) {
|
|
return "";
|
|
}
|
|
return (tdata->thread_name != NULL ? tdata->thread_name : "");
|
|
}
|
|
|
|
int
|
|
prof_thread_name_set(tsd_t *tsd, const char *thread_name) {
|
|
if (opt_prof_sys_thread_name) {
|
|
return ENOENT;
|
|
} else {
|
|
return prof_thread_name_set_impl(tsd, thread_name);
|
|
}
|
|
}
|
|
|
|
bool
|
|
prof_thread_active_get(tsd_t *tsd) {
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
|
|
prof_tdata_t *tdata;
|
|
|
|
tdata = prof_tdata_get(tsd, true);
|
|
if (tdata == NULL) {
|
|
return false;
|
|
}
|
|
return tdata->active;
|
|
}
|
|
|
|
bool
|
|
prof_thread_active_set(tsd_t *tsd, bool active) {
|
|
assert(tsd_reentrancy_level_get(tsd) == 0);
|
|
|
|
prof_tdata_t *tdata;
|
|
|
|
tdata = prof_tdata_get(tsd, true);
|
|
if (tdata == NULL) {
|
|
return true;
|
|
}
|
|
tdata->active = active;
|
|
return false;
|
|
}
|
|
|
|
bool
|
|
prof_thread_active_init_get(tsdn_t *tsdn) {
|
|
bool active_init;
|
|
|
|
malloc_mutex_lock(tsdn, &prof_thread_active_init_mtx);
|
|
active_init = prof_thread_active_init;
|
|
malloc_mutex_unlock(tsdn, &prof_thread_active_init_mtx);
|
|
return active_init;
|
|
}
|
|
|
|
bool
|
|
prof_thread_active_init_set(tsdn_t *tsdn, bool active_init) {
|
|
bool active_init_old;
|
|
|
|
malloc_mutex_lock(tsdn, &prof_thread_active_init_mtx);
|
|
active_init_old = prof_thread_active_init;
|
|
prof_thread_active_init = active_init;
|
|
malloc_mutex_unlock(tsdn, &prof_thread_active_init_mtx);
|
|
return active_init_old;
|
|
}
|
|
|
|
bool
|
|
prof_gdump_get(tsdn_t *tsdn) {
|
|
bool prof_gdump_current;
|
|
|
|
malloc_mutex_lock(tsdn, &prof_gdump_mtx);
|
|
prof_gdump_current = prof_gdump_val;
|
|
malloc_mutex_unlock(tsdn, &prof_gdump_mtx);
|
|
return prof_gdump_current;
|
|
}
|
|
|
|
bool
|
|
prof_gdump_set(tsdn_t *tsdn, bool gdump) {
|
|
bool prof_gdump_old;
|
|
|
|
malloc_mutex_lock(tsdn, &prof_gdump_mtx);
|
|
prof_gdump_old = prof_gdump_val;
|
|
prof_gdump_val = gdump;
|
|
malloc_mutex_unlock(tsdn, &prof_gdump_mtx);
|
|
return prof_gdump_old;
|
|
}
|
|
|
|
void
|
|
prof_boot0(void) {
|
|
cassert(config_prof);
|
|
|
|
memcpy(opt_prof_prefix, PROF_PREFIX_DEFAULT,
|
|
sizeof(PROF_PREFIX_DEFAULT));
|
|
}
|
|
|
|
void
|
|
prof_boot1(void) {
|
|
cassert(config_prof);
|
|
|
|
/*
|
|
* opt_prof must be in its final state before any arenas are
|
|
* initialized, so this function must be executed early.
|
|
*/
|
|
|
|
if (opt_prof_leak && !opt_prof) {
|
|
/*
|
|
* Enable opt_prof, but in such a way that profiles are never
|
|
* automatically dumped.
|
|
*/
|
|
opt_prof = true;
|
|
opt_prof_gdump = false;
|
|
} else if (opt_prof) {
|
|
if (opt_lg_prof_interval >= 0) {
|
|
prof_interval = (((uint64_t)1U) <<
|
|
opt_lg_prof_interval);
|
|
}
|
|
}
|
|
}
|
|
|
|
bool
|
|
prof_boot2(tsd_t *tsd, base_t *base) {
|
|
cassert(config_prof);
|
|
|
|
if (opt_prof) {
|
|
unsigned i;
|
|
|
|
lg_prof_sample = opt_lg_prof_sample;
|
|
|
|
prof_active = opt_prof_active;
|
|
if (malloc_mutex_init(&prof_active_mtx, "prof_active",
|
|
WITNESS_RANK_PROF_ACTIVE, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
prof_gdump_val = opt_prof_gdump;
|
|
if (malloc_mutex_init(&prof_gdump_mtx, "prof_gdump",
|
|
WITNESS_RANK_PROF_GDUMP, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
prof_thread_active_init = opt_prof_thread_active_init;
|
|
if (malloc_mutex_init(&prof_thread_active_init_mtx,
|
|
"prof_thread_active_init",
|
|
WITNESS_RANK_PROF_THREAD_ACTIVE_INIT,
|
|
malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
if (prof_data_init(tsd)) {
|
|
return true;
|
|
}
|
|
|
|
if (malloc_mutex_init(&bt2gctx_mtx, "prof_bt2gctx",
|
|
WITNESS_RANK_PROF_BT2GCTX, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
if (malloc_mutex_init(&tdatas_mtx, "prof_tdatas",
|
|
WITNESS_RANK_PROF_TDATAS, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
next_thr_uid = 0;
|
|
if (malloc_mutex_init(&next_thr_uid_mtx, "prof_next_thr_uid",
|
|
WITNESS_RANK_PROF_NEXT_THR_UID, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
if (prof_idump_accum_init()) {
|
|
return true;
|
|
}
|
|
|
|
if (malloc_mutex_init(&prof_dump_filename_mtx, "prof_dump_filename",
|
|
WITNESS_RANK_PROF_DUMP_FILENAME, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
if (malloc_mutex_init(&prof_dump_mtx, "prof_dump",
|
|
WITNESS_RANK_PROF_DUMP, malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
|
|
if (opt_prof_final && opt_prof_prefix[0] != '\0' &&
|
|
atexit(prof_fdump) != 0) {
|
|
malloc_write("<jemalloc>: Error in atexit()\n");
|
|
if (opt_abort) {
|
|
abort();
|
|
}
|
|
}
|
|
|
|
if (prof_log_init(tsd)) {
|
|
return true;
|
|
}
|
|
|
|
if (prof_recent_init()) {
|
|
return true;
|
|
}
|
|
|
|
prof_base = base;
|
|
|
|
gctx_locks = (malloc_mutex_t *)base_alloc(tsd_tsdn(tsd), base,
|
|
PROF_NCTX_LOCKS * sizeof(malloc_mutex_t), CACHELINE);
|
|
if (gctx_locks == NULL) {
|
|
return true;
|
|
}
|
|
for (i = 0; i < PROF_NCTX_LOCKS; i++) {
|
|
if (malloc_mutex_init(&gctx_locks[i], "prof_gctx",
|
|
WITNESS_RANK_PROF_GCTX,
|
|
malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
}
|
|
|
|
tdata_locks = (malloc_mutex_t *)base_alloc(tsd_tsdn(tsd), base,
|
|
PROF_NTDATA_LOCKS * sizeof(malloc_mutex_t), CACHELINE);
|
|
if (tdata_locks == NULL) {
|
|
return true;
|
|
}
|
|
for (i = 0; i < PROF_NTDATA_LOCKS; i++) {
|
|
if (malloc_mutex_init(&tdata_locks[i], "prof_tdata",
|
|
WITNESS_RANK_PROF_TDATA,
|
|
malloc_mutex_rank_exclusive)) {
|
|
return true;
|
|
}
|
|
}
|
|
#ifdef JEMALLOC_PROF_LIBGCC
|
|
/*
|
|
* Cause the backtracing machinery to allocate its internal
|
|
* state before enabling profiling.
|
|
*/
|
|
_Unwind_Backtrace(prof_unwind_init_callback, NULL);
|
|
#endif
|
|
}
|
|
prof_booted = true;
|
|
|
|
return false;
|
|
}
|
|
|
|
void
|
|
prof_prefork0(tsdn_t *tsdn) {
|
|
if (config_prof && opt_prof) {
|
|
unsigned i;
|
|
|
|
malloc_mutex_prefork(tsdn, &prof_dump_mtx);
|
|
malloc_mutex_prefork(tsdn, &bt2gctx_mtx);
|
|
malloc_mutex_prefork(tsdn, &tdatas_mtx);
|
|
for (i = 0; i < PROF_NTDATA_LOCKS; i++) {
|
|
malloc_mutex_prefork(tsdn, &tdata_locks[i]);
|
|
}
|
|
malloc_mutex_prefork(tsdn, &log_mtx);
|
|
for (i = 0; i < PROF_NCTX_LOCKS; i++) {
|
|
malloc_mutex_prefork(tsdn, &gctx_locks[i]);
|
|
}
|
|
malloc_mutex_prefork(tsdn, &prof_recent_dump_mtx);
|
|
}
|
|
}
|
|
|
|
void
|
|
prof_prefork1(tsdn_t *tsdn) {
|
|
if (config_prof && opt_prof) {
|
|
counter_prefork(tsdn, &prof_idump_accumulated);
|
|
malloc_mutex_prefork(tsdn, &prof_active_mtx);
|
|
malloc_mutex_prefork(tsdn, &prof_dump_filename_mtx);
|
|
malloc_mutex_prefork(tsdn, &prof_gdump_mtx);
|
|
malloc_mutex_prefork(tsdn, &next_thr_uid_mtx);
|
|
malloc_mutex_prefork(tsdn, &prof_thread_active_init_mtx);
|
|
malloc_mutex_prefork(tsdn, &prof_recent_alloc_mtx);
|
|
}
|
|
}
|
|
|
|
void
|
|
prof_postfork_parent(tsdn_t *tsdn) {
|
|
if (config_prof && opt_prof) {
|
|
unsigned i;
|
|
|
|
malloc_mutex_postfork_parent(tsdn, &prof_recent_alloc_mtx);
|
|
malloc_mutex_postfork_parent(tsdn,
|
|
&prof_thread_active_init_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &next_thr_uid_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &prof_gdump_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &prof_dump_filename_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &prof_active_mtx);
|
|
counter_postfork_parent(tsdn, &prof_idump_accumulated);
|
|
malloc_mutex_postfork_parent(tsdn, &prof_recent_dump_mtx);
|
|
for (i = 0; i < PROF_NCTX_LOCKS; i++) {
|
|
malloc_mutex_postfork_parent(tsdn, &gctx_locks[i]);
|
|
}
|
|
malloc_mutex_postfork_parent(tsdn, &log_mtx);
|
|
for (i = 0; i < PROF_NTDATA_LOCKS; i++) {
|
|
malloc_mutex_postfork_parent(tsdn, &tdata_locks[i]);
|
|
}
|
|
malloc_mutex_postfork_parent(tsdn, &tdatas_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &bt2gctx_mtx);
|
|
malloc_mutex_postfork_parent(tsdn, &prof_dump_mtx);
|
|
}
|
|
}
|
|
|
|
void
|
|
prof_postfork_child(tsdn_t *tsdn) {
|
|
if (config_prof && opt_prof) {
|
|
unsigned i;
|
|
|
|
malloc_mutex_postfork_child(tsdn, &prof_recent_alloc_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &prof_thread_active_init_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &next_thr_uid_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &prof_gdump_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &prof_dump_filename_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &prof_active_mtx);
|
|
counter_postfork_child(tsdn, &prof_idump_accumulated);
|
|
malloc_mutex_postfork_child(tsdn, &prof_recent_dump_mtx);
|
|
for (i = 0; i < PROF_NCTX_LOCKS; i++) {
|
|
malloc_mutex_postfork_child(tsdn, &gctx_locks[i]);
|
|
}
|
|
malloc_mutex_postfork_child(tsdn, &log_mtx);
|
|
for (i = 0; i < PROF_NTDATA_LOCKS; i++) {
|
|
malloc_mutex_postfork_child(tsdn, &tdata_locks[i]);
|
|
}
|
|
malloc_mutex_postfork_child(tsdn, &tdatas_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &bt2gctx_mtx);
|
|
malloc_mutex_postfork_child(tsdn, &prof_dump_mtx);
|
|
}
|
|
}
|
|
|
|
/******************************************************************************/
|