server-skynet-source-3rd-je.../src/prof_recent.c

#define JEMALLOC_PROF_RECENT_C_
#include "jemalloc/internal/jemalloc_preamble.h"
#include "jemalloc/internal/jemalloc_internal_includes.h"

#include "jemalloc/internal/assert.h"
#include "jemalloc/internal/buf_writer.h"
#include "jemalloc/internal/emitter.h"
#include "jemalloc/internal/prof_data.h"
#include "jemalloc/internal/prof_recent.h"

#ifndef JEMALLOC_JET
#  define STATIC_INLINE_IF_NOT_TEST static inline
#else
#  define STATIC_INLINE_IF_NOT_TEST
#endif

ssize_t opt_prof_recent_alloc_max = PROF_RECENT_ALLOC_MAX_DEFAULT;
malloc_mutex_t prof_recent_alloc_mtx; /* Protects the fields below */
static atomic_zd_t prof_recent_alloc_max;
static ssize_t prof_recent_alloc_count = 0;
static prof_recent_t *prof_recent_alloc_dummy = NULL;

static void
prof_recent_alloc_max_init() {
	atomic_store_zd(&prof_recent_alloc_max, opt_prof_recent_alloc_max,
	    ATOMIC_RELAXED);
}

static inline ssize_t
prof_recent_alloc_max_get_no_lock() {
	return atomic_load_zd(&prof_recent_alloc_max, ATOMIC_RELAXED);
}

static inline ssize_t
prof_recent_alloc_max_get(tsd_t *tsd) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	return prof_recent_alloc_max_get_no_lock();
}

static inline ssize_t
prof_recent_alloc_max_update(tsd_t *tsd, ssize_t max) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	ssize_t old_max = prof_recent_alloc_max_get(tsd);
	atomic_store_zd(&prof_recent_alloc_max, max, ATOMIC_RELAXED);
	return old_max;
}

static inline void
increment_recent_count(tsd_t *tsd, prof_tctx_t *tctx) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), tctx->tdata->lock);
	++tctx->recent_count;
	assert(tctx->recent_count > 0);
}

bool
prof_recent_alloc_prepare(tsd_t *tsd, prof_tctx_t *tctx) {
	assert(opt_prof && prof_booted);
	malloc_mutex_assert_owner(tsd_tsdn(tsd), tctx->tdata->lock);
	malloc_mutex_assert_not_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);

	/*
	 * Check whether last-N mode is turned on without trying to acquire the
	 * lock, so as to optimize for the following two scenarios:
	 * (1) Last-N mode is switched off;
	 * (2) Dumping, during which last-N mode is temporarily turned off so
	 *     as not to block sampled allocations.
	 */
	if (prof_recent_alloc_max_get_no_lock() == 0) {
		return false;
	}

	/*
	 * Increment recent_count to hold the tctx so that it won't be gone
	 * even after tctx->tdata->lock is released.  This acts as a
	 * "placeholder"; the real recording of the allocation requires a lock
	 * on prof_recent_alloc_mtx and is done in prof_recent_alloc (when
	 * tctx->tdata->lock has been released).
	 */
	increment_recent_count(tsd, tctx);
	return true;
}

static void
decrement_recent_count(tsd_t *tsd, prof_tctx_t *tctx) {
	malloc_mutex_assert_not_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	assert(tctx != NULL);
	malloc_mutex_lock(tsd_tsdn(tsd), tctx->tdata->lock);
	assert(tctx->recent_count > 0);
	--tctx->recent_count;
	prof_tctx_try_destroy(tsd, tctx);
}

void
edata_prof_recent_alloc_init(edata_t *edata) {
	edata_prof_recent_alloc_set_dont_call_directly(edata, NULL);
}

static inline prof_recent_t *
edata_prof_recent_alloc_get_no_lock(const edata_t *edata) {
	return edata_prof_recent_alloc_get_dont_call_directly(edata);
}

STATIC_INLINE_IF_NOT_TEST prof_recent_t *
edata_prof_recent_alloc_get(tsd_t *tsd, const edata_t *edata) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	prof_recent_t *recent_alloc =
	    edata_prof_recent_alloc_get_no_lock(edata);
	assert(recent_alloc == NULL || recent_alloc->alloc_edata == edata);
	return recent_alloc;
}

static prof_recent_t *
edata_prof_recent_alloc_update_internal(tsd_t *tsd, edata_t *edata,
    prof_recent_t *recent_alloc) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	prof_recent_t *old_recent_alloc =
	    edata_prof_recent_alloc_get(tsd, edata);
	edata_prof_recent_alloc_set_dont_call_directly(edata, recent_alloc);
	return old_recent_alloc;
}

static void
edata_prof_recent_alloc_set(tsd_t *tsd, edata_t *edata,
    prof_recent_t *recent_alloc) {
	assert(recent_alloc != NULL);
	prof_recent_t *old_recent_alloc =
	    edata_prof_recent_alloc_update_internal(tsd, edata, recent_alloc);
	assert(old_recent_alloc == NULL);
	recent_alloc->alloc_edata = edata;
}

static void
edata_prof_recent_alloc_reset(tsd_t *tsd, edata_t *edata,
    prof_recent_t *recent_alloc) {
	assert(recent_alloc != NULL);
	prof_recent_t *old_recent_alloc =
	    edata_prof_recent_alloc_update_internal(tsd, edata, NULL);
	assert(old_recent_alloc == recent_alloc);
	assert(edata == recent_alloc->alloc_edata);
	recent_alloc->alloc_edata = NULL;
}

/*
 * This function should be called right before an allocation is released, so
 * that the associated recent allocation record can contain the following
 * information:
 * (1) The allocation is released;
 * (2) The time of the deallocation; and
 * (3) The prof_tctx associated with the deallocation.
 */
void
prof_recent_alloc_reset(tsd_t *tsd, edata_t *edata) {
	/*
	 * Check whether the recent allocation record still exists without
	 * trying to acquire the lock.
	 */
	if (edata_prof_recent_alloc_get_no_lock(edata) == NULL) {
		return;
	}

	prof_tctx_t *dalloc_tctx = prof_tctx_create(tsd);
	/*
	 * In case dalloc_tctx is NULL, e.g. due to OOM, we will not record the
	 * deallocation time / tctx, which is handled later, after we check
	 * again when holding the lock.
	 */

	if (dalloc_tctx != NULL) {
		malloc_mutex_lock(tsd_tsdn(tsd), dalloc_tctx->tdata->lock);
		increment_recent_count(tsd, dalloc_tctx);
		dalloc_tctx->prepared = false;
		malloc_mutex_unlock(tsd_tsdn(tsd), dalloc_tctx->tdata->lock);
	}

	malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	/* Check again after acquiring the lock.  */
	prof_recent_t *recent = edata_prof_recent_alloc_get(tsd, edata);
	if (recent != NULL) {
		edata_prof_recent_alloc_reset(tsd, edata, recent);
		assert(nstime_equals_zero(&recent->dalloc_time));
		assert(recent->dalloc_tctx == NULL);
		if (dalloc_tctx != NULL) {
			nstime_update(&recent->dalloc_time);
			recent->dalloc_tctx = dalloc_tctx;
		}
	} else if (dalloc_tctx != NULL) {
		/* We lost the rase - the allocation record was just gone. */
		decrement_recent_count(tsd, dalloc_tctx);
	}
	malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
}

static void
prof_recent_alloc_evict_edata(tsd_t *tsd, prof_recent_t *recent) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	if (recent->alloc_edata != NULL) {
		edata_prof_recent_alloc_reset(tsd, recent->alloc_edata, recent);
	}
}

STATIC_INLINE_IF_NOT_TEST prof_recent_t *
prof_recent_alloc_begin(tsd_t *tsd) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	assert(prof_recent_alloc_dummy != NULL);
	return prof_recent_alloc_dummy->next;
}

STATIC_INLINE_IF_NOT_TEST prof_recent_t *
prof_recent_alloc_end(tsd_t *tsd) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	assert(prof_recent_alloc_dummy != NULL);
	return prof_recent_alloc_dummy;
}

STATIC_INLINE_IF_NOT_TEST prof_recent_t *
prof_recent_alloc_next(tsd_t *tsd, prof_recent_t *node) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	assert(prof_recent_alloc_dummy != NULL);
	assert(node != NULL && node != prof_recent_alloc_dummy);
	return node->next;
}

static bool
prof_recent_alloc_is_empty(tsd_t *tsd) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	if (prof_recent_alloc_begin(tsd) == prof_recent_alloc_end(tsd)) {
		assert(prof_recent_alloc_count == 0);
		return true;
	} else {
		assert(prof_recent_alloc_count > 0);
		return false;
	}
}

static void
prof_recent_alloc_assert_count(tsd_t *tsd) {
	malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	if (config_debug) {
		ssize_t count = 0;
		prof_recent_t *n = prof_recent_alloc_begin(tsd);
		while (n != prof_recent_alloc_end(tsd)) {
			++count;
			n = prof_recent_alloc_next(tsd, n);
		}
		assert(count == prof_recent_alloc_count);
		assert(prof_recent_alloc_max_get(tsd) == -1 ||
		    count <= prof_recent_alloc_max_get(tsd));
	}
}

void
prof_recent_alloc(tsd_t *tsd, edata_t *edata, size_t usize) {
	assert(edata != NULL);
	prof_tctx_t *tctx = edata_prof_tctx_get(edata);

	malloc_mutex_assert_not_owner(tsd_tsdn(tsd), tctx->tdata->lock);
	malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	prof_recent_alloc_assert_count(tsd);

	/*
	 * Reserve a new prof_recent_t node if needed.  If needed, we release
	 * the prof_recent_alloc_mtx lock and allocate.  Then, rather than
	 * immediately checking for OOM, we regain the lock and try to make use
	 * of the reserve node if needed.  There are six scenarios:
	 *
	 *          \ now | no need | need but OOMed | need and allocated
	 *     later \    |         |                |
	 *    ------------------------------------------------------------
	 *     no need    |   (1)   |      (2)       |         (3)
	 *    ------------------------------------------------------------
	 *     need       |   (4)   |      (5)       |         (6)
	 *
	 * First, "(4)" never happens, because we don't release the lock in the
	 * middle if there's no need for a new node; in such cases "(1)" always
	 * takes place, which is trivial.
	 *
	 * Out of the remaining four scenarios, "(6)" is the common case and is
	 * trivial.  "(5)" is also trivial, in which case we'll rollback the
	 * effect of prof_recent_alloc_prepare() as expected.
	 *
	 * "(2)" / "(3)" occurs when the need for a new node is gone after we
	 * regain the lock.  If the new node is successfully allocated, i.e. in
	 * the case of "(3)", we'll release it in the end; otherwise, i.e. in
	 * the case of "(2)", we do nothing - we're lucky that the OOM ends up
	 * doing no harm at all.
	 *
	 * Therefore, the only performance cost of the "release lock" ->
	 * "allocate" -> "regain lock" design is the "(3)" case, but it happens
	 * very rarely, so the cost is relatively small compared to the gain of
	 * not having to have the lock order of prof_recent_alloc_mtx above all
	 * the allocation locks.
	 */
	prof_recent_t *reserve = NULL;
	if (prof_recent_alloc_max_get(tsd) == -1 ||
	    prof_recent_alloc_count < prof_recent_alloc_max_get(tsd)) {
		assert(prof_recent_alloc_max_get(tsd) != 0);
		malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
		reserve = (prof_recent_t *)iallocztm(tsd_tsdn(tsd),
		    sizeof(prof_recent_t), sz_size2index(sizeof(prof_recent_t)),
		    false, NULL, true, arena_get(tsd_tsdn(tsd), 0, false),
		    true);
		malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
		prof_recent_alloc_assert_count(tsd);
	}

	if (prof_recent_alloc_max_get(tsd) == 0) {
		assert(prof_recent_alloc_is_empty(tsd));
		goto label_rollback;
	}

	assert(prof_recent_alloc_dummy != NULL);
	{
		/* Fill content into the dummy node. */
		prof_recent_t *node = prof_recent_alloc_dummy;
		node->usize = usize;
		nstime_copy(&node->alloc_time,
		    edata_prof_alloc_time_get(edata));
		node->alloc_tctx = tctx;
		edata_prof_recent_alloc_set(tsd, edata, node);
		nstime_init_zero(&node->dalloc_time);
		node->dalloc_tctx = NULL;
	}

	prof_tctx_t *old_alloc_tctx, *old_dalloc_tctx;
	if (prof_recent_alloc_count == prof_recent_alloc_max_get(tsd)) {
		/* If upper limit is reached, simply shift the dummy. */
		assert(prof_recent_alloc_max_get(tsd) != -1);
		assert(!prof_recent_alloc_is_empty(tsd));
		prof_recent_alloc_dummy = prof_recent_alloc_dummy->next;
		old_alloc_tctx = prof_recent_alloc_dummy->alloc_tctx;
		assert(old_alloc_tctx != NULL);
		old_dalloc_tctx = prof_recent_alloc_dummy->dalloc_tctx;
		prof_recent_alloc_evict_edata(tsd, prof_recent_alloc_dummy);
	} else {
		/* Otherwise use the new node as the dummy. */
		assert(prof_recent_alloc_max_get(tsd) == -1 ||
		    prof_recent_alloc_count < prof_recent_alloc_max_get(tsd));
		if (reserve == NULL) {
			goto label_rollback;
		}
		reserve->next = prof_recent_alloc_dummy->next;
		prof_recent_alloc_dummy->next = reserve;
		prof_recent_alloc_dummy = reserve;
		reserve = NULL;
		old_alloc_tctx = NULL;
		old_dalloc_tctx = NULL;
		++prof_recent_alloc_count;
	}

	assert(!prof_recent_alloc_is_empty(tsd));
	prof_recent_alloc_assert_count(tsd);
	malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);

	if (reserve != NULL) {
		idalloctm(tsd_tsdn(tsd), reserve, NULL, NULL, true, true);
	}

	/*
	 * Asynchronously handle the tctx of the old node, so that there's no
	 * simultaneous holdings of prof_recent_alloc_mtx and tdata->lock.
	 * In the worst case this may delay the tctx release but it's better
	 * than holding prof_recent_alloc_mtx for longer.
	 */
	if (old_alloc_tctx != NULL) {
		decrement_recent_count(tsd, old_alloc_tctx);
	}
	if (old_dalloc_tctx != NULL) {
		decrement_recent_count(tsd, old_dalloc_tctx);
	}
	return;

label_rollback:
	assert(edata_prof_recent_alloc_get(tsd, edata) == NULL);
	prof_recent_alloc_assert_count(tsd);
	malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	if (reserve != NULL) {
		idalloctm(tsd_tsdn(tsd), reserve, NULL, NULL, true, true);
	}
	decrement_recent_count(tsd, tctx);
}

ssize_t
prof_recent_alloc_max_ctl_read() {
	/* Don't bother to acquire the lock. */
	return prof_recent_alloc_max_get_no_lock();
}

ssize_t
prof_recent_alloc_max_ctl_write(tsd_t *tsd, ssize_t max) {
	assert(max >= -1);

	malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	prof_recent_alloc_assert_count(tsd);

	const ssize_t old_max = prof_recent_alloc_max_update(tsd, max);

	if (max == -1 || prof_recent_alloc_count <= max) {
		/* Easy case - no need to alter the list. */
		malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
		return old_max;
	}

	prof_recent_t *begin = prof_recent_alloc_dummy->next;
	/* For verification purpose only. */
	ssize_t count = prof_recent_alloc_count - max;
	do {
		assert(!prof_recent_alloc_is_empty(tsd));
		prof_recent_t *node = prof_recent_alloc_dummy->next;
		assert(node != prof_recent_alloc_dummy);
		prof_recent_alloc_evict_edata(tsd, node);
		prof_recent_alloc_dummy->next = node->next;
		--prof_recent_alloc_count;
	} while (prof_recent_alloc_count > max);
	prof_recent_t *end = prof_recent_alloc_dummy->next;
	assert(begin != end);

	prof_recent_alloc_assert_count(tsd);
	malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);

	/*
	 * Asynchronously handle the tctx of the to-be-deleted nodes, so that
	 * there's no simultaneous holdings of prof_recent_alloc_mtx and
	 * tdata->lock.  In the worst case there can be slightly extra space
	 * overhead taken by these nodes, but the total number of nodes at any
	 * time is bounded by (max + sum(decreases)), where "max" means the
	 * most recent prof_recent_alloc_max and "sum(decreases)" means the
	 * sum of the deltas of all decreases in prof_recent_alloc_max in the
	 * past.  This (max + sum(decreases)) value is completely transparent
	 * to and controlled by application.
	 */
	do {
		prof_recent_t *node = begin;
		decrement_recent_count(tsd, node->alloc_tctx);
		if (node->dalloc_tctx != NULL) {
			decrement_recent_count(tsd, node->dalloc_tctx);
		}
		begin = node->next;
		idalloctm(tsd_tsdn(tsd), node, NULL, NULL, true, true);
		--count;
	} while (begin != end);
	assert(count == 0);

	return old_max;
}

static void
dump_bt(emitter_t *emitter, prof_tctx_t *tctx) {
	char bt_buf[2 * sizeof(intptr_t) + 3];
	char *s = bt_buf;
	assert(tctx != NULL);
	prof_bt_t *bt = &tctx->gctx->bt;
	for (size_t i = 0; i < bt->len; ++i) {
		malloc_snprintf(bt_buf, sizeof(bt_buf), "%p", bt->vec[i]);
		emitter_json_value(emitter, emitter_type_string, &s);
	}
}

#define PROF_RECENT_PRINT_BUFSIZE 4096
void
prof_recent_alloc_dump(tsd_t *tsd, void (*write_cb)(void *, const char *),
    void *cbopaque) {
	char *buf = (char *)iallocztm(tsd_tsdn(tsd), PROF_RECENT_PRINT_BUFSIZE,
	    sz_size2index(PROF_RECENT_PRINT_BUFSIZE), false, NULL, true,
	    arena_get(tsd_tsdn(tsd), 0, false), true);
	buf_write_arg_t buf_arg = {write_cb, cbopaque, buf,
	    PROF_RECENT_PRINT_BUFSIZE - 1, 0};
	emitter_t emitter;
	emitter_init(&emitter, emitter_output_json_compact, buf_write_cb,
	    &buf_arg);
	emitter_begin(&emitter);

	malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);
	prof_recent_alloc_assert_count(tsd);

	/*
	 * Set prof_recent_alloc_max to 0 so that dumping won't block sampled
	 * allocations: the allocations can complete but will not be recorded.
	 */
	ssize_t max = prof_recent_alloc_max_update(tsd, 0);

	emitter_json_kv(&emitter, "recent_alloc_max", emitter_type_ssize, &max);

	emitter_json_array_kv_begin(&emitter, "recent_alloc");
	for (prof_recent_t *n = prof_recent_alloc_begin(tsd);
	    n != prof_recent_alloc_end(tsd);
	    n = prof_recent_alloc_next(tsd, n)) {
		emitter_json_object_begin(&emitter);

		emitter_json_kv(&emitter, "usize", emitter_type_size,
		    &n->usize);
		bool released = n->alloc_edata == NULL;
		emitter_json_kv(&emitter, "released", emitter_type_bool,
		    &released);

		emitter_json_kv(&emitter, "alloc_thread_uid",
		    emitter_type_uint64, &n->alloc_tctx->thr_uid);
		uint64_t alloc_time_ns = nstime_ns(&n->alloc_time);
		emitter_json_kv(&emitter, "alloc_time", emitter_type_uint64,
		    &alloc_time_ns);
		emitter_json_array_kv_begin(&emitter, "alloc_trace");
		dump_bt(&emitter, n->alloc_tctx);
		emitter_json_array_end(&emitter);

		if (n->dalloc_tctx != NULL) {
			assert(released);
			emitter_json_kv(&emitter, "dalloc_thread_uid",
			    emitter_type_uint64, &n->dalloc_tctx->thr_uid);
			assert(!nstime_equals_zero(&n->dalloc_time));
			uint64_t dalloc_time_ns = nstime_ns(&n->dalloc_time);
			emitter_json_kv(&emitter, "dalloc_time",
			    emitter_type_uint64, &dalloc_time_ns);
			emitter_json_array_kv_begin(&emitter, "dalloc_trace");
			dump_bt(&emitter, n->dalloc_tctx);
			emitter_json_array_end(&emitter);
		} else {
			assert(nstime_equals_zero(&n->dalloc_time));
		}

		emitter_json_object_end(&emitter);
	}
	emitter_json_array_end(&emitter);

	max = prof_recent_alloc_max_update(tsd, max);
	assert(max == 0);
	malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);

	emitter_end(&emitter);
	buf_write_flush(&buf_arg);
	idalloctm(tsd_tsdn(tsd), buf, NULL, NULL, true, true);
}
#undef PROF_RECENT_PRINT_BUFSIZE

bool
prof_recent_init() {
	prof_recent_alloc_max_init();

	if (malloc_mutex_init(&prof_recent_alloc_mtx,
	    "prof_recent_alloc", WITNESS_RANK_PROF_RECENT_ALLOC,
	    malloc_mutex_rank_exclusive)) {
		return true;
	}

	assert(prof_recent_alloc_dummy == NULL);
	prof_recent_alloc_dummy = (prof_recent_t *)iallocztm(
	    TSDN_NULL, sizeof(prof_recent_t),
	    sz_size2index(sizeof(prof_recent_t)), false, NULL, true,
	    arena_get(TSDN_NULL, 0, true), true);
	if (prof_recent_alloc_dummy == NULL) {
		return true;
	}
	prof_recent_alloc_dummy->next = prof_recent_alloc_dummy;

	return false;
}
Last-N profiling mode 2019-12-19 05:38:14 +08:00			`#define JEMALLOC_PROF_RECENT_C_`
			`#include "jemalloc/internal/jemalloc_preamble.h"`
			`#include "jemalloc/internal/jemalloc_internal_includes.h"`

			`#include "jemalloc/internal/assert.h"`
Make buffered writer an independent module 2020-01-10 08:36:09 +08:00			`#include "jemalloc/internal/buf_writer.h"`
Last-N profiling mode 2019-12-19 05:38:14 +08:00			`#include "jemalloc/internal/emitter.h"`
			`#include "jemalloc/internal/prof_data.h"`
			`#include "jemalloc/internal/prof_recent.h"`

			`#ifndef JEMALLOC_JET`
			`# define STATIC_INLINE_IF_NOT_TEST static inline`
			`#else`
			`# define STATIC_INLINE_IF_NOT_TEST`
			`#endif`

			`ssize_t opt_prof_recent_alloc_max = PROF_RECENT_ALLOC_MAX_DEFAULT;`
			`malloc_mutex_t prof_recent_alloc_mtx; /* Protects the fields below */`
			`static atomic_zd_t prof_recent_alloc_max;`
			`static ssize_t prof_recent_alloc_count = 0;`
			`static prof_recent_t *prof_recent_alloc_dummy = NULL;`

			`static void`
			`prof_recent_alloc_max_init() {`
			`atomic_store_zd(&prof_recent_alloc_max, opt_prof_recent_alloc_max,`
			`ATOMIC_RELAXED);`
			`}`

			`static inline ssize_t`
			`prof_recent_alloc_max_get_no_lock() {`
			`return atomic_load_zd(&prof_recent_alloc_max, ATOMIC_RELAXED);`
			`}`

			`static inline ssize_t`
			`prof_recent_alloc_max_get(tsd_t *tsd) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`return prof_recent_alloc_max_get_no_lock();`
			`}`

			`static inline ssize_t`
			`prof_recent_alloc_max_update(tsd_t *tsd, ssize_t max) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`ssize_t old_max = prof_recent_alloc_max_get(tsd);`
			`atomic_store_zd(&prof_recent_alloc_max, max, ATOMIC_RELAXED);`
			`return old_max;`
			`}`

			`static inline void`
			`increment_recent_count(tsd_t tsd, prof_tctx_t tctx) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), tctx->tdata->lock);`
			`++tctx->recent_count;`
			`assert(tctx->recent_count > 0);`
			`}`

			`bool`
			`prof_recent_alloc_prepare(tsd_t tsd, prof_tctx_t tctx) {`
			`assert(opt_prof && prof_booted);`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), tctx->tdata->lock);`
			`malloc_mutex_assert_not_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`

			`/*`
			`* Check whether last-N mode is turned on without trying to acquire the`
			`* lock, so as to optimize for the following two scenarios:`
			`* (1) Last-N mode is switched off;`
			`* (2) Dumping, during which last-N mode is temporarily turned off so`
			`* as not to block sampled allocations.`
			`*/`
			`if (prof_recent_alloc_max_get_no_lock() == 0) {`
			`return false;`
			`}`

			`/*`
			`* Increment recent_count to hold the tctx so that it won't be gone`
			`* even after tctx->tdata->lock is released. This acts as a`
			`* "placeholder"; the real recording of the allocation requires a lock`
			`* on prof_recent_alloc_mtx and is done in prof_recent_alloc (when`
			`* tctx->tdata->lock has been released).`
			`*/`
			`increment_recent_count(tsd, tctx);`
			`return true;`
			`}`

			`static void`
			`decrement_recent_count(tsd_t tsd, prof_tctx_t tctx) {`
			`malloc_mutex_assert_not_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`assert(tctx != NULL);`
			`malloc_mutex_lock(tsd_tsdn(tsd), tctx->tdata->lock);`
			`assert(tctx->recent_count > 0);`
			`--tctx->recent_count;`
			`prof_tctx_try_destroy(tsd, tctx);`
			`}`

			`void`
			`edata_prof_recent_alloc_init(edata_t *edata) {`
			`edata_prof_recent_alloc_set_dont_call_directly(edata, NULL);`
			`}`

			`static inline prof_recent_t *`
			`edata_prof_recent_alloc_get_no_lock(const edata_t *edata) {`
			`return edata_prof_recent_alloc_get_dont_call_directly(edata);`
			`}`

			`STATIC_INLINE_IF_NOT_TEST prof_recent_t *`
			`edata_prof_recent_alloc_get(tsd_t tsd, const edata_t edata) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_t *recent_alloc =`
			`edata_prof_recent_alloc_get_no_lock(edata);`
			`assert(recent_alloc == NULL \|\| recent_alloc->alloc_edata == edata);`
			`return recent_alloc;`
			`}`

			`static prof_recent_t *`
			`edata_prof_recent_alloc_update_internal(tsd_t tsd, edata_t edata,`
			`prof_recent_t *recent_alloc) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_t *old_recent_alloc =`
			`edata_prof_recent_alloc_get(tsd, edata);`
			`edata_prof_recent_alloc_set_dont_call_directly(edata, recent_alloc);`
			`return old_recent_alloc;`
			`}`

			`static void`
			`edata_prof_recent_alloc_set(tsd_t tsd, edata_t edata,`
			`prof_recent_t *recent_alloc) {`
			`assert(recent_alloc != NULL);`
			`prof_recent_t *old_recent_alloc =`
			`edata_prof_recent_alloc_update_internal(tsd, edata, recent_alloc);`
			`assert(old_recent_alloc == NULL);`
			`recent_alloc->alloc_edata = edata;`
			`}`

			`static void`
			`edata_prof_recent_alloc_reset(tsd_t tsd, edata_t edata,`
			`prof_recent_t *recent_alloc) {`
			`assert(recent_alloc != NULL);`
			`prof_recent_t *old_recent_alloc =`
			`edata_prof_recent_alloc_update_internal(tsd, edata, NULL);`
			`assert(old_recent_alloc == recent_alloc);`
			`assert(edata == recent_alloc->alloc_edata);`
			`recent_alloc->alloc_edata = NULL;`
			`}`

			`/*`
			`* This function should be called right before an allocation is released, so`
			`* that the associated recent allocation record can contain the following`
			`* information:`
			`* (1) The allocation is released;`
			`* (2) The time of the deallocation; and`
			`* (3) The prof_tctx associated with the deallocation.`
			`*/`
			`void`
			`prof_recent_alloc_reset(tsd_t tsd, edata_t edata) {`
			`/*`
			`* Check whether the recent allocation record still exists without`
			`* trying to acquire the lock.`
			`*/`
			`if (edata_prof_recent_alloc_get_no_lock(edata) == NULL) {`
			`return;`
			`}`

			`prof_tctx_t *dalloc_tctx = prof_tctx_create(tsd);`
			`/*`
			`* In case dalloc_tctx is NULL, e.g. due to OOM, we will not record the`
			`* deallocation time / tctx, which is handled later, after we check`
			`* again when holding the lock.`
			`*/`

			`if (dalloc_tctx != NULL) {`
			`malloc_mutex_lock(tsd_tsdn(tsd), dalloc_tctx->tdata->lock);`
			`increment_recent_count(tsd, dalloc_tctx);`
			`dalloc_tctx->prepared = false;`
			`malloc_mutex_unlock(tsd_tsdn(tsd), dalloc_tctx->tdata->lock);`
			`}`

			`malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`/* Check again after acquiring the lock. */`
			`prof_recent_t *recent = edata_prof_recent_alloc_get(tsd, edata);`
			`if (recent != NULL) {`
			`edata_prof_recent_alloc_reset(tsd, edata, recent);`
			`assert(nstime_equals_zero(&recent->dalloc_time));`
			`assert(recent->dalloc_tctx == NULL);`
			`if (dalloc_tctx != NULL) {`
			`nstime_update(&recent->dalloc_time);`
			`recent->dalloc_tctx = dalloc_tctx;`
			`}`
			`} else if (dalloc_tctx != NULL) {`
			`/* We lost the rase - the allocation record was just gone. */`
			`decrement_recent_count(tsd, dalloc_tctx);`
			`}`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`}`

			`static void`
			`prof_recent_alloc_evict_edata(tsd_t tsd, prof_recent_t recent) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`if (recent->alloc_edata != NULL) {`
			`edata_prof_recent_alloc_reset(tsd, recent->alloc_edata, recent);`
			`}`
			`}`

			`STATIC_INLINE_IF_NOT_TEST prof_recent_t *`
			`prof_recent_alloc_begin(tsd_t *tsd) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`assert(prof_recent_alloc_dummy != NULL);`
			`return prof_recent_alloc_dummy->next;`
			`}`

			`STATIC_INLINE_IF_NOT_TEST prof_recent_t *`
			`prof_recent_alloc_end(tsd_t *tsd) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`assert(prof_recent_alloc_dummy != NULL);`
			`return prof_recent_alloc_dummy;`
			`}`

			`STATIC_INLINE_IF_NOT_TEST prof_recent_t *`
			`prof_recent_alloc_next(tsd_t tsd, prof_recent_t node) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`assert(prof_recent_alloc_dummy != NULL);`
			`assert(node != NULL && node != prof_recent_alloc_dummy);`
			`return node->next;`
			`}`

			`static bool`
			`prof_recent_alloc_is_empty(tsd_t *tsd) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`if (prof_recent_alloc_begin(tsd) == prof_recent_alloc_end(tsd)) {`
			`assert(prof_recent_alloc_count == 0);`
			`return true;`
			`} else {`
			`assert(prof_recent_alloc_count > 0);`
			`return false;`
			`}`
			`}`

			`static void`
			`prof_recent_alloc_assert_count(tsd_t *tsd) {`
			`malloc_mutex_assert_owner(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`if (config_debug) {`
			`ssize_t count = 0;`
			`prof_recent_t *n = prof_recent_alloc_begin(tsd);`
			`while (n != prof_recent_alloc_end(tsd)) {`
			`++count;`
			`n = prof_recent_alloc_next(tsd, n);`
			`}`
			`assert(count == prof_recent_alloc_count);`
			`assert(prof_recent_alloc_max_get(tsd) == -1 \|\|`
			`count <= prof_recent_alloc_max_get(tsd));`
			`}`
			`}`

			`void`
			`prof_recent_alloc(tsd_t tsd, edata_t edata, size_t usize) {`
			`assert(edata != NULL);`
			`prof_tctx_t *tctx = edata_prof_tctx_get(edata);`

			`malloc_mutex_assert_not_owner(tsd_tsdn(tsd), tctx->tdata->lock);`
			`malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_alloc_assert_count(tsd);`

			`/*`
			`* Reserve a new prof_recent_t node if needed. If needed, we release`
			`* the prof_recent_alloc_mtx lock and allocate. Then, rather than`
			`* immediately checking for OOM, we regain the lock and try to make use`
			`* of the reserve node if needed. There are six scenarios:`
			`*`
			`* \ now \| no need \| need but OOMed \| need and allocated`
			`* later \ \| \| \|`
			`* ------------------------------------------------------------`
			`* no need \| (1) \| (2) \| (3)`
			`* ------------------------------------------------------------`
			`* need \| (4) \| (5) \| (6)`
			`*`
			`* First, "(4)" never happens, because we don't release the lock in the`
			`* middle if there's no need for a new node; in such cases "(1)" always`
			`* takes place, which is trivial.`
			`*`
			`* Out of the remaining four scenarios, "(6)" is the common case and is`
			`* trivial. "(5)" is also trivial, in which case we'll rollback the`
			`* effect of prof_recent_alloc_prepare() as expected.`
			`*`
			`* "(2)" / "(3)" occurs when the need for a new node is gone after we`
			`* regain the lock. If the new node is successfully allocated, i.e. in`
			`* the case of "(3)", we'll release it in the end; otherwise, i.e. in`
			`* the case of "(2)", we do nothing - we're lucky that the OOM ends up`
			`* doing no harm at all.`
			`*`
			`* Therefore, the only performance cost of the "release lock" ->`
			`* "allocate" -> "regain lock" design is the "(3)" case, but it happens`
			`* very rarely, so the cost is relatively small compared to the gain of`
			`* not having to have the lock order of prof_recent_alloc_mtx above all`
			`* the allocation locks.`
			`*/`
			`prof_recent_t *reserve = NULL;`
			`if (prof_recent_alloc_max_get(tsd) == -1 \|\|`
			`prof_recent_alloc_count < prof_recent_alloc_max_get(tsd)) {`
			`assert(prof_recent_alloc_max_get(tsd) != 0);`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`reserve = (prof_recent_t *)iallocztm(tsd_tsdn(tsd),`
			`sizeof(prof_recent_t), sz_size2index(sizeof(prof_recent_t)),`
			`false, NULL, true, arena_get(tsd_tsdn(tsd), 0, false),`
			`true);`
			`malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_alloc_assert_count(tsd);`
			`}`

			`if (prof_recent_alloc_max_get(tsd) == 0) {`
			`assert(prof_recent_alloc_is_empty(tsd));`
			`goto label_rollback;`
			`}`

			`assert(prof_recent_alloc_dummy != NULL);`
			`{`
			`/* Fill content into the dummy node. */`
			`prof_recent_t *node = prof_recent_alloc_dummy;`
			`node->usize = usize;`
			`nstime_copy(&node->alloc_time,`
			`edata_prof_alloc_time_get(edata));`
			`node->alloc_tctx = tctx;`
			`edata_prof_recent_alloc_set(tsd, edata, node);`
			`nstime_init_zero(&node->dalloc_time);`
			`node->dalloc_tctx = NULL;`
			`}`

			`prof_tctx_t old_alloc_tctx, old_dalloc_tctx;`
			`if (prof_recent_alloc_count == prof_recent_alloc_max_get(tsd)) {`
			`/* If upper limit is reached, simply shift the dummy. */`
			`assert(prof_recent_alloc_max_get(tsd) != -1);`
			`assert(!prof_recent_alloc_is_empty(tsd));`
			`prof_recent_alloc_dummy = prof_recent_alloc_dummy->next;`
			`old_alloc_tctx = prof_recent_alloc_dummy->alloc_tctx;`
			`assert(old_alloc_tctx != NULL);`
			`old_dalloc_tctx = prof_recent_alloc_dummy->dalloc_tctx;`
			`prof_recent_alloc_evict_edata(tsd, prof_recent_alloc_dummy);`
			`} else {`
			`/* Otherwise use the new node as the dummy. */`
			`assert(prof_recent_alloc_max_get(tsd) == -1 \|\|`
			`prof_recent_alloc_count < prof_recent_alloc_max_get(tsd));`
			`if (reserve == NULL) {`
			`goto label_rollback;`
			`}`
			`reserve->next = prof_recent_alloc_dummy->next;`
			`prof_recent_alloc_dummy->next = reserve;`
			`prof_recent_alloc_dummy = reserve;`
			`reserve = NULL;`
			`old_alloc_tctx = NULL;`
			`old_dalloc_tctx = NULL;`
			`++prof_recent_alloc_count;`
			`}`

			`assert(!prof_recent_alloc_is_empty(tsd));`
			`prof_recent_alloc_assert_count(tsd);`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`

			`if (reserve != NULL) {`
			`idalloctm(tsd_tsdn(tsd), reserve, NULL, NULL, true, true);`
			`}`

			`/*`
			`* Asynchronously handle the tctx of the old node, so that there's no`
			`* simultaneous holdings of prof_recent_alloc_mtx and tdata->lock.`
			`* In the worst case this may delay the tctx release but it's better`
			`* than holding prof_recent_alloc_mtx for longer.`
			`*/`
			`if (old_alloc_tctx != NULL) {`
			`decrement_recent_count(tsd, old_alloc_tctx);`
			`}`
			`if (old_dalloc_tctx != NULL) {`
			`decrement_recent_count(tsd, old_dalloc_tctx);`
			`}`
			`return;`

			`label_rollback:`
			`assert(edata_prof_recent_alloc_get(tsd, edata) == NULL);`
			`prof_recent_alloc_assert_count(tsd);`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`if (reserve != NULL) {`
			`idalloctm(tsd_tsdn(tsd), reserve, NULL, NULL, true, true);`
			`}`
			`decrement_recent_count(tsd, tctx);`
			`}`

			`ssize_t`
			`prof_recent_alloc_max_ctl_read() {`
			`/* Don't bother to acquire the lock. */`
			`return prof_recent_alloc_max_get_no_lock();`
			`}`

			`ssize_t`
			`prof_recent_alloc_max_ctl_write(tsd_t *tsd, ssize_t max) {`
			`assert(max >= -1);`

			`malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_alloc_assert_count(tsd);`

			`const ssize_t old_max = prof_recent_alloc_max_update(tsd, max);`

			`if (max == -1 \|\| prof_recent_alloc_count <= max) {`
			`/* Easy case - no need to alter the list. */`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`return old_max;`
			`}`

			`prof_recent_t *begin = prof_recent_alloc_dummy->next;`
			`/* For verification purpose only. */`
			`ssize_t count = prof_recent_alloc_count - max;`
			`do {`
			`assert(!prof_recent_alloc_is_empty(tsd));`
			`prof_recent_t *node = prof_recent_alloc_dummy->next;`
			`assert(node != prof_recent_alloc_dummy);`
			`prof_recent_alloc_evict_edata(tsd, node);`
			`prof_recent_alloc_dummy->next = node->next;`
			`--prof_recent_alloc_count;`
			`} while (prof_recent_alloc_count > max);`
			`prof_recent_t *end = prof_recent_alloc_dummy->next;`
			`assert(begin != end);`

			`prof_recent_alloc_assert_count(tsd);`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`

			`/*`
			`* Asynchronously handle the tctx of the to-be-deleted nodes, so that`
			`* there's no simultaneous holdings of prof_recent_alloc_mtx and`
			`* tdata->lock. In the worst case there can be slightly extra space`
			`* overhead taken by these nodes, but the total number of nodes at any`
			`* time is bounded by (max + sum(decreases)), where "max" means the`
			`* most recent prof_recent_alloc_max and "sum(decreases)" means the`
			`* sum of the deltas of all decreases in prof_recent_alloc_max in the`
			`* past. This (max + sum(decreases)) value is completely transparent`
			`* to and controlled by application.`
			`*/`
			`do {`
			`prof_recent_t *node = begin;`
			`decrement_recent_count(tsd, node->alloc_tctx);`
			`if (node->dalloc_tctx != NULL) {`
			`decrement_recent_count(tsd, node->dalloc_tctx);`
			`}`
			`begin = node->next;`
			`idalloctm(tsd_tsdn(tsd), node, NULL, NULL, true, true);`
			`--count;`
			`} while (begin != end);`
			`assert(count == 0);`

			`return old_max;`
			`}`

			`static void`
			`dump_bt(emitter_t emitter, prof_tctx_t tctx) {`
			`char bt_buf[2 * sizeof(intptr_t) + 3];`
			`char *s = bt_buf;`
			`assert(tctx != NULL);`
			`prof_bt_t *bt = &tctx->gctx->bt;`
			`for (size_t i = 0; i < bt->len; ++i) {`
			`malloc_snprintf(bt_buf, sizeof(bt_buf), "%p", bt->vec[i]);`
			`emitter_json_value(emitter, emitter_type_string, &s);`
			`}`
			`}`

			`#define PROF_RECENT_PRINT_BUFSIZE 4096`
			`void`
			`prof_recent_alloc_dump(tsd_t tsd, void (write_cb)(void , const char ),`
			`void *cbopaque) {`
			`char buf = (char )iallocztm(tsd_tsdn(tsd), PROF_RECENT_PRINT_BUFSIZE,`
			`sz_size2index(PROF_RECENT_PRINT_BUFSIZE), false, NULL, true,`
			`arena_get(tsd_tsdn(tsd), 0, false), true);`
Unify buffered writer naming 2020-01-10 01:59:17 +08:00			`buf_write_arg_t buf_arg = {write_cb, cbopaque, buf,`
Last-N profiling mode 2019-12-19 05:38:14 +08:00			`PROF_RECENT_PRINT_BUFSIZE - 1, 0};`
			`emitter_t emitter;`
Unify buffered writer naming 2020-01-10 01:59:17 +08:00			`emitter_init(&emitter, emitter_output_json_compact, buf_write_cb,`
Last-N profiling mode 2019-12-19 05:38:14 +08:00			`&buf_arg);`
			`emitter_begin(&emitter);`

			`malloc_mutex_lock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`
			`prof_recent_alloc_assert_count(tsd);`

			`/*`
			`* Set prof_recent_alloc_max to 0 so that dumping won't block sampled`
			`* allocations: the allocations can complete but will not be recorded.`
			`*/`
			`ssize_t max = prof_recent_alloc_max_update(tsd, 0);`

			`emitter_json_kv(&emitter, "recent_alloc_max", emitter_type_ssize, &max);`

			`emitter_json_array_kv_begin(&emitter, "recent_alloc");`
			`for (prof_recent_t *n = prof_recent_alloc_begin(tsd);`
			`n != prof_recent_alloc_end(tsd);`
			`n = prof_recent_alloc_next(tsd, n)) {`
			`emitter_json_object_begin(&emitter);`

			`emitter_json_kv(&emitter, "usize", emitter_type_size,`
			`&n->usize);`
			`bool released = n->alloc_edata == NULL;`
			`emitter_json_kv(&emitter, "released", emitter_type_bool,`
			`&released);`

			`emitter_json_kv(&emitter, "alloc_thread_uid",`
			`emitter_type_uint64, &n->alloc_tctx->thr_uid);`
			`uint64_t alloc_time_ns = nstime_ns(&n->alloc_time);`
			`emitter_json_kv(&emitter, "alloc_time", emitter_type_uint64,`
			`&alloc_time_ns);`
			`emitter_json_array_kv_begin(&emitter, "alloc_trace");`
			`dump_bt(&emitter, n->alloc_tctx);`
			`emitter_json_array_end(&emitter);`

			`if (n->dalloc_tctx != NULL) {`
			`assert(released);`
			`emitter_json_kv(&emitter, "dalloc_thread_uid",`
			`emitter_type_uint64, &n->dalloc_tctx->thr_uid);`
			`assert(!nstime_equals_zero(&n->dalloc_time));`
			`uint64_t dalloc_time_ns = nstime_ns(&n->dalloc_time);`
			`emitter_json_kv(&emitter, "dalloc_time",`
			`emitter_type_uint64, &dalloc_time_ns);`
			`emitter_json_array_kv_begin(&emitter, "dalloc_trace");`
			`dump_bt(&emitter, n->dalloc_tctx);`
			`emitter_json_array_end(&emitter);`
			`} else {`
			`assert(nstime_equals_zero(&n->dalloc_time));`
			`}`

			`emitter_json_object_end(&emitter);`
			`}`
			`emitter_json_array_end(&emitter);`

			`max = prof_recent_alloc_max_update(tsd, max);`
			`assert(max == 0);`
			`malloc_mutex_unlock(tsd_tsdn(tsd), &prof_recent_alloc_mtx);`

			`emitter_end(&emitter);`
Unify buffered writer naming 2020-01-10 01:59:17 +08:00			`buf_write_flush(&buf_arg);`
Last-N profiling mode 2019-12-19 05:38:14 +08:00			`idalloctm(tsd_tsdn(tsd), buf, NULL, NULL, true, true);`
			`}`
			`#undef PROF_RECENT_PRINT_BUFSIZE`

			`bool`
			`prof_recent_init() {`
			`prof_recent_alloc_max_init();`

			`if (malloc_mutex_init(&prof_recent_alloc_mtx,`
			`"prof_recent_alloc", WITNESS_RANK_PROF_RECENT_ALLOC,`
			`malloc_mutex_rank_exclusive)) {`
			`return true;`
			`}`

			`assert(prof_recent_alloc_dummy == NULL);`
			`prof_recent_alloc_dummy = (prof_recent_t *)iallocztm(`
			`TSDN_NULL, sizeof(prof_recent_t),`
			`sz_size2index(sizeof(prof_recent_t)), false, NULL, true,`
			`arena_get(TSDN_NULL, 0, true), true);`
			`if (prof_recent_alloc_dummy == NULL) {`
			`return true;`
			`}`
			`prof_recent_alloc_dummy->next = prof_recent_alloc_dummy;`

			`return false;`
			`}`