Make ctl_arena_clear slightly more efficient

While this function isn't particularly hot, (accounting for just 0.27% of
time spent inside the allocator on average across the fleet), looking
at the generated assembly and performance profiles does show we're dispatching
to multiple different `memset`s when we could instead be just tail-calling
`memset` once, reducing code size and marginally improving performance.
This commit is contained in:
Kevin Svetlitski 2023-07-25 12:14:35 -07:00 committed by Qi Wang
parent 8ff7e7d6c3
commit 9ba1e1cb37

View File

@ -1042,23 +1042,7 @@ ctl_arena_clear(ctl_arena_t *ctl_arena) {
ctl_arena->pdirty = 0; ctl_arena->pdirty = 0;
ctl_arena->pmuzzy = 0; ctl_arena->pmuzzy = 0;
if (config_stats) { if (config_stats) {
memset(&ctl_arena->astats->astats, 0, sizeof(arena_stats_t)); memset(ctl_arena->astats, 0, sizeof(*(ctl_arena->astats)));
ctl_arena->astats->allocated_small = 0;
ctl_arena->astats->nmalloc_small = 0;
ctl_arena->astats->ndalloc_small = 0;
ctl_arena->astats->nrequests_small = 0;
ctl_arena->astats->nfills_small = 0;
ctl_arena->astats->nflushes_small = 0;
memset(ctl_arena->astats->bstats, 0, SC_NBINS *
sizeof(bin_stats_data_t));
memset(ctl_arena->astats->lstats, 0, (SC_NSIZES - SC_NBINS) *
sizeof(arena_stats_large_t));
memset(ctl_arena->astats->estats, 0, SC_NPSIZES *
sizeof(pac_estats_t));
memset(&ctl_arena->astats->hpastats, 0,
sizeof(hpa_shard_stats_t));
memset(&ctl_arena->astats->secstats, 0,
sizeof(sec_stats_t));
} }
} }