1*c43cad87SWarner Losh #include "jemalloc/internal/jemalloc_preamble.h" 2*c43cad87SWarner Losh #include "jemalloc/internal/jemalloc_internal_includes.h" 3*c43cad87SWarner Losh 4*c43cad87SWarner Losh #include "jemalloc/internal/pac.h" 5*c43cad87SWarner Losh #include "jemalloc/internal/san.h" 6*c43cad87SWarner Losh 7*c43cad87SWarner Losh static edata_t *pac_alloc_impl(tsdn_t *tsdn, pai_t *self, size_t size, 8*c43cad87SWarner Losh size_t alignment, bool zero, bool guarded, bool frequent_reuse, 9*c43cad87SWarner Losh bool *deferred_work_generated); 10*c43cad87SWarner Losh static bool pac_expand_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, 11*c43cad87SWarner Losh size_t old_size, size_t new_size, bool zero, bool *deferred_work_generated); 12*c43cad87SWarner Losh static bool pac_shrink_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, 13*c43cad87SWarner Losh size_t old_size, size_t new_size, bool *deferred_work_generated); 14*c43cad87SWarner Losh static void pac_dalloc_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, 15*c43cad87SWarner Losh bool *deferred_work_generated); 16*c43cad87SWarner Losh static uint64_t pac_time_until_deferred_work(tsdn_t *tsdn, pai_t *self); 17*c43cad87SWarner Losh 18*c43cad87SWarner Losh static inline void 19*c43cad87SWarner Losh pac_decay_data_get(pac_t *pac, extent_state_t state, 20*c43cad87SWarner Losh decay_t **r_decay, pac_decay_stats_t **r_decay_stats, ecache_t **r_ecache) { 21*c43cad87SWarner Losh switch(state) { 22*c43cad87SWarner Losh case extent_state_dirty: 23*c43cad87SWarner Losh *r_decay = &pac->decay_dirty; 24*c43cad87SWarner Losh *r_decay_stats = &pac->stats->decay_dirty; 25*c43cad87SWarner Losh *r_ecache = &pac->ecache_dirty; 26*c43cad87SWarner Losh return; 27*c43cad87SWarner Losh case extent_state_muzzy: 28*c43cad87SWarner Losh *r_decay = &pac->decay_muzzy; 29*c43cad87SWarner Losh *r_decay_stats = &pac->stats->decay_muzzy; 30*c43cad87SWarner Losh *r_ecache = &pac->ecache_muzzy; 31*c43cad87SWarner Losh return; 32*c43cad87SWarner Losh default: 33*c43cad87SWarner Losh unreachable(); 34*c43cad87SWarner Losh } 35*c43cad87SWarner Losh } 36*c43cad87SWarner Losh 37*c43cad87SWarner Losh bool 38*c43cad87SWarner Losh pac_init(tsdn_t *tsdn, pac_t *pac, base_t *base, emap_t *emap, 39*c43cad87SWarner Losh edata_cache_t *edata_cache, nstime_t *cur_time, 40*c43cad87SWarner Losh size_t pac_oversize_threshold, ssize_t dirty_decay_ms, 41*c43cad87SWarner Losh ssize_t muzzy_decay_ms, pac_stats_t *pac_stats, malloc_mutex_t *stats_mtx) { 42*c43cad87SWarner Losh unsigned ind = base_ind_get(base); 43*c43cad87SWarner Losh /* 44*c43cad87SWarner Losh * Delay coalescing for dirty extents despite the disruptive effect on 45*c43cad87SWarner Losh * memory layout for best-fit extent allocation, since cached extents 46*c43cad87SWarner Losh * are likely to be reused soon after deallocation, and the cost of 47*c43cad87SWarner Losh * merging/splitting extents is non-trivial. 48*c43cad87SWarner Losh */ 49*c43cad87SWarner Losh if (ecache_init(tsdn, &pac->ecache_dirty, extent_state_dirty, ind, 50*c43cad87SWarner Losh /* delay_coalesce */ true)) { 51*c43cad87SWarner Losh return true; 52*c43cad87SWarner Losh } 53*c43cad87SWarner Losh /* 54*c43cad87SWarner Losh * Coalesce muzzy extents immediately, because operations on them are in 55*c43cad87SWarner Losh * the critical path much less often than for dirty extents. 56*c43cad87SWarner Losh */ 57*c43cad87SWarner Losh if (ecache_init(tsdn, &pac->ecache_muzzy, extent_state_muzzy, ind, 58*c43cad87SWarner Losh /* delay_coalesce */ false)) { 59*c43cad87SWarner Losh return true; 60*c43cad87SWarner Losh } 61*c43cad87SWarner Losh /* 62*c43cad87SWarner Losh * Coalesce retained extents immediately, in part because they will 63*c43cad87SWarner Losh * never be evicted (and therefore there's no opportunity for delayed 64*c43cad87SWarner Losh * coalescing), but also because operations on retained extents are not 65*c43cad87SWarner Losh * in the critical path. 66*c43cad87SWarner Losh */ 67*c43cad87SWarner Losh if (ecache_init(tsdn, &pac->ecache_retained, extent_state_retained, 68*c43cad87SWarner Losh ind, /* delay_coalesce */ false)) { 69*c43cad87SWarner Losh return true; 70*c43cad87SWarner Losh } 71*c43cad87SWarner Losh exp_grow_init(&pac->exp_grow); 72*c43cad87SWarner Losh if (malloc_mutex_init(&pac->grow_mtx, "extent_grow", 73*c43cad87SWarner Losh WITNESS_RANK_EXTENT_GROW, malloc_mutex_rank_exclusive)) { 74*c43cad87SWarner Losh return true; 75*c43cad87SWarner Losh } 76*c43cad87SWarner Losh atomic_store_zu(&pac->oversize_threshold, pac_oversize_threshold, 77*c43cad87SWarner Losh ATOMIC_RELAXED); 78*c43cad87SWarner Losh if (decay_init(&pac->decay_dirty, cur_time, dirty_decay_ms)) { 79*c43cad87SWarner Losh return true; 80*c43cad87SWarner Losh } 81*c43cad87SWarner Losh if (decay_init(&pac->decay_muzzy, cur_time, muzzy_decay_ms)) { 82*c43cad87SWarner Losh return true; 83*c43cad87SWarner Losh } 84*c43cad87SWarner Losh if (san_bump_alloc_init(&pac->sba)) { 85*c43cad87SWarner Losh return true; 86*c43cad87SWarner Losh } 87*c43cad87SWarner Losh 88*c43cad87SWarner Losh pac->base = base; 89*c43cad87SWarner Losh pac->emap = emap; 90*c43cad87SWarner Losh pac->edata_cache = edata_cache; 91*c43cad87SWarner Losh pac->stats = pac_stats; 92*c43cad87SWarner Losh pac->stats_mtx = stats_mtx; 93*c43cad87SWarner Losh atomic_store_zu(&pac->extent_sn_next, 0, ATOMIC_RELAXED); 94*c43cad87SWarner Losh 95*c43cad87SWarner Losh pac->pai.alloc = &pac_alloc_impl; 96*c43cad87SWarner Losh pac->pai.alloc_batch = &pai_alloc_batch_default; 97*c43cad87SWarner Losh pac->pai.expand = &pac_expand_impl; 98*c43cad87SWarner Losh pac->pai.shrink = &pac_shrink_impl; 99*c43cad87SWarner Losh pac->pai.dalloc = &pac_dalloc_impl; 100*c43cad87SWarner Losh pac->pai.dalloc_batch = &pai_dalloc_batch_default; 101*c43cad87SWarner Losh pac->pai.time_until_deferred_work = &pac_time_until_deferred_work; 102*c43cad87SWarner Losh 103*c43cad87SWarner Losh return false; 104*c43cad87SWarner Losh } 105*c43cad87SWarner Losh 106*c43cad87SWarner Losh static inline bool 107*c43cad87SWarner Losh pac_may_have_muzzy(pac_t *pac) { 108*c43cad87SWarner Losh return pac_decay_ms_get(pac, extent_state_muzzy) != 0; 109*c43cad87SWarner Losh } 110*c43cad87SWarner Losh 111*c43cad87SWarner Losh static edata_t * 112*c43cad87SWarner Losh pac_alloc_real(tsdn_t *tsdn, pac_t *pac, ehooks_t *ehooks, size_t size, 113*c43cad87SWarner Losh size_t alignment, bool zero, bool guarded) { 114*c43cad87SWarner Losh assert(!guarded || alignment <= PAGE); 115*c43cad87SWarner Losh 116*c43cad87SWarner Losh edata_t *edata = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_dirty, 117*c43cad87SWarner Losh NULL, size, alignment, zero, guarded); 118*c43cad87SWarner Losh 119*c43cad87SWarner Losh if (edata == NULL && pac_may_have_muzzy(pac)) { 120*c43cad87SWarner Losh edata = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_muzzy, 121*c43cad87SWarner Losh NULL, size, alignment, zero, guarded); 122*c43cad87SWarner Losh } 123*c43cad87SWarner Losh if (edata == NULL) { 124*c43cad87SWarner Losh edata = ecache_alloc_grow(tsdn, pac, ehooks, 125*c43cad87SWarner Losh &pac->ecache_retained, NULL, size, alignment, zero, 126*c43cad87SWarner Losh guarded); 127*c43cad87SWarner Losh if (config_stats && edata != NULL) { 128*c43cad87SWarner Losh atomic_fetch_add_zu(&pac->stats->pac_mapped, size, 129*c43cad87SWarner Losh ATOMIC_RELAXED); 130*c43cad87SWarner Losh } 131*c43cad87SWarner Losh } 132*c43cad87SWarner Losh 133*c43cad87SWarner Losh return edata; 134*c43cad87SWarner Losh } 135*c43cad87SWarner Losh 136*c43cad87SWarner Losh static edata_t * 137*c43cad87SWarner Losh pac_alloc_new_guarded(tsdn_t *tsdn, pac_t *pac, ehooks_t *ehooks, size_t size, 138*c43cad87SWarner Losh size_t alignment, bool zero, bool frequent_reuse) { 139*c43cad87SWarner Losh assert(alignment <= PAGE); 140*c43cad87SWarner Losh 141*c43cad87SWarner Losh edata_t *edata; 142*c43cad87SWarner Losh if (san_bump_enabled() && frequent_reuse) { 143*c43cad87SWarner Losh edata = san_bump_alloc(tsdn, &pac->sba, pac, ehooks, size, 144*c43cad87SWarner Losh zero); 145*c43cad87SWarner Losh } else { 146*c43cad87SWarner Losh size_t size_with_guards = san_two_side_guarded_sz(size); 147*c43cad87SWarner Losh /* Alloc a non-guarded extent first.*/ 148*c43cad87SWarner Losh edata = pac_alloc_real(tsdn, pac, ehooks, size_with_guards, 149*c43cad87SWarner Losh /* alignment */ PAGE, zero, /* guarded */ false); 150*c43cad87SWarner Losh if (edata != NULL) { 151*c43cad87SWarner Losh /* Add guards around it. */ 152*c43cad87SWarner Losh assert(edata_size_get(edata) == size_with_guards); 153*c43cad87SWarner Losh san_guard_pages_two_sided(tsdn, ehooks, edata, 154*c43cad87SWarner Losh pac->emap, true); 155*c43cad87SWarner Losh } 156*c43cad87SWarner Losh } 157*c43cad87SWarner Losh assert(edata == NULL || (edata_guarded_get(edata) && 158*c43cad87SWarner Losh edata_size_get(edata) == size)); 159*c43cad87SWarner Losh 160*c43cad87SWarner Losh return edata; 161*c43cad87SWarner Losh } 162*c43cad87SWarner Losh 163*c43cad87SWarner Losh static edata_t * 164*c43cad87SWarner Losh pac_alloc_impl(tsdn_t *tsdn, pai_t *self, size_t size, size_t alignment, 165*c43cad87SWarner Losh bool zero, bool guarded, bool frequent_reuse, 166*c43cad87SWarner Losh bool *deferred_work_generated) { 167*c43cad87SWarner Losh pac_t *pac = (pac_t *)self; 168*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 169*c43cad87SWarner Losh 170*c43cad87SWarner Losh edata_t *edata = NULL; 171*c43cad87SWarner Losh /* 172*c43cad87SWarner Losh * The condition is an optimization - not frequently reused guarded 173*c43cad87SWarner Losh * allocations are never put in the ecache. pac_alloc_real also 174*c43cad87SWarner Losh * doesn't grow retained for guarded allocations. So pac_alloc_real 175*c43cad87SWarner Losh * for such allocations would always return NULL. 176*c43cad87SWarner Losh * */ 177*c43cad87SWarner Losh if (!guarded || frequent_reuse) { 178*c43cad87SWarner Losh edata = pac_alloc_real(tsdn, pac, ehooks, size, alignment, 179*c43cad87SWarner Losh zero, guarded); 180*c43cad87SWarner Losh } 181*c43cad87SWarner Losh if (edata == NULL && guarded) { 182*c43cad87SWarner Losh /* No cached guarded extents; creating a new one. */ 183*c43cad87SWarner Losh edata = pac_alloc_new_guarded(tsdn, pac, ehooks, size, 184*c43cad87SWarner Losh alignment, zero, frequent_reuse); 185*c43cad87SWarner Losh } 186*c43cad87SWarner Losh 187*c43cad87SWarner Losh return edata; 188*c43cad87SWarner Losh } 189*c43cad87SWarner Losh 190*c43cad87SWarner Losh static bool 191*c43cad87SWarner Losh pac_expand_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, size_t old_size, 192*c43cad87SWarner Losh size_t new_size, bool zero, bool *deferred_work_generated) { 193*c43cad87SWarner Losh pac_t *pac = (pac_t *)self; 194*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 195*c43cad87SWarner Losh 196*c43cad87SWarner Losh size_t mapped_add = 0; 197*c43cad87SWarner Losh size_t expand_amount = new_size - old_size; 198*c43cad87SWarner Losh 199*c43cad87SWarner Losh if (ehooks_merge_will_fail(ehooks)) { 200*c43cad87SWarner Losh return true; 201*c43cad87SWarner Losh } 202*c43cad87SWarner Losh edata_t *trail = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_dirty, 203*c43cad87SWarner Losh edata, expand_amount, PAGE, zero, /* guarded*/ false); 204*c43cad87SWarner Losh if (trail == NULL) { 205*c43cad87SWarner Losh trail = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_muzzy, 206*c43cad87SWarner Losh edata, expand_amount, PAGE, zero, /* guarded*/ false); 207*c43cad87SWarner Losh } 208*c43cad87SWarner Losh if (trail == NULL) { 209*c43cad87SWarner Losh trail = ecache_alloc_grow(tsdn, pac, ehooks, 210*c43cad87SWarner Losh &pac->ecache_retained, edata, expand_amount, PAGE, zero, 211*c43cad87SWarner Losh /* guarded */ false); 212*c43cad87SWarner Losh mapped_add = expand_amount; 213*c43cad87SWarner Losh } 214*c43cad87SWarner Losh if (trail == NULL) { 215*c43cad87SWarner Losh return true; 216*c43cad87SWarner Losh } 217*c43cad87SWarner Losh if (extent_merge_wrapper(tsdn, pac, ehooks, edata, trail)) { 218*c43cad87SWarner Losh extent_dalloc_wrapper(tsdn, pac, ehooks, trail); 219*c43cad87SWarner Losh return true; 220*c43cad87SWarner Losh } 221*c43cad87SWarner Losh if (config_stats && mapped_add > 0) { 222*c43cad87SWarner Losh atomic_fetch_add_zu(&pac->stats->pac_mapped, mapped_add, 223*c43cad87SWarner Losh ATOMIC_RELAXED); 224*c43cad87SWarner Losh } 225*c43cad87SWarner Losh return false; 226*c43cad87SWarner Losh } 227*c43cad87SWarner Losh 228*c43cad87SWarner Losh static bool 229*c43cad87SWarner Losh pac_shrink_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, size_t old_size, 230*c43cad87SWarner Losh size_t new_size, bool *deferred_work_generated) { 231*c43cad87SWarner Losh pac_t *pac = (pac_t *)self; 232*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 233*c43cad87SWarner Losh 234*c43cad87SWarner Losh size_t shrink_amount = old_size - new_size; 235*c43cad87SWarner Losh 236*c43cad87SWarner Losh if (ehooks_split_will_fail(ehooks)) { 237*c43cad87SWarner Losh return true; 238*c43cad87SWarner Losh } 239*c43cad87SWarner Losh 240*c43cad87SWarner Losh edata_t *trail = extent_split_wrapper(tsdn, pac, ehooks, edata, 241*c43cad87SWarner Losh new_size, shrink_amount, /* holding_core_locks */ false); 242*c43cad87SWarner Losh if (trail == NULL) { 243*c43cad87SWarner Losh return true; 244*c43cad87SWarner Losh } 245*c43cad87SWarner Losh ecache_dalloc(tsdn, pac, ehooks, &pac->ecache_dirty, trail); 246*c43cad87SWarner Losh *deferred_work_generated = true; 247*c43cad87SWarner Losh return false; 248*c43cad87SWarner Losh } 249*c43cad87SWarner Losh 250*c43cad87SWarner Losh static void 251*c43cad87SWarner Losh pac_dalloc_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, 252*c43cad87SWarner Losh bool *deferred_work_generated) { 253*c43cad87SWarner Losh pac_t *pac = (pac_t *)self; 254*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 255*c43cad87SWarner Losh 256*c43cad87SWarner Losh if (edata_guarded_get(edata)) { 257*c43cad87SWarner Losh /* 258*c43cad87SWarner Losh * Because cached guarded extents do exact fit only, large 259*c43cad87SWarner Losh * guarded extents are restored on dalloc eagerly (otherwise 260*c43cad87SWarner Losh * they will not be reused efficiently). Slab sizes have a 261*c43cad87SWarner Losh * limited number of size classes, and tend to cycle faster. 262*c43cad87SWarner Losh * 263*c43cad87SWarner Losh * In the case where coalesce is restrained (VirtualFree on 264*c43cad87SWarner Losh * Windows), guarded extents are also not cached -- otherwise 265*c43cad87SWarner Losh * during arena destroy / reset, the retained extents would not 266*c43cad87SWarner Losh * be whole regions (i.e. they are split between regular and 267*c43cad87SWarner Losh * guarded). 268*c43cad87SWarner Losh */ 269*c43cad87SWarner Losh if (!edata_slab_get(edata) || !maps_coalesce) { 270*c43cad87SWarner Losh assert(edata_size_get(edata) >= SC_LARGE_MINCLASS || 271*c43cad87SWarner Losh !maps_coalesce); 272*c43cad87SWarner Losh san_unguard_pages_two_sided(tsdn, ehooks, edata, 273*c43cad87SWarner Losh pac->emap); 274*c43cad87SWarner Losh } 275*c43cad87SWarner Losh } 276*c43cad87SWarner Losh 277*c43cad87SWarner Losh ecache_dalloc(tsdn, pac, ehooks, &pac->ecache_dirty, edata); 278*c43cad87SWarner Losh /* Purging of deallocated pages is deferred */ 279*c43cad87SWarner Losh *deferred_work_generated = true; 280*c43cad87SWarner Losh } 281*c43cad87SWarner Losh 282*c43cad87SWarner Losh static inline uint64_t 283*c43cad87SWarner Losh pac_ns_until_purge(tsdn_t *tsdn, decay_t *decay, size_t npages) { 284*c43cad87SWarner Losh if (malloc_mutex_trylock(tsdn, &decay->mtx)) { 285*c43cad87SWarner Losh /* Use minimal interval if decay is contended. */ 286*c43cad87SWarner Losh return BACKGROUND_THREAD_DEFERRED_MIN; 287*c43cad87SWarner Losh } 288*c43cad87SWarner Losh uint64_t result = decay_ns_until_purge(decay, npages, 289*c43cad87SWarner Losh ARENA_DEFERRED_PURGE_NPAGES_THRESHOLD); 290*c43cad87SWarner Losh 291*c43cad87SWarner Losh malloc_mutex_unlock(tsdn, &decay->mtx); 292*c43cad87SWarner Losh return result; 293*c43cad87SWarner Losh } 294*c43cad87SWarner Losh 295*c43cad87SWarner Losh static uint64_t 296*c43cad87SWarner Losh pac_time_until_deferred_work(tsdn_t *tsdn, pai_t *self) { 297*c43cad87SWarner Losh uint64_t time; 298*c43cad87SWarner Losh pac_t *pac = (pac_t *)self; 299*c43cad87SWarner Losh 300*c43cad87SWarner Losh time = pac_ns_until_purge(tsdn, 301*c43cad87SWarner Losh &pac->decay_dirty, 302*c43cad87SWarner Losh ecache_npages_get(&pac->ecache_dirty)); 303*c43cad87SWarner Losh if (time == BACKGROUND_THREAD_DEFERRED_MIN) { 304*c43cad87SWarner Losh return time; 305*c43cad87SWarner Losh } 306*c43cad87SWarner Losh 307*c43cad87SWarner Losh uint64_t muzzy = pac_ns_until_purge(tsdn, 308*c43cad87SWarner Losh &pac->decay_muzzy, 309*c43cad87SWarner Losh ecache_npages_get(&pac->ecache_muzzy)); 310*c43cad87SWarner Losh if (muzzy < time) { 311*c43cad87SWarner Losh time = muzzy; 312*c43cad87SWarner Losh } 313*c43cad87SWarner Losh return time; 314*c43cad87SWarner Losh } 315*c43cad87SWarner Losh 316*c43cad87SWarner Losh bool 317*c43cad87SWarner Losh pac_retain_grow_limit_get_set(tsdn_t *tsdn, pac_t *pac, size_t *old_limit, 318*c43cad87SWarner Losh size_t *new_limit) { 319*c43cad87SWarner Losh pszind_t new_ind JEMALLOC_CC_SILENCE_INIT(0); 320*c43cad87SWarner Losh if (new_limit != NULL) { 321*c43cad87SWarner Losh size_t limit = *new_limit; 322*c43cad87SWarner Losh /* Grow no more than the new limit. */ 323*c43cad87SWarner Losh if ((new_ind = sz_psz2ind(limit + 1) - 1) >= SC_NPSIZES) { 324*c43cad87SWarner Losh return true; 325*c43cad87SWarner Losh } 326*c43cad87SWarner Losh } 327*c43cad87SWarner Losh 328*c43cad87SWarner Losh malloc_mutex_lock(tsdn, &pac->grow_mtx); 329*c43cad87SWarner Losh if (old_limit != NULL) { 330*c43cad87SWarner Losh *old_limit = sz_pind2sz(pac->exp_grow.limit); 331*c43cad87SWarner Losh } 332*c43cad87SWarner Losh if (new_limit != NULL) { 333*c43cad87SWarner Losh pac->exp_grow.limit = new_ind; 334*c43cad87SWarner Losh } 335*c43cad87SWarner Losh malloc_mutex_unlock(tsdn, &pac->grow_mtx); 336*c43cad87SWarner Losh 337*c43cad87SWarner Losh return false; 338*c43cad87SWarner Losh } 339*c43cad87SWarner Losh 340*c43cad87SWarner Losh static size_t 341*c43cad87SWarner Losh pac_stash_decayed(tsdn_t *tsdn, pac_t *pac, ecache_t *ecache, 342*c43cad87SWarner Losh size_t npages_limit, size_t npages_decay_max, 343*c43cad87SWarner Losh edata_list_inactive_t *result) { 344*c43cad87SWarner Losh witness_assert_depth_to_rank(tsdn_witness_tsdp_get(tsdn), 345*c43cad87SWarner Losh WITNESS_RANK_CORE, 0); 346*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 347*c43cad87SWarner Losh 348*c43cad87SWarner Losh /* Stash extents according to npages_limit. */ 349*c43cad87SWarner Losh size_t nstashed = 0; 350*c43cad87SWarner Losh while (nstashed < npages_decay_max) { 351*c43cad87SWarner Losh edata_t *edata = ecache_evict(tsdn, pac, ehooks, ecache, 352*c43cad87SWarner Losh npages_limit); 353*c43cad87SWarner Losh if (edata == NULL) { 354*c43cad87SWarner Losh break; 355*c43cad87SWarner Losh } 356*c43cad87SWarner Losh edata_list_inactive_append(result, edata); 357*c43cad87SWarner Losh nstashed += edata_size_get(edata) >> LG_PAGE; 358*c43cad87SWarner Losh } 359*c43cad87SWarner Losh return nstashed; 360*c43cad87SWarner Losh } 361*c43cad87SWarner Losh 362*c43cad87SWarner Losh static size_t 363*c43cad87SWarner Losh pac_decay_stashed(tsdn_t *tsdn, pac_t *pac, decay_t *decay, 364*c43cad87SWarner Losh pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay, 365*c43cad87SWarner Losh edata_list_inactive_t *decay_extents) { 366*c43cad87SWarner Losh bool err; 367*c43cad87SWarner Losh 368*c43cad87SWarner Losh size_t nmadvise = 0; 369*c43cad87SWarner Losh size_t nunmapped = 0; 370*c43cad87SWarner Losh size_t npurged = 0; 371*c43cad87SWarner Losh 372*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 373*c43cad87SWarner Losh 374*c43cad87SWarner Losh bool try_muzzy = !fully_decay 375*c43cad87SWarner Losh && pac_decay_ms_get(pac, extent_state_muzzy) != 0; 376*c43cad87SWarner Losh 377*c43cad87SWarner Losh for (edata_t *edata = edata_list_inactive_first(decay_extents); edata != 378*c43cad87SWarner Losh NULL; edata = edata_list_inactive_first(decay_extents)) { 379*c43cad87SWarner Losh edata_list_inactive_remove(decay_extents, edata); 380*c43cad87SWarner Losh 381*c43cad87SWarner Losh size_t size = edata_size_get(edata); 382*c43cad87SWarner Losh size_t npages = size >> LG_PAGE; 383*c43cad87SWarner Losh 384*c43cad87SWarner Losh nmadvise++; 385*c43cad87SWarner Losh npurged += npages; 386*c43cad87SWarner Losh 387*c43cad87SWarner Losh switch (ecache->state) { 388*c43cad87SWarner Losh case extent_state_active: 389*c43cad87SWarner Losh not_reached(); 390*c43cad87SWarner Losh case extent_state_dirty: 391*c43cad87SWarner Losh if (try_muzzy) { 392*c43cad87SWarner Losh err = extent_purge_lazy_wrapper(tsdn, ehooks, 393*c43cad87SWarner Losh edata, /* offset */ 0, size); 394*c43cad87SWarner Losh if (!err) { 395*c43cad87SWarner Losh ecache_dalloc(tsdn, pac, ehooks, 396*c43cad87SWarner Losh &pac->ecache_muzzy, edata); 397*c43cad87SWarner Losh break; 398*c43cad87SWarner Losh } 399*c43cad87SWarner Losh } 400*c43cad87SWarner Losh JEMALLOC_FALLTHROUGH; 401*c43cad87SWarner Losh case extent_state_muzzy: 402*c43cad87SWarner Losh extent_dalloc_wrapper(tsdn, pac, ehooks, edata); 403*c43cad87SWarner Losh nunmapped += npages; 404*c43cad87SWarner Losh break; 405*c43cad87SWarner Losh case extent_state_retained: 406*c43cad87SWarner Losh default: 407*c43cad87SWarner Losh not_reached(); 408*c43cad87SWarner Losh } 409*c43cad87SWarner Losh } 410*c43cad87SWarner Losh 411*c43cad87SWarner Losh if (config_stats) { 412*c43cad87SWarner Losh LOCKEDINT_MTX_LOCK(tsdn, *pac->stats_mtx); 413*c43cad87SWarner Losh locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx), 414*c43cad87SWarner Losh &decay_stats->npurge, 1); 415*c43cad87SWarner Losh locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx), 416*c43cad87SWarner Losh &decay_stats->nmadvise, nmadvise); 417*c43cad87SWarner Losh locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx), 418*c43cad87SWarner Losh &decay_stats->purged, npurged); 419*c43cad87SWarner Losh LOCKEDINT_MTX_UNLOCK(tsdn, *pac->stats_mtx); 420*c43cad87SWarner Losh atomic_fetch_sub_zu(&pac->stats->pac_mapped, 421*c43cad87SWarner Losh nunmapped << LG_PAGE, ATOMIC_RELAXED); 422*c43cad87SWarner Losh } 423*c43cad87SWarner Losh 424*c43cad87SWarner Losh return npurged; 425*c43cad87SWarner Losh } 426*c43cad87SWarner Losh 427*c43cad87SWarner Losh /* 428*c43cad87SWarner Losh * npages_limit: Decay at most npages_decay_max pages without violating the 429*c43cad87SWarner Losh * invariant: (ecache_npages_get(ecache) >= npages_limit). We need an upper 430*c43cad87SWarner Losh * bound on number of pages in order to prevent unbounded growth (namely in 431*c43cad87SWarner Losh * stashed), otherwise unbounded new pages could be added to extents during the 432*c43cad87SWarner Losh * current decay run, so that the purging thread never finishes. 433*c43cad87SWarner Losh */ 434*c43cad87SWarner Losh static void 435*c43cad87SWarner Losh pac_decay_to_limit(tsdn_t *tsdn, pac_t *pac, decay_t *decay, 436*c43cad87SWarner Losh pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay, 437*c43cad87SWarner Losh size_t npages_limit, size_t npages_decay_max) { 438*c43cad87SWarner Losh witness_assert_depth_to_rank(tsdn_witness_tsdp_get(tsdn), 439*c43cad87SWarner Losh WITNESS_RANK_CORE, 1); 440*c43cad87SWarner Losh 441*c43cad87SWarner Losh if (decay->purging || npages_decay_max == 0) { 442*c43cad87SWarner Losh return; 443*c43cad87SWarner Losh } 444*c43cad87SWarner Losh decay->purging = true; 445*c43cad87SWarner Losh malloc_mutex_unlock(tsdn, &decay->mtx); 446*c43cad87SWarner Losh 447*c43cad87SWarner Losh edata_list_inactive_t decay_extents; 448*c43cad87SWarner Losh edata_list_inactive_init(&decay_extents); 449*c43cad87SWarner Losh size_t npurge = pac_stash_decayed(tsdn, pac, ecache, npages_limit, 450*c43cad87SWarner Losh npages_decay_max, &decay_extents); 451*c43cad87SWarner Losh if (npurge != 0) { 452*c43cad87SWarner Losh size_t npurged = pac_decay_stashed(tsdn, pac, decay, 453*c43cad87SWarner Losh decay_stats, ecache, fully_decay, &decay_extents); 454*c43cad87SWarner Losh assert(npurged == npurge); 455*c43cad87SWarner Losh } 456*c43cad87SWarner Losh 457*c43cad87SWarner Losh malloc_mutex_lock(tsdn, &decay->mtx); 458*c43cad87SWarner Losh decay->purging = false; 459*c43cad87SWarner Losh } 460*c43cad87SWarner Losh 461*c43cad87SWarner Losh void 462*c43cad87SWarner Losh pac_decay_all(tsdn_t *tsdn, pac_t *pac, decay_t *decay, 463*c43cad87SWarner Losh pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay) { 464*c43cad87SWarner Losh malloc_mutex_assert_owner(tsdn, &decay->mtx); 465*c43cad87SWarner Losh pac_decay_to_limit(tsdn, pac, decay, decay_stats, ecache, fully_decay, 466*c43cad87SWarner Losh /* npages_limit */ 0, ecache_npages_get(ecache)); 467*c43cad87SWarner Losh } 468*c43cad87SWarner Losh 469*c43cad87SWarner Losh static void 470*c43cad87SWarner Losh pac_decay_try_purge(tsdn_t *tsdn, pac_t *pac, decay_t *decay, 471*c43cad87SWarner Losh pac_decay_stats_t *decay_stats, ecache_t *ecache, 472*c43cad87SWarner Losh size_t current_npages, size_t npages_limit) { 473*c43cad87SWarner Losh if (current_npages > npages_limit) { 474*c43cad87SWarner Losh pac_decay_to_limit(tsdn, pac, decay, decay_stats, ecache, 475*c43cad87SWarner Losh /* fully_decay */ false, npages_limit, 476*c43cad87SWarner Losh current_npages - npages_limit); 477*c43cad87SWarner Losh } 478*c43cad87SWarner Losh } 479*c43cad87SWarner Losh 480*c43cad87SWarner Losh bool 481*c43cad87SWarner Losh pac_maybe_decay_purge(tsdn_t *tsdn, pac_t *pac, decay_t *decay, 482*c43cad87SWarner Losh pac_decay_stats_t *decay_stats, ecache_t *ecache, 483*c43cad87SWarner Losh pac_purge_eagerness_t eagerness) { 484*c43cad87SWarner Losh malloc_mutex_assert_owner(tsdn, &decay->mtx); 485*c43cad87SWarner Losh 486*c43cad87SWarner Losh /* Purge all or nothing if the option is disabled. */ 487*c43cad87SWarner Losh ssize_t decay_ms = decay_ms_read(decay); 488*c43cad87SWarner Losh if (decay_ms <= 0) { 489*c43cad87SWarner Losh if (decay_ms == 0) { 490*c43cad87SWarner Losh pac_decay_to_limit(tsdn, pac, decay, decay_stats, 491*c43cad87SWarner Losh ecache, /* fully_decay */ false, 492*c43cad87SWarner Losh /* npages_limit */ 0, ecache_npages_get(ecache)); 493*c43cad87SWarner Losh } 494*c43cad87SWarner Losh return false; 495*c43cad87SWarner Losh } 496*c43cad87SWarner Losh 497*c43cad87SWarner Losh /* 498*c43cad87SWarner Losh * If the deadline has been reached, advance to the current epoch and 499*c43cad87SWarner Losh * purge to the new limit if necessary. Note that dirty pages created 500*c43cad87SWarner Losh * during the current epoch are not subject to purge until a future 501*c43cad87SWarner Losh * epoch, so as a result purging only happens during epoch advances, or 502*c43cad87SWarner Losh * being triggered by background threads (scheduled event). 503*c43cad87SWarner Losh */ 504*c43cad87SWarner Losh nstime_t time; 505*c43cad87SWarner Losh nstime_init_update(&time); 506*c43cad87SWarner Losh size_t npages_current = ecache_npages_get(ecache); 507*c43cad87SWarner Losh bool epoch_advanced = decay_maybe_advance_epoch(decay, &time, 508*c43cad87SWarner Losh npages_current); 509*c43cad87SWarner Losh if (eagerness == PAC_PURGE_ALWAYS 510*c43cad87SWarner Losh || (epoch_advanced && eagerness == PAC_PURGE_ON_EPOCH_ADVANCE)) { 511*c43cad87SWarner Losh size_t npages_limit = decay_npages_limit_get(decay); 512*c43cad87SWarner Losh pac_decay_try_purge(tsdn, pac, decay, decay_stats, ecache, 513*c43cad87SWarner Losh npages_current, npages_limit); 514*c43cad87SWarner Losh } 515*c43cad87SWarner Losh 516*c43cad87SWarner Losh return epoch_advanced; 517*c43cad87SWarner Losh } 518*c43cad87SWarner Losh 519*c43cad87SWarner Losh bool 520*c43cad87SWarner Losh pac_decay_ms_set(tsdn_t *tsdn, pac_t *pac, extent_state_t state, 521*c43cad87SWarner Losh ssize_t decay_ms, pac_purge_eagerness_t eagerness) { 522*c43cad87SWarner Losh decay_t *decay; 523*c43cad87SWarner Losh pac_decay_stats_t *decay_stats; 524*c43cad87SWarner Losh ecache_t *ecache; 525*c43cad87SWarner Losh pac_decay_data_get(pac, state, &decay, &decay_stats, &ecache); 526*c43cad87SWarner Losh 527*c43cad87SWarner Losh if (!decay_ms_valid(decay_ms)) { 528*c43cad87SWarner Losh return true; 529*c43cad87SWarner Losh } 530*c43cad87SWarner Losh 531*c43cad87SWarner Losh malloc_mutex_lock(tsdn, &decay->mtx); 532*c43cad87SWarner Losh /* 533*c43cad87SWarner Losh * Restart decay backlog from scratch, which may cause many dirty pages 534*c43cad87SWarner Losh * to be immediately purged. It would conceptually be possible to map 535*c43cad87SWarner Losh * the old backlog onto the new backlog, but there is no justification 536*c43cad87SWarner Losh * for such complexity since decay_ms changes are intended to be 537*c43cad87SWarner Losh * infrequent, either between the {-1, 0, >0} states, or a one-time 538*c43cad87SWarner Losh * arbitrary change during initial arena configuration. 539*c43cad87SWarner Losh */ 540*c43cad87SWarner Losh nstime_t cur_time; 541*c43cad87SWarner Losh nstime_init_update(&cur_time); 542*c43cad87SWarner Losh decay_reinit(decay, &cur_time, decay_ms); 543*c43cad87SWarner Losh pac_maybe_decay_purge(tsdn, pac, decay, decay_stats, ecache, eagerness); 544*c43cad87SWarner Losh malloc_mutex_unlock(tsdn, &decay->mtx); 545*c43cad87SWarner Losh 546*c43cad87SWarner Losh return false; 547*c43cad87SWarner Losh } 548*c43cad87SWarner Losh 549*c43cad87SWarner Losh ssize_t 550*c43cad87SWarner Losh pac_decay_ms_get(pac_t *pac, extent_state_t state) { 551*c43cad87SWarner Losh decay_t *decay; 552*c43cad87SWarner Losh pac_decay_stats_t *decay_stats; 553*c43cad87SWarner Losh ecache_t *ecache; 554*c43cad87SWarner Losh pac_decay_data_get(pac, state, &decay, &decay_stats, &ecache); 555*c43cad87SWarner Losh return decay_ms_read(decay); 556*c43cad87SWarner Losh } 557*c43cad87SWarner Losh 558*c43cad87SWarner Losh void 559*c43cad87SWarner Losh pac_reset(tsdn_t *tsdn, pac_t *pac) { 560*c43cad87SWarner Losh /* 561*c43cad87SWarner Losh * No-op for now; purging is still done at the arena-level. It should 562*c43cad87SWarner Losh * get moved in here, though. 563*c43cad87SWarner Losh */ 564*c43cad87SWarner Losh (void)tsdn; 565*c43cad87SWarner Losh (void)pac; 566*c43cad87SWarner Losh } 567*c43cad87SWarner Losh 568*c43cad87SWarner Losh void 569*c43cad87SWarner Losh pac_destroy(tsdn_t *tsdn, pac_t *pac) { 570*c43cad87SWarner Losh assert(ecache_npages_get(&pac->ecache_dirty) == 0); 571*c43cad87SWarner Losh assert(ecache_npages_get(&pac->ecache_muzzy) == 0); 572*c43cad87SWarner Losh /* 573*c43cad87SWarner Losh * Iterate over the retained extents and destroy them. This gives the 574*c43cad87SWarner Losh * extent allocator underlying the extent hooks an opportunity to unmap 575*c43cad87SWarner Losh * all retained memory without having to keep its own metadata 576*c43cad87SWarner Losh * structures. In practice, virtual memory for dss-allocated extents is 577*c43cad87SWarner Losh * leaked here, so best practice is to avoid dss for arenas to be 578*c43cad87SWarner Losh * destroyed, or provide custom extent hooks that track retained 579*c43cad87SWarner Losh * dss-based extents for later reuse. 580*c43cad87SWarner Losh */ 581*c43cad87SWarner Losh ehooks_t *ehooks = pac_ehooks_get(pac); 582*c43cad87SWarner Losh edata_t *edata; 583*c43cad87SWarner Losh while ((edata = ecache_evict(tsdn, pac, ehooks, 584*c43cad87SWarner Losh &pac->ecache_retained, 0)) != NULL) { 585*c43cad87SWarner Losh extent_destroy_wrapper(tsdn, pac, ehooks, edata); 586*c43cad87SWarner Losh } 587*c43cad87SWarner Losh } 588