xref: /freebsd/contrib/jemalloc/src/pac.c (revision c43cad87172039ccf38172129c79755ea79e6102)
1*c43cad87SWarner Losh #include "jemalloc/internal/jemalloc_preamble.h"
2*c43cad87SWarner Losh #include "jemalloc/internal/jemalloc_internal_includes.h"
3*c43cad87SWarner Losh 
4*c43cad87SWarner Losh #include "jemalloc/internal/pac.h"
5*c43cad87SWarner Losh #include "jemalloc/internal/san.h"
6*c43cad87SWarner Losh 
7*c43cad87SWarner Losh static edata_t *pac_alloc_impl(tsdn_t *tsdn, pai_t *self, size_t size,
8*c43cad87SWarner Losh     size_t alignment, bool zero, bool guarded, bool frequent_reuse,
9*c43cad87SWarner Losh     bool *deferred_work_generated);
10*c43cad87SWarner Losh static bool pac_expand_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata,
11*c43cad87SWarner Losh     size_t old_size, size_t new_size, bool zero, bool *deferred_work_generated);
12*c43cad87SWarner Losh static bool pac_shrink_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata,
13*c43cad87SWarner Losh     size_t old_size, size_t new_size, bool *deferred_work_generated);
14*c43cad87SWarner Losh static void pac_dalloc_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata,
15*c43cad87SWarner Losh     bool *deferred_work_generated);
16*c43cad87SWarner Losh static uint64_t pac_time_until_deferred_work(tsdn_t *tsdn, pai_t *self);
17*c43cad87SWarner Losh 
18*c43cad87SWarner Losh static inline void
19*c43cad87SWarner Losh pac_decay_data_get(pac_t *pac, extent_state_t state,
20*c43cad87SWarner Losh     decay_t **r_decay, pac_decay_stats_t **r_decay_stats, ecache_t **r_ecache) {
21*c43cad87SWarner Losh 	switch(state) {
22*c43cad87SWarner Losh 	case extent_state_dirty:
23*c43cad87SWarner Losh 		*r_decay = &pac->decay_dirty;
24*c43cad87SWarner Losh 		*r_decay_stats = &pac->stats->decay_dirty;
25*c43cad87SWarner Losh 		*r_ecache = &pac->ecache_dirty;
26*c43cad87SWarner Losh 		return;
27*c43cad87SWarner Losh 	case extent_state_muzzy:
28*c43cad87SWarner Losh 		*r_decay = &pac->decay_muzzy;
29*c43cad87SWarner Losh 		*r_decay_stats = &pac->stats->decay_muzzy;
30*c43cad87SWarner Losh 		*r_ecache = &pac->ecache_muzzy;
31*c43cad87SWarner Losh 		return;
32*c43cad87SWarner Losh 	default:
33*c43cad87SWarner Losh 		unreachable();
34*c43cad87SWarner Losh 	}
35*c43cad87SWarner Losh }
36*c43cad87SWarner Losh 
37*c43cad87SWarner Losh bool
38*c43cad87SWarner Losh pac_init(tsdn_t *tsdn, pac_t *pac, base_t *base, emap_t *emap,
39*c43cad87SWarner Losh     edata_cache_t *edata_cache, nstime_t *cur_time,
40*c43cad87SWarner Losh     size_t pac_oversize_threshold, ssize_t dirty_decay_ms,
41*c43cad87SWarner Losh     ssize_t muzzy_decay_ms, pac_stats_t *pac_stats, malloc_mutex_t *stats_mtx) {
42*c43cad87SWarner Losh 	unsigned ind = base_ind_get(base);
43*c43cad87SWarner Losh 	/*
44*c43cad87SWarner Losh 	 * Delay coalescing for dirty extents despite the disruptive effect on
45*c43cad87SWarner Losh 	 * memory layout for best-fit extent allocation, since cached extents
46*c43cad87SWarner Losh 	 * are likely to be reused soon after deallocation, and the cost of
47*c43cad87SWarner Losh 	 * merging/splitting extents is non-trivial.
48*c43cad87SWarner Losh 	 */
49*c43cad87SWarner Losh 	if (ecache_init(tsdn, &pac->ecache_dirty, extent_state_dirty, ind,
50*c43cad87SWarner Losh 	    /* delay_coalesce */ true)) {
51*c43cad87SWarner Losh 		return true;
52*c43cad87SWarner Losh 	}
53*c43cad87SWarner Losh 	/*
54*c43cad87SWarner Losh 	 * Coalesce muzzy extents immediately, because operations on them are in
55*c43cad87SWarner Losh 	 * the critical path much less often than for dirty extents.
56*c43cad87SWarner Losh 	 */
57*c43cad87SWarner Losh 	if (ecache_init(tsdn, &pac->ecache_muzzy, extent_state_muzzy, ind,
58*c43cad87SWarner Losh 	    /* delay_coalesce */ false)) {
59*c43cad87SWarner Losh 		return true;
60*c43cad87SWarner Losh 	}
61*c43cad87SWarner Losh 	/*
62*c43cad87SWarner Losh 	 * Coalesce retained extents immediately, in part because they will
63*c43cad87SWarner Losh 	 * never be evicted (and therefore there's no opportunity for delayed
64*c43cad87SWarner Losh 	 * coalescing), but also because operations on retained extents are not
65*c43cad87SWarner Losh 	 * in the critical path.
66*c43cad87SWarner Losh 	 */
67*c43cad87SWarner Losh 	if (ecache_init(tsdn, &pac->ecache_retained, extent_state_retained,
68*c43cad87SWarner Losh 	    ind, /* delay_coalesce */ false)) {
69*c43cad87SWarner Losh 		return true;
70*c43cad87SWarner Losh 	}
71*c43cad87SWarner Losh 	exp_grow_init(&pac->exp_grow);
72*c43cad87SWarner Losh 	if (malloc_mutex_init(&pac->grow_mtx, "extent_grow",
73*c43cad87SWarner Losh 	    WITNESS_RANK_EXTENT_GROW, malloc_mutex_rank_exclusive)) {
74*c43cad87SWarner Losh 		return true;
75*c43cad87SWarner Losh 	}
76*c43cad87SWarner Losh 	atomic_store_zu(&pac->oversize_threshold, pac_oversize_threshold,
77*c43cad87SWarner Losh 	    ATOMIC_RELAXED);
78*c43cad87SWarner Losh 	if (decay_init(&pac->decay_dirty, cur_time, dirty_decay_ms)) {
79*c43cad87SWarner Losh 		return true;
80*c43cad87SWarner Losh 	}
81*c43cad87SWarner Losh 	if (decay_init(&pac->decay_muzzy, cur_time, muzzy_decay_ms)) {
82*c43cad87SWarner Losh 		return true;
83*c43cad87SWarner Losh 	}
84*c43cad87SWarner Losh 	if (san_bump_alloc_init(&pac->sba)) {
85*c43cad87SWarner Losh 		return true;
86*c43cad87SWarner Losh 	}
87*c43cad87SWarner Losh 
88*c43cad87SWarner Losh 	pac->base = base;
89*c43cad87SWarner Losh 	pac->emap = emap;
90*c43cad87SWarner Losh 	pac->edata_cache = edata_cache;
91*c43cad87SWarner Losh 	pac->stats = pac_stats;
92*c43cad87SWarner Losh 	pac->stats_mtx = stats_mtx;
93*c43cad87SWarner Losh 	atomic_store_zu(&pac->extent_sn_next, 0, ATOMIC_RELAXED);
94*c43cad87SWarner Losh 
95*c43cad87SWarner Losh 	pac->pai.alloc = &pac_alloc_impl;
96*c43cad87SWarner Losh 	pac->pai.alloc_batch = &pai_alloc_batch_default;
97*c43cad87SWarner Losh 	pac->pai.expand = &pac_expand_impl;
98*c43cad87SWarner Losh 	pac->pai.shrink = &pac_shrink_impl;
99*c43cad87SWarner Losh 	pac->pai.dalloc = &pac_dalloc_impl;
100*c43cad87SWarner Losh 	pac->pai.dalloc_batch = &pai_dalloc_batch_default;
101*c43cad87SWarner Losh 	pac->pai.time_until_deferred_work = &pac_time_until_deferred_work;
102*c43cad87SWarner Losh 
103*c43cad87SWarner Losh 	return false;
104*c43cad87SWarner Losh }
105*c43cad87SWarner Losh 
106*c43cad87SWarner Losh static inline bool
107*c43cad87SWarner Losh pac_may_have_muzzy(pac_t *pac) {
108*c43cad87SWarner Losh 	return pac_decay_ms_get(pac, extent_state_muzzy) != 0;
109*c43cad87SWarner Losh }
110*c43cad87SWarner Losh 
111*c43cad87SWarner Losh static edata_t *
112*c43cad87SWarner Losh pac_alloc_real(tsdn_t *tsdn, pac_t *pac, ehooks_t *ehooks, size_t size,
113*c43cad87SWarner Losh     size_t alignment, bool zero, bool guarded) {
114*c43cad87SWarner Losh 	assert(!guarded || alignment <= PAGE);
115*c43cad87SWarner Losh 
116*c43cad87SWarner Losh 	edata_t *edata = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_dirty,
117*c43cad87SWarner Losh 	    NULL, size, alignment, zero, guarded);
118*c43cad87SWarner Losh 
119*c43cad87SWarner Losh 	if (edata == NULL && pac_may_have_muzzy(pac)) {
120*c43cad87SWarner Losh 		edata = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_muzzy,
121*c43cad87SWarner Losh 		    NULL, size, alignment, zero, guarded);
122*c43cad87SWarner Losh 	}
123*c43cad87SWarner Losh 	if (edata == NULL) {
124*c43cad87SWarner Losh 		edata = ecache_alloc_grow(tsdn, pac, ehooks,
125*c43cad87SWarner Losh 		    &pac->ecache_retained, NULL, size, alignment, zero,
126*c43cad87SWarner Losh 		    guarded);
127*c43cad87SWarner Losh 		if (config_stats && edata != NULL) {
128*c43cad87SWarner Losh 			atomic_fetch_add_zu(&pac->stats->pac_mapped, size,
129*c43cad87SWarner Losh 			    ATOMIC_RELAXED);
130*c43cad87SWarner Losh 		}
131*c43cad87SWarner Losh 	}
132*c43cad87SWarner Losh 
133*c43cad87SWarner Losh 	return edata;
134*c43cad87SWarner Losh }
135*c43cad87SWarner Losh 
136*c43cad87SWarner Losh static edata_t *
137*c43cad87SWarner Losh pac_alloc_new_guarded(tsdn_t *tsdn, pac_t *pac, ehooks_t *ehooks, size_t size,
138*c43cad87SWarner Losh     size_t alignment, bool zero, bool frequent_reuse) {
139*c43cad87SWarner Losh 	assert(alignment <= PAGE);
140*c43cad87SWarner Losh 
141*c43cad87SWarner Losh 	edata_t *edata;
142*c43cad87SWarner Losh 	if (san_bump_enabled() && frequent_reuse) {
143*c43cad87SWarner Losh 		edata = san_bump_alloc(tsdn, &pac->sba, pac, ehooks, size,
144*c43cad87SWarner Losh 		    zero);
145*c43cad87SWarner Losh 	} else {
146*c43cad87SWarner Losh 		size_t size_with_guards = san_two_side_guarded_sz(size);
147*c43cad87SWarner Losh 		/* Alloc a non-guarded extent first.*/
148*c43cad87SWarner Losh 		edata = pac_alloc_real(tsdn, pac, ehooks, size_with_guards,
149*c43cad87SWarner Losh 		    /* alignment */ PAGE, zero, /* guarded */ false);
150*c43cad87SWarner Losh 		if (edata != NULL) {
151*c43cad87SWarner Losh 			/* Add guards around it. */
152*c43cad87SWarner Losh 			assert(edata_size_get(edata) == size_with_guards);
153*c43cad87SWarner Losh 			san_guard_pages_two_sided(tsdn, ehooks, edata,
154*c43cad87SWarner Losh 			    pac->emap, true);
155*c43cad87SWarner Losh 		}
156*c43cad87SWarner Losh 	}
157*c43cad87SWarner Losh 	assert(edata == NULL || (edata_guarded_get(edata) &&
158*c43cad87SWarner Losh 	    edata_size_get(edata) == size));
159*c43cad87SWarner Losh 
160*c43cad87SWarner Losh 	return edata;
161*c43cad87SWarner Losh }
162*c43cad87SWarner Losh 
163*c43cad87SWarner Losh static edata_t *
164*c43cad87SWarner Losh pac_alloc_impl(tsdn_t *tsdn, pai_t *self, size_t size, size_t alignment,
165*c43cad87SWarner Losh     bool zero, bool guarded, bool frequent_reuse,
166*c43cad87SWarner Losh     bool *deferred_work_generated) {
167*c43cad87SWarner Losh 	pac_t *pac = (pac_t *)self;
168*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
169*c43cad87SWarner Losh 
170*c43cad87SWarner Losh 	edata_t *edata = NULL;
171*c43cad87SWarner Losh 	/*
172*c43cad87SWarner Losh 	 * The condition is an optimization - not frequently reused guarded
173*c43cad87SWarner Losh 	 * allocations are never put in the ecache.  pac_alloc_real also
174*c43cad87SWarner Losh 	 * doesn't grow retained for guarded allocations.  So pac_alloc_real
175*c43cad87SWarner Losh 	 * for such allocations would always return NULL.
176*c43cad87SWarner Losh 	 * */
177*c43cad87SWarner Losh 	if (!guarded || frequent_reuse) {
178*c43cad87SWarner Losh 		edata =	pac_alloc_real(tsdn, pac, ehooks, size, alignment,
179*c43cad87SWarner Losh 		    zero, guarded);
180*c43cad87SWarner Losh 	}
181*c43cad87SWarner Losh 	if (edata == NULL && guarded) {
182*c43cad87SWarner Losh 		/* No cached guarded extents; creating a new one. */
183*c43cad87SWarner Losh 		edata = pac_alloc_new_guarded(tsdn, pac, ehooks, size,
184*c43cad87SWarner Losh 		    alignment, zero, frequent_reuse);
185*c43cad87SWarner Losh 	}
186*c43cad87SWarner Losh 
187*c43cad87SWarner Losh 	return edata;
188*c43cad87SWarner Losh }
189*c43cad87SWarner Losh 
190*c43cad87SWarner Losh static bool
191*c43cad87SWarner Losh pac_expand_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, size_t old_size,
192*c43cad87SWarner Losh     size_t new_size, bool zero, bool *deferred_work_generated) {
193*c43cad87SWarner Losh 	pac_t *pac = (pac_t *)self;
194*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
195*c43cad87SWarner Losh 
196*c43cad87SWarner Losh 	size_t mapped_add = 0;
197*c43cad87SWarner Losh 	size_t expand_amount = new_size - old_size;
198*c43cad87SWarner Losh 
199*c43cad87SWarner Losh 	if (ehooks_merge_will_fail(ehooks)) {
200*c43cad87SWarner Losh 		return true;
201*c43cad87SWarner Losh 	}
202*c43cad87SWarner Losh 	edata_t *trail = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_dirty,
203*c43cad87SWarner Losh 	    edata, expand_amount, PAGE, zero, /* guarded*/ false);
204*c43cad87SWarner Losh 	if (trail == NULL) {
205*c43cad87SWarner Losh 		trail = ecache_alloc(tsdn, pac, ehooks, &pac->ecache_muzzy,
206*c43cad87SWarner Losh 		    edata, expand_amount, PAGE, zero, /* guarded*/ false);
207*c43cad87SWarner Losh 	}
208*c43cad87SWarner Losh 	if (trail == NULL) {
209*c43cad87SWarner Losh 		trail = ecache_alloc_grow(tsdn, pac, ehooks,
210*c43cad87SWarner Losh 		    &pac->ecache_retained, edata, expand_amount, PAGE, zero,
211*c43cad87SWarner Losh 		    /* guarded */ false);
212*c43cad87SWarner Losh 		mapped_add = expand_amount;
213*c43cad87SWarner Losh 	}
214*c43cad87SWarner Losh 	if (trail == NULL) {
215*c43cad87SWarner Losh 		return true;
216*c43cad87SWarner Losh 	}
217*c43cad87SWarner Losh 	if (extent_merge_wrapper(tsdn, pac, ehooks, edata, trail)) {
218*c43cad87SWarner Losh 		extent_dalloc_wrapper(tsdn, pac, ehooks, trail);
219*c43cad87SWarner Losh 		return true;
220*c43cad87SWarner Losh 	}
221*c43cad87SWarner Losh 	if (config_stats && mapped_add > 0) {
222*c43cad87SWarner Losh 		atomic_fetch_add_zu(&pac->stats->pac_mapped, mapped_add,
223*c43cad87SWarner Losh 		    ATOMIC_RELAXED);
224*c43cad87SWarner Losh 	}
225*c43cad87SWarner Losh 	return false;
226*c43cad87SWarner Losh }
227*c43cad87SWarner Losh 
228*c43cad87SWarner Losh static bool
229*c43cad87SWarner Losh pac_shrink_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata, size_t old_size,
230*c43cad87SWarner Losh     size_t new_size, bool *deferred_work_generated) {
231*c43cad87SWarner Losh 	pac_t *pac = (pac_t *)self;
232*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
233*c43cad87SWarner Losh 
234*c43cad87SWarner Losh 	size_t shrink_amount = old_size - new_size;
235*c43cad87SWarner Losh 
236*c43cad87SWarner Losh 	if (ehooks_split_will_fail(ehooks)) {
237*c43cad87SWarner Losh 		return true;
238*c43cad87SWarner Losh 	}
239*c43cad87SWarner Losh 
240*c43cad87SWarner Losh 	edata_t *trail = extent_split_wrapper(tsdn, pac, ehooks, edata,
241*c43cad87SWarner Losh 	    new_size, shrink_amount, /* holding_core_locks */ false);
242*c43cad87SWarner Losh 	if (trail == NULL) {
243*c43cad87SWarner Losh 		return true;
244*c43cad87SWarner Losh 	}
245*c43cad87SWarner Losh 	ecache_dalloc(tsdn, pac, ehooks, &pac->ecache_dirty, trail);
246*c43cad87SWarner Losh 	*deferred_work_generated = true;
247*c43cad87SWarner Losh 	return false;
248*c43cad87SWarner Losh }
249*c43cad87SWarner Losh 
250*c43cad87SWarner Losh static void
251*c43cad87SWarner Losh pac_dalloc_impl(tsdn_t *tsdn, pai_t *self, edata_t *edata,
252*c43cad87SWarner Losh     bool *deferred_work_generated) {
253*c43cad87SWarner Losh 	pac_t *pac = (pac_t *)self;
254*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
255*c43cad87SWarner Losh 
256*c43cad87SWarner Losh 	if (edata_guarded_get(edata)) {
257*c43cad87SWarner Losh 		/*
258*c43cad87SWarner Losh 		 * Because cached guarded extents do exact fit only, large
259*c43cad87SWarner Losh 		 * guarded extents are restored on dalloc eagerly (otherwise
260*c43cad87SWarner Losh 		 * they will not be reused efficiently).  Slab sizes have a
261*c43cad87SWarner Losh 		 * limited number of size classes, and tend to cycle faster.
262*c43cad87SWarner Losh 		 *
263*c43cad87SWarner Losh 		 * In the case where coalesce is restrained (VirtualFree on
264*c43cad87SWarner Losh 		 * Windows), guarded extents are also not cached -- otherwise
265*c43cad87SWarner Losh 		 * during arena destroy / reset, the retained extents would not
266*c43cad87SWarner Losh 		 * be whole regions (i.e. they are split between regular and
267*c43cad87SWarner Losh 		 * guarded).
268*c43cad87SWarner Losh 		 */
269*c43cad87SWarner Losh 		if (!edata_slab_get(edata) || !maps_coalesce) {
270*c43cad87SWarner Losh 			assert(edata_size_get(edata) >= SC_LARGE_MINCLASS ||
271*c43cad87SWarner Losh 			    !maps_coalesce);
272*c43cad87SWarner Losh 			san_unguard_pages_two_sided(tsdn, ehooks, edata,
273*c43cad87SWarner Losh 			    pac->emap);
274*c43cad87SWarner Losh 		}
275*c43cad87SWarner Losh 	}
276*c43cad87SWarner Losh 
277*c43cad87SWarner Losh 	ecache_dalloc(tsdn, pac, ehooks, &pac->ecache_dirty, edata);
278*c43cad87SWarner Losh 	/* Purging of deallocated pages is deferred */
279*c43cad87SWarner Losh 	*deferred_work_generated = true;
280*c43cad87SWarner Losh }
281*c43cad87SWarner Losh 
282*c43cad87SWarner Losh static inline uint64_t
283*c43cad87SWarner Losh pac_ns_until_purge(tsdn_t *tsdn, decay_t *decay, size_t npages) {
284*c43cad87SWarner Losh 	if (malloc_mutex_trylock(tsdn, &decay->mtx)) {
285*c43cad87SWarner Losh 		/* Use minimal interval if decay is contended. */
286*c43cad87SWarner Losh 		return BACKGROUND_THREAD_DEFERRED_MIN;
287*c43cad87SWarner Losh 	}
288*c43cad87SWarner Losh 	uint64_t result = decay_ns_until_purge(decay, npages,
289*c43cad87SWarner Losh 	    ARENA_DEFERRED_PURGE_NPAGES_THRESHOLD);
290*c43cad87SWarner Losh 
291*c43cad87SWarner Losh 	malloc_mutex_unlock(tsdn, &decay->mtx);
292*c43cad87SWarner Losh 	return result;
293*c43cad87SWarner Losh }
294*c43cad87SWarner Losh 
295*c43cad87SWarner Losh static uint64_t
296*c43cad87SWarner Losh pac_time_until_deferred_work(tsdn_t *tsdn, pai_t *self) {
297*c43cad87SWarner Losh 	uint64_t time;
298*c43cad87SWarner Losh 	pac_t *pac = (pac_t *)self;
299*c43cad87SWarner Losh 
300*c43cad87SWarner Losh 	time = pac_ns_until_purge(tsdn,
301*c43cad87SWarner Losh 	    &pac->decay_dirty,
302*c43cad87SWarner Losh 	    ecache_npages_get(&pac->ecache_dirty));
303*c43cad87SWarner Losh 	if (time == BACKGROUND_THREAD_DEFERRED_MIN) {
304*c43cad87SWarner Losh 		return time;
305*c43cad87SWarner Losh 	}
306*c43cad87SWarner Losh 
307*c43cad87SWarner Losh 	uint64_t muzzy = pac_ns_until_purge(tsdn,
308*c43cad87SWarner Losh 	    &pac->decay_muzzy,
309*c43cad87SWarner Losh 	    ecache_npages_get(&pac->ecache_muzzy));
310*c43cad87SWarner Losh 	if (muzzy < time) {
311*c43cad87SWarner Losh 		time = muzzy;
312*c43cad87SWarner Losh 	}
313*c43cad87SWarner Losh 	return time;
314*c43cad87SWarner Losh }
315*c43cad87SWarner Losh 
316*c43cad87SWarner Losh bool
317*c43cad87SWarner Losh pac_retain_grow_limit_get_set(tsdn_t *tsdn, pac_t *pac, size_t *old_limit,
318*c43cad87SWarner Losh     size_t *new_limit) {
319*c43cad87SWarner Losh 	pszind_t new_ind JEMALLOC_CC_SILENCE_INIT(0);
320*c43cad87SWarner Losh 	if (new_limit != NULL) {
321*c43cad87SWarner Losh 		size_t limit = *new_limit;
322*c43cad87SWarner Losh 		/* Grow no more than the new limit. */
323*c43cad87SWarner Losh 		if ((new_ind = sz_psz2ind(limit + 1) - 1) >= SC_NPSIZES) {
324*c43cad87SWarner Losh 			return true;
325*c43cad87SWarner Losh 		}
326*c43cad87SWarner Losh 	}
327*c43cad87SWarner Losh 
328*c43cad87SWarner Losh 	malloc_mutex_lock(tsdn, &pac->grow_mtx);
329*c43cad87SWarner Losh 	if (old_limit != NULL) {
330*c43cad87SWarner Losh 		*old_limit = sz_pind2sz(pac->exp_grow.limit);
331*c43cad87SWarner Losh 	}
332*c43cad87SWarner Losh 	if (new_limit != NULL) {
333*c43cad87SWarner Losh 		pac->exp_grow.limit = new_ind;
334*c43cad87SWarner Losh 	}
335*c43cad87SWarner Losh 	malloc_mutex_unlock(tsdn, &pac->grow_mtx);
336*c43cad87SWarner Losh 
337*c43cad87SWarner Losh 	return false;
338*c43cad87SWarner Losh }
339*c43cad87SWarner Losh 
340*c43cad87SWarner Losh static size_t
341*c43cad87SWarner Losh pac_stash_decayed(tsdn_t *tsdn, pac_t *pac, ecache_t *ecache,
342*c43cad87SWarner Losh     size_t npages_limit, size_t npages_decay_max,
343*c43cad87SWarner Losh     edata_list_inactive_t *result) {
344*c43cad87SWarner Losh 	witness_assert_depth_to_rank(tsdn_witness_tsdp_get(tsdn),
345*c43cad87SWarner Losh 	    WITNESS_RANK_CORE, 0);
346*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
347*c43cad87SWarner Losh 
348*c43cad87SWarner Losh 	/* Stash extents according to npages_limit. */
349*c43cad87SWarner Losh 	size_t nstashed = 0;
350*c43cad87SWarner Losh 	while (nstashed < npages_decay_max) {
351*c43cad87SWarner Losh 		edata_t *edata = ecache_evict(tsdn, pac, ehooks, ecache,
352*c43cad87SWarner Losh 		    npages_limit);
353*c43cad87SWarner Losh 		if (edata == NULL) {
354*c43cad87SWarner Losh 			break;
355*c43cad87SWarner Losh 		}
356*c43cad87SWarner Losh 		edata_list_inactive_append(result, edata);
357*c43cad87SWarner Losh 		nstashed += edata_size_get(edata) >> LG_PAGE;
358*c43cad87SWarner Losh 	}
359*c43cad87SWarner Losh 	return nstashed;
360*c43cad87SWarner Losh }
361*c43cad87SWarner Losh 
362*c43cad87SWarner Losh static size_t
363*c43cad87SWarner Losh pac_decay_stashed(tsdn_t *tsdn, pac_t *pac, decay_t *decay,
364*c43cad87SWarner Losh     pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay,
365*c43cad87SWarner Losh     edata_list_inactive_t *decay_extents) {
366*c43cad87SWarner Losh 	bool err;
367*c43cad87SWarner Losh 
368*c43cad87SWarner Losh 	size_t nmadvise = 0;
369*c43cad87SWarner Losh 	size_t nunmapped = 0;
370*c43cad87SWarner Losh 	size_t npurged = 0;
371*c43cad87SWarner Losh 
372*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
373*c43cad87SWarner Losh 
374*c43cad87SWarner Losh 	bool try_muzzy = !fully_decay
375*c43cad87SWarner Losh 	    && pac_decay_ms_get(pac, extent_state_muzzy) != 0;
376*c43cad87SWarner Losh 
377*c43cad87SWarner Losh 	for (edata_t *edata = edata_list_inactive_first(decay_extents); edata !=
378*c43cad87SWarner Losh 	    NULL; edata = edata_list_inactive_first(decay_extents)) {
379*c43cad87SWarner Losh 		edata_list_inactive_remove(decay_extents, edata);
380*c43cad87SWarner Losh 
381*c43cad87SWarner Losh 		size_t size = edata_size_get(edata);
382*c43cad87SWarner Losh 		size_t npages = size >> LG_PAGE;
383*c43cad87SWarner Losh 
384*c43cad87SWarner Losh 		nmadvise++;
385*c43cad87SWarner Losh 		npurged += npages;
386*c43cad87SWarner Losh 
387*c43cad87SWarner Losh 		switch (ecache->state) {
388*c43cad87SWarner Losh 		case extent_state_active:
389*c43cad87SWarner Losh 			not_reached();
390*c43cad87SWarner Losh 		case extent_state_dirty:
391*c43cad87SWarner Losh 			if (try_muzzy) {
392*c43cad87SWarner Losh 				err = extent_purge_lazy_wrapper(tsdn, ehooks,
393*c43cad87SWarner Losh 				    edata, /* offset */ 0, size);
394*c43cad87SWarner Losh 				if (!err) {
395*c43cad87SWarner Losh 					ecache_dalloc(tsdn, pac, ehooks,
396*c43cad87SWarner Losh 					    &pac->ecache_muzzy, edata);
397*c43cad87SWarner Losh 					break;
398*c43cad87SWarner Losh 				}
399*c43cad87SWarner Losh 			}
400*c43cad87SWarner Losh 			JEMALLOC_FALLTHROUGH;
401*c43cad87SWarner Losh 		case extent_state_muzzy:
402*c43cad87SWarner Losh 			extent_dalloc_wrapper(tsdn, pac, ehooks, edata);
403*c43cad87SWarner Losh 			nunmapped += npages;
404*c43cad87SWarner Losh 			break;
405*c43cad87SWarner Losh 		case extent_state_retained:
406*c43cad87SWarner Losh 		default:
407*c43cad87SWarner Losh 			not_reached();
408*c43cad87SWarner Losh 		}
409*c43cad87SWarner Losh 	}
410*c43cad87SWarner Losh 
411*c43cad87SWarner Losh 	if (config_stats) {
412*c43cad87SWarner Losh 		LOCKEDINT_MTX_LOCK(tsdn, *pac->stats_mtx);
413*c43cad87SWarner Losh 		locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx),
414*c43cad87SWarner Losh 		    &decay_stats->npurge, 1);
415*c43cad87SWarner Losh 		locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx),
416*c43cad87SWarner Losh 		    &decay_stats->nmadvise, nmadvise);
417*c43cad87SWarner Losh 		locked_inc_u64(tsdn, LOCKEDINT_MTX(*pac->stats_mtx),
418*c43cad87SWarner Losh 		    &decay_stats->purged, npurged);
419*c43cad87SWarner Losh 		LOCKEDINT_MTX_UNLOCK(tsdn, *pac->stats_mtx);
420*c43cad87SWarner Losh 		atomic_fetch_sub_zu(&pac->stats->pac_mapped,
421*c43cad87SWarner Losh 		    nunmapped << LG_PAGE, ATOMIC_RELAXED);
422*c43cad87SWarner Losh 	}
423*c43cad87SWarner Losh 
424*c43cad87SWarner Losh 	return npurged;
425*c43cad87SWarner Losh }
426*c43cad87SWarner Losh 
427*c43cad87SWarner Losh /*
428*c43cad87SWarner Losh  * npages_limit: Decay at most npages_decay_max pages without violating the
429*c43cad87SWarner Losh  * invariant: (ecache_npages_get(ecache) >= npages_limit).  We need an upper
430*c43cad87SWarner Losh  * bound on number of pages in order to prevent unbounded growth (namely in
431*c43cad87SWarner Losh  * stashed), otherwise unbounded new pages could be added to extents during the
432*c43cad87SWarner Losh  * current decay run, so that the purging thread never finishes.
433*c43cad87SWarner Losh  */
434*c43cad87SWarner Losh static void
435*c43cad87SWarner Losh pac_decay_to_limit(tsdn_t *tsdn, pac_t *pac, decay_t *decay,
436*c43cad87SWarner Losh     pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay,
437*c43cad87SWarner Losh     size_t npages_limit, size_t npages_decay_max) {
438*c43cad87SWarner Losh 	witness_assert_depth_to_rank(tsdn_witness_tsdp_get(tsdn),
439*c43cad87SWarner Losh 	    WITNESS_RANK_CORE, 1);
440*c43cad87SWarner Losh 
441*c43cad87SWarner Losh 	if (decay->purging || npages_decay_max == 0) {
442*c43cad87SWarner Losh 		return;
443*c43cad87SWarner Losh 	}
444*c43cad87SWarner Losh 	decay->purging = true;
445*c43cad87SWarner Losh 	malloc_mutex_unlock(tsdn, &decay->mtx);
446*c43cad87SWarner Losh 
447*c43cad87SWarner Losh 	edata_list_inactive_t decay_extents;
448*c43cad87SWarner Losh 	edata_list_inactive_init(&decay_extents);
449*c43cad87SWarner Losh 	size_t npurge = pac_stash_decayed(tsdn, pac, ecache, npages_limit,
450*c43cad87SWarner Losh 	    npages_decay_max, &decay_extents);
451*c43cad87SWarner Losh 	if (npurge != 0) {
452*c43cad87SWarner Losh 		size_t npurged = pac_decay_stashed(tsdn, pac, decay,
453*c43cad87SWarner Losh 		    decay_stats, ecache, fully_decay, &decay_extents);
454*c43cad87SWarner Losh 		assert(npurged == npurge);
455*c43cad87SWarner Losh 	}
456*c43cad87SWarner Losh 
457*c43cad87SWarner Losh 	malloc_mutex_lock(tsdn, &decay->mtx);
458*c43cad87SWarner Losh 	decay->purging = false;
459*c43cad87SWarner Losh }
460*c43cad87SWarner Losh 
461*c43cad87SWarner Losh void
462*c43cad87SWarner Losh pac_decay_all(tsdn_t *tsdn, pac_t *pac, decay_t *decay,
463*c43cad87SWarner Losh     pac_decay_stats_t *decay_stats, ecache_t *ecache, bool fully_decay) {
464*c43cad87SWarner Losh 	malloc_mutex_assert_owner(tsdn, &decay->mtx);
465*c43cad87SWarner Losh 	pac_decay_to_limit(tsdn, pac, decay, decay_stats, ecache, fully_decay,
466*c43cad87SWarner Losh 	    /* npages_limit */ 0, ecache_npages_get(ecache));
467*c43cad87SWarner Losh }
468*c43cad87SWarner Losh 
469*c43cad87SWarner Losh static void
470*c43cad87SWarner Losh pac_decay_try_purge(tsdn_t *tsdn, pac_t *pac, decay_t *decay,
471*c43cad87SWarner Losh     pac_decay_stats_t *decay_stats, ecache_t *ecache,
472*c43cad87SWarner Losh     size_t current_npages, size_t npages_limit) {
473*c43cad87SWarner Losh 	if (current_npages > npages_limit) {
474*c43cad87SWarner Losh 		pac_decay_to_limit(tsdn, pac, decay, decay_stats, ecache,
475*c43cad87SWarner Losh 		    /* fully_decay */ false, npages_limit,
476*c43cad87SWarner Losh 		    current_npages - npages_limit);
477*c43cad87SWarner Losh 	}
478*c43cad87SWarner Losh }
479*c43cad87SWarner Losh 
480*c43cad87SWarner Losh bool
481*c43cad87SWarner Losh pac_maybe_decay_purge(tsdn_t *tsdn, pac_t *pac, decay_t *decay,
482*c43cad87SWarner Losh     pac_decay_stats_t *decay_stats, ecache_t *ecache,
483*c43cad87SWarner Losh     pac_purge_eagerness_t eagerness) {
484*c43cad87SWarner Losh 	malloc_mutex_assert_owner(tsdn, &decay->mtx);
485*c43cad87SWarner Losh 
486*c43cad87SWarner Losh 	/* Purge all or nothing if the option is disabled. */
487*c43cad87SWarner Losh 	ssize_t decay_ms = decay_ms_read(decay);
488*c43cad87SWarner Losh 	if (decay_ms <= 0) {
489*c43cad87SWarner Losh 		if (decay_ms == 0) {
490*c43cad87SWarner Losh 			pac_decay_to_limit(tsdn, pac, decay, decay_stats,
491*c43cad87SWarner Losh 			    ecache, /* fully_decay */ false,
492*c43cad87SWarner Losh 			    /* npages_limit */ 0, ecache_npages_get(ecache));
493*c43cad87SWarner Losh 		}
494*c43cad87SWarner Losh 		return false;
495*c43cad87SWarner Losh 	}
496*c43cad87SWarner Losh 
497*c43cad87SWarner Losh 	/*
498*c43cad87SWarner Losh 	 * If the deadline has been reached, advance to the current epoch and
499*c43cad87SWarner Losh 	 * purge to the new limit if necessary.  Note that dirty pages created
500*c43cad87SWarner Losh 	 * during the current epoch are not subject to purge until a future
501*c43cad87SWarner Losh 	 * epoch, so as a result purging only happens during epoch advances, or
502*c43cad87SWarner Losh 	 * being triggered by background threads (scheduled event).
503*c43cad87SWarner Losh 	 */
504*c43cad87SWarner Losh 	nstime_t time;
505*c43cad87SWarner Losh 	nstime_init_update(&time);
506*c43cad87SWarner Losh 	size_t npages_current = ecache_npages_get(ecache);
507*c43cad87SWarner Losh 	bool epoch_advanced = decay_maybe_advance_epoch(decay, &time,
508*c43cad87SWarner Losh 	    npages_current);
509*c43cad87SWarner Losh 	if (eagerness == PAC_PURGE_ALWAYS
510*c43cad87SWarner Losh 	    || (epoch_advanced && eagerness == PAC_PURGE_ON_EPOCH_ADVANCE)) {
511*c43cad87SWarner Losh 		size_t npages_limit = decay_npages_limit_get(decay);
512*c43cad87SWarner Losh 		pac_decay_try_purge(tsdn, pac, decay, decay_stats, ecache,
513*c43cad87SWarner Losh 		    npages_current, npages_limit);
514*c43cad87SWarner Losh 	}
515*c43cad87SWarner Losh 
516*c43cad87SWarner Losh 	return epoch_advanced;
517*c43cad87SWarner Losh }
518*c43cad87SWarner Losh 
519*c43cad87SWarner Losh bool
520*c43cad87SWarner Losh pac_decay_ms_set(tsdn_t *tsdn, pac_t *pac, extent_state_t state,
521*c43cad87SWarner Losh     ssize_t decay_ms, pac_purge_eagerness_t eagerness) {
522*c43cad87SWarner Losh 	decay_t *decay;
523*c43cad87SWarner Losh 	pac_decay_stats_t *decay_stats;
524*c43cad87SWarner Losh 	ecache_t *ecache;
525*c43cad87SWarner Losh 	pac_decay_data_get(pac, state, &decay, &decay_stats, &ecache);
526*c43cad87SWarner Losh 
527*c43cad87SWarner Losh 	if (!decay_ms_valid(decay_ms)) {
528*c43cad87SWarner Losh 		return true;
529*c43cad87SWarner Losh 	}
530*c43cad87SWarner Losh 
531*c43cad87SWarner Losh 	malloc_mutex_lock(tsdn, &decay->mtx);
532*c43cad87SWarner Losh 	/*
533*c43cad87SWarner Losh 	 * Restart decay backlog from scratch, which may cause many dirty pages
534*c43cad87SWarner Losh 	 * to be immediately purged.  It would conceptually be possible to map
535*c43cad87SWarner Losh 	 * the old backlog onto the new backlog, but there is no justification
536*c43cad87SWarner Losh 	 * for such complexity since decay_ms changes are intended to be
537*c43cad87SWarner Losh 	 * infrequent, either between the {-1, 0, >0} states, or a one-time
538*c43cad87SWarner Losh 	 * arbitrary change during initial arena configuration.
539*c43cad87SWarner Losh 	 */
540*c43cad87SWarner Losh 	nstime_t cur_time;
541*c43cad87SWarner Losh 	nstime_init_update(&cur_time);
542*c43cad87SWarner Losh 	decay_reinit(decay, &cur_time, decay_ms);
543*c43cad87SWarner Losh 	pac_maybe_decay_purge(tsdn, pac, decay, decay_stats, ecache, eagerness);
544*c43cad87SWarner Losh 	malloc_mutex_unlock(tsdn, &decay->mtx);
545*c43cad87SWarner Losh 
546*c43cad87SWarner Losh 	return false;
547*c43cad87SWarner Losh }
548*c43cad87SWarner Losh 
549*c43cad87SWarner Losh ssize_t
550*c43cad87SWarner Losh pac_decay_ms_get(pac_t *pac, extent_state_t state) {
551*c43cad87SWarner Losh 	decay_t *decay;
552*c43cad87SWarner Losh 	pac_decay_stats_t *decay_stats;
553*c43cad87SWarner Losh 	ecache_t *ecache;
554*c43cad87SWarner Losh 	pac_decay_data_get(pac, state, &decay, &decay_stats, &ecache);
555*c43cad87SWarner Losh 	return decay_ms_read(decay);
556*c43cad87SWarner Losh }
557*c43cad87SWarner Losh 
558*c43cad87SWarner Losh void
559*c43cad87SWarner Losh pac_reset(tsdn_t *tsdn, pac_t *pac) {
560*c43cad87SWarner Losh 	/*
561*c43cad87SWarner Losh 	 * No-op for now; purging is still done at the arena-level.  It should
562*c43cad87SWarner Losh 	 * get moved in here, though.
563*c43cad87SWarner Losh 	 */
564*c43cad87SWarner Losh 	(void)tsdn;
565*c43cad87SWarner Losh 	(void)pac;
566*c43cad87SWarner Losh }
567*c43cad87SWarner Losh 
568*c43cad87SWarner Losh void
569*c43cad87SWarner Losh pac_destroy(tsdn_t *tsdn, pac_t *pac) {
570*c43cad87SWarner Losh 	assert(ecache_npages_get(&pac->ecache_dirty) == 0);
571*c43cad87SWarner Losh 	assert(ecache_npages_get(&pac->ecache_muzzy) == 0);
572*c43cad87SWarner Losh 	/*
573*c43cad87SWarner Losh 	 * Iterate over the retained extents and destroy them.  This gives the
574*c43cad87SWarner Losh 	 * extent allocator underlying the extent hooks an opportunity to unmap
575*c43cad87SWarner Losh 	 * all retained memory without having to keep its own metadata
576*c43cad87SWarner Losh 	 * structures.  In practice, virtual memory for dss-allocated extents is
577*c43cad87SWarner Losh 	 * leaked here, so best practice is to avoid dss for arenas to be
578*c43cad87SWarner Losh 	 * destroyed, or provide custom extent hooks that track retained
579*c43cad87SWarner Losh 	 * dss-based extents for later reuse.
580*c43cad87SWarner Losh 	 */
581*c43cad87SWarner Losh 	ehooks_t *ehooks = pac_ehooks_get(pac);
582*c43cad87SWarner Losh 	edata_t *edata;
583*c43cad87SWarner Losh 	while ((edata = ecache_evict(tsdn, pac, ehooks,
584*c43cad87SWarner Losh 	    &pac->ecache_retained, 0)) != NULL) {
585*c43cad87SWarner Losh 		extent_destroy_wrapper(tsdn, pac, ehooks, edata);
586*c43cad87SWarner Losh 	}
587*c43cad87SWarner Losh }
588