1b7eaed25SJason Evans #define JEMALLOC_EXTENT_DSS_C_
2b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_preamble.h"
3b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_internal_includes.h"
4b7eaed25SJason Evans
5b7eaed25SJason Evans #include "jemalloc/internal/assert.h"
6b7eaed25SJason Evans #include "jemalloc/internal/extent_dss.h"
7b7eaed25SJason Evans #include "jemalloc/internal/spin.h"
8b7eaed25SJason Evans
9b7eaed25SJason Evans /******************************************************************************/
10b7eaed25SJason Evans /* Data. */
11b7eaed25SJason Evans
12b7eaed25SJason Evans const char *opt_dss = DSS_DEFAULT;
13b7eaed25SJason Evans
14b7eaed25SJason Evans const char *dss_prec_names[] = {
15b7eaed25SJason Evans "disabled",
16b7eaed25SJason Evans "primary",
17b7eaed25SJason Evans "secondary",
18b7eaed25SJason Evans "N/A"
19b7eaed25SJason Evans };
20b7eaed25SJason Evans
21b7eaed25SJason Evans /*
22b7eaed25SJason Evans * Current dss precedence default, used when creating new arenas. NB: This is
23b7eaed25SJason Evans * stored as unsigned rather than dss_prec_t because in principle there's no
24b7eaed25SJason Evans * guarantee that sizeof(dss_prec_t) is the same as sizeof(unsigned), and we use
25b7eaed25SJason Evans * atomic operations to synchronize the setting.
26b7eaed25SJason Evans */
27b7eaed25SJason Evans static atomic_u_t dss_prec_default = ATOMIC_INIT(
28b7eaed25SJason Evans (unsigned)DSS_PREC_DEFAULT);
29b7eaed25SJason Evans
30b7eaed25SJason Evans /* Base address of the DSS. */
31b7eaed25SJason Evans static void *dss_base;
32b7eaed25SJason Evans /* Atomic boolean indicating whether a thread is currently extending DSS. */
33b7eaed25SJason Evans static atomic_b_t dss_extending;
34b7eaed25SJason Evans /* Atomic boolean indicating whether the DSS is exhausted. */
35b7eaed25SJason Evans static atomic_b_t dss_exhausted;
36b7eaed25SJason Evans /* Atomic current upper limit on DSS addresses. */
37b7eaed25SJason Evans static atomic_p_t dss_max;
38b7eaed25SJason Evans
39b7eaed25SJason Evans /******************************************************************************/
40b7eaed25SJason Evans
41b7eaed25SJason Evans static void *
extent_dss_sbrk(intptr_t increment)42b7eaed25SJason Evans extent_dss_sbrk(intptr_t increment) {
43b7eaed25SJason Evans #ifdef JEMALLOC_DSS
44b7eaed25SJason Evans return sbrk(increment);
45b7eaed25SJason Evans #else
46b7eaed25SJason Evans not_implemented();
47b7eaed25SJason Evans return NULL;
48b7eaed25SJason Evans #endif
49b7eaed25SJason Evans }
50b7eaed25SJason Evans
51b7eaed25SJason Evans dss_prec_t
extent_dss_prec_get(void)52b7eaed25SJason Evans extent_dss_prec_get(void) {
53b7eaed25SJason Evans dss_prec_t ret;
54b7eaed25SJason Evans
55b7eaed25SJason Evans if (!have_dss) {
56b7eaed25SJason Evans return dss_prec_disabled;
57b7eaed25SJason Evans }
58b7eaed25SJason Evans ret = (dss_prec_t)atomic_load_u(&dss_prec_default, ATOMIC_ACQUIRE);
59b7eaed25SJason Evans return ret;
60b7eaed25SJason Evans }
61b7eaed25SJason Evans
62b7eaed25SJason Evans bool
extent_dss_prec_set(dss_prec_t dss_prec)63b7eaed25SJason Evans extent_dss_prec_set(dss_prec_t dss_prec) {
64b7eaed25SJason Evans if (!have_dss) {
65b7eaed25SJason Evans return (dss_prec != dss_prec_disabled);
66b7eaed25SJason Evans }
67b7eaed25SJason Evans atomic_store_u(&dss_prec_default, (unsigned)dss_prec, ATOMIC_RELEASE);
68b7eaed25SJason Evans return false;
69b7eaed25SJason Evans }
70b7eaed25SJason Evans
71b7eaed25SJason Evans static void
extent_dss_extending_start(void)72b7eaed25SJason Evans extent_dss_extending_start(void) {
73b7eaed25SJason Evans spin_t spinner = SPIN_INITIALIZER;
74b7eaed25SJason Evans while (true) {
75b7eaed25SJason Evans bool expected = false;
76b7eaed25SJason Evans if (atomic_compare_exchange_weak_b(&dss_extending, &expected,
77b7eaed25SJason Evans true, ATOMIC_ACQ_REL, ATOMIC_RELAXED)) {
78b7eaed25SJason Evans break;
79b7eaed25SJason Evans }
80b7eaed25SJason Evans spin_adaptive(&spinner);
81b7eaed25SJason Evans }
82b7eaed25SJason Evans }
83b7eaed25SJason Evans
84b7eaed25SJason Evans static void
extent_dss_extending_finish(void)85b7eaed25SJason Evans extent_dss_extending_finish(void) {
86b7eaed25SJason Evans assert(atomic_load_b(&dss_extending, ATOMIC_RELAXED));
87b7eaed25SJason Evans
88b7eaed25SJason Evans atomic_store_b(&dss_extending, false, ATOMIC_RELEASE);
89b7eaed25SJason Evans }
90b7eaed25SJason Evans
91b7eaed25SJason Evans static void *
extent_dss_max_update(void * new_addr)92b7eaed25SJason Evans extent_dss_max_update(void *new_addr) {
93b7eaed25SJason Evans /*
94b7eaed25SJason Evans * Get the current end of the DSS as max_cur and assure that dss_max is
95b7eaed25SJason Evans * up to date.
96b7eaed25SJason Evans */
97b7eaed25SJason Evans void *max_cur = extent_dss_sbrk(0);
98b7eaed25SJason Evans if (max_cur == (void *)-1) {
99b7eaed25SJason Evans return NULL;
100b7eaed25SJason Evans }
101b7eaed25SJason Evans atomic_store_p(&dss_max, max_cur, ATOMIC_RELEASE);
102b7eaed25SJason Evans /* Fixed new_addr can only be supported if it is at the edge of DSS. */
103b7eaed25SJason Evans if (new_addr != NULL && max_cur != new_addr) {
104b7eaed25SJason Evans return NULL;
105b7eaed25SJason Evans }
106b7eaed25SJason Evans return max_cur;
107b7eaed25SJason Evans }
108b7eaed25SJason Evans
109b7eaed25SJason Evans void *
extent_alloc_dss(tsdn_t * tsdn,arena_t * arena,void * new_addr,size_t size,size_t alignment,bool * zero,bool * commit)110b7eaed25SJason Evans extent_alloc_dss(tsdn_t *tsdn, arena_t *arena, void *new_addr, size_t size,
111b7eaed25SJason Evans size_t alignment, bool *zero, bool *commit) {
112b7eaed25SJason Evans extent_t *gap;
113b7eaed25SJason Evans
114b7eaed25SJason Evans cassert(have_dss);
115b7eaed25SJason Evans assert(size > 0);
116*c5ad8142SEric van Gyzen assert(alignment == ALIGNMENT_CEILING(alignment, PAGE));
117b7eaed25SJason Evans
118b7eaed25SJason Evans /*
119b7eaed25SJason Evans * sbrk() uses a signed increment argument, so take care not to
120b7eaed25SJason Evans * interpret a large allocation request as a negative increment.
121b7eaed25SJason Evans */
122b7eaed25SJason Evans if ((intptr_t)size < 0) {
123b7eaed25SJason Evans return NULL;
124b7eaed25SJason Evans }
125b7eaed25SJason Evans
126b7eaed25SJason Evans gap = extent_alloc(tsdn, arena);
127b7eaed25SJason Evans if (gap == NULL) {
128b7eaed25SJason Evans return NULL;
129b7eaed25SJason Evans }
130b7eaed25SJason Evans
131b7eaed25SJason Evans extent_dss_extending_start();
132b7eaed25SJason Evans if (!atomic_load_b(&dss_exhausted, ATOMIC_ACQUIRE)) {
133b7eaed25SJason Evans /*
134b7eaed25SJason Evans * The loop is necessary to recover from races with other
135b7eaed25SJason Evans * threads that are using the DSS for something other than
136b7eaed25SJason Evans * malloc.
137b7eaed25SJason Evans */
138b7eaed25SJason Evans while (true) {
139b7eaed25SJason Evans void *max_cur = extent_dss_max_update(new_addr);
140b7eaed25SJason Evans if (max_cur == NULL) {
141b7eaed25SJason Evans goto label_oom;
142b7eaed25SJason Evans }
143b7eaed25SJason Evans
144b7eaed25SJason Evans /*
145b7eaed25SJason Evans * Compute how much page-aligned gap space (if any) is
146b7eaed25SJason Evans * necessary to satisfy alignment. This space can be
147b7eaed25SJason Evans * recycled for later use.
148b7eaed25SJason Evans */
149b7eaed25SJason Evans void *gap_addr_page = (void *)(PAGE_CEILING(
150b7eaed25SJason Evans (uintptr_t)max_cur));
151b7eaed25SJason Evans void *ret = (void *)ALIGNMENT_CEILING(
152b7eaed25SJason Evans (uintptr_t)gap_addr_page, alignment);
153b7eaed25SJason Evans size_t gap_size_page = (uintptr_t)ret -
154b7eaed25SJason Evans (uintptr_t)gap_addr_page;
155b7eaed25SJason Evans if (gap_size_page != 0) {
156b7eaed25SJason Evans extent_init(gap, arena, gap_addr_page,
157*c5ad8142SEric van Gyzen gap_size_page, false, SC_NSIZES,
158b7eaed25SJason Evans arena_extent_sn_next(arena),
159*c5ad8142SEric van Gyzen extent_state_active, false, true, true,
160*c5ad8142SEric van Gyzen EXTENT_NOT_HEAD);
161b7eaed25SJason Evans }
162b7eaed25SJason Evans /*
163b7eaed25SJason Evans * Compute the address just past the end of the desired
164b7eaed25SJason Evans * allocation space.
165b7eaed25SJason Evans */
166b7eaed25SJason Evans void *dss_next = (void *)((uintptr_t)ret + size);
167b7eaed25SJason Evans if ((uintptr_t)ret < (uintptr_t)max_cur ||
168b7eaed25SJason Evans (uintptr_t)dss_next < (uintptr_t)max_cur) {
169b7eaed25SJason Evans goto label_oom; /* Wrap-around. */
170b7eaed25SJason Evans }
171b7eaed25SJason Evans /* Compute the increment, including subpage bytes. */
172b7eaed25SJason Evans void *gap_addr_subpage = max_cur;
173b7eaed25SJason Evans size_t gap_size_subpage = (uintptr_t)ret -
174b7eaed25SJason Evans (uintptr_t)gap_addr_subpage;
175b7eaed25SJason Evans intptr_t incr = gap_size_subpage + size;
176b7eaed25SJason Evans
177b7eaed25SJason Evans assert((uintptr_t)max_cur + incr == (uintptr_t)ret +
178b7eaed25SJason Evans size);
179b7eaed25SJason Evans
180b7eaed25SJason Evans /* Try to allocate. */
181b7eaed25SJason Evans void *dss_prev = extent_dss_sbrk(incr);
182b7eaed25SJason Evans if (dss_prev == max_cur) {
183b7eaed25SJason Evans /* Success. */
184b7eaed25SJason Evans atomic_store_p(&dss_max, dss_next,
185b7eaed25SJason Evans ATOMIC_RELEASE);
186b7eaed25SJason Evans extent_dss_extending_finish();
187b7eaed25SJason Evans
188b7eaed25SJason Evans if (gap_size_page != 0) {
189b7eaed25SJason Evans extent_dalloc_gap(tsdn, arena, gap);
190b7eaed25SJason Evans } else {
191b7eaed25SJason Evans extent_dalloc(tsdn, arena, gap);
192b7eaed25SJason Evans }
193b7eaed25SJason Evans if (!*commit) {
194b7eaed25SJason Evans *commit = pages_decommit(ret, size);
195b7eaed25SJason Evans }
196b7eaed25SJason Evans if (*zero && *commit) {
197b7eaed25SJason Evans extent_hooks_t *extent_hooks =
198b7eaed25SJason Evans EXTENT_HOOKS_INITIALIZER;
199b7eaed25SJason Evans extent_t extent;
200b7eaed25SJason Evans
201b7eaed25SJason Evans extent_init(&extent, arena, ret, size,
202*c5ad8142SEric van Gyzen size, false, SC_NSIZES,
2030ef50b4eSJason Evans extent_state_active, false, true,
204*c5ad8142SEric van Gyzen true, EXTENT_NOT_HEAD);
205b7eaed25SJason Evans if (extent_purge_forced_wrapper(tsdn,
206b7eaed25SJason Evans arena, &extent_hooks, &extent, 0,
207b7eaed25SJason Evans size)) {
208b7eaed25SJason Evans memset(ret, 0, size);
209b7eaed25SJason Evans }
210b7eaed25SJason Evans }
211b7eaed25SJason Evans return ret;
212b7eaed25SJason Evans }
213b7eaed25SJason Evans /*
214b7eaed25SJason Evans * Failure, whether due to OOM or a race with a raw
215b7eaed25SJason Evans * sbrk() call from outside the allocator.
216b7eaed25SJason Evans */
217b7eaed25SJason Evans if (dss_prev == (void *)-1) {
218b7eaed25SJason Evans /* OOM. */
219b7eaed25SJason Evans atomic_store_b(&dss_exhausted, true,
220b7eaed25SJason Evans ATOMIC_RELEASE);
221b7eaed25SJason Evans goto label_oom;
222b7eaed25SJason Evans }
223b7eaed25SJason Evans }
224b7eaed25SJason Evans }
225b7eaed25SJason Evans label_oom:
226b7eaed25SJason Evans extent_dss_extending_finish();
227b7eaed25SJason Evans extent_dalloc(tsdn, arena, gap);
228b7eaed25SJason Evans return NULL;
229b7eaed25SJason Evans }
230b7eaed25SJason Evans
231b7eaed25SJason Evans static bool
extent_in_dss_helper(void * addr,void * max)232b7eaed25SJason Evans extent_in_dss_helper(void *addr, void *max) {
233b7eaed25SJason Evans return ((uintptr_t)addr >= (uintptr_t)dss_base && (uintptr_t)addr <
234b7eaed25SJason Evans (uintptr_t)max);
235b7eaed25SJason Evans }
236b7eaed25SJason Evans
237b7eaed25SJason Evans bool
extent_in_dss(void * addr)238b7eaed25SJason Evans extent_in_dss(void *addr) {
239b7eaed25SJason Evans cassert(have_dss);
240b7eaed25SJason Evans
241b7eaed25SJason Evans return extent_in_dss_helper(addr, atomic_load_p(&dss_max,
242b7eaed25SJason Evans ATOMIC_ACQUIRE));
243b7eaed25SJason Evans }
244b7eaed25SJason Evans
245b7eaed25SJason Evans bool
extent_dss_mergeable(void * addr_a,void * addr_b)246b7eaed25SJason Evans extent_dss_mergeable(void *addr_a, void *addr_b) {
247b7eaed25SJason Evans void *max;
248b7eaed25SJason Evans
249b7eaed25SJason Evans cassert(have_dss);
250b7eaed25SJason Evans
251b7eaed25SJason Evans if ((uintptr_t)addr_a < (uintptr_t)dss_base && (uintptr_t)addr_b <
252b7eaed25SJason Evans (uintptr_t)dss_base) {
253b7eaed25SJason Evans return true;
254b7eaed25SJason Evans }
255b7eaed25SJason Evans
256b7eaed25SJason Evans max = atomic_load_p(&dss_max, ATOMIC_ACQUIRE);
257b7eaed25SJason Evans return (extent_in_dss_helper(addr_a, max) ==
258b7eaed25SJason Evans extent_in_dss_helper(addr_b, max));
259b7eaed25SJason Evans }
260b7eaed25SJason Evans
261b7eaed25SJason Evans void
extent_dss_boot(void)262b7eaed25SJason Evans extent_dss_boot(void) {
263b7eaed25SJason Evans cassert(have_dss);
264b7eaed25SJason Evans
265b7eaed25SJason Evans dss_base = extent_dss_sbrk(0);
266b7eaed25SJason Evans atomic_store_b(&dss_extending, false, ATOMIC_RELAXED);
267b7eaed25SJason Evans atomic_store_b(&dss_exhausted, dss_base == (void *)-1, ATOMIC_RELAXED);
268b7eaed25SJason Evans atomic_store_p(&dss_max, dss_base, ATOMIC_RELAXED);
269b7eaed25SJason Evans }
270b7eaed25SJason Evans
271b7eaed25SJason Evans /******************************************************************************/
272