1a4bd5210SJason Evans #define JEMALLOC_RTREE_C_
2b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_preamble.h"
3b7eaed25SJason Evans #include "jemalloc/internal/jemalloc_internal_includes.h"
4a4bd5210SJason Evans
5b7eaed25SJason Evans #include "jemalloc/internal/assert.h"
6b7eaed25SJason Evans #include "jemalloc/internal/mutex.h"
7d0e79aa3SJason Evans
8b7eaed25SJason Evans /*
9b7eaed25SJason Evans * Only the most significant bits of keys passed to rtree_{read,write}() are
10b7eaed25SJason Evans * used.
11b7eaed25SJason Evans */
12d0e79aa3SJason Evans bool
rtree_new(rtree_t * rtree,bool zeroed)13b7eaed25SJason Evans rtree_new(rtree_t *rtree, bool zeroed) {
14b7eaed25SJason Evans #ifdef JEMALLOC_JET
15b7eaed25SJason Evans if (!zeroed) {
16b7eaed25SJason Evans memset(rtree, 0, sizeof(rtree_t)); /* Clear root. */
17a4bd5210SJason Evans }
18b7eaed25SJason Evans #else
19b7eaed25SJason Evans assert(zeroed);
20b7eaed25SJason Evans #endif
21b7eaed25SJason Evans
22b7eaed25SJason Evans if (malloc_mutex_init(&rtree->init_lock, "rtree", WITNESS_RANK_RTREE,
23b7eaed25SJason Evans malloc_mutex_rank_exclusive)) {
24b7eaed25SJason Evans return true;
25a4bd5210SJason Evans }
26a4bd5210SJason Evans
27b7eaed25SJason Evans return false;
28f921d10fSJason Evans }
29f921d10fSJason Evans
30d0e79aa3SJason Evans static rtree_node_elm_t *
rtree_node_alloc_impl(tsdn_t * tsdn,rtree_t * rtree,size_t nelms)31b7eaed25SJason Evans rtree_node_alloc_impl(tsdn_t *tsdn, rtree_t *rtree, size_t nelms) {
32b7eaed25SJason Evans return (rtree_node_elm_t *)base_alloc(tsdn, b0get(), nelms *
33b7eaed25SJason Evans sizeof(rtree_node_elm_t), CACHELINE);
34b7eaed25SJason Evans }
35b7eaed25SJason Evans rtree_node_alloc_t *JET_MUTABLE rtree_node_alloc = rtree_node_alloc_impl;
36b7eaed25SJason Evans
37b7eaed25SJason Evans static void
rtree_node_dalloc_impl(tsdn_t * tsdn,rtree_t * rtree,rtree_node_elm_t * node)38b7eaed25SJason Evans rtree_node_dalloc_impl(tsdn_t *tsdn, rtree_t *rtree, rtree_node_elm_t *node) {
39b7eaed25SJason Evans /* Nodes are never deleted during normal operation. */
40b7eaed25SJason Evans not_reached();
41b7eaed25SJason Evans }
42*c5ad8142SEric van Gyzen rtree_node_dalloc_t *JET_MUTABLE rtree_node_dalloc =
43b7eaed25SJason Evans rtree_node_dalloc_impl;
44b7eaed25SJason Evans
45b7eaed25SJason Evans static rtree_leaf_elm_t *
rtree_leaf_alloc_impl(tsdn_t * tsdn,rtree_t * rtree,size_t nelms)46b7eaed25SJason Evans rtree_leaf_alloc_impl(tsdn_t *tsdn, rtree_t *rtree, size_t nelms) {
47b7eaed25SJason Evans return (rtree_leaf_elm_t *)base_alloc(tsdn, b0get(), nelms *
48b7eaed25SJason Evans sizeof(rtree_leaf_elm_t), CACHELINE);
49b7eaed25SJason Evans }
50b7eaed25SJason Evans rtree_leaf_alloc_t *JET_MUTABLE rtree_leaf_alloc = rtree_leaf_alloc_impl;
51b7eaed25SJason Evans
52b7eaed25SJason Evans static void
rtree_leaf_dalloc_impl(tsdn_t * tsdn,rtree_t * rtree,rtree_leaf_elm_t * leaf)53b7eaed25SJason Evans rtree_leaf_dalloc_impl(tsdn_t *tsdn, rtree_t *rtree, rtree_leaf_elm_t *leaf) {
54b7eaed25SJason Evans /* Leaves are never deleted during normal operation. */
55b7eaed25SJason Evans not_reached();
56b7eaed25SJason Evans }
57*c5ad8142SEric van Gyzen rtree_leaf_dalloc_t *JET_MUTABLE rtree_leaf_dalloc =
58b7eaed25SJason Evans rtree_leaf_dalloc_impl;
59b7eaed25SJason Evans
60b7eaed25SJason Evans #ifdef JEMALLOC_JET
61b7eaed25SJason Evans # if RTREE_HEIGHT > 1
62b7eaed25SJason Evans static void
rtree_delete_subtree(tsdn_t * tsdn,rtree_t * rtree,rtree_node_elm_t * subtree,unsigned level)63b7eaed25SJason Evans rtree_delete_subtree(tsdn_t *tsdn, rtree_t *rtree, rtree_node_elm_t *subtree,
64b7eaed25SJason Evans unsigned level) {
65b7eaed25SJason Evans size_t nchildren = ZU(1) << rtree_levels[level].bits;
66b7eaed25SJason Evans if (level + 2 < RTREE_HEIGHT) {
67b7eaed25SJason Evans for (size_t i = 0; i < nchildren; i++) {
68b7eaed25SJason Evans rtree_node_elm_t *node =
69b7eaed25SJason Evans (rtree_node_elm_t *)atomic_load_p(&subtree[i].child,
70b7eaed25SJason Evans ATOMIC_RELAXED);
71b7eaed25SJason Evans if (node != NULL) {
72b7eaed25SJason Evans rtree_delete_subtree(tsdn, rtree, node, level +
73b7eaed25SJason Evans 1);
74b7eaed25SJason Evans }
75b7eaed25SJason Evans }
76b7eaed25SJason Evans } else {
77b7eaed25SJason Evans for (size_t i = 0; i < nchildren; i++) {
78b7eaed25SJason Evans rtree_leaf_elm_t *leaf =
79b7eaed25SJason Evans (rtree_leaf_elm_t *)atomic_load_p(&subtree[i].child,
80b7eaed25SJason Evans ATOMIC_RELAXED);
81b7eaed25SJason Evans if (leaf != NULL) {
82b7eaed25SJason Evans rtree_leaf_dalloc(tsdn, rtree, leaf);
83b7eaed25SJason Evans }
84b7eaed25SJason Evans }
85b7eaed25SJason Evans }
86b7eaed25SJason Evans
87b7eaed25SJason Evans if (subtree != rtree->root) {
88b7eaed25SJason Evans rtree_node_dalloc(tsdn, rtree, subtree);
89b7eaed25SJason Evans }
90b7eaed25SJason Evans }
91b7eaed25SJason Evans # endif
92b7eaed25SJason Evans
93b7eaed25SJason Evans void
rtree_delete(tsdn_t * tsdn,rtree_t * rtree)94b7eaed25SJason Evans rtree_delete(tsdn_t *tsdn, rtree_t *rtree) {
95b7eaed25SJason Evans # if RTREE_HEIGHT > 1
96b7eaed25SJason Evans rtree_delete_subtree(tsdn, rtree, rtree->root, 0);
97b7eaed25SJason Evans # endif
98b7eaed25SJason Evans }
99b7eaed25SJason Evans #endif
100b7eaed25SJason Evans
101b7eaed25SJason Evans static rtree_node_elm_t *
rtree_node_init(tsdn_t * tsdn,rtree_t * rtree,unsigned level,atomic_p_t * elmp)102b7eaed25SJason Evans rtree_node_init(tsdn_t *tsdn, rtree_t *rtree, unsigned level,
103b7eaed25SJason Evans atomic_p_t *elmp) {
104b7eaed25SJason Evans malloc_mutex_lock(tsdn, &rtree->init_lock);
105b7eaed25SJason Evans /*
106b7eaed25SJason Evans * If *elmp is non-null, then it was initialized with the init lock
107b7eaed25SJason Evans * held, so we can get by with 'relaxed' here.
108b7eaed25SJason Evans */
109b7eaed25SJason Evans rtree_node_elm_t *node = atomic_load_p(elmp, ATOMIC_RELAXED);
110b7eaed25SJason Evans if (node == NULL) {
111b7eaed25SJason Evans node = rtree_node_alloc(tsdn, rtree, ZU(1) <<
112b7eaed25SJason Evans rtree_levels[level].bits);
113b7eaed25SJason Evans if (node == NULL) {
114b7eaed25SJason Evans malloc_mutex_unlock(tsdn, &rtree->init_lock);
115b7eaed25SJason Evans return NULL;
116b7eaed25SJason Evans }
117b7eaed25SJason Evans /*
118b7eaed25SJason Evans * Even though we hold the lock, a later reader might not; we
119b7eaed25SJason Evans * need release semantics.
120b7eaed25SJason Evans */
121b7eaed25SJason Evans atomic_store_p(elmp, node, ATOMIC_RELEASE);
122b7eaed25SJason Evans }
123b7eaed25SJason Evans malloc_mutex_unlock(tsdn, &rtree->init_lock);
124b7eaed25SJason Evans
125b7eaed25SJason Evans return node;
126b7eaed25SJason Evans }
127b7eaed25SJason Evans
128b7eaed25SJason Evans static rtree_leaf_elm_t *
rtree_leaf_init(tsdn_t * tsdn,rtree_t * rtree,atomic_p_t * elmp)129b7eaed25SJason Evans rtree_leaf_init(tsdn_t *tsdn, rtree_t *rtree, atomic_p_t *elmp) {
130b7eaed25SJason Evans malloc_mutex_lock(tsdn, &rtree->init_lock);
131b7eaed25SJason Evans /*
132b7eaed25SJason Evans * If *elmp is non-null, then it was initialized with the init lock
133b7eaed25SJason Evans * held, so we can get by with 'relaxed' here.
134b7eaed25SJason Evans */
135b7eaed25SJason Evans rtree_leaf_elm_t *leaf = atomic_load_p(elmp, ATOMIC_RELAXED);
136b7eaed25SJason Evans if (leaf == NULL) {
137b7eaed25SJason Evans leaf = rtree_leaf_alloc(tsdn, rtree, ZU(1) <<
138b7eaed25SJason Evans rtree_levels[RTREE_HEIGHT-1].bits);
139b7eaed25SJason Evans if (leaf == NULL) {
140b7eaed25SJason Evans malloc_mutex_unlock(tsdn, &rtree->init_lock);
141b7eaed25SJason Evans return NULL;
142b7eaed25SJason Evans }
143b7eaed25SJason Evans /*
144b7eaed25SJason Evans * Even though we hold the lock, a later reader might not; we
145b7eaed25SJason Evans * need release semantics.
146b7eaed25SJason Evans */
147b7eaed25SJason Evans atomic_store_p(elmp, leaf, ATOMIC_RELEASE);
148b7eaed25SJason Evans }
149b7eaed25SJason Evans malloc_mutex_unlock(tsdn, &rtree->init_lock);
150b7eaed25SJason Evans
151b7eaed25SJason Evans return leaf;
152b7eaed25SJason Evans }
153b7eaed25SJason Evans
154b7eaed25SJason Evans static bool
rtree_node_valid(rtree_node_elm_t * node)155b7eaed25SJason Evans rtree_node_valid(rtree_node_elm_t *node) {
156b7eaed25SJason Evans return ((uintptr_t)node != (uintptr_t)0);
157b7eaed25SJason Evans }
158b7eaed25SJason Evans
159b7eaed25SJason Evans static bool
rtree_leaf_valid(rtree_leaf_elm_t * leaf)160b7eaed25SJason Evans rtree_leaf_valid(rtree_leaf_elm_t *leaf) {
161b7eaed25SJason Evans return ((uintptr_t)leaf != (uintptr_t)0);
162b7eaed25SJason Evans }
163b7eaed25SJason Evans
164b7eaed25SJason Evans static rtree_node_elm_t *
rtree_child_node_tryread(rtree_node_elm_t * elm,bool dependent)165b7eaed25SJason Evans rtree_child_node_tryread(rtree_node_elm_t *elm, bool dependent) {
166d0e79aa3SJason Evans rtree_node_elm_t *node;
16782872ac0SJason Evans
168b7eaed25SJason Evans if (dependent) {
169b7eaed25SJason Evans node = (rtree_node_elm_t *)atomic_load_p(&elm->child,
170b7eaed25SJason Evans ATOMIC_RELAXED);
171d0e79aa3SJason Evans } else {
172b7eaed25SJason Evans node = (rtree_node_elm_t *)atomic_load_p(&elm->child,
173b7eaed25SJason Evans ATOMIC_ACQUIRE);
17482872ac0SJason Evans }
17582872ac0SJason Evans
176b7eaed25SJason Evans assert(!dependent || node != NULL);
177b7eaed25SJason Evans return node;
17882872ac0SJason Evans }
17982872ac0SJason Evans
180b7eaed25SJason Evans static rtree_node_elm_t *
rtree_child_node_read(tsdn_t * tsdn,rtree_t * rtree,rtree_node_elm_t * elm,unsigned level,bool dependent)181b7eaed25SJason Evans rtree_child_node_read(tsdn_t *tsdn, rtree_t *rtree, rtree_node_elm_t *elm,
182b7eaed25SJason Evans unsigned level, bool dependent) {
183b7eaed25SJason Evans rtree_node_elm_t *node;
18482872ac0SJason Evans
185b7eaed25SJason Evans node = rtree_child_node_tryread(elm, dependent);
186b7eaed25SJason Evans if (!dependent && unlikely(!rtree_node_valid(node))) {
187b7eaed25SJason Evans node = rtree_node_init(tsdn, rtree, level + 1, &elm->child);
188b7eaed25SJason Evans }
189b7eaed25SJason Evans assert(!dependent || node != NULL);
190b7eaed25SJason Evans return node;
191d0e79aa3SJason Evans }
192d0e79aa3SJason Evans
193b7eaed25SJason Evans static rtree_leaf_elm_t *
rtree_child_leaf_tryread(rtree_node_elm_t * elm,bool dependent)194b7eaed25SJason Evans rtree_child_leaf_tryread(rtree_node_elm_t *elm, bool dependent) {
195b7eaed25SJason Evans rtree_leaf_elm_t *leaf;
196d0e79aa3SJason Evans
197b7eaed25SJason Evans if (dependent) {
198b7eaed25SJason Evans leaf = (rtree_leaf_elm_t *)atomic_load_p(&elm->child,
199b7eaed25SJason Evans ATOMIC_RELAXED);
200b7eaed25SJason Evans } else {
201b7eaed25SJason Evans leaf = (rtree_leaf_elm_t *)atomic_load_p(&elm->child,
202b7eaed25SJason Evans ATOMIC_ACQUIRE);
203b7eaed25SJason Evans }
204b7eaed25SJason Evans
205b7eaed25SJason Evans assert(!dependent || leaf != NULL);
206b7eaed25SJason Evans return leaf;
207b7eaed25SJason Evans }
208b7eaed25SJason Evans
209b7eaed25SJason Evans static rtree_leaf_elm_t *
rtree_child_leaf_read(tsdn_t * tsdn,rtree_t * rtree,rtree_node_elm_t * elm,unsigned level,bool dependent)210b7eaed25SJason Evans rtree_child_leaf_read(tsdn_t *tsdn, rtree_t *rtree, rtree_node_elm_t *elm,
211b7eaed25SJason Evans unsigned level, bool dependent) {
212b7eaed25SJason Evans rtree_leaf_elm_t *leaf;
213b7eaed25SJason Evans
214b7eaed25SJason Evans leaf = rtree_child_leaf_tryread(elm, dependent);
215b7eaed25SJason Evans if (!dependent && unlikely(!rtree_leaf_valid(leaf))) {
216b7eaed25SJason Evans leaf = rtree_leaf_init(tsdn, rtree, &elm->child);
217b7eaed25SJason Evans }
218b7eaed25SJason Evans assert(!dependent || leaf != NULL);
219b7eaed25SJason Evans return leaf;
220b7eaed25SJason Evans }
221b7eaed25SJason Evans
222b7eaed25SJason Evans rtree_leaf_elm_t *
rtree_leaf_elm_lookup_hard(tsdn_t * tsdn,rtree_t * rtree,rtree_ctx_t * rtree_ctx,uintptr_t key,bool dependent,bool init_missing)223b7eaed25SJason Evans rtree_leaf_elm_lookup_hard(tsdn_t *tsdn, rtree_t *rtree, rtree_ctx_t *rtree_ctx,
224b7eaed25SJason Evans uintptr_t key, bool dependent, bool init_missing) {
225b7eaed25SJason Evans rtree_node_elm_t *node;
226b7eaed25SJason Evans rtree_leaf_elm_t *leaf;
227b7eaed25SJason Evans #if RTREE_HEIGHT > 1
228b7eaed25SJason Evans node = rtree->root;
229b7eaed25SJason Evans #else
230b7eaed25SJason Evans leaf = rtree->root;
231b7eaed25SJason Evans #endif
232b7eaed25SJason Evans
233b7eaed25SJason Evans if (config_debug) {
234b7eaed25SJason Evans uintptr_t leafkey = rtree_leafkey(key);
235b7eaed25SJason Evans for (unsigned i = 0; i < RTREE_CTX_NCACHE; i++) {
236b7eaed25SJason Evans assert(rtree_ctx->cache[i].leafkey != leafkey);
237b7eaed25SJason Evans }
238b7eaed25SJason Evans for (unsigned i = 0; i < RTREE_CTX_NCACHE_L2; i++) {
239b7eaed25SJason Evans assert(rtree_ctx->l2_cache[i].leafkey != leafkey);
240b7eaed25SJason Evans }
241b7eaed25SJason Evans }
242b7eaed25SJason Evans
243b7eaed25SJason Evans #define RTREE_GET_CHILD(level) { \
244b7eaed25SJason Evans assert(level < RTREE_HEIGHT-1); \
245b7eaed25SJason Evans if (level != 0 && !dependent && \
246b7eaed25SJason Evans unlikely(!rtree_node_valid(node))) { \
247b7eaed25SJason Evans return NULL; \
248b7eaed25SJason Evans } \
249b7eaed25SJason Evans uintptr_t subkey = rtree_subkey(key, level); \
250b7eaed25SJason Evans if (level + 2 < RTREE_HEIGHT) { \
251b7eaed25SJason Evans node = init_missing ? \
252b7eaed25SJason Evans rtree_child_node_read(tsdn, rtree, \
253b7eaed25SJason Evans &node[subkey], level, dependent) : \
254b7eaed25SJason Evans rtree_child_node_tryread(&node[subkey], \
255b7eaed25SJason Evans dependent); \
256b7eaed25SJason Evans } else { \
257b7eaed25SJason Evans leaf = init_missing ? \
258b7eaed25SJason Evans rtree_child_leaf_read(tsdn, rtree, \
259b7eaed25SJason Evans &node[subkey], level, dependent) : \
260b7eaed25SJason Evans rtree_child_leaf_tryread(&node[subkey], \
261b7eaed25SJason Evans dependent); \
262b7eaed25SJason Evans } \
263b7eaed25SJason Evans }
264b7eaed25SJason Evans /*
265b7eaed25SJason Evans * Cache replacement upon hard lookup (i.e. L1 & L2 rtree cache miss):
266b7eaed25SJason Evans * (1) evict last entry in L2 cache; (2) move the collision slot from L1
267b7eaed25SJason Evans * cache down to L2; and 3) fill L1.
268b7eaed25SJason Evans */
269b7eaed25SJason Evans #define RTREE_GET_LEAF(level) { \
270b7eaed25SJason Evans assert(level == RTREE_HEIGHT-1); \
271b7eaed25SJason Evans if (!dependent && unlikely(!rtree_leaf_valid(leaf))) { \
272b7eaed25SJason Evans return NULL; \
273b7eaed25SJason Evans } \
274b7eaed25SJason Evans if (RTREE_CTX_NCACHE_L2 > 1) { \
275b7eaed25SJason Evans memmove(&rtree_ctx->l2_cache[1], \
276b7eaed25SJason Evans &rtree_ctx->l2_cache[0], \
277b7eaed25SJason Evans sizeof(rtree_ctx_cache_elm_t) * \
278b7eaed25SJason Evans (RTREE_CTX_NCACHE_L2 - 1)); \
279b7eaed25SJason Evans } \
280b7eaed25SJason Evans size_t slot = rtree_cache_direct_map(key); \
281b7eaed25SJason Evans rtree_ctx->l2_cache[0].leafkey = \
282b7eaed25SJason Evans rtree_ctx->cache[slot].leafkey; \
283b7eaed25SJason Evans rtree_ctx->l2_cache[0].leaf = \
284b7eaed25SJason Evans rtree_ctx->cache[slot].leaf; \
285b7eaed25SJason Evans uintptr_t leafkey = rtree_leafkey(key); \
286b7eaed25SJason Evans rtree_ctx->cache[slot].leafkey = leafkey; \
287b7eaed25SJason Evans rtree_ctx->cache[slot].leaf = leaf; \
288b7eaed25SJason Evans uintptr_t subkey = rtree_subkey(key, level); \
289b7eaed25SJason Evans return &leaf[subkey]; \
290b7eaed25SJason Evans }
291b7eaed25SJason Evans if (RTREE_HEIGHT > 1) {
292b7eaed25SJason Evans RTREE_GET_CHILD(0)
293b7eaed25SJason Evans }
294b7eaed25SJason Evans if (RTREE_HEIGHT > 2) {
295b7eaed25SJason Evans RTREE_GET_CHILD(1)
296b7eaed25SJason Evans }
297b7eaed25SJason Evans if (RTREE_HEIGHT > 3) {
298b7eaed25SJason Evans for (unsigned i = 2; i < RTREE_HEIGHT-1; i++) {
299b7eaed25SJason Evans RTREE_GET_CHILD(i)
300b7eaed25SJason Evans }
301b7eaed25SJason Evans }
302b7eaed25SJason Evans RTREE_GET_LEAF(RTREE_HEIGHT-1)
303b7eaed25SJason Evans #undef RTREE_GET_CHILD
304b7eaed25SJason Evans #undef RTREE_GET_LEAF
305b7eaed25SJason Evans not_reached();
306b7eaed25SJason Evans }
307b7eaed25SJason Evans
308b7eaed25SJason Evans void
rtree_ctx_data_init(rtree_ctx_t * ctx)309b7eaed25SJason Evans rtree_ctx_data_init(rtree_ctx_t *ctx) {
310b7eaed25SJason Evans for (unsigned i = 0; i < RTREE_CTX_NCACHE; i++) {
311b7eaed25SJason Evans rtree_ctx_cache_elm_t *cache = &ctx->cache[i];
312b7eaed25SJason Evans cache->leafkey = RTREE_LEAFKEY_INVALID;
313b7eaed25SJason Evans cache->leaf = NULL;
314b7eaed25SJason Evans }
315b7eaed25SJason Evans for (unsigned i = 0; i < RTREE_CTX_NCACHE_L2; i++) {
316b7eaed25SJason Evans rtree_ctx_cache_elm_t *cache = &ctx->l2_cache[i];
317b7eaed25SJason Evans cache->leafkey = RTREE_LEAFKEY_INVALID;
318b7eaed25SJason Evans cache->leaf = NULL;
319b7eaed25SJason Evans }
32082872ac0SJason Evans }
321