xref: /linux/fs/xfs/libxfs/xfs_rtrefcount_btree.c (revision b477ff98d903618a1ab8247861f2ea6e70c0f0f8)
1 // SPDX-License-Identifier: GPL-2.0-or-later
2 /*
3  * Copyright (c) 2021-2024 Oracle.  All Rights Reserved.
4  * Author: Darrick J. Wong <djwong@kernel.org>
5  */
6 #include "xfs.h"
7 #include "xfs_fs.h"
8 #include "xfs_shared.h"
9 #include "xfs_format.h"
10 #include "xfs_log_format.h"
11 #include "xfs_trans_resv.h"
12 #include "xfs_bit.h"
13 #include "xfs_sb.h"
14 #include "xfs_mount.h"
15 #include "xfs_defer.h"
16 #include "xfs_inode.h"
17 #include "xfs_trans.h"
18 #include "xfs_alloc.h"
19 #include "xfs_btree.h"
20 #include "xfs_btree_staging.h"
21 #include "xfs_rtrefcount_btree.h"
22 #include "xfs_refcount.h"
23 #include "xfs_trace.h"
24 #include "xfs_cksum.h"
25 #include "xfs_error.h"
26 #include "xfs_extent_busy.h"
27 #include "xfs_rtgroup.h"
28 #include "xfs_rtbitmap.h"
29 #include "xfs_metafile.h"
30 #include "xfs_health.h"
31 
32 static struct kmem_cache	*xfs_rtrefcountbt_cur_cache;
33 
34 /*
35  * Realtime Reference Count btree.
36  *
37  * This is a btree used to track the owner(s) of a given extent in the realtime
38  * device.  See the comments in xfs_refcount_btree.c for more information.
39  *
40  * This tree is basically the same as the regular refcount btree except that
41  * it's rooted in an inode.
42  */
43 
44 static struct xfs_btree_cur *
xfs_rtrefcountbt_dup_cursor(struct xfs_btree_cur * cur)45 xfs_rtrefcountbt_dup_cursor(
46 	struct xfs_btree_cur	*cur)
47 {
48 	return xfs_rtrefcountbt_init_cursor(cur->bc_tp, to_rtg(cur->bc_group));
49 }
50 
51 STATIC int
xfs_rtrefcountbt_get_minrecs(struct xfs_btree_cur * cur,int level)52 xfs_rtrefcountbt_get_minrecs(
53 	struct xfs_btree_cur	*cur,
54 	int			level)
55 {
56 	if (level == cur->bc_nlevels - 1) {
57 		struct xfs_ifork	*ifp = xfs_btree_ifork_ptr(cur);
58 
59 		return xfs_rtrefcountbt_maxrecs(cur->bc_mp, ifp->if_broot_bytes,
60 				level == 0) / 2;
61 	}
62 
63 	return cur->bc_mp->m_rtrefc_mnr[level != 0];
64 }
65 
66 STATIC int
xfs_rtrefcountbt_get_maxrecs(struct xfs_btree_cur * cur,int level)67 xfs_rtrefcountbt_get_maxrecs(
68 	struct xfs_btree_cur	*cur,
69 	int			level)
70 {
71 	if (level == cur->bc_nlevels - 1) {
72 		struct xfs_ifork	*ifp = xfs_btree_ifork_ptr(cur);
73 
74 		return xfs_rtrefcountbt_maxrecs(cur->bc_mp, ifp->if_broot_bytes,
75 				level == 0);
76 	}
77 
78 	return cur->bc_mp->m_rtrefc_mxr[level != 0];
79 }
80 
81 /*
82  * Calculate number of records in a realtime refcount btree inode root.
83  */
84 unsigned int
xfs_rtrefcountbt_droot_maxrecs(unsigned int blocklen,bool leaf)85 xfs_rtrefcountbt_droot_maxrecs(
86 	unsigned int		blocklen,
87 	bool			leaf)
88 {
89 	blocklen -= sizeof(struct xfs_rtrefcount_root);
90 
91 	if (leaf)
92 		return blocklen / sizeof(struct xfs_refcount_rec);
93 	return blocklen / (2 * sizeof(struct xfs_refcount_key) +
94 			sizeof(xfs_rtrefcount_ptr_t));
95 }
96 
97 /*
98  * Get the maximum records we could store in the on-disk format.
99  *
100  * For non-root nodes this is equivalent to xfs_rtrefcountbt_get_maxrecs, but
101  * for the root node this checks the available space in the dinode fork so that
102  * we can resize the in-memory buffer to match it.  After a resize to the
103  * maximum size this function returns the same value as
104  * xfs_rtrefcountbt_get_maxrecs for the root node, too.
105  */
106 STATIC int
xfs_rtrefcountbt_get_dmaxrecs(struct xfs_btree_cur * cur,int level)107 xfs_rtrefcountbt_get_dmaxrecs(
108 	struct xfs_btree_cur	*cur,
109 	int			level)
110 {
111 	if (level != cur->bc_nlevels - 1)
112 		return cur->bc_mp->m_rtrefc_mxr[level != 0];
113 	return xfs_rtrefcountbt_droot_maxrecs(cur->bc_ino.forksize, level == 0);
114 }
115 
116 STATIC void
xfs_rtrefcountbt_init_key_from_rec(union xfs_btree_key * key,const union xfs_btree_rec * rec)117 xfs_rtrefcountbt_init_key_from_rec(
118 	union xfs_btree_key		*key,
119 	const union xfs_btree_rec	*rec)
120 {
121 	key->refc.rc_startblock = rec->refc.rc_startblock;
122 }
123 
124 STATIC void
xfs_rtrefcountbt_init_high_key_from_rec(union xfs_btree_key * key,const union xfs_btree_rec * rec)125 xfs_rtrefcountbt_init_high_key_from_rec(
126 	union xfs_btree_key		*key,
127 	const union xfs_btree_rec	*rec)
128 {
129 	__u32				x;
130 
131 	x = be32_to_cpu(rec->refc.rc_startblock);
132 	x += be32_to_cpu(rec->refc.rc_blockcount) - 1;
133 	key->refc.rc_startblock = cpu_to_be32(x);
134 }
135 
136 STATIC void
xfs_rtrefcountbt_init_rec_from_cur(struct xfs_btree_cur * cur,union xfs_btree_rec * rec)137 xfs_rtrefcountbt_init_rec_from_cur(
138 	struct xfs_btree_cur	*cur,
139 	union xfs_btree_rec	*rec)
140 {
141 	const struct xfs_refcount_irec *irec = &cur->bc_rec.rc;
142 	uint32_t		start;
143 
144 	start = xfs_refcount_encode_startblock(irec->rc_startblock,
145 			irec->rc_domain);
146 	rec->refc.rc_startblock = cpu_to_be32(start);
147 	rec->refc.rc_blockcount = cpu_to_be32(cur->bc_rec.rc.rc_blockcount);
148 	rec->refc.rc_refcount = cpu_to_be32(cur->bc_rec.rc.rc_refcount);
149 }
150 
151 STATIC void
xfs_rtrefcountbt_init_ptr_from_cur(struct xfs_btree_cur * cur,union xfs_btree_ptr * ptr)152 xfs_rtrefcountbt_init_ptr_from_cur(
153 	struct xfs_btree_cur	*cur,
154 	union xfs_btree_ptr	*ptr)
155 {
156 	ptr->l = 0;
157 }
158 
159 STATIC int64_t
xfs_rtrefcountbt_key_diff(struct xfs_btree_cur * cur,const union xfs_btree_key * key)160 xfs_rtrefcountbt_key_diff(
161 	struct xfs_btree_cur		*cur,
162 	const union xfs_btree_key	*key)
163 {
164 	const struct xfs_refcount_key	*kp = &key->refc;
165 	const struct xfs_refcount_irec	*irec = &cur->bc_rec.rc;
166 	uint32_t			start;
167 
168 	start = xfs_refcount_encode_startblock(irec->rc_startblock,
169 			irec->rc_domain);
170 	return (int64_t)be32_to_cpu(kp->rc_startblock) - start;
171 }
172 
173 STATIC int64_t
xfs_rtrefcountbt_diff_two_keys(struct xfs_btree_cur * cur,const union xfs_btree_key * k1,const union xfs_btree_key * k2,const union xfs_btree_key * mask)174 xfs_rtrefcountbt_diff_two_keys(
175 	struct xfs_btree_cur		*cur,
176 	const union xfs_btree_key	*k1,
177 	const union xfs_btree_key	*k2,
178 	const union xfs_btree_key	*mask)
179 {
180 	ASSERT(!mask || mask->refc.rc_startblock);
181 
182 	return (int64_t)be32_to_cpu(k1->refc.rc_startblock) -
183 			be32_to_cpu(k2->refc.rc_startblock);
184 }
185 
186 static xfs_failaddr_t
xfs_rtrefcountbt_verify(struct xfs_buf * bp)187 xfs_rtrefcountbt_verify(
188 	struct xfs_buf		*bp)
189 {
190 	struct xfs_mount	*mp = bp->b_target->bt_mount;
191 	struct xfs_btree_block	*block = XFS_BUF_TO_BLOCK(bp);
192 	xfs_failaddr_t		fa;
193 	int			level;
194 
195 	if (!xfs_verify_magic(bp, block->bb_magic))
196 		return __this_address;
197 
198 	if (!xfs_has_reflink(mp))
199 		return __this_address;
200 	fa = xfs_btree_fsblock_v5hdr_verify(bp, XFS_RMAP_OWN_UNKNOWN);
201 	if (fa)
202 		return fa;
203 	level = be16_to_cpu(block->bb_level);
204 	if (level > mp->m_rtrefc_maxlevels)
205 		return __this_address;
206 
207 	return xfs_btree_fsblock_verify(bp, mp->m_rtrefc_mxr[level != 0]);
208 }
209 
210 static void
xfs_rtrefcountbt_read_verify(struct xfs_buf * bp)211 xfs_rtrefcountbt_read_verify(
212 	struct xfs_buf	*bp)
213 {
214 	xfs_failaddr_t	fa;
215 
216 	if (!xfs_btree_fsblock_verify_crc(bp))
217 		xfs_verifier_error(bp, -EFSBADCRC, __this_address);
218 	else {
219 		fa = xfs_rtrefcountbt_verify(bp);
220 		if (fa)
221 			xfs_verifier_error(bp, -EFSCORRUPTED, fa);
222 	}
223 
224 	if (bp->b_error)
225 		trace_xfs_btree_corrupt(bp, _RET_IP_);
226 }
227 
228 static void
xfs_rtrefcountbt_write_verify(struct xfs_buf * bp)229 xfs_rtrefcountbt_write_verify(
230 	struct xfs_buf	*bp)
231 {
232 	xfs_failaddr_t	fa;
233 
234 	fa = xfs_rtrefcountbt_verify(bp);
235 	if (fa) {
236 		trace_xfs_btree_corrupt(bp, _RET_IP_);
237 		xfs_verifier_error(bp, -EFSCORRUPTED, fa);
238 		return;
239 	}
240 	xfs_btree_fsblock_calc_crc(bp);
241 
242 }
243 
244 const struct xfs_buf_ops xfs_rtrefcountbt_buf_ops = {
245 	.name			= "xfs_rtrefcountbt",
246 	.magic			= { 0, cpu_to_be32(XFS_RTREFC_CRC_MAGIC) },
247 	.verify_read		= xfs_rtrefcountbt_read_verify,
248 	.verify_write		= xfs_rtrefcountbt_write_verify,
249 	.verify_struct		= xfs_rtrefcountbt_verify,
250 };
251 
252 STATIC int
xfs_rtrefcountbt_keys_inorder(struct xfs_btree_cur * cur,const union xfs_btree_key * k1,const union xfs_btree_key * k2)253 xfs_rtrefcountbt_keys_inorder(
254 	struct xfs_btree_cur		*cur,
255 	const union xfs_btree_key	*k1,
256 	const union xfs_btree_key	*k2)
257 {
258 	return be32_to_cpu(k1->refc.rc_startblock) <
259 	       be32_to_cpu(k2->refc.rc_startblock);
260 }
261 
262 STATIC int
xfs_rtrefcountbt_recs_inorder(struct xfs_btree_cur * cur,const union xfs_btree_rec * r1,const union xfs_btree_rec * r2)263 xfs_rtrefcountbt_recs_inorder(
264 	struct xfs_btree_cur		*cur,
265 	const union xfs_btree_rec	*r1,
266 	const union xfs_btree_rec	*r2)
267 {
268 	return  be32_to_cpu(r1->refc.rc_startblock) +
269 		be32_to_cpu(r1->refc.rc_blockcount) <=
270 		be32_to_cpu(r2->refc.rc_startblock);
271 }
272 
273 STATIC enum xbtree_key_contig
xfs_rtrefcountbt_keys_contiguous(struct xfs_btree_cur * cur,const union xfs_btree_key * key1,const union xfs_btree_key * key2,const union xfs_btree_key * mask)274 xfs_rtrefcountbt_keys_contiguous(
275 	struct xfs_btree_cur		*cur,
276 	const union xfs_btree_key	*key1,
277 	const union xfs_btree_key	*key2,
278 	const union xfs_btree_key	*mask)
279 {
280 	ASSERT(!mask || mask->refc.rc_startblock);
281 
282 	return xbtree_key_contig(be32_to_cpu(key1->refc.rc_startblock),
283 				 be32_to_cpu(key2->refc.rc_startblock));
284 }
285 
286 static inline void
xfs_rtrefcountbt_move_ptrs(struct xfs_mount * mp,struct xfs_btree_block * broot,short old_size,size_t new_size,unsigned int numrecs)287 xfs_rtrefcountbt_move_ptrs(
288 	struct xfs_mount	*mp,
289 	struct xfs_btree_block	*broot,
290 	short			old_size,
291 	size_t			new_size,
292 	unsigned int		numrecs)
293 {
294 	void			*dptr;
295 	void			*sptr;
296 
297 	sptr = xfs_rtrefcount_broot_ptr_addr(mp, broot, 1, old_size);
298 	dptr = xfs_rtrefcount_broot_ptr_addr(mp, broot, 1, new_size);
299 	memmove(dptr, sptr, numrecs * sizeof(xfs_rtrefcount_ptr_t));
300 }
301 
302 static struct xfs_btree_block *
xfs_rtrefcountbt_broot_realloc(struct xfs_btree_cur * cur,unsigned int new_numrecs)303 xfs_rtrefcountbt_broot_realloc(
304 	struct xfs_btree_cur	*cur,
305 	unsigned int		new_numrecs)
306 {
307 	struct xfs_mount	*mp = cur->bc_mp;
308 	struct xfs_ifork	*ifp = xfs_btree_ifork_ptr(cur);
309 	struct xfs_btree_block	*broot;
310 	unsigned int		new_size;
311 	unsigned int		old_size = ifp->if_broot_bytes;
312 	const unsigned int	level = cur->bc_nlevels - 1;
313 
314 	new_size = xfs_rtrefcount_broot_space_calc(mp, level, new_numrecs);
315 
316 	/* Handle the nop case quietly. */
317 	if (new_size == old_size)
318 		return ifp->if_broot;
319 
320 	if (new_size > old_size) {
321 		unsigned int	old_numrecs;
322 
323 		/*
324 		 * If there wasn't any memory allocated before, just allocate
325 		 * it now and get out.
326 		 */
327 		if (old_size == 0)
328 			return xfs_broot_realloc(ifp, new_size);
329 
330 		/*
331 		 * If there is already an existing if_broot, then we need to
332 		 * realloc it and possibly move the node block pointers because
333 		 * those are not butted up against the btree block header.
334 		 */
335 		old_numrecs = xfs_rtrefcountbt_maxrecs(mp, old_size, level);
336 		broot = xfs_broot_realloc(ifp, new_size);
337 		if (level > 0)
338 			xfs_rtrefcountbt_move_ptrs(mp, broot, old_size,
339 					new_size, old_numrecs);
340 		goto out_broot;
341 	}
342 
343 	/*
344 	 * We're reducing numrecs.  If we're going all the way to zero, just
345 	 * free the block.
346 	 */
347 	ASSERT(ifp->if_broot != NULL && old_size > 0);
348 	if (new_size == 0)
349 		return xfs_broot_realloc(ifp, 0);
350 
351 	/*
352 	 * Shrink the btree root by possibly moving the rtrmapbt pointers,
353 	 * since they are not butted up against the btree block header.  Then
354 	 * reallocate broot.
355 	 */
356 	if (level > 0)
357 		xfs_rtrefcountbt_move_ptrs(mp, ifp->if_broot, old_size,
358 				new_size, new_numrecs);
359 	broot = xfs_broot_realloc(ifp, new_size);
360 
361 out_broot:
362 	ASSERT(xfs_rtrefcount_droot_space(broot) <=
363 	       xfs_inode_fork_size(cur->bc_ino.ip, cur->bc_ino.whichfork));
364 	return broot;
365 }
366 
367 const struct xfs_btree_ops xfs_rtrefcountbt_ops = {
368 	.name			= "rtrefcount",
369 	.type			= XFS_BTREE_TYPE_INODE,
370 	.geom_flags		= XFS_BTGEO_IROOT_RECORDS,
371 
372 	.rec_len		= sizeof(struct xfs_refcount_rec),
373 	.key_len		= sizeof(struct xfs_refcount_key),
374 	.ptr_len		= XFS_BTREE_LONG_PTR_LEN,
375 
376 	.lru_refs		= XFS_REFC_BTREE_REF,
377 	.statoff		= XFS_STATS_CALC_INDEX(xs_rtrefcbt_2),
378 	.sick_mask		= XFS_SICK_RG_REFCNTBT,
379 
380 	.dup_cursor		= xfs_rtrefcountbt_dup_cursor,
381 	.alloc_block		= xfs_btree_alloc_metafile_block,
382 	.free_block		= xfs_btree_free_metafile_block,
383 	.get_minrecs		= xfs_rtrefcountbt_get_minrecs,
384 	.get_maxrecs		= xfs_rtrefcountbt_get_maxrecs,
385 	.get_dmaxrecs		= xfs_rtrefcountbt_get_dmaxrecs,
386 	.init_key_from_rec	= xfs_rtrefcountbt_init_key_from_rec,
387 	.init_high_key_from_rec	= xfs_rtrefcountbt_init_high_key_from_rec,
388 	.init_rec_from_cur	= xfs_rtrefcountbt_init_rec_from_cur,
389 	.init_ptr_from_cur	= xfs_rtrefcountbt_init_ptr_from_cur,
390 	.key_diff		= xfs_rtrefcountbt_key_diff,
391 	.buf_ops		= &xfs_rtrefcountbt_buf_ops,
392 	.diff_two_keys		= xfs_rtrefcountbt_diff_two_keys,
393 	.keys_inorder		= xfs_rtrefcountbt_keys_inorder,
394 	.recs_inorder		= xfs_rtrefcountbt_recs_inorder,
395 	.keys_contiguous	= xfs_rtrefcountbt_keys_contiguous,
396 	.broot_realloc		= xfs_rtrefcountbt_broot_realloc,
397 };
398 
399 /* Allocate a new rt refcount btree cursor. */
400 struct xfs_btree_cur *
xfs_rtrefcountbt_init_cursor(struct xfs_trans * tp,struct xfs_rtgroup * rtg)401 xfs_rtrefcountbt_init_cursor(
402 	struct xfs_trans	*tp,
403 	struct xfs_rtgroup	*rtg)
404 {
405 	struct xfs_inode	*ip = rtg_refcount(rtg);
406 	struct xfs_mount	*mp = rtg_mount(rtg);
407 	struct xfs_btree_cur	*cur;
408 
409 	xfs_assert_ilocked(ip, XFS_ILOCK_SHARED | XFS_ILOCK_EXCL);
410 
411 	cur = xfs_btree_alloc_cursor(mp, tp, &xfs_rtrefcountbt_ops,
412 			mp->m_rtrefc_maxlevels, xfs_rtrefcountbt_cur_cache);
413 
414 	cur->bc_ino.ip = ip;
415 	cur->bc_refc.nr_ops = 0;
416 	cur->bc_refc.shape_changes = 0;
417 	cur->bc_group = xfs_group_hold(rtg_group(rtg));
418 	cur->bc_nlevels = be16_to_cpu(ip->i_df.if_broot->bb_level) + 1;
419 	cur->bc_ino.forksize = xfs_inode_fork_size(ip, XFS_DATA_FORK);
420 	cur->bc_ino.whichfork = XFS_DATA_FORK;
421 	return cur;
422 }
423 
424 /*
425  * Install a new rt reverse mapping btree root.  Caller is responsible for
426  * invalidating and freeing the old btree blocks.
427  */
428 void
xfs_rtrefcountbt_commit_staged_btree(struct xfs_btree_cur * cur,struct xfs_trans * tp)429 xfs_rtrefcountbt_commit_staged_btree(
430 	struct xfs_btree_cur	*cur,
431 	struct xfs_trans	*tp)
432 {
433 	struct xbtree_ifakeroot	*ifake = cur->bc_ino.ifake;
434 	struct xfs_ifork	*ifp;
435 	int			flags = XFS_ILOG_CORE | XFS_ILOG_DBROOT;
436 
437 	ASSERT(cur->bc_flags & XFS_BTREE_STAGING);
438 	ASSERT(ifake->if_fork->if_format == XFS_DINODE_FMT_META_BTREE);
439 
440 	/*
441 	 * Free any resources hanging off the real fork, then shallow-copy the
442 	 * staging fork's contents into the real fork to transfer everything
443 	 * we just built.
444 	 */
445 	ifp = xfs_ifork_ptr(cur->bc_ino.ip, XFS_DATA_FORK);
446 	xfs_idestroy_fork(ifp);
447 	memcpy(ifp, ifake->if_fork, sizeof(struct xfs_ifork));
448 
449 	cur->bc_ino.ip->i_projid = cur->bc_group->xg_gno;
450 	xfs_trans_log_inode(tp, cur->bc_ino.ip, flags);
451 	xfs_btree_commit_ifakeroot(cur, tp, XFS_DATA_FORK);
452 }
453 
454 /* Calculate number of records in a realtime refcount btree block. */
455 static inline unsigned int
xfs_rtrefcountbt_block_maxrecs(unsigned int blocklen,bool leaf)456 xfs_rtrefcountbt_block_maxrecs(
457 	unsigned int		blocklen,
458 	bool			leaf)
459 {
460 
461 	if (leaf)
462 		return blocklen / sizeof(struct xfs_refcount_rec);
463 	return blocklen / (sizeof(struct xfs_refcount_key) +
464 			   sizeof(xfs_rtrefcount_ptr_t));
465 }
466 
467 /*
468  * Calculate number of records in an refcount btree block.
469  */
470 unsigned int
xfs_rtrefcountbt_maxrecs(struct xfs_mount * mp,unsigned int blocklen,bool leaf)471 xfs_rtrefcountbt_maxrecs(
472 	struct xfs_mount	*mp,
473 	unsigned int		blocklen,
474 	bool			leaf)
475 {
476 	blocklen -= XFS_RTREFCOUNT_BLOCK_LEN;
477 	return xfs_rtrefcountbt_block_maxrecs(blocklen, leaf);
478 }
479 
480 /* Compute the max possible height for realtime refcount btrees. */
481 unsigned int
xfs_rtrefcountbt_maxlevels_ondisk(void)482 xfs_rtrefcountbt_maxlevels_ondisk(void)
483 {
484 	unsigned int		minrecs[2];
485 	unsigned int		blocklen;
486 
487 	blocklen = XFS_MIN_CRC_BLOCKSIZE - XFS_BTREE_LBLOCK_CRC_LEN;
488 
489 	minrecs[0] = xfs_rtrefcountbt_block_maxrecs(blocklen, true) / 2;
490 	minrecs[1] = xfs_rtrefcountbt_block_maxrecs(blocklen, false) / 2;
491 
492 	/* We need at most one record for every block in an rt group. */
493 	return xfs_btree_compute_maxlevels(minrecs, XFS_MAX_RGBLOCKS);
494 }
495 
496 int __init
xfs_rtrefcountbt_init_cur_cache(void)497 xfs_rtrefcountbt_init_cur_cache(void)
498 {
499 	xfs_rtrefcountbt_cur_cache = kmem_cache_create("xfs_rtrefcountbt_cur",
500 			xfs_btree_cur_sizeof(
501 					xfs_rtrefcountbt_maxlevels_ondisk()),
502 			0, 0, NULL);
503 
504 	if (!xfs_rtrefcountbt_cur_cache)
505 		return -ENOMEM;
506 	return 0;
507 }
508 
509 void
xfs_rtrefcountbt_destroy_cur_cache(void)510 xfs_rtrefcountbt_destroy_cur_cache(void)
511 {
512 	kmem_cache_destroy(xfs_rtrefcountbt_cur_cache);
513 	xfs_rtrefcountbt_cur_cache = NULL;
514 }
515 
516 /* Compute the maximum height of a realtime refcount btree. */
517 void
xfs_rtrefcountbt_compute_maxlevels(struct xfs_mount * mp)518 xfs_rtrefcountbt_compute_maxlevels(
519 	struct xfs_mount	*mp)
520 {
521 	unsigned int		d_maxlevels, r_maxlevels;
522 
523 	if (!xfs_has_rtreflink(mp)) {
524 		mp->m_rtrefc_maxlevels = 0;
525 		return;
526 	}
527 
528 	/*
529 	 * The realtime refcountbt lives on the data device, which means that
530 	 * its maximum height is constrained by the size of the data device and
531 	 * the height required to store one refcount record for each rtextent
532 	 * in an rt group.
533 	 */
534 	d_maxlevels = xfs_btree_space_to_height(mp->m_rtrefc_mnr,
535 				mp->m_sb.sb_dblocks);
536 	r_maxlevels = xfs_btree_compute_maxlevels(mp->m_rtrefc_mnr,
537 				mp->m_sb.sb_rgextents);
538 
539 	/* Add one level to handle the inode root level. */
540 	mp->m_rtrefc_maxlevels = min(d_maxlevels, r_maxlevels) + 1;
541 }
542 
543 /* Calculate the rtrefcount btree size for some records. */
544 unsigned long long
xfs_rtrefcountbt_calc_size(struct xfs_mount * mp,unsigned long long len)545 xfs_rtrefcountbt_calc_size(
546 	struct xfs_mount	*mp,
547 	unsigned long long	len)
548 {
549 	return xfs_btree_calc_size(mp->m_rtrefc_mnr, len);
550 }
551 
552 /*
553  * Calculate the maximum refcount btree size.
554  */
555 static unsigned long long
xfs_rtrefcountbt_max_size(struct xfs_mount * mp,xfs_rtblock_t rtblocks)556 xfs_rtrefcountbt_max_size(
557 	struct xfs_mount	*mp,
558 	xfs_rtblock_t		rtblocks)
559 {
560 	/* Bail out if we're uninitialized, which can happen in mkfs. */
561 	if (mp->m_rtrefc_mxr[0] == 0)
562 		return 0;
563 
564 	return xfs_rtrefcountbt_calc_size(mp, rtblocks);
565 }
566 
567 /*
568  * Figure out how many blocks to reserve and how many are used by this btree.
569  * We need enough space to hold one record for every rt extent in the rtgroup.
570  */
571 xfs_filblks_t
xfs_rtrefcountbt_calc_reserves(struct xfs_mount * mp)572 xfs_rtrefcountbt_calc_reserves(
573 	struct xfs_mount	*mp)
574 {
575 	if (!xfs_has_rtreflink(mp))
576 		return 0;
577 
578 	return xfs_rtrefcountbt_max_size(mp, mp->m_sb.sb_rgextents);
579 }
580 
581 /*
582  * Convert on-disk form of btree root to in-memory form.
583  */
584 STATIC void
xfs_rtrefcountbt_from_disk(struct xfs_inode * ip,struct xfs_rtrefcount_root * dblock,int dblocklen,struct xfs_btree_block * rblock)585 xfs_rtrefcountbt_from_disk(
586 	struct xfs_inode		*ip,
587 	struct xfs_rtrefcount_root	*dblock,
588 	int				dblocklen,
589 	struct xfs_btree_block		*rblock)
590 {
591 	struct xfs_mount		*mp = ip->i_mount;
592 	struct xfs_refcount_key	*fkp;
593 	__be64				*fpp;
594 	struct xfs_refcount_key	*tkp;
595 	__be64				*tpp;
596 	struct xfs_refcount_rec	*frp;
597 	struct xfs_refcount_rec	*trp;
598 	unsigned int			numrecs;
599 	unsigned int			maxrecs;
600 	unsigned int			rblocklen;
601 
602 	rblocklen = xfs_rtrefcount_broot_space(mp, dblock);
603 
604 	xfs_btree_init_block(mp, rblock, &xfs_rtrefcountbt_ops, 0, 0,
605 			ip->i_ino);
606 
607 	rblock->bb_level = dblock->bb_level;
608 	rblock->bb_numrecs = dblock->bb_numrecs;
609 
610 	if (be16_to_cpu(rblock->bb_level) > 0) {
611 		maxrecs = xfs_rtrefcountbt_droot_maxrecs(dblocklen, false);
612 		fkp = xfs_rtrefcount_droot_key_addr(dblock, 1);
613 		tkp = xfs_rtrefcount_key_addr(rblock, 1);
614 		fpp = xfs_rtrefcount_droot_ptr_addr(dblock, 1, maxrecs);
615 		tpp = xfs_rtrefcount_broot_ptr_addr(mp, rblock, 1, rblocklen);
616 		numrecs = be16_to_cpu(dblock->bb_numrecs);
617 		memcpy(tkp, fkp, 2 * sizeof(*fkp) * numrecs);
618 		memcpy(tpp, fpp, sizeof(*fpp) * numrecs);
619 	} else {
620 		frp = xfs_rtrefcount_droot_rec_addr(dblock, 1);
621 		trp = xfs_rtrefcount_rec_addr(rblock, 1);
622 		numrecs = be16_to_cpu(dblock->bb_numrecs);
623 		memcpy(trp, frp, sizeof(*frp) * numrecs);
624 	}
625 }
626 
627 /* Load a realtime reference count btree root in from disk. */
628 int
xfs_iformat_rtrefcount(struct xfs_inode * ip,struct xfs_dinode * dip)629 xfs_iformat_rtrefcount(
630 	struct xfs_inode	*ip,
631 	struct xfs_dinode	*dip)
632 {
633 	struct xfs_mount	*mp = ip->i_mount;
634 	struct xfs_rtrefcount_root *dfp = XFS_DFORK_PTR(dip, XFS_DATA_FORK);
635 	struct xfs_btree_block	*broot;
636 	unsigned int		numrecs;
637 	unsigned int		level;
638 	int			dsize;
639 
640 	/*
641 	 * growfs must create the rtrefcount inodes before adding a realtime
642 	 * volume to the filesystem, so we cannot use the rtrefcount predicate
643 	 * here.
644 	 */
645 	if (!xfs_has_reflink(ip->i_mount)) {
646 		xfs_inode_mark_sick(ip, XFS_SICK_INO_CORE);
647 		return -EFSCORRUPTED;
648 	}
649 
650 	dsize = XFS_DFORK_SIZE(dip, mp, XFS_DATA_FORK);
651 	numrecs = be16_to_cpu(dfp->bb_numrecs);
652 	level = be16_to_cpu(dfp->bb_level);
653 
654 	if (level > mp->m_rtrefc_maxlevels ||
655 	    xfs_rtrefcount_droot_space_calc(level, numrecs) > dsize) {
656 		xfs_inode_mark_sick(ip, XFS_SICK_INO_CORE);
657 		return -EFSCORRUPTED;
658 	}
659 
660 	broot = xfs_broot_alloc(xfs_ifork_ptr(ip, XFS_DATA_FORK),
661 			xfs_rtrefcount_broot_space_calc(mp, level, numrecs));
662 	if (broot)
663 		xfs_rtrefcountbt_from_disk(ip, dfp, dsize, broot);
664 	return 0;
665 }
666 
667 /*
668  * Convert in-memory form of btree root to on-disk form.
669  */
670 void
xfs_rtrefcountbt_to_disk(struct xfs_mount * mp,struct xfs_btree_block * rblock,int rblocklen,struct xfs_rtrefcount_root * dblock,int dblocklen)671 xfs_rtrefcountbt_to_disk(
672 	struct xfs_mount		*mp,
673 	struct xfs_btree_block		*rblock,
674 	int				rblocklen,
675 	struct xfs_rtrefcount_root	*dblock,
676 	int				dblocklen)
677 {
678 	struct xfs_refcount_key	*fkp;
679 	__be64				*fpp;
680 	struct xfs_refcount_key	*tkp;
681 	__be64				*tpp;
682 	struct xfs_refcount_rec	*frp;
683 	struct xfs_refcount_rec	*trp;
684 	unsigned int			maxrecs;
685 	unsigned int			numrecs;
686 
687 	ASSERT(rblock->bb_magic == cpu_to_be32(XFS_RTREFC_CRC_MAGIC));
688 	ASSERT(uuid_equal(&rblock->bb_u.l.bb_uuid, &mp->m_sb.sb_meta_uuid));
689 	ASSERT(rblock->bb_u.l.bb_blkno == cpu_to_be64(XFS_BUF_DADDR_NULL));
690 	ASSERT(rblock->bb_u.l.bb_leftsib == cpu_to_be64(NULLFSBLOCK));
691 	ASSERT(rblock->bb_u.l.bb_rightsib == cpu_to_be64(NULLFSBLOCK));
692 
693 	dblock->bb_level = rblock->bb_level;
694 	dblock->bb_numrecs = rblock->bb_numrecs;
695 
696 	if (be16_to_cpu(rblock->bb_level) > 0) {
697 		maxrecs = xfs_rtrefcountbt_droot_maxrecs(dblocklen, false);
698 		fkp = xfs_rtrefcount_key_addr(rblock, 1);
699 		tkp = xfs_rtrefcount_droot_key_addr(dblock, 1);
700 		fpp = xfs_rtrefcount_broot_ptr_addr(mp, rblock, 1, rblocklen);
701 		tpp = xfs_rtrefcount_droot_ptr_addr(dblock, 1, maxrecs);
702 		numrecs = be16_to_cpu(rblock->bb_numrecs);
703 		memcpy(tkp, fkp, 2 * sizeof(*fkp) * numrecs);
704 		memcpy(tpp, fpp, sizeof(*fpp) * numrecs);
705 	} else {
706 		frp = xfs_rtrefcount_rec_addr(rblock, 1);
707 		trp = xfs_rtrefcount_droot_rec_addr(dblock, 1);
708 		numrecs = be16_to_cpu(rblock->bb_numrecs);
709 		memcpy(trp, frp, sizeof(*frp) * numrecs);
710 	}
711 }
712 
713 /* Flush a realtime reference count btree root out to disk. */
714 void
xfs_iflush_rtrefcount(struct xfs_inode * ip,struct xfs_dinode * dip)715 xfs_iflush_rtrefcount(
716 	struct xfs_inode	*ip,
717 	struct xfs_dinode	*dip)
718 {
719 	struct xfs_ifork	*ifp = xfs_ifork_ptr(ip, XFS_DATA_FORK);
720 	struct xfs_rtrefcount_root *dfp = XFS_DFORK_PTR(dip, XFS_DATA_FORK);
721 
722 	ASSERT(ifp->if_broot != NULL);
723 	ASSERT(ifp->if_broot_bytes > 0);
724 	ASSERT(xfs_rtrefcount_droot_space(ifp->if_broot) <=
725 			xfs_inode_fork_size(ip, XFS_DATA_FORK));
726 	xfs_rtrefcountbt_to_disk(ip->i_mount, ifp->if_broot,
727 			ifp->if_broot_bytes, dfp,
728 			XFS_DFORK_SIZE(dip, ip->i_mount, XFS_DATA_FORK));
729 }
730 
731 /*
732  * Create a realtime refcount btree inode.
733  */
734 int
xfs_rtrefcountbt_create(struct xfs_rtgroup * rtg,struct xfs_inode * ip,struct xfs_trans * tp,bool init)735 xfs_rtrefcountbt_create(
736 	struct xfs_rtgroup	*rtg,
737 	struct xfs_inode	*ip,
738 	struct xfs_trans	*tp,
739 	bool			init)
740 {
741 	struct xfs_ifork	*ifp = xfs_ifork_ptr(ip, XFS_DATA_FORK);
742 	struct xfs_mount	*mp = ip->i_mount;
743 	struct xfs_btree_block	*broot;
744 
745 	ifp->if_format = XFS_DINODE_FMT_META_BTREE;
746 	ASSERT(ifp->if_broot_bytes == 0);
747 	ASSERT(ifp->if_bytes == 0);
748 
749 	/* Initialize the empty incore btree root. */
750 	broot = xfs_broot_realloc(ifp,
751 			xfs_rtrefcount_broot_space_calc(mp, 0, 0));
752 	if (broot)
753 		xfs_btree_init_block(mp, broot, &xfs_rtrefcountbt_ops, 0, 0,
754 				ip->i_ino);
755 	xfs_trans_log_inode(tp, ip, XFS_ILOG_CORE | XFS_ILOG_DBROOT);
756 	return 0;
757 }
758