xref: /freebsd/sys/fs/ext2fs/ext2_extents.c (revision 3fcbb8c0a9966ef9bd4fc7f5cdf85106427c29c5)
1d7511a40SPedro F. Giffuni /*-
2d7511a40SPedro F. Giffuni  * Copyright (c) 2010 Zheng Liu <lz@freebsd.org>
3d7511a40SPedro F. Giffuni  * All rights reserved.
4d7511a40SPedro F. Giffuni  *
5d7511a40SPedro F. Giffuni  * Redistribution and use in source and binary forms, with or without
6d7511a40SPedro F. Giffuni  * modification, are permitted provided that the following conditions
7d7511a40SPedro F. Giffuni  * are met:
8d7511a40SPedro F. Giffuni  * 1. Redistributions of source code must retain the above copyright
9d7511a40SPedro F. Giffuni  *    notice, this list of conditions and the following disclaimer.
10d7511a40SPedro F. Giffuni  * 2. Redistributions in binary form must reproduce the above copyright
11d7511a40SPedro F. Giffuni  *    notice, this list of conditions and the following disclaimer in the
12d7511a40SPedro F. Giffuni  *    documentation and/or other materials provided with the distribution.
13d7511a40SPedro F. Giffuni  *
14d7511a40SPedro F. Giffuni  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15d7511a40SPedro F. Giffuni  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16d7511a40SPedro F. Giffuni  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17d7511a40SPedro F. Giffuni  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18d7511a40SPedro F. Giffuni  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19d7511a40SPedro F. Giffuni  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20d7511a40SPedro F. Giffuni  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21d7511a40SPedro F. Giffuni  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22d7511a40SPedro F. Giffuni  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23d7511a40SPedro F. Giffuni  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24d7511a40SPedro F. Giffuni  * SUCH DAMAGE.
25d7511a40SPedro F. Giffuni  *
26d7511a40SPedro F. Giffuni  * $FreeBSD$
27d7511a40SPedro F. Giffuni  */
28d7511a40SPedro F. Giffuni 
29d7511a40SPedro F. Giffuni #include <sys/param.h>
30d7511a40SPedro F. Giffuni #include <sys/systm.h>
31d7511a40SPedro F. Giffuni #include <sys/types.h>
32d7511a40SPedro F. Giffuni #include <sys/kernel.h>
33d7511a40SPedro F. Giffuni #include <sys/malloc.h>
34d7511a40SPedro F. Giffuni #include <sys/vnode.h>
35d7511a40SPedro F. Giffuni #include <sys/bio.h>
36d7511a40SPedro F. Giffuni #include <sys/buf.h>
37d7511a40SPedro F. Giffuni #include <sys/conf.h>
38b394cd1eSFedor Uporov #include <sys/stat.h>
39d7511a40SPedro F. Giffuni 
40d7511a40SPedro F. Giffuni #include <fs/ext2fs/ext2_mount.h>
41d7511a40SPedro F. Giffuni #include <fs/ext2fs/fs.h>
42d7511a40SPedro F. Giffuni #include <fs/ext2fs/inode.h>
43d7511a40SPedro F. Giffuni #include <fs/ext2fs/ext2fs.h>
44d7511a40SPedro F. Giffuni #include <fs/ext2fs/ext2_extents.h>
45d7511a40SPedro F. Giffuni #include <fs/ext2fs/ext2_extern.h>
46d7511a40SPedro F. Giffuni 
47b394cd1eSFedor Uporov static MALLOC_DEFINE(M_EXT2EXTENTS, "ext2_extents", "EXT2 extents");
48d7511a40SPedro F. Giffuni 
49b394cd1eSFedor Uporov #ifdef EXT2FS_DEBUG
50b394cd1eSFedor Uporov static void
51b394cd1eSFedor Uporov ext4_ext_print_extent(struct ext4_extent *ep)
52b394cd1eSFedor Uporov {
53b394cd1eSFedor Uporov 
54b394cd1eSFedor Uporov 	printf("    ext %p => (blk %u len %u start %lu)\n",
55b394cd1eSFedor Uporov 	    ep, ep->e_blk, ep->e_len,
56b394cd1eSFedor Uporov 	    (uint64_t)ep->e_start_hi << 32 | ep->e_start_lo);
57d7511a40SPedro F. Giffuni }
58d7511a40SPedro F. Giffuni 
59b394cd1eSFedor Uporov static void ext4_ext_print_header(struct inode *ip, struct ext4_extent_header *ehp);
60b394cd1eSFedor Uporov 
61b394cd1eSFedor Uporov static void
62b394cd1eSFedor Uporov ext4_ext_print_index(struct inode *ip, struct ext4_extent_index *ex, int do_walk)
63b394cd1eSFedor Uporov {
64b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
65b394cd1eSFedor Uporov 	struct buf *bp;
66b394cd1eSFedor Uporov 	int error;
67b394cd1eSFedor Uporov 
68b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
69b394cd1eSFedor Uporov 
70b394cd1eSFedor Uporov 	printf("    index %p => (blk %u pblk %lu)\n",
71b394cd1eSFedor Uporov 	    ex, ex->ei_blk, (uint64_t)ex->ei_leaf_hi << 32 | ex->ei_leaf_lo);
72b394cd1eSFedor Uporov 
73b394cd1eSFedor Uporov 	if(!do_walk)
74b394cd1eSFedor Uporov 		return;
75b394cd1eSFedor Uporov 
76b394cd1eSFedor Uporov 	if ((error = bread(ip->i_devvp,
77b394cd1eSFedor Uporov 	    fsbtodb(fs, ((uint64_t)ex->ei_leaf_hi << 32 | ex->ei_leaf_lo)),
78b394cd1eSFedor Uporov 	    (int)fs->e2fs_bsize, NOCRED, &bp)) != 0) {
79b394cd1eSFedor Uporov 		brelse(bp);
80b394cd1eSFedor Uporov 		return;
8178f6ea54SPedro F. Giffuni 	}
82b394cd1eSFedor Uporov 
83b394cd1eSFedor Uporov 	ext4_ext_print_header(ip, (struct ext4_extent_header *)bp->b_data);
84b394cd1eSFedor Uporov 
85b394cd1eSFedor Uporov 	brelse(bp);
86b394cd1eSFedor Uporov 
87d7511a40SPedro F. Giffuni }
88d7511a40SPedro F. Giffuni 
89d7511a40SPedro F. Giffuni static void
90b394cd1eSFedor Uporov ext4_ext_print_header(struct inode *ip, struct ext4_extent_header *ehp)
91d7511a40SPedro F. Giffuni {
92b394cd1eSFedor Uporov 	int i;
93d7511a40SPedro F. Giffuni 
94b394cd1eSFedor Uporov 	printf("header %p => (magic 0x%x entries %d max %d depth %d gen %d)\n",
95b394cd1eSFedor Uporov 	    ehp, ehp->eh_magic, ehp->eh_ecount, ehp->eh_max, ehp->eh_depth,
96b394cd1eSFedor Uporov 	    ehp->eh_gen);
97b394cd1eSFedor Uporov 
98b394cd1eSFedor Uporov 	for (i = 0; i < ehp->eh_ecount; i++)
99b394cd1eSFedor Uporov 		if (ehp->eh_depth != 0)
100b394cd1eSFedor Uporov 			ext4_ext_print_index(ip,
101b394cd1eSFedor Uporov 			    (struct ext4_extent_index *)(ehp + 1 + i), 1);
102b394cd1eSFedor Uporov 		else
103b394cd1eSFedor Uporov 			ext4_ext_print_extent((struct ext4_extent *)(ehp + 1 + i));
104b394cd1eSFedor Uporov }
105b394cd1eSFedor Uporov 
106b394cd1eSFedor Uporov static void
107b394cd1eSFedor Uporov ext4_ext_print_path(struct inode *ip, struct ext4_extent_path *path)
108b394cd1eSFedor Uporov {
109b394cd1eSFedor Uporov 	int k, l;
110b394cd1eSFedor Uporov 
111b394cd1eSFedor Uporov 	l = path->ep_depth
112b394cd1eSFedor Uporov 
113b394cd1eSFedor Uporov 	printf("ip=%d, Path:\n", ip->i_number);
114b394cd1eSFedor Uporov 	for (k = 0; k <= l; k++, path++) {
115b394cd1eSFedor Uporov 		if (path->ep_index) {
116b394cd1eSFedor Uporov 			ext4_ext_print_index(ip, path->ep_index, 0);
117b394cd1eSFedor Uporov 		} else if (path->ep_ext) {
118b394cd1eSFedor Uporov 			ext4_ext_print_extent(path->ep_ext);
119b394cd1eSFedor Uporov 		}
120b394cd1eSFedor Uporov 	}
121b394cd1eSFedor Uporov }
122b394cd1eSFedor Uporov 
123b394cd1eSFedor Uporov void
124b394cd1eSFedor Uporov ext4_ext_print_extent_tree_status(struct inode * ip)
125b394cd1eSFedor Uporov {
126b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
127b394cd1eSFedor Uporov 	struct ext4_extent_header *ehp;
128b394cd1eSFedor Uporov 
129b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
130b394cd1eSFedor Uporov 	ehp = (struct ext4_extent_header *)(char *)ip->i_db;
131b394cd1eSFedor Uporov 
132b394cd1eSFedor Uporov 	printf("Extent status:ip=%d\n", ip->i_number);
133b394cd1eSFedor Uporov 	if (!(ip->i_flag & IN_E4EXTENTS))
134d7511a40SPedro F. Giffuni 		return;
135d7511a40SPedro F. Giffuni 
136b394cd1eSFedor Uporov 	ext4_ext_print_header(ip, ehp);
137d7511a40SPedro F. Giffuni 
138e813d9d7SPedro F. Giffuni 	return;
139e813d9d7SPedro F. Giffuni }
140b394cd1eSFedor Uporov #endif
141b394cd1eSFedor Uporov 
142b394cd1eSFedor Uporov static inline struct ext4_extent_header *
143b394cd1eSFedor Uporov ext4_ext_inode_header(struct inode *ip)
144b394cd1eSFedor Uporov {
145b394cd1eSFedor Uporov 
146b394cd1eSFedor Uporov 	return ((struct ext4_extent_header *)ip->i_db);
147d7511a40SPedro F. Giffuni }
148d7511a40SPedro F. Giffuni 
149b394cd1eSFedor Uporov static inline struct ext4_extent_header *
150b394cd1eSFedor Uporov ext4_ext_block_header(char *bdata)
151b394cd1eSFedor Uporov {
152b394cd1eSFedor Uporov 
153b394cd1eSFedor Uporov 	return ((struct ext4_extent_header *)bdata);
154b394cd1eSFedor Uporov }
155b394cd1eSFedor Uporov 
156b394cd1eSFedor Uporov static inline unsigned short
157b394cd1eSFedor Uporov ext4_ext_inode_depth(struct inode *ip)
158b394cd1eSFedor Uporov {
159b394cd1eSFedor Uporov 	struct ext4_extent_header *ehp;
160b394cd1eSFedor Uporov 
161b394cd1eSFedor Uporov 	ehp = (struct ext4_extent_header *)ip->i_data;
162b394cd1eSFedor Uporov 	return (ehp->eh_depth);
163b394cd1eSFedor Uporov }
164b394cd1eSFedor Uporov 
165b394cd1eSFedor Uporov static inline e4fs_daddr_t
166b394cd1eSFedor Uporov ext4_ext_index_pblock(struct ext4_extent_index *index)
167b394cd1eSFedor Uporov {
168b394cd1eSFedor Uporov 	e4fs_daddr_t blk;
169b394cd1eSFedor Uporov 
170b394cd1eSFedor Uporov 	blk = index->ei_leaf_lo;
171b394cd1eSFedor Uporov 	blk |= (e4fs_daddr_t)index->ei_leaf_hi << 32;
172b394cd1eSFedor Uporov 
173b394cd1eSFedor Uporov 	return (blk);
174b394cd1eSFedor Uporov }
175b394cd1eSFedor Uporov 
176b394cd1eSFedor Uporov static inline void
177b394cd1eSFedor Uporov ext4_index_store_pblock(struct ext4_extent_index *index, e4fs_daddr_t pb)
178b394cd1eSFedor Uporov {
179b394cd1eSFedor Uporov 
180b394cd1eSFedor Uporov 	index->ei_leaf_lo = pb & 0xffffffff;
181b394cd1eSFedor Uporov 	index->ei_leaf_hi = (pb >> 32) & 0xffff;
182b394cd1eSFedor Uporov }
183b394cd1eSFedor Uporov 
184b394cd1eSFedor Uporov 
185b394cd1eSFedor Uporov static inline e4fs_daddr_t
186b394cd1eSFedor Uporov ext4_ext_extent_pblock(struct ext4_extent *extent)
187b394cd1eSFedor Uporov {
188b394cd1eSFedor Uporov 	e4fs_daddr_t blk;
189b394cd1eSFedor Uporov 
190b394cd1eSFedor Uporov 	blk = extent->e_start_lo;
191b394cd1eSFedor Uporov 	blk |= (e4fs_daddr_t)extent->e_start_hi << 32;
192b394cd1eSFedor Uporov 
193b394cd1eSFedor Uporov 	return (blk);
194b394cd1eSFedor Uporov }
195b394cd1eSFedor Uporov 
196b394cd1eSFedor Uporov static inline void
197b394cd1eSFedor Uporov ext4_ext_store_pblock(struct ext4_extent *ex, e4fs_daddr_t pb)
198b394cd1eSFedor Uporov {
199b394cd1eSFedor Uporov 
200b394cd1eSFedor Uporov 	ex->e_start_lo = pb & 0xffffffff;
201b394cd1eSFedor Uporov 	ex->e_start_hi = (pb >> 32) & 0xffff;
202b394cd1eSFedor Uporov }
203b394cd1eSFedor Uporov 
204d7511a40SPedro F. Giffuni int
205d7511a40SPedro F. Giffuni ext4_ext_in_cache(struct inode *ip, daddr_t lbn, struct ext4_extent *ep)
206d7511a40SPedro F. Giffuni {
207d7511a40SPedro F. Giffuni 	struct ext4_extent_cache *ecp;
208d7511a40SPedro F. Giffuni 	int ret = EXT4_EXT_CACHE_NO;
209d7511a40SPedro F. Giffuni 
210d7511a40SPedro F. Giffuni 	ecp = &ip->i_ext_cache;
211d7511a40SPedro F. Giffuni 	if (ecp->ec_type == EXT4_EXT_CACHE_NO)
212d7511a40SPedro F. Giffuni 		return (ret);
213d7511a40SPedro F. Giffuni 
214d7511a40SPedro F. Giffuni 	if (lbn >= ecp->ec_blk && lbn < ecp->ec_blk + ecp->ec_len) {
215d7511a40SPedro F. Giffuni 		ep->e_blk = ecp->ec_blk;
216d7511a40SPedro F. Giffuni 		ep->e_start_lo = ecp->ec_start & 0xffffffff;
217d7511a40SPedro F. Giffuni 		ep->e_start_hi = ecp->ec_start >> 32 & 0xffff;
218d7511a40SPedro F. Giffuni 		ep->e_len = ecp->ec_len;
219d7511a40SPedro F. Giffuni 		ret = ecp->ec_type;
220d7511a40SPedro F. Giffuni 	}
221d7511a40SPedro F. Giffuni 	return (ret);
222d7511a40SPedro F. Giffuni }
223d7511a40SPedro F. Giffuni 
224b394cd1eSFedor Uporov static int
225b394cd1eSFedor Uporov ext4_ext_check_header(struct inode *ip, struct ext4_extent_header *eh)
226d7511a40SPedro F. Giffuni {
227b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
228b394cd1eSFedor Uporov 	char *error_msg;
229d7511a40SPedro F. Giffuni 
230b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
231b394cd1eSFedor Uporov 
232b394cd1eSFedor Uporov 	if (eh->eh_magic != EXT4_EXT_MAGIC) {
233b394cd1eSFedor Uporov 		error_msg = "invalid magic";
234b394cd1eSFedor Uporov 		goto corrupted;
235b394cd1eSFedor Uporov 	}
236b394cd1eSFedor Uporov 	if (eh->eh_max == 0) {
237b394cd1eSFedor Uporov 		error_msg = "invalid eh_max";
238b394cd1eSFedor Uporov 		goto corrupted;
239b394cd1eSFedor Uporov 	}
240b394cd1eSFedor Uporov 	if (eh->eh_ecount > eh->eh_max) {
241b394cd1eSFedor Uporov 		error_msg = "invalid eh_entries";
242b394cd1eSFedor Uporov 		goto corrupted;
243d7511a40SPedro F. Giffuni 	}
244d7511a40SPedro F. Giffuni 
245b394cd1eSFedor Uporov 	return (0);
246b394cd1eSFedor Uporov 
247b394cd1eSFedor Uporov corrupted:
248b394cd1eSFedor Uporov 	ext2_fserr(fs, ip->i_uid, error_msg);
249b394cd1eSFedor Uporov 	return (EIO);
250b394cd1eSFedor Uporov }
251b394cd1eSFedor Uporov 
252b394cd1eSFedor Uporov static void
253b394cd1eSFedor Uporov ext4_ext_binsearch_index(struct ext4_extent_path *path, int blk)
254b394cd1eSFedor Uporov {
255b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
256b394cd1eSFedor Uporov 	struct ext4_extent_index *r, *l, *m;
257b394cd1eSFedor Uporov 
258b394cd1eSFedor Uporov 	eh = path->ep_header;
259b394cd1eSFedor Uporov 
260b394cd1eSFedor Uporov 	KASSERT(eh->eh_ecount <= eh->eh_max && eh->eh_ecount > 0,
261b394cd1eSFedor Uporov 	    ("ext4_ext_binsearch_index: bad args"));
262b394cd1eSFedor Uporov 
263b394cd1eSFedor Uporov 	l = EXT_FIRST_INDEX(eh) + 1;
264b394cd1eSFedor Uporov 	r = EXT_FIRST_INDEX(eh) + eh->eh_ecount - 1;
265b394cd1eSFedor Uporov 	while (l <= r) {
266b394cd1eSFedor Uporov 		m = l + (r - l) / 2;
267b394cd1eSFedor Uporov 		if (blk < m->ei_blk)
268b394cd1eSFedor Uporov 			r = m - 1;
269b394cd1eSFedor Uporov 		else
270b394cd1eSFedor Uporov 			l = m + 1;
271b394cd1eSFedor Uporov 	}
272b394cd1eSFedor Uporov 
273b394cd1eSFedor Uporov 	path->ep_index = l - 1;
274b394cd1eSFedor Uporov }
275b394cd1eSFedor Uporov 
276b394cd1eSFedor Uporov static void
277b394cd1eSFedor Uporov ext4_ext_binsearch_ext(struct ext4_extent_path *path, int blk)
278b394cd1eSFedor Uporov {
279b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
280b394cd1eSFedor Uporov 	struct ext4_extent *r, *l, *m;
281b394cd1eSFedor Uporov 
282b394cd1eSFedor Uporov 	eh = path->ep_header;
283b394cd1eSFedor Uporov 
284b394cd1eSFedor Uporov 	KASSERT(eh->eh_ecount <= eh->eh_max,
285b394cd1eSFedor Uporov 	    ("ext4_ext_binsearch_ext: bad args"));
286b394cd1eSFedor Uporov 
287b394cd1eSFedor Uporov 	if (eh->eh_ecount == 0)
288b394cd1eSFedor Uporov 		return;
289b394cd1eSFedor Uporov 
290b394cd1eSFedor Uporov 	l = EXT_FIRST_EXTENT(eh) + 1;
291b394cd1eSFedor Uporov 	r = EXT_FIRST_EXTENT(eh) + eh->eh_ecount - 1;
292b394cd1eSFedor Uporov 
293b394cd1eSFedor Uporov 	while (l <= r) {
294b394cd1eSFedor Uporov 		m = l + (r - l) / 2;
295b394cd1eSFedor Uporov 		if (blk < m->e_blk)
296b394cd1eSFedor Uporov 			r = m - 1;
297b394cd1eSFedor Uporov 		else
298b394cd1eSFedor Uporov 			l = m + 1;
299b394cd1eSFedor Uporov 	}
300b394cd1eSFedor Uporov 
301b394cd1eSFedor Uporov 	path->ep_ext = l - 1;
302b394cd1eSFedor Uporov }
303b394cd1eSFedor Uporov 
304b394cd1eSFedor Uporov static int
305b394cd1eSFedor Uporov ext4_ext_fill_path_bdata(struct ext4_extent_path *path,
306b394cd1eSFedor Uporov     struct buf *bp, uint64_t blk)
307b394cd1eSFedor Uporov {
308b394cd1eSFedor Uporov 
309b394cd1eSFedor Uporov 	KASSERT(path->ep_data == NULL,
310b394cd1eSFedor Uporov 	    ("ext4_ext_fill_path_bdata: bad ep_data"));
311b394cd1eSFedor Uporov 
312b394cd1eSFedor Uporov 	path->ep_data = malloc(bp->b_bufsize, M_EXT2EXTENTS, M_WAITOK);
313b394cd1eSFedor Uporov 	if (!path->ep_data)
314b394cd1eSFedor Uporov 		return (ENOMEM);
315b394cd1eSFedor Uporov 
316b394cd1eSFedor Uporov 	memcpy(path->ep_data, bp->b_data, bp->b_bufsize);
317b394cd1eSFedor Uporov 	path->ep_blk = blk;
318b394cd1eSFedor Uporov 
319b394cd1eSFedor Uporov 	return (0);
320b394cd1eSFedor Uporov }
321b394cd1eSFedor Uporov 
322b394cd1eSFedor Uporov static void
323b394cd1eSFedor Uporov ext4_ext_fill_path_buf(struct ext4_extent_path *path, struct buf *bp)
324b394cd1eSFedor Uporov {
325b394cd1eSFedor Uporov 
326b394cd1eSFedor Uporov 	KASSERT(path->ep_data != NULL,
327b394cd1eSFedor Uporov 	    ("ext4_ext_fill_path_buf: bad ep_data"));
328b394cd1eSFedor Uporov 
329b394cd1eSFedor Uporov 	memcpy(bp->b_data, path->ep_data, bp->b_bufsize);
330b394cd1eSFedor Uporov }
331b394cd1eSFedor Uporov 
332b394cd1eSFedor Uporov static void
333b394cd1eSFedor Uporov ext4_ext_drop_refs(struct ext4_extent_path *path)
334b394cd1eSFedor Uporov {
335b394cd1eSFedor Uporov 	int depth, i;
336b394cd1eSFedor Uporov 
337b394cd1eSFedor Uporov 	if (!path)
338b394cd1eSFedor Uporov 		return;
339b394cd1eSFedor Uporov 
340b394cd1eSFedor Uporov 	depth = path->ep_depth;
341b394cd1eSFedor Uporov 	for (i = 0; i <= depth; i++, path++)
342b394cd1eSFedor Uporov 		if (path->ep_data) {
343b394cd1eSFedor Uporov 			free(path->ep_data, M_EXT2EXTENTS);
344b394cd1eSFedor Uporov 			path->ep_data = NULL;
345b394cd1eSFedor Uporov 		}
346b394cd1eSFedor Uporov }
347b394cd1eSFedor Uporov 
348b394cd1eSFedor Uporov void
349b394cd1eSFedor Uporov ext4_ext_path_free(struct ext4_extent_path *path)
350b394cd1eSFedor Uporov {
351b394cd1eSFedor Uporov 
352b394cd1eSFedor Uporov 	if (!path)
353b394cd1eSFedor Uporov 		return;
354b394cd1eSFedor Uporov 
355b394cd1eSFedor Uporov 	ext4_ext_drop_refs(path);
356b394cd1eSFedor Uporov 	free(path, M_EXT2EXTENTS);
357b394cd1eSFedor Uporov }
358b394cd1eSFedor Uporov 
359b394cd1eSFedor Uporov int
360b394cd1eSFedor Uporov ext4_ext_find_extent(struct inode *ip, daddr_t block,
361b394cd1eSFedor Uporov     struct ext4_extent_path **ppath)
362b394cd1eSFedor Uporov {
363b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
364b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
365b394cd1eSFedor Uporov 	struct ext4_extent_path *path;
366b394cd1eSFedor Uporov 	struct buf *bp;
367b394cd1eSFedor Uporov 	uint64_t blk;
368b394cd1eSFedor Uporov 	int error, depth, i, ppos, alloc;
369b394cd1eSFedor Uporov 
370b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
371b394cd1eSFedor Uporov 	eh = ext4_ext_inode_header(ip);
372b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
373b394cd1eSFedor Uporov 	ppos = 0;
374b394cd1eSFedor Uporov 	alloc = 0;
375b394cd1eSFedor Uporov 
376b394cd1eSFedor Uporov 	error = ext4_ext_check_header(ip, eh);
377b394cd1eSFedor Uporov 	if (error)
378b394cd1eSFedor Uporov 		return (error);
379b394cd1eSFedor Uporov 
380*3fcbb8c0SFedor Uporov 	if (ppath == NULL)
381b394cd1eSFedor Uporov 		return (EINVAL);
382b394cd1eSFedor Uporov 
383b394cd1eSFedor Uporov 	path = *ppath;
384*3fcbb8c0SFedor Uporov 	if (path == NULL) {
385b394cd1eSFedor Uporov 		path = malloc(EXT4_EXT_DEPTH_MAX *
386b394cd1eSFedor Uporov 		    sizeof(struct ext4_extent_path),
387b394cd1eSFedor Uporov 		    M_EXT2EXTENTS, M_WAITOK | M_ZERO);
388b394cd1eSFedor Uporov 		if (!path)
389b394cd1eSFedor Uporov 			return (ENOMEM);
390b394cd1eSFedor Uporov 
391b394cd1eSFedor Uporov 		*ppath = path;
392b394cd1eSFedor Uporov 		alloc = 1;
393b394cd1eSFedor Uporov 	}
394b394cd1eSFedor Uporov 
395b394cd1eSFedor Uporov 	path[0].ep_header = eh;
396b394cd1eSFedor Uporov 	path[0].ep_data = NULL;
397b394cd1eSFedor Uporov 
398b394cd1eSFedor Uporov 	/* Walk through the tree. */
399b394cd1eSFedor Uporov 	i = depth;
400b394cd1eSFedor Uporov 	while (i) {
401b394cd1eSFedor Uporov 		ext4_ext_binsearch_index(&path[ppos], block);
402b394cd1eSFedor Uporov 		blk = ext4_ext_index_pblock(path[ppos].ep_index);
403b394cd1eSFedor Uporov 		path[ppos].ep_depth = i;
404b394cd1eSFedor Uporov 		path[ppos].ep_ext = NULL;
405b394cd1eSFedor Uporov 
406b394cd1eSFedor Uporov 		error = bread(ip->i_devvp, fsbtodb(ip->i_e2fs, blk),
407b394cd1eSFedor Uporov 		    ip->i_e2fs->e2fs_bsize, NOCRED, &bp);
408b394cd1eSFedor Uporov 		if (error) {
409b394cd1eSFedor Uporov 			brelse(bp);
410b394cd1eSFedor Uporov 			goto error;
411b394cd1eSFedor Uporov 		}
412b394cd1eSFedor Uporov 
413b394cd1eSFedor Uporov 		ppos++;
414b394cd1eSFedor Uporov 		if (ppos > depth) {
415b394cd1eSFedor Uporov 			ext2_fserr(fs, ip->i_uid,
416b394cd1eSFedor Uporov 			    "ppos > depth => extent corrupted");
417b394cd1eSFedor Uporov 			error = EIO;
418b394cd1eSFedor Uporov 			brelse(bp);
419b394cd1eSFedor Uporov 			goto error;
420b394cd1eSFedor Uporov 		}
421b394cd1eSFedor Uporov 
422b394cd1eSFedor Uporov 		ext4_ext_fill_path_bdata(&path[ppos], bp, blk);
423b394cd1eSFedor Uporov 		brelse(bp);
424b394cd1eSFedor Uporov 
425b394cd1eSFedor Uporov 		eh = ext4_ext_block_header(path[ppos].ep_data);
426b394cd1eSFedor Uporov 		error = ext4_ext_check_header(ip, eh);
427b394cd1eSFedor Uporov 		if (error)
428b394cd1eSFedor Uporov 			goto error;
429b394cd1eSFedor Uporov 
430b394cd1eSFedor Uporov 		path[ppos].ep_header = eh;
431b394cd1eSFedor Uporov 
432b394cd1eSFedor Uporov 		i--;
433b394cd1eSFedor Uporov 	}
434b394cd1eSFedor Uporov 
435b394cd1eSFedor Uporov 	error = ext4_ext_check_header(ip, eh);
436b394cd1eSFedor Uporov 	if (error)
437b394cd1eSFedor Uporov 		goto error;
438b394cd1eSFedor Uporov 
439b394cd1eSFedor Uporov 	/* Find extent. */
440b394cd1eSFedor Uporov 	path[ppos].ep_depth = i;
441b394cd1eSFedor Uporov 	path[ppos].ep_header = eh;
442b394cd1eSFedor Uporov 	path[ppos].ep_ext = NULL;
443b394cd1eSFedor Uporov 	path[ppos].ep_index = NULL;
444b394cd1eSFedor Uporov 	ext4_ext_binsearch_ext(&path[ppos], block);
445b394cd1eSFedor Uporov 	return (0);
446b394cd1eSFedor Uporov 
447b394cd1eSFedor Uporov error:
448b394cd1eSFedor Uporov 	ext4_ext_drop_refs(path);
449b394cd1eSFedor Uporov 	if (alloc)
450b394cd1eSFedor Uporov 		free(path, M_EXT2EXTENTS);
451b394cd1eSFedor Uporov 
452b394cd1eSFedor Uporov 	*ppath = NULL;
453b394cd1eSFedor Uporov 
454b394cd1eSFedor Uporov 	return (error);
455b394cd1eSFedor Uporov }
456b394cd1eSFedor Uporov 
457b394cd1eSFedor Uporov static inline int
458b394cd1eSFedor Uporov ext4_ext_space_root(struct inode *ip)
459b394cd1eSFedor Uporov {
460b394cd1eSFedor Uporov 	int size;
461b394cd1eSFedor Uporov 
462b394cd1eSFedor Uporov 	size = sizeof(ip->i_data);
463b394cd1eSFedor Uporov 	size -= sizeof(struct ext4_extent_header);
464b394cd1eSFedor Uporov 	size /= sizeof(struct ext4_extent);
465b394cd1eSFedor Uporov 
466b394cd1eSFedor Uporov 	return (size);
467b394cd1eSFedor Uporov }
468b394cd1eSFedor Uporov 
469b394cd1eSFedor Uporov static inline int
470b394cd1eSFedor Uporov ext4_ext_space_block(struct inode *ip)
471b394cd1eSFedor Uporov {
472b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
473b394cd1eSFedor Uporov 	int size;
474b394cd1eSFedor Uporov 
475b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
476b394cd1eSFedor Uporov 
477b394cd1eSFedor Uporov 	size = (fs->e2fs_bsize - sizeof(struct ext4_extent_header)) /
478b394cd1eSFedor Uporov 	    sizeof(struct ext4_extent);
479b394cd1eSFedor Uporov 
480b394cd1eSFedor Uporov 	return (size);
481b394cd1eSFedor Uporov }
482b394cd1eSFedor Uporov 
483b394cd1eSFedor Uporov static inline int
484b394cd1eSFedor Uporov ext4_ext_space_block_index(struct inode *ip)
485b394cd1eSFedor Uporov {
486b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
487b394cd1eSFedor Uporov 	int size;
488b394cd1eSFedor Uporov 
489b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
490b394cd1eSFedor Uporov 
491b394cd1eSFedor Uporov 	size = (fs->e2fs_bsize - sizeof(struct ext4_extent_header)) /
492b394cd1eSFedor Uporov 	    sizeof(struct ext4_extent_index);
493b394cd1eSFedor Uporov 
494b394cd1eSFedor Uporov 	return (size);
495b394cd1eSFedor Uporov }
496b394cd1eSFedor Uporov 
497b394cd1eSFedor Uporov void
498b394cd1eSFedor Uporov ext4_ext_tree_init(struct inode *ip)
499d7511a40SPedro F. Giffuni {
500d7511a40SPedro F. Giffuni 	struct ext4_extent_header *ehp;
501d7511a40SPedro F. Giffuni 
502b394cd1eSFedor Uporov 	ip->i_flag |= IN_E4EXTENTS;
503d7511a40SPedro F. Giffuni 
504b394cd1eSFedor Uporov 	memset(ip->i_data, 0, EXT2_NDADDR + EXT2_NIADDR);
505b394cd1eSFedor Uporov 	ehp = (struct ext4_extent_header *)ip->i_data;
506b394cd1eSFedor Uporov 	ehp->eh_magic = EXT4_EXT_MAGIC;
507b394cd1eSFedor Uporov 	ehp->eh_max = ext4_ext_space_root(ip);
508b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_type = EXT4_EXT_CACHE_NO;
509b394cd1eSFedor Uporov 	ip->i_flag |= IN_CHANGE | IN_UPDATE;
510b394cd1eSFedor Uporov 	ext2_update(ip->i_vnode, 1);
51178f6ea54SPedro F. Giffuni }
512d7511a40SPedro F. Giffuni 
513b394cd1eSFedor Uporov static inline void
514b394cd1eSFedor Uporov ext4_ext_put_in_cache(struct inode *ip, uint32_t blk,
515b394cd1eSFedor Uporov 			uint32_t len, uint32_t start, int type)
516b394cd1eSFedor Uporov {
517b394cd1eSFedor Uporov 
518b394cd1eSFedor Uporov 	KASSERT(len != 0, ("ext4_ext_put_in_cache: bad input"));
519b394cd1eSFedor Uporov 
520b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_type = type;
521b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_blk = blk;
522b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_len = len;
523b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_start = start;
524d7511a40SPedro F. Giffuni }
525b394cd1eSFedor Uporov 
526b394cd1eSFedor Uporov static e4fs_daddr_t
527b394cd1eSFedor Uporov ext4_ext_blkpref(struct inode *ip, struct ext4_extent_path *path,
528b394cd1eSFedor Uporov     e4fs_daddr_t block)
529b394cd1eSFedor Uporov {
530b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
531b394cd1eSFedor Uporov 	struct ext4_extent *ex;
532b394cd1eSFedor Uporov 	e4fs_daddr_t bg_start;
533b394cd1eSFedor Uporov 	int depth;
534b394cd1eSFedor Uporov 
535b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
536b394cd1eSFedor Uporov 
537b394cd1eSFedor Uporov 	if (path) {
538b394cd1eSFedor Uporov 		depth = path->ep_depth;
539b394cd1eSFedor Uporov 		ex = path[depth].ep_ext;
540b394cd1eSFedor Uporov 		if (ex) {
541b394cd1eSFedor Uporov 			e4fs_daddr_t pblk = ext4_ext_extent_pblock(ex);
542b394cd1eSFedor Uporov 			e2fs_daddr_t blk = ex->e_blk;
543b394cd1eSFedor Uporov 
544b394cd1eSFedor Uporov 			if (block > blk)
545b394cd1eSFedor Uporov 				return (pblk + (block - blk));
546b394cd1eSFedor Uporov 			else
547b394cd1eSFedor Uporov 				return (pblk - (blk - block));
548b394cd1eSFedor Uporov 		}
549b394cd1eSFedor Uporov 
550b394cd1eSFedor Uporov 		/* Try to get block from index itself. */
551b394cd1eSFedor Uporov 		if (path[depth].ep_data)
552b394cd1eSFedor Uporov 			return (path[depth].ep_blk);
553b394cd1eSFedor Uporov 	}
554b394cd1eSFedor Uporov 
555b394cd1eSFedor Uporov 	/* Use inode's group. */
556b394cd1eSFedor Uporov 	bg_start = (ip->i_block_group * EXT2_BLOCKS_PER_GROUP(ip->i_e2fs)) +
557b394cd1eSFedor Uporov 	    fs->e2fs->e2fs_first_dblock;
558b394cd1eSFedor Uporov 
559b394cd1eSFedor Uporov 	return (bg_start + block);
560b394cd1eSFedor Uporov }
561b394cd1eSFedor Uporov 
562b394cd1eSFedor Uporov static int inline
563b394cd1eSFedor Uporov ext4_can_extents_be_merged(struct ext4_extent *ex1,
564b394cd1eSFedor Uporov     struct ext4_extent *ex2)
565b394cd1eSFedor Uporov {
566b394cd1eSFedor Uporov 
567b394cd1eSFedor Uporov 	if (ex1->e_blk + ex1->e_len != ex2->e_blk)
568b394cd1eSFedor Uporov 		return (0);
569b394cd1eSFedor Uporov 
570b394cd1eSFedor Uporov 	if (ex1->e_len + ex2->e_len > EXT4_MAX_LEN)
571b394cd1eSFedor Uporov 		return (0);
572b394cd1eSFedor Uporov 
573b394cd1eSFedor Uporov 	if (ext4_ext_extent_pblock(ex1) + ex1->e_len ==
574b394cd1eSFedor Uporov 	    ext4_ext_extent_pblock(ex2))
575b394cd1eSFedor Uporov 		return (1);
576b394cd1eSFedor Uporov 
577b394cd1eSFedor Uporov 	return (0);
578b394cd1eSFedor Uporov }
579b394cd1eSFedor Uporov 
580b394cd1eSFedor Uporov static unsigned
581b394cd1eSFedor Uporov ext4_ext_next_leaf_block(struct inode *ip, struct ext4_extent_path *path)
582b394cd1eSFedor Uporov {
583b394cd1eSFedor Uporov 	int depth = path->ep_depth;
584b394cd1eSFedor Uporov 
585b394cd1eSFedor Uporov 	/* Empty tree */
586b394cd1eSFedor Uporov 	if (depth == 0)
587b394cd1eSFedor Uporov 		return (EXT4_MAX_BLOCKS);
588b394cd1eSFedor Uporov 
589b394cd1eSFedor Uporov 	/* Go to indexes. */
590b394cd1eSFedor Uporov 	depth--;
591b394cd1eSFedor Uporov 
592b394cd1eSFedor Uporov 	while (depth >= 0) {
593b394cd1eSFedor Uporov 		if (path[depth].ep_index !=
594b394cd1eSFedor Uporov 		    EXT_LAST_INDEX(path[depth].ep_header))
595b394cd1eSFedor Uporov 			return (path[depth].ep_index[1].ei_blk);
596b394cd1eSFedor Uporov 
597b394cd1eSFedor Uporov 		depth--;
598b394cd1eSFedor Uporov 	}
599b394cd1eSFedor Uporov 
600b394cd1eSFedor Uporov 	return (EXT4_MAX_BLOCKS);
601b394cd1eSFedor Uporov }
602b394cd1eSFedor Uporov 
603b394cd1eSFedor Uporov static int
604b394cd1eSFedor Uporov ext4_ext_dirty(struct inode *ip, struct ext4_extent_path *path)
605b394cd1eSFedor Uporov {
606b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
607b394cd1eSFedor Uporov 	struct buf *bp;
608b394cd1eSFedor Uporov 	uint64_t blk;
609b394cd1eSFedor Uporov 	int error;
610b394cd1eSFedor Uporov 
611b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
612b394cd1eSFedor Uporov 
613b394cd1eSFedor Uporov 	if (!path)
614b394cd1eSFedor Uporov 		return (EINVAL);
615b394cd1eSFedor Uporov 
616b394cd1eSFedor Uporov 	if (path->ep_data) {
617b394cd1eSFedor Uporov 		blk = path->ep_blk;
618b394cd1eSFedor Uporov 		bp = getblk(ip->i_devvp, fsbtodb(fs, blk),
619b394cd1eSFedor Uporov 		    fs->e2fs_bsize, 0, 0, 0);
620b394cd1eSFedor Uporov 		if (!bp)
621b394cd1eSFedor Uporov 			return (EIO);
622b394cd1eSFedor Uporov 		ext4_ext_fill_path_buf(path, bp);
623b394cd1eSFedor Uporov 		error = bwrite(bp);
624b394cd1eSFedor Uporov 	} else {
625b394cd1eSFedor Uporov 		ip->i_flag |= IN_CHANGE | IN_UPDATE;
626b394cd1eSFedor Uporov 		error = ext2_update(ip->i_vnode, 1);
627b394cd1eSFedor Uporov 	}
628b394cd1eSFedor Uporov 
629b394cd1eSFedor Uporov 	return (error);
630b394cd1eSFedor Uporov }
631b394cd1eSFedor Uporov 
632b394cd1eSFedor Uporov static int
633b394cd1eSFedor Uporov ext4_ext_insert_index(struct inode *ip, struct ext4_extent_path *path,
634b394cd1eSFedor Uporov     uint32_t lblk, e4fs_daddr_t blk)
635b394cd1eSFedor Uporov {
636b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
637b394cd1eSFedor Uporov 	struct ext4_extent_index *idx;
638b394cd1eSFedor Uporov 	int len;
639b394cd1eSFedor Uporov 
640b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
641b394cd1eSFedor Uporov 
642b394cd1eSFedor Uporov 	if (lblk == path->ep_index->ei_blk) {
643b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid,
644b394cd1eSFedor Uporov 		    "lblk == index blk => extent corrupted");
645b394cd1eSFedor Uporov 		return (EIO);
646b394cd1eSFedor Uporov 	}
647b394cd1eSFedor Uporov 
648b394cd1eSFedor Uporov 	if (path->ep_header->eh_ecount >= path->ep_header->eh_max) {
649b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid,
650b394cd1eSFedor Uporov 		    "ecout > maxcount => extent corrupted");
651b394cd1eSFedor Uporov 		return (EIO);
652b394cd1eSFedor Uporov 	}
653b394cd1eSFedor Uporov 
654b394cd1eSFedor Uporov 	if (lblk > path->ep_index->ei_blk) {
655b394cd1eSFedor Uporov 		/* Insert after. */
656b394cd1eSFedor Uporov 		idx = path->ep_index + 1;
657b394cd1eSFedor Uporov 	} else {
658b394cd1eSFedor Uporov 		/* Insert before. */
659b394cd1eSFedor Uporov 		idx = path->ep_index;
660b394cd1eSFedor Uporov 	}
661b394cd1eSFedor Uporov 
662b394cd1eSFedor Uporov 	len = EXT_LAST_INDEX(path->ep_header) - idx + 1;
663b394cd1eSFedor Uporov 	if (len > 0)
664b394cd1eSFedor Uporov 		memmove(idx + 1, idx, len * sizeof(struct ext4_extent_index));
665b394cd1eSFedor Uporov 
666b394cd1eSFedor Uporov 	if (idx > EXT_MAX_INDEX(path->ep_header)) {
667b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid,
668b394cd1eSFedor Uporov 		    "index is out of range => extent corrupted");
669b394cd1eSFedor Uporov 		return (EIO);
670b394cd1eSFedor Uporov 	}
671b394cd1eSFedor Uporov 
672b394cd1eSFedor Uporov 	idx->ei_blk = lblk;
673b394cd1eSFedor Uporov 	ext4_index_store_pblock(idx, blk);
674b394cd1eSFedor Uporov 	path->ep_header->eh_ecount++;
675b394cd1eSFedor Uporov 
676b394cd1eSFedor Uporov 	return (ext4_ext_dirty(ip, path));
677b394cd1eSFedor Uporov }
678b394cd1eSFedor Uporov 
679b394cd1eSFedor Uporov static e4fs_daddr_t
680b394cd1eSFedor Uporov ext4_ext_alloc_meta(struct inode *ip)
681b394cd1eSFedor Uporov {
682b394cd1eSFedor Uporov 	e4fs_daddr_t blk = ext2_alloc_meta(ip);
683b394cd1eSFedor Uporov 	if (blk) {
684b394cd1eSFedor Uporov 		ip->i_blocks += btodb(ip->i_e2fs->e2fs_bsize);
685b394cd1eSFedor Uporov 		ip->i_flag |= IN_CHANGE | IN_UPDATE;
686b394cd1eSFedor Uporov 		ext2_update(ip->i_vnode, 1);
687b394cd1eSFedor Uporov 	}
688b394cd1eSFedor Uporov 
689b394cd1eSFedor Uporov 	return (blk);
690b394cd1eSFedor Uporov }
691b394cd1eSFedor Uporov 
692b394cd1eSFedor Uporov static void
693b394cd1eSFedor Uporov ext4_ext_blkfree(struct inode *ip, uint64_t blk, int count, int flags)
694b394cd1eSFedor Uporov {
695b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
696b394cd1eSFedor Uporov 	int i, blocksreleased;
697b394cd1eSFedor Uporov 
698b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
699b394cd1eSFedor Uporov 	blocksreleased = count;
700b394cd1eSFedor Uporov 
701b394cd1eSFedor Uporov 	for(i = 0; i < count; i++)
702b394cd1eSFedor Uporov 		ext2_blkfree(ip, blk + i, fs->e2fs_bsize);
703b394cd1eSFedor Uporov 
704b394cd1eSFedor Uporov 	if (ip->i_blocks >= blocksreleased)
705b394cd1eSFedor Uporov 		ip->i_blocks -= (btodb(fs->e2fs_bsize)*blocksreleased);
706b394cd1eSFedor Uporov 	else
707b394cd1eSFedor Uporov 		ip->i_blocks = 0;
708b394cd1eSFedor Uporov 
709b394cd1eSFedor Uporov 	ip->i_flag |= IN_CHANGE | IN_UPDATE;
710b394cd1eSFedor Uporov 	ext2_update(ip->i_vnode, 1);
711b394cd1eSFedor Uporov }
712b394cd1eSFedor Uporov 
713b394cd1eSFedor Uporov static int
714b394cd1eSFedor Uporov ext4_ext_split(struct inode *ip, struct ext4_extent_path *path,
715b394cd1eSFedor Uporov     struct ext4_extent *newext, int at)
716b394cd1eSFedor Uporov {
717b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
718b394cd1eSFedor Uporov 	struct  buf *bp;
719b394cd1eSFedor Uporov 	int depth = ext4_ext_inode_depth(ip);
720b394cd1eSFedor Uporov 	struct ext4_extent_header *neh;
721b394cd1eSFedor Uporov 	struct ext4_extent_index *fidx;
722b394cd1eSFedor Uporov 	struct ext4_extent *ex;
723b394cd1eSFedor Uporov 	int i = at, k, m, a;
724b394cd1eSFedor Uporov 	e4fs_daddr_t newblk, oldblk;
725b394cd1eSFedor Uporov 	uint32_t border;
726b394cd1eSFedor Uporov 	e4fs_daddr_t *ablks = NULL;
727b394cd1eSFedor Uporov 	int error = 0;
728b394cd1eSFedor Uporov 
729b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
730b394cd1eSFedor Uporov 	bp = NULL;
731b394cd1eSFedor Uporov 
732b394cd1eSFedor Uporov 	/*
733b394cd1eSFedor Uporov 	 * We will split at current extent for now.
734b394cd1eSFedor Uporov 	 */
735b394cd1eSFedor Uporov 	if (path[depth].ep_ext > EXT_MAX_EXTENT(path[depth].ep_header)) {
736b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid,
737b394cd1eSFedor Uporov 		    "extent is out of range => extent corrupted");
738b394cd1eSFedor Uporov 		return (EIO);
739b394cd1eSFedor Uporov 	}
740b394cd1eSFedor Uporov 
741b394cd1eSFedor Uporov 	if (path[depth].ep_ext != EXT_MAX_EXTENT(path[depth].ep_header))
742b394cd1eSFedor Uporov 		border = path[depth].ep_ext[1].e_blk;
743b394cd1eSFedor Uporov 	else
744b394cd1eSFedor Uporov 		border = newext->e_blk;
745b394cd1eSFedor Uporov 
746b394cd1eSFedor Uporov 	/* Allocate new blocks. */
747b394cd1eSFedor Uporov 	ablks = malloc(sizeof(e4fs_daddr_t) * depth,
748b394cd1eSFedor Uporov 	    M_EXT2EXTENTS, M_WAITOK | M_ZERO);
749b394cd1eSFedor Uporov 	if (!ablks)
750b394cd1eSFedor Uporov 		return (ENOMEM);
751b394cd1eSFedor Uporov 	for (a = 0; a < depth - at; a++) {
752b394cd1eSFedor Uporov 		newblk = ext4_ext_alloc_meta(ip);
753b394cd1eSFedor Uporov 		if (newblk == 0)
754b394cd1eSFedor Uporov 			goto cleanup;
755b394cd1eSFedor Uporov 		ablks[a] = newblk;
756b394cd1eSFedor Uporov 	}
757b394cd1eSFedor Uporov 
758b394cd1eSFedor Uporov 	newblk = ablks[--a];
759b394cd1eSFedor Uporov 	bp = getblk(ip->i_devvp, fsbtodb(fs, newblk), fs->e2fs_bsize, 0, 0, 0);
760b394cd1eSFedor Uporov 	if (!bp) {
761b394cd1eSFedor Uporov 		error = EIO;
762b394cd1eSFedor Uporov 		goto cleanup;
763b394cd1eSFedor Uporov 	}
764b394cd1eSFedor Uporov 
765b394cd1eSFedor Uporov 	neh = ext4_ext_block_header(bp->b_data);
766b394cd1eSFedor Uporov 	neh->eh_ecount = 0;
767b394cd1eSFedor Uporov 	neh->eh_max = ext4_ext_space_block(ip);
768b394cd1eSFedor Uporov 	neh->eh_magic = EXT4_EXT_MAGIC;
769b394cd1eSFedor Uporov 	neh->eh_depth = 0;
770b394cd1eSFedor Uporov 	ex = EXT_FIRST_EXTENT(neh);
771b394cd1eSFedor Uporov 
772b394cd1eSFedor Uporov 	if (path[depth].ep_header->eh_ecount != path[depth].ep_header->eh_max) {
773b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid,
774b394cd1eSFedor Uporov 		    "extents count out of range => extent corrupted");
775b394cd1eSFedor Uporov 		error = EIO;
776b394cd1eSFedor Uporov 		goto cleanup;
777b394cd1eSFedor Uporov 	}
778b394cd1eSFedor Uporov 
779b394cd1eSFedor Uporov 	/* Start copy from next extent. */
780b394cd1eSFedor Uporov 	m = 0;
781b394cd1eSFedor Uporov 	path[depth].ep_ext++;
782b394cd1eSFedor Uporov 	while (path[depth].ep_ext <= EXT_MAX_EXTENT(path[depth].ep_header)) {
783b394cd1eSFedor Uporov 		path[depth].ep_ext++;
784b394cd1eSFedor Uporov 		m++;
785b394cd1eSFedor Uporov 	}
786b394cd1eSFedor Uporov 	if (m) {
787b394cd1eSFedor Uporov 		memmove(ex, path[depth].ep_ext - m,
788b394cd1eSFedor Uporov 		    sizeof(struct ext4_extent) * m);
789b394cd1eSFedor Uporov 		neh->eh_ecount = neh->eh_ecount + m;
790b394cd1eSFedor Uporov 	}
791b394cd1eSFedor Uporov 
792b394cd1eSFedor Uporov 	bwrite(bp);
793b394cd1eSFedor Uporov 	bp = NULL;
794b394cd1eSFedor Uporov 
795b394cd1eSFedor Uporov 	/* Fix old leaf. */
796b394cd1eSFedor Uporov 	if (m) {
797b394cd1eSFedor Uporov 		path[depth].ep_header->eh_ecount =
798b394cd1eSFedor Uporov 		    path[depth].ep_header->eh_ecount - m;
799b394cd1eSFedor Uporov 		ext4_ext_dirty(ip, path + depth);
800b394cd1eSFedor Uporov 	}
801b394cd1eSFedor Uporov 
802b394cd1eSFedor Uporov 	/* Create intermediate indexes. */
803b394cd1eSFedor Uporov 	k = depth - at - 1;
804b394cd1eSFedor Uporov 	KASSERT(k >= 0, ("ext4_ext_split: negative k"));
805b394cd1eSFedor Uporov 
806b394cd1eSFedor Uporov 	/* Insert new index into current index block. */
807b394cd1eSFedor Uporov 	i = depth - 1;
808b394cd1eSFedor Uporov 	while (k--) {
809b394cd1eSFedor Uporov 		oldblk = newblk;
810b394cd1eSFedor Uporov 		newblk = ablks[--a];
811b394cd1eSFedor Uporov 		error = bread(ip->i_devvp, fsbtodb(fs, newblk),
812b394cd1eSFedor Uporov 		    (int)fs->e2fs_bsize, NOCRED, &bp);
813d7511a40SPedro F. Giffuni 		if (error) {
814b394cd1eSFedor Uporov 			brelse(bp);
815b394cd1eSFedor Uporov 			goto cleanup;
816b394cd1eSFedor Uporov 		}
817b394cd1eSFedor Uporov 
818b394cd1eSFedor Uporov 		neh = (struct ext4_extent_header *)bp->b_data;
819b394cd1eSFedor Uporov 		neh->eh_ecount = 1;
820b394cd1eSFedor Uporov 		neh->eh_magic = EXT4_EXT_MAGIC;
821b394cd1eSFedor Uporov 		neh->eh_max = ext4_ext_space_block_index(ip);
822b394cd1eSFedor Uporov 		neh->eh_depth = depth - i;
823b394cd1eSFedor Uporov 		fidx = EXT_FIRST_INDEX(neh);
824b394cd1eSFedor Uporov 		fidx->ei_blk = border;
825b394cd1eSFedor Uporov 		ext4_index_store_pblock(fidx, oldblk);
826b394cd1eSFedor Uporov 
827b394cd1eSFedor Uporov 		m = 0;
828b394cd1eSFedor Uporov 		path[i].ep_index++;
829b394cd1eSFedor Uporov 		while (path[i].ep_index <= EXT_MAX_INDEX(path[i].ep_header)) {
830b394cd1eSFedor Uporov 			path[i].ep_index++;
831b394cd1eSFedor Uporov 			m++;
832b394cd1eSFedor Uporov 		}
833b394cd1eSFedor Uporov 		if (m) {
834b394cd1eSFedor Uporov 			memmove(++fidx, path[i].ep_index - m,
835b394cd1eSFedor Uporov 			    sizeof(struct ext4_extent_index) * m);
836b394cd1eSFedor Uporov 			neh->eh_ecount = neh->eh_ecount + m;
837b394cd1eSFedor Uporov 		}
838b394cd1eSFedor Uporov 
839b394cd1eSFedor Uporov 		bwrite(bp);
840b394cd1eSFedor Uporov 		bp = NULL;
841b394cd1eSFedor Uporov 
842b394cd1eSFedor Uporov 		/* Fix old index. */
843b394cd1eSFedor Uporov 		if (m) {
844b394cd1eSFedor Uporov 			path[i].ep_header->eh_ecount =
845b394cd1eSFedor Uporov 			    path[i].ep_header->eh_ecount - m;
846b394cd1eSFedor Uporov 			ext4_ext_dirty(ip, path + i);
847b394cd1eSFedor Uporov 		}
848b394cd1eSFedor Uporov 
849b394cd1eSFedor Uporov 		i--;
850b394cd1eSFedor Uporov 	}
851b394cd1eSFedor Uporov 
852b394cd1eSFedor Uporov 	error = ext4_ext_insert_index(ip, path + at, border, newblk);
853b394cd1eSFedor Uporov 
854b394cd1eSFedor Uporov cleanup:
855b394cd1eSFedor Uporov 	if (bp)
856b394cd1eSFedor Uporov 		brelse(bp);
857b394cd1eSFedor Uporov 
858b394cd1eSFedor Uporov 	if (error) {
859b394cd1eSFedor Uporov 		for (i = 0; i < depth; i++) {
860b394cd1eSFedor Uporov 			if (!ablks[i])
861b394cd1eSFedor Uporov 				continue;
862b394cd1eSFedor Uporov 			ext4_ext_blkfree(ip, ablks[i], 1, 0);
863b394cd1eSFedor Uporov 		}
864b394cd1eSFedor Uporov 	}
865b394cd1eSFedor Uporov 
866b394cd1eSFedor Uporov 	free(ablks, M_EXT2EXTENTS);
867b394cd1eSFedor Uporov 
868b394cd1eSFedor Uporov 	return (error);
869b394cd1eSFedor Uporov }
870b394cd1eSFedor Uporov 
871b394cd1eSFedor Uporov static int
872b394cd1eSFedor Uporov ext4_ext_grow_indepth(struct inode *ip, struct ext4_extent_path *path,
873b394cd1eSFedor Uporov     struct ext4_extent *newext)
874b394cd1eSFedor Uporov {
875b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
876b394cd1eSFedor Uporov 	struct ext4_extent_path *curpath;
877b394cd1eSFedor Uporov 	struct ext4_extent_header *neh;
878b394cd1eSFedor Uporov 	struct ext4_extent_index *fidx;
879b394cd1eSFedor Uporov 	struct buf *bp;
880b394cd1eSFedor Uporov 	e4fs_daddr_t newblk;
881b394cd1eSFedor Uporov 	int error = 0;
882b394cd1eSFedor Uporov 
883b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
884b394cd1eSFedor Uporov 	curpath = path;
885b394cd1eSFedor Uporov 
886b394cd1eSFedor Uporov 	newblk = ext4_ext_alloc_meta(ip);
887b394cd1eSFedor Uporov 	if (newblk == 0)
888b394cd1eSFedor Uporov 		return (error);
889b394cd1eSFedor Uporov 
890b394cd1eSFedor Uporov 	bp = getblk(ip->i_devvp, fsbtodb(fs, newblk), fs->e2fs_bsize, 0, 0, 0);
891b394cd1eSFedor Uporov 	if (!bp)
892b394cd1eSFedor Uporov 		return (EIO);
893b394cd1eSFedor Uporov 
894b394cd1eSFedor Uporov 	/* Move top-level index/leaf into new block. */
895b394cd1eSFedor Uporov 	memmove(bp->b_data, curpath->ep_header, sizeof(ip->i_data));
896b394cd1eSFedor Uporov 
897b394cd1eSFedor Uporov 	/* Set size of new block */
898b394cd1eSFedor Uporov 	neh = ext4_ext_block_header(bp->b_data);
899b394cd1eSFedor Uporov 	neh->eh_magic = EXT4_EXT_MAGIC;
900b394cd1eSFedor Uporov 
901b394cd1eSFedor Uporov 	if (ext4_ext_inode_depth(ip))
902b394cd1eSFedor Uporov 		neh->eh_max = ext4_ext_space_block_index(ip);
903b394cd1eSFedor Uporov 	else
904b394cd1eSFedor Uporov 		neh->eh_max = ext4_ext_space_block(ip);
905b394cd1eSFedor Uporov 
906b394cd1eSFedor Uporov 	error = bwrite(bp);
907b394cd1eSFedor Uporov 	if (error)
908b394cd1eSFedor Uporov 		goto out;
909b394cd1eSFedor Uporov 
910b394cd1eSFedor Uporov 	bp = NULL;
911b394cd1eSFedor Uporov 
912b394cd1eSFedor Uporov 	curpath->ep_header->eh_magic = EXT4_EXT_MAGIC;
913b394cd1eSFedor Uporov 	curpath->ep_header->eh_max = ext4_ext_space_root(ip);
914b394cd1eSFedor Uporov 	curpath->ep_header->eh_ecount = 1;
915b394cd1eSFedor Uporov 	curpath->ep_index = EXT_FIRST_INDEX(curpath->ep_header);
916b394cd1eSFedor Uporov 	curpath->ep_index->ei_blk = EXT_FIRST_EXTENT(path[0].ep_header)->e_blk;
917b394cd1eSFedor Uporov 	ext4_index_store_pblock(curpath->ep_index, newblk);
918b394cd1eSFedor Uporov 
919b394cd1eSFedor Uporov 	neh = ext4_ext_inode_header(ip);
920b394cd1eSFedor Uporov 	fidx = EXT_FIRST_INDEX(neh);
921b394cd1eSFedor Uporov 	neh->eh_depth = path->ep_depth + 1;
922b394cd1eSFedor Uporov 	ext4_ext_dirty(ip, curpath);
923b394cd1eSFedor Uporov out:
924b394cd1eSFedor Uporov 	brelse(bp);
925b394cd1eSFedor Uporov 
926b394cd1eSFedor Uporov 	return (error);
927b394cd1eSFedor Uporov }
928b394cd1eSFedor Uporov 
929b394cd1eSFedor Uporov static int
930b394cd1eSFedor Uporov ext4_ext_create_new_leaf(struct inode *ip, struct ext4_extent_path *path,
931b394cd1eSFedor Uporov     struct ext4_extent *newext)
932b394cd1eSFedor Uporov {
933b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
934b394cd1eSFedor Uporov 	struct ext4_extent_path *curpath;
935b394cd1eSFedor Uporov 	int depth, i, error;
936b394cd1eSFedor Uporov 
937b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
938b394cd1eSFedor Uporov 
939b394cd1eSFedor Uporov repeat:
940b394cd1eSFedor Uporov 	i = depth = ext4_ext_inode_depth(ip);
941b394cd1eSFedor Uporov 
942b394cd1eSFedor Uporov 	/* Look for free index entry int the tree */
943b394cd1eSFedor Uporov 	curpath = path + depth;
944b394cd1eSFedor Uporov 	while (i > 0 && !EXT_HAS_FREE_INDEX(curpath)) {
945b394cd1eSFedor Uporov 		i--;
946b394cd1eSFedor Uporov 		curpath--;
947b394cd1eSFedor Uporov 	}
948b394cd1eSFedor Uporov 
949b394cd1eSFedor Uporov 	/*
950b394cd1eSFedor Uporov 	 * We use already allocated block for index block,
951b394cd1eSFedor Uporov 	 * so subsequent data blocks should be contiguous.
952b394cd1eSFedor Uporov 	 */
953b394cd1eSFedor Uporov 	if (EXT_HAS_FREE_INDEX(curpath)) {
954b394cd1eSFedor Uporov 		error = ext4_ext_split(ip, path, newext, i);
955b394cd1eSFedor Uporov 		if (error)
956b394cd1eSFedor Uporov 			goto out;
957b394cd1eSFedor Uporov 
958b394cd1eSFedor Uporov 		/* Refill path. */
959b394cd1eSFedor Uporov 		ext4_ext_drop_refs(path);
960b394cd1eSFedor Uporov 		error = ext4_ext_find_extent(ip, newext->e_blk, &path);
961b394cd1eSFedor Uporov 		if (error)
962b394cd1eSFedor Uporov 			goto out;
963b394cd1eSFedor Uporov 	} else {
964b394cd1eSFedor Uporov 		/* Tree is full, do grow in depth. */
965b394cd1eSFedor Uporov 		error = ext4_ext_grow_indepth(ip, path, newext);
966b394cd1eSFedor Uporov 		if (error)
967b394cd1eSFedor Uporov 			goto out;
968b394cd1eSFedor Uporov 
969b394cd1eSFedor Uporov 		/* Refill path. */
970b394cd1eSFedor Uporov 		ext4_ext_drop_refs(path);
971b394cd1eSFedor Uporov 		error = ext4_ext_find_extent(ip, newext->e_blk, &path);
972b394cd1eSFedor Uporov 		if (error)
973b394cd1eSFedor Uporov 			goto out;
974b394cd1eSFedor Uporov 
975b394cd1eSFedor Uporov 		/* Check and split tree if required. */
976b394cd1eSFedor Uporov 		depth = ext4_ext_inode_depth(ip);
977b394cd1eSFedor Uporov 		if (path[depth].ep_header->eh_ecount ==
978b394cd1eSFedor Uporov 		    path[depth].ep_header->eh_max)
979b394cd1eSFedor Uporov 			goto repeat;
980b394cd1eSFedor Uporov 	}
981b394cd1eSFedor Uporov 
982b394cd1eSFedor Uporov out:
983b394cd1eSFedor Uporov 	return (error);
984b394cd1eSFedor Uporov }
985b394cd1eSFedor Uporov 
986b394cd1eSFedor Uporov static int
987b394cd1eSFedor Uporov ext4_ext_correct_indexes(struct inode *ip, struct ext4_extent_path *path)
988b394cd1eSFedor Uporov {
989b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
990b394cd1eSFedor Uporov 	struct ext4_extent *ex;
991b394cd1eSFedor Uporov 	int32_t border;
992b394cd1eSFedor Uporov 	int depth, k;
993b394cd1eSFedor Uporov 
994b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
995b394cd1eSFedor Uporov 	eh = path[depth].ep_header;
996b394cd1eSFedor Uporov 	ex = path[depth].ep_ext;
997b394cd1eSFedor Uporov 
998b394cd1eSFedor Uporov 	if (ex == NULL || eh == NULL)
999b394cd1eSFedor Uporov 		return (EIO);
1000b394cd1eSFedor Uporov 
1001b394cd1eSFedor Uporov 	if (!depth)
1002b394cd1eSFedor Uporov 		return (0);
1003b394cd1eSFedor Uporov 
1004b394cd1eSFedor Uporov 	/* We will correct tree if first leaf got modified only. */
1005b394cd1eSFedor Uporov 	if (ex != EXT_FIRST_EXTENT(eh))
1006b394cd1eSFedor Uporov 		return (0);
1007b394cd1eSFedor Uporov 
1008b394cd1eSFedor Uporov 	k = depth - 1;
1009b394cd1eSFedor Uporov 	border = path[depth].ep_ext->e_blk;
1010b394cd1eSFedor Uporov 	path[k].ep_index->ei_blk = border;
1011b394cd1eSFedor Uporov 	ext4_ext_dirty(ip, path + k);
1012b394cd1eSFedor Uporov 	while (k--) {
1013b394cd1eSFedor Uporov 		/* Change all left-side indexes. */
1014b394cd1eSFedor Uporov 		if (path[k+1].ep_index != EXT_FIRST_INDEX(path[k+1].ep_header))
1015b394cd1eSFedor Uporov 			break;
1016b394cd1eSFedor Uporov 
1017b394cd1eSFedor Uporov 		path[k].ep_index->ei_blk = border;
1018b394cd1eSFedor Uporov 		ext4_ext_dirty(ip, path + k);
1019b394cd1eSFedor Uporov 	}
1020b394cd1eSFedor Uporov 
1021b394cd1eSFedor Uporov 	return (0);
1022b394cd1eSFedor Uporov }
1023b394cd1eSFedor Uporov 
1024b394cd1eSFedor Uporov static int
1025b394cd1eSFedor Uporov ext4_ext_insert_extent(struct inode *ip, struct ext4_extent_path *path,
1026b394cd1eSFedor Uporov     struct ext4_extent *newext)
1027b394cd1eSFedor Uporov {
1028b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
1029b394cd1eSFedor Uporov 	struct ext4_extent_header * eh;
1030b394cd1eSFedor Uporov 	struct ext4_extent *ex, *nex, *nearex;
1031b394cd1eSFedor Uporov 	struct ext4_extent_path *npath;
1032b394cd1eSFedor Uporov 	int depth, len, error, next;
1033b394cd1eSFedor Uporov 
1034b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
1035b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1036b394cd1eSFedor Uporov 	ex = path[depth].ep_ext;
1037b394cd1eSFedor Uporov 	npath = NULL;
1038b394cd1eSFedor Uporov 
1039b394cd1eSFedor Uporov 	if (newext->e_len == 0 || path[depth].ep_header == NULL)
1040b394cd1eSFedor Uporov 		return (EINVAL);
1041b394cd1eSFedor Uporov 
1042b394cd1eSFedor Uporov 	/* Insert block into found extent. */
1043b394cd1eSFedor Uporov 	if (ex && ext4_can_extents_be_merged(ex, newext)) {
1044b394cd1eSFedor Uporov 		ex->e_len = ex->e_len + newext->e_len;
1045b394cd1eSFedor Uporov 		eh = path[depth].ep_header;
1046b394cd1eSFedor Uporov 		nearex = ex;
1047b394cd1eSFedor Uporov 		goto merge;
1048b394cd1eSFedor Uporov 	}
1049b394cd1eSFedor Uporov 
1050b394cd1eSFedor Uporov repeat:
1051b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1052b394cd1eSFedor Uporov 	eh = path[depth].ep_header;
1053b394cd1eSFedor Uporov 	if (eh->eh_ecount < eh->eh_max)
1054b394cd1eSFedor Uporov 		goto has_space;
1055b394cd1eSFedor Uporov 
1056b394cd1eSFedor Uporov 	/* Try next leaf */
1057b394cd1eSFedor Uporov 	nex = EXT_LAST_EXTENT(eh);
1058b394cd1eSFedor Uporov 	next = ext4_ext_next_leaf_block(ip, path);
1059b394cd1eSFedor Uporov 	if (newext->e_blk > nex->e_blk && next != EXT4_MAX_BLOCKS) {
1060b394cd1eSFedor Uporov 		KASSERT(npath == NULL,
1061b394cd1eSFedor Uporov 		    ("ext4_ext_insert_extent: bad path"));
1062b394cd1eSFedor Uporov 
1063b394cd1eSFedor Uporov 		error = ext4_ext_find_extent(ip, next, &npath);
1064b394cd1eSFedor Uporov 		if (error)
1065b394cd1eSFedor Uporov 			goto cleanup;
1066b394cd1eSFedor Uporov 
1067b394cd1eSFedor Uporov 		if (npath->ep_depth != path->ep_depth) {
1068b394cd1eSFedor Uporov 			error = EIO;
1069b394cd1eSFedor Uporov 			goto cleanup;
1070b394cd1eSFedor Uporov 		}
1071b394cd1eSFedor Uporov 
1072b394cd1eSFedor Uporov 		eh = npath[depth].ep_header;
1073b394cd1eSFedor Uporov 		if (eh->eh_ecount < eh->eh_max) {
1074b394cd1eSFedor Uporov 			path = npath;
1075b394cd1eSFedor Uporov 			goto repeat;
1076b394cd1eSFedor Uporov 		}
1077b394cd1eSFedor Uporov 	}
1078b394cd1eSFedor Uporov 
1079b394cd1eSFedor Uporov 	/*
1080b394cd1eSFedor Uporov 	 * There is no free space in the found leaf,
1081b394cd1eSFedor Uporov 	 * try to add a new leaf to the tree.
1082b394cd1eSFedor Uporov 	 */
1083b394cd1eSFedor Uporov 	error = ext4_ext_create_new_leaf(ip, path, newext);
1084b394cd1eSFedor Uporov 	if (error)
1085b394cd1eSFedor Uporov 		goto cleanup;
1086b394cd1eSFedor Uporov 
1087b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1088b394cd1eSFedor Uporov 	eh = path[depth].ep_header;
1089b394cd1eSFedor Uporov 
1090b394cd1eSFedor Uporov has_space:
1091b394cd1eSFedor Uporov 	nearex = path[depth].ep_ext;
1092b394cd1eSFedor Uporov 	if (!nearex) {
1093b394cd1eSFedor Uporov 		/* Create new extent in the leaf. */
1094b394cd1eSFedor Uporov 		path[depth].ep_ext = EXT_FIRST_EXTENT(eh);
1095b394cd1eSFedor Uporov 	} else if (newext->e_blk > nearex->e_blk) {
1096b394cd1eSFedor Uporov 		if (nearex != EXT_LAST_EXTENT(eh)) {
1097b394cd1eSFedor Uporov 			len = EXT_MAX_EXTENT(eh) - nearex;
1098b394cd1eSFedor Uporov 			len = (len - 1) * sizeof(struct ext4_extent);
1099b394cd1eSFedor Uporov 			len = len < 0 ? 0 : len;
1100b394cd1eSFedor Uporov 			memmove(nearex + 2, nearex + 1, len);
1101b394cd1eSFedor Uporov 		}
1102b394cd1eSFedor Uporov 		path[depth].ep_ext = nearex + 1;
1103b394cd1eSFedor Uporov 	} else {
1104b394cd1eSFedor Uporov 		len = (EXT_MAX_EXTENT(eh) - nearex) * sizeof(struct ext4_extent);
1105b394cd1eSFedor Uporov 		len = len < 0 ? 0 : len;
1106b394cd1eSFedor Uporov 		memmove(nearex + 1, nearex, len);
1107b394cd1eSFedor Uporov 		path[depth].ep_ext = nearex;
1108b394cd1eSFedor Uporov 	}
1109b394cd1eSFedor Uporov 
1110b394cd1eSFedor Uporov 	eh->eh_ecount = eh->eh_ecount + 1;
1111b394cd1eSFedor Uporov 	nearex = path[depth].ep_ext;
1112b394cd1eSFedor Uporov 	nearex->e_blk = newext->e_blk;
1113b394cd1eSFedor Uporov 	nearex->e_start_lo = newext->e_start_lo;
1114b394cd1eSFedor Uporov 	nearex->e_start_hi = newext->e_start_hi;
1115b394cd1eSFedor Uporov 	nearex->e_len = newext->e_len;
1116b394cd1eSFedor Uporov 
1117b394cd1eSFedor Uporov merge:
1118b394cd1eSFedor Uporov 	/* Try to merge extents to the right. */
1119b394cd1eSFedor Uporov 	while (nearex < EXT_LAST_EXTENT(eh)) {
1120b394cd1eSFedor Uporov 		if (!ext4_can_extents_be_merged(nearex, nearex + 1))
1121b394cd1eSFedor Uporov 			break;
1122b394cd1eSFedor Uporov 
1123b394cd1eSFedor Uporov 		/* Merge with next extent. */
1124b394cd1eSFedor Uporov 		nearex->e_len = nearex->e_len + nearex[1].e_len;
1125b394cd1eSFedor Uporov 		if (nearex + 1 < EXT_LAST_EXTENT(eh)) {
1126b394cd1eSFedor Uporov 			len = (EXT_LAST_EXTENT(eh) - nearex - 1) *
1127b394cd1eSFedor Uporov 			    sizeof(struct ext4_extent);
1128b394cd1eSFedor Uporov 			memmove(nearex + 1, nearex + 2, len);
1129b394cd1eSFedor Uporov 		}
1130b394cd1eSFedor Uporov 
1131b394cd1eSFedor Uporov 		eh->eh_ecount = eh->eh_ecount - 1;
1132b394cd1eSFedor Uporov 		KASSERT(eh->eh_ecount != 0,
1133b394cd1eSFedor Uporov 		    ("ext4_ext_insert_extent: bad ecount"));
1134b394cd1eSFedor Uporov 	}
1135b394cd1eSFedor Uporov 
1136b394cd1eSFedor Uporov 	/*
1137b394cd1eSFedor Uporov 	 * Try to merge extents to the left,
1138b394cd1eSFedor Uporov 	 * start from inexes correction.
1139b394cd1eSFedor Uporov 	 */
1140b394cd1eSFedor Uporov 	error = ext4_ext_correct_indexes(ip, path);
1141b394cd1eSFedor Uporov 	if (error)
1142b394cd1eSFedor Uporov 		goto cleanup;
1143b394cd1eSFedor Uporov 
1144b394cd1eSFedor Uporov 	ext4_ext_dirty(ip, path + depth);
1145b394cd1eSFedor Uporov 
1146b394cd1eSFedor Uporov cleanup:
1147b394cd1eSFedor Uporov 	if (npath) {
1148b394cd1eSFedor Uporov 		ext4_ext_drop_refs(npath);
1149b394cd1eSFedor Uporov 		free(npath, M_EXT2EXTENTS);
1150b394cd1eSFedor Uporov 	}
1151b394cd1eSFedor Uporov 
1152b394cd1eSFedor Uporov 	ip->i_ext_cache.ec_type = EXT4_EXT_CACHE_NO;
1153b394cd1eSFedor Uporov 	return (error);
1154b394cd1eSFedor Uporov }
1155b394cd1eSFedor Uporov 
1156b394cd1eSFedor Uporov static e4fs_daddr_t
1157b394cd1eSFedor Uporov ext4_new_blocks(struct inode *ip, daddr_t lbn, e4fs_daddr_t pref,
1158b394cd1eSFedor Uporov     struct ucred *cred, unsigned long *count, int *perror)
1159b394cd1eSFedor Uporov {
1160b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
1161b394cd1eSFedor Uporov 	struct ext2mount *ump;
1162b394cd1eSFedor Uporov 	e4fs_daddr_t newblk;
1163b394cd1eSFedor Uporov 
1164b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
1165b394cd1eSFedor Uporov 	ump = ip->i_ump;
1166b394cd1eSFedor Uporov 
1167b394cd1eSFedor Uporov 	/*
1168b394cd1eSFedor Uporov 	 * We will allocate only single block for now.
1169b394cd1eSFedor Uporov 	 */
1170b394cd1eSFedor Uporov 	if (*count > 1)
1171b394cd1eSFedor Uporov 		return (0);
1172b394cd1eSFedor Uporov 
1173b394cd1eSFedor Uporov 	EXT2_LOCK(ip->i_ump);
1174b394cd1eSFedor Uporov 	*perror = ext2_alloc(ip, lbn, pref, (int)fs->e2fs_bsize, cred, &newblk);
1175b394cd1eSFedor Uporov 	if (*perror)
1176b394cd1eSFedor Uporov 		return (0);
1177b394cd1eSFedor Uporov 
1178b394cd1eSFedor Uporov 	if (newblk) {
1179b394cd1eSFedor Uporov 		ip->i_flag |= IN_CHANGE | IN_UPDATE;
1180b394cd1eSFedor Uporov 		ext2_update(ip->i_vnode, 1);
1181b394cd1eSFedor Uporov 	}
1182b394cd1eSFedor Uporov 
1183b394cd1eSFedor Uporov 	return (newblk);
1184b394cd1eSFedor Uporov }
1185b394cd1eSFedor Uporov 
1186b394cd1eSFedor Uporov int
1187b394cd1eSFedor Uporov ext4_ext_get_blocks(struct inode *ip, e4fs_daddr_t iblk,
1188b394cd1eSFedor Uporov     unsigned long max_blocks, struct ucred *cred, struct buf **bpp,
1189b394cd1eSFedor Uporov     int *pallocated, uint32_t *nb)
1190b394cd1eSFedor Uporov {
1191b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
1192b394cd1eSFedor Uporov 	struct buf *bp = NULL;
1193b394cd1eSFedor Uporov 	struct ext4_extent_path *path;
1194b394cd1eSFedor Uporov 	struct ext4_extent newex, *ex;
1195b394cd1eSFedor Uporov 	e4fs_daddr_t bpref, newblk = 0;
1196b394cd1eSFedor Uporov 	unsigned long allocated = 0;
1197b394cd1eSFedor Uporov 	int error = 0, depth;
1198b394cd1eSFedor Uporov 
1199b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
1200b394cd1eSFedor Uporov 	*pallocated = 0;
1201b394cd1eSFedor Uporov 	path = NULL;
1202b394cd1eSFedor Uporov 	if(bpp)
1203b394cd1eSFedor Uporov 		*bpp = NULL;
1204b394cd1eSFedor Uporov 
1205b394cd1eSFedor Uporov 	/* Check cache. */
1206b394cd1eSFedor Uporov 	if ((bpref = ext4_ext_in_cache(ip, iblk, &newex))) {
1207b394cd1eSFedor Uporov 		if (bpref == EXT4_EXT_CACHE_IN) {
1208b394cd1eSFedor Uporov 			/* Block is already allocated. */
1209b394cd1eSFedor Uporov 			newblk = iblk - newex.e_blk +
1210b394cd1eSFedor Uporov 			    ext4_ext_extent_pblock(&newex);
1211b394cd1eSFedor Uporov 			allocated = newex.e_len - (iblk - newex.e_blk);
1212b394cd1eSFedor Uporov 			goto out;
1213b394cd1eSFedor Uporov 		} else {
1214b394cd1eSFedor Uporov 			error = EIO;
1215b394cd1eSFedor Uporov 			goto out2;
1216b394cd1eSFedor Uporov 		}
1217b394cd1eSFedor Uporov 	}
1218b394cd1eSFedor Uporov 
1219b394cd1eSFedor Uporov 	error = ext4_ext_find_extent(ip, iblk, &path);
1220b394cd1eSFedor Uporov 	if (error) {
1221b394cd1eSFedor Uporov 		goto out2;
1222b394cd1eSFedor Uporov 	}
1223b394cd1eSFedor Uporov 
1224b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1225b394cd1eSFedor Uporov 	if (path[depth].ep_ext == NULL && depth != 0) {
1226b394cd1eSFedor Uporov 		error = EIO;
1227b394cd1eSFedor Uporov 		goto out2;
1228b394cd1eSFedor Uporov 	}
1229b394cd1eSFedor Uporov 
1230b394cd1eSFedor Uporov 	if ((ex = path[depth].ep_ext)) {
1231b394cd1eSFedor Uporov 	        uint64_t lblk = ex->e_blk;
1232b394cd1eSFedor Uporov 		uint16_t e_len  = ex->e_len;
1233b394cd1eSFedor Uporov 		e4fs_daddr_t e_start = ext4_ext_extent_pblock(ex);
1234b394cd1eSFedor Uporov 
1235b394cd1eSFedor Uporov 		if (e_len > EXT4_MAX_LEN)
1236b394cd1eSFedor Uporov 			goto out2;
1237b394cd1eSFedor Uporov 
1238b394cd1eSFedor Uporov 		/* If we found extent covers block, simply return it. */
1239b394cd1eSFedor Uporov 		if (iblk >= lblk && iblk < lblk + e_len) {
1240b394cd1eSFedor Uporov 			newblk = iblk - lblk + e_start;
1241b394cd1eSFedor Uporov 			allocated = e_len - (iblk - lblk);
1242b394cd1eSFedor Uporov 			ext4_ext_put_in_cache(ip, lblk, e_len,
1243b394cd1eSFedor Uporov 			    e_start, EXT4_EXT_CACHE_IN);
1244b394cd1eSFedor Uporov 			goto out;
1245b394cd1eSFedor Uporov 		}
1246b394cd1eSFedor Uporov 	}
1247b394cd1eSFedor Uporov 
1248b394cd1eSFedor Uporov 	/* Allocate the new block. */
1249b394cd1eSFedor Uporov 	if (S_ISREG(ip->i_mode) && (!ip->i_next_alloc_block)) {
1250b394cd1eSFedor Uporov 		ip->i_next_alloc_goal = 0;
1251b394cd1eSFedor Uporov 	}
1252b394cd1eSFedor Uporov 
1253b394cd1eSFedor Uporov 	bpref = ext4_ext_blkpref(ip, path, iblk);
1254b394cd1eSFedor Uporov 	allocated = max_blocks;
1255b394cd1eSFedor Uporov 	newblk = ext4_new_blocks(ip, iblk, bpref, cred, &allocated, &error);
1256b394cd1eSFedor Uporov 	if (!newblk)
1257b394cd1eSFedor Uporov 		goto out2;
1258b394cd1eSFedor Uporov 
1259b394cd1eSFedor Uporov 	/* Try to insert new extent into found leaf and return. */
1260b394cd1eSFedor Uporov 	newex.e_blk = iblk;
1261b394cd1eSFedor Uporov 	ext4_ext_store_pblock(&newex, newblk);
1262b394cd1eSFedor Uporov 	newex.e_len = allocated;
1263b394cd1eSFedor Uporov 	error = ext4_ext_insert_extent(ip, path, &newex);
1264b394cd1eSFedor Uporov 	if (error)
1265b394cd1eSFedor Uporov 		goto out2;
1266b394cd1eSFedor Uporov 
1267b394cd1eSFedor Uporov 	newblk = ext4_ext_extent_pblock(&newex);
1268b394cd1eSFedor Uporov 	ext4_ext_put_in_cache(ip, iblk, allocated, newblk, EXT4_EXT_CACHE_IN);
1269b394cd1eSFedor Uporov 	*pallocated = 1;
1270b394cd1eSFedor Uporov 
1271b394cd1eSFedor Uporov out:
1272b394cd1eSFedor Uporov 	if (allocated > max_blocks)
1273b394cd1eSFedor Uporov 		allocated = max_blocks;
1274b394cd1eSFedor Uporov 
1275b394cd1eSFedor Uporov 	if (bpp)
1276b394cd1eSFedor Uporov 	{
1277b394cd1eSFedor Uporov 		error = bread(ip->i_devvp, fsbtodb(fs, newblk),
1278b394cd1eSFedor Uporov 		    fs->e2fs_bsize, cred, &bp);
1279b394cd1eSFedor Uporov 		if (error) {
1280b394cd1eSFedor Uporov 			brelse(bp);
1281b394cd1eSFedor Uporov 		} else {
1282b394cd1eSFedor Uporov 			*bpp = bp;
1283b394cd1eSFedor Uporov 		}
1284b394cd1eSFedor Uporov 	}
1285b394cd1eSFedor Uporov 
1286b394cd1eSFedor Uporov out2:
1287b394cd1eSFedor Uporov 	if (path) {
1288b394cd1eSFedor Uporov 		ext4_ext_drop_refs(path);
1289b394cd1eSFedor Uporov 		free(path, M_EXT2EXTENTS);
1290b394cd1eSFedor Uporov 	}
1291b394cd1eSFedor Uporov 
1292b394cd1eSFedor Uporov 	if (nb)
1293b394cd1eSFedor Uporov 		*nb = newblk;
1294b394cd1eSFedor Uporov 
1295b394cd1eSFedor Uporov 	return (error);
1296b394cd1eSFedor Uporov }
1297b394cd1eSFedor Uporov 
1298b394cd1eSFedor Uporov static inline uint16_t
1299b394cd1eSFedor Uporov ext4_ext_get_actual_len(struct ext4_extent *ext)
1300b394cd1eSFedor Uporov {
1301b394cd1eSFedor Uporov 
1302b394cd1eSFedor Uporov 	return (ext->e_len <= EXT_INIT_MAX_LEN ?
1303b394cd1eSFedor Uporov 	    ext->e_len : (ext->e_len - EXT_INIT_MAX_LEN));
1304b394cd1eSFedor Uporov }
1305b394cd1eSFedor Uporov 
1306b394cd1eSFedor Uporov static inline struct ext4_extent_header *
1307b394cd1eSFedor Uporov ext4_ext_header(struct inode *ip)
1308b394cd1eSFedor Uporov {
1309b394cd1eSFedor Uporov 
1310b394cd1eSFedor Uporov 	return (struct ext4_extent_header *)ip->i_db;
1311b394cd1eSFedor Uporov }
1312b394cd1eSFedor Uporov 
1313b394cd1eSFedor Uporov static int
1314b394cd1eSFedor Uporov ext4_remove_blocks(struct inode *ip, struct ext4_extent *ex,
1315b394cd1eSFedor Uporov     unsigned long from, unsigned long to)
1316b394cd1eSFedor Uporov {
1317b394cd1eSFedor Uporov 	unsigned long num, start;
1318b394cd1eSFedor Uporov 
1319b394cd1eSFedor Uporov 	if (from >= ex->e_blk &&
1320b394cd1eSFedor Uporov 	    to == ex->e_blk + ext4_ext_get_actual_len(ex) - 1) {
1321b394cd1eSFedor Uporov 		/* Tail cleanup. */
1322b394cd1eSFedor Uporov 		num = ex->e_blk + ext4_ext_get_actual_len(ex) - from;
1323b394cd1eSFedor Uporov 		start = ext4_ext_extent_pblock(ex) +
1324b394cd1eSFedor Uporov 		    ext4_ext_get_actual_len(ex) - num;
1325b394cd1eSFedor Uporov 		ext4_ext_blkfree(ip, start, num, 0);
1326b394cd1eSFedor Uporov 	}
1327b394cd1eSFedor Uporov 
1328b394cd1eSFedor Uporov 	return (0);
1329b394cd1eSFedor Uporov }
1330b394cd1eSFedor Uporov 
1331b394cd1eSFedor Uporov static int
1332b394cd1eSFedor Uporov ext4_ext_rm_index(struct inode *ip, struct ext4_extent_path *path)
1333b394cd1eSFedor Uporov {
1334b394cd1eSFedor Uporov 	e4fs_daddr_t leaf;
1335b394cd1eSFedor Uporov 
1336b394cd1eSFedor Uporov 	/* Free index block. */
1337b394cd1eSFedor Uporov 	path--;
1338b394cd1eSFedor Uporov 	leaf = ext4_ext_index_pblock(path->ep_index);
1339b394cd1eSFedor Uporov 	KASSERT(path->ep_header->eh_ecount != 0,
1340b394cd1eSFedor Uporov 	    ("ext4_ext_rm_index: bad ecount"));
1341b394cd1eSFedor Uporov 	path->ep_header->eh_ecount--;
1342b394cd1eSFedor Uporov 	ext4_ext_dirty(ip, path);
1343b394cd1eSFedor Uporov 	ext4_ext_blkfree(ip, leaf, 1, 0);
1344b394cd1eSFedor Uporov 	return (0);
1345b394cd1eSFedor Uporov }
1346b394cd1eSFedor Uporov 
1347b394cd1eSFedor Uporov static int
1348b394cd1eSFedor Uporov ext4_ext_rm_leaf(struct inode *ip, struct ext4_extent_path *path,
1349b394cd1eSFedor Uporov     uint64_t start)
1350b394cd1eSFedor Uporov {
1351b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
1352*3fcbb8c0SFedor Uporov 	int depth;
1353b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
1354b394cd1eSFedor Uporov 	unsigned int a, b, block, num;
1355b394cd1eSFedor Uporov 	unsigned long ex_blk;
1356b394cd1eSFedor Uporov 	unsigned short ex_len;
1357b394cd1eSFedor Uporov 	struct ext4_extent *ex;
1358b394cd1eSFedor Uporov 	int error, correct_index;
1359b394cd1eSFedor Uporov 
1360b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
1361b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1362b394cd1eSFedor Uporov 	correct_index = 0;
1363b394cd1eSFedor Uporov 
1364b394cd1eSFedor Uporov 	if (!path[depth].ep_header) {
1365b394cd1eSFedor Uporov 		if (path[depth].ep_data == NULL)
1366b394cd1eSFedor Uporov 			return (EINVAL);
1367b394cd1eSFedor Uporov 		path[depth].ep_header =
1368b394cd1eSFedor Uporov 		    (struct ext4_extent_header* )path[depth].ep_data;
1369b394cd1eSFedor Uporov 	}
1370b394cd1eSFedor Uporov 
1371b394cd1eSFedor Uporov 	eh = path[depth].ep_header;
1372b394cd1eSFedor Uporov 	if (!eh) {
1373b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid, "bad header => extent corrupted");
1374b394cd1eSFedor Uporov 		return (EIO);
1375b394cd1eSFedor Uporov 	}
1376b394cd1eSFedor Uporov 
1377b394cd1eSFedor Uporov 	ex = EXT_LAST_EXTENT(eh);
1378b394cd1eSFedor Uporov 	ex_blk = ex->e_blk;
1379b394cd1eSFedor Uporov 	ex_len = ext4_ext_get_actual_len(ex);
1380b394cd1eSFedor Uporov 
1381b394cd1eSFedor Uporov 	while (ex >= EXT_FIRST_EXTENT(eh) && ex_blk + ex_len > start) {
1382b394cd1eSFedor Uporov 		path[depth].ep_ext = ex;
1383b394cd1eSFedor Uporov 		a = ex_blk > start ? ex_blk : start;
1384b394cd1eSFedor Uporov 		b = (uint64_t)ex_blk + ex_len - 1 <
1385b394cd1eSFedor Uporov 		    EXT4_MAX_BLOCKS ? ex_blk + ex_len - 1 : EXT4_MAX_BLOCKS;
1386b394cd1eSFedor Uporov 
1387b394cd1eSFedor Uporov 		if (a != ex_blk && b != ex_blk + ex_len - 1)
1388b394cd1eSFedor Uporov 			return (EINVAL);
1389b394cd1eSFedor Uporov 		else if (a != ex_blk) {
1390b394cd1eSFedor Uporov 			/* Remove tail of the extent. */
1391b394cd1eSFedor Uporov 			block = ex_blk;
1392b394cd1eSFedor Uporov 			num = a - block;
1393b394cd1eSFedor Uporov 		} else if (b != ex_blk + ex_len - 1) {
1394b394cd1eSFedor Uporov 			/* Remove head of the extent, not implemented. */
1395b394cd1eSFedor Uporov 			return (EINVAL);
1396b394cd1eSFedor Uporov 		} else {
1397b394cd1eSFedor Uporov 			/* Remove whole extent. */
1398b394cd1eSFedor Uporov 			block = ex_blk;
1399b394cd1eSFedor Uporov 			num = 0;
1400b394cd1eSFedor Uporov 			KASSERT(a == ex_blk, ("ext4_ext_rm_leaf: bad a"));
1401b394cd1eSFedor Uporov 			KASSERT(b != ex_blk + ex_len - 1,
1402b394cd1eSFedor Uporov 			    ("ext4_ext_rm_leaf: bad b"));
1403b394cd1eSFedor Uporov 		}
1404b394cd1eSFedor Uporov 
1405*3fcbb8c0SFedor Uporov 		if (ex == EXT_FIRST_EXTENT(eh))
1406b394cd1eSFedor Uporov 			correct_index = 1;
1407b394cd1eSFedor Uporov 
1408b394cd1eSFedor Uporov 		error = ext4_remove_blocks(ip, ex, a, b);
1409b394cd1eSFedor Uporov 		if (error)
1410b394cd1eSFedor Uporov 			goto out;
1411b394cd1eSFedor Uporov 
1412b394cd1eSFedor Uporov 		if (num == 0) {
1413b394cd1eSFedor Uporov 			ext4_ext_store_pblock(ex, 0);
1414b394cd1eSFedor Uporov 			eh->eh_ecount--;
1415b394cd1eSFedor Uporov 		}
1416b394cd1eSFedor Uporov 
1417b394cd1eSFedor Uporov 		ex->e_blk = block;
1418b394cd1eSFedor Uporov 		ex->e_len = num;
1419b394cd1eSFedor Uporov 
1420b394cd1eSFedor Uporov 		ext4_ext_dirty(ip, path + depth);
1421b394cd1eSFedor Uporov 
1422b394cd1eSFedor Uporov 		ex--;
1423b394cd1eSFedor Uporov 		ex_blk = ex->e_blk;
1424b394cd1eSFedor Uporov 		ex_len = ext4_ext_get_actual_len(ex);
1425b394cd1eSFedor Uporov 	};
1426b394cd1eSFedor Uporov 
1427b394cd1eSFedor Uporov 	if (correct_index && eh->eh_ecount)
1428b394cd1eSFedor Uporov 		error = ext4_ext_correct_indexes(ip, path);
1429b394cd1eSFedor Uporov 
1430b394cd1eSFedor Uporov 	/*
1431b394cd1eSFedor Uporov 	 * If this leaf is free, we should
1432b394cd1eSFedor Uporov 	 * remove it from index block above.
1433b394cd1eSFedor Uporov 	 */
1434b394cd1eSFedor Uporov 	if (error == 0 && eh->eh_ecount == 0 && path[depth].ep_data != NULL)
1435b394cd1eSFedor Uporov 		error = ext4_ext_rm_index(ip, path + depth);
1436b394cd1eSFedor Uporov 
1437b394cd1eSFedor Uporov out:
1438b394cd1eSFedor Uporov 	return (error);
1439b394cd1eSFedor Uporov }
1440b394cd1eSFedor Uporov 
1441b394cd1eSFedor Uporov static struct buf *
1442b394cd1eSFedor Uporov ext4_read_extent_tree_block(struct inode *ip, e4fs_daddr_t pblk,
1443b394cd1eSFedor Uporov     int depth, int flags)
1444b394cd1eSFedor Uporov {
1445b394cd1eSFedor Uporov 	struct m_ext2fs *fs;
1446b394cd1eSFedor Uporov 	struct ext4_extent_header *eh;
1447b394cd1eSFedor Uporov 	struct buf *bp;
1448b394cd1eSFedor Uporov 	int error;
1449b394cd1eSFedor Uporov 
1450b394cd1eSFedor Uporov 	fs = ip->i_e2fs;
1451b394cd1eSFedor Uporov 
1452b394cd1eSFedor Uporov 	error = bread(ip->i_devvp, fsbtodb(fs, pblk),
1453b394cd1eSFedor Uporov 	    fs->e2fs_bsize, NOCRED, &bp);
1454b394cd1eSFedor Uporov 	if (error) {
1455b394cd1eSFedor Uporov 		brelse(bp);
1456d7511a40SPedro F. Giffuni 		return (NULL);
1457d7511a40SPedro F. Giffuni 	}
1458b394cd1eSFedor Uporov 
1459b394cd1eSFedor Uporov 	eh = ext4_ext_block_header(bp->b_data);
1460b394cd1eSFedor Uporov 	if (eh->eh_depth != depth) {
1461b394cd1eSFedor Uporov 		ext2_fserr(fs, ip->i_uid, "unexpected eh_depth");
1462b394cd1eSFedor Uporov 		goto err;
1463d7511a40SPedro F. Giffuni 	}
1464d7511a40SPedro F. Giffuni 
1465b394cd1eSFedor Uporov 	error = ext4_ext_check_header(ip, eh);
1466b394cd1eSFedor Uporov 	if (error)
1467b394cd1eSFedor Uporov 		goto err;
1468d7511a40SPedro F. Giffuni 
1469b394cd1eSFedor Uporov 	return (bp);
1470b394cd1eSFedor Uporov 
1471b394cd1eSFedor Uporov err:
1472b394cd1eSFedor Uporov 	brelse(bp);
1473b394cd1eSFedor Uporov 	return (NULL);
1474b394cd1eSFedor Uporov 
1475b394cd1eSFedor Uporov }
1476b394cd1eSFedor Uporov 
1477b394cd1eSFedor Uporov static int inline
1478b394cd1eSFedor Uporov ext4_ext_more_to_rm(struct ext4_extent_path *path)
1479b394cd1eSFedor Uporov {
1480b394cd1eSFedor Uporov 
1481b394cd1eSFedor Uporov 	KASSERT(path->ep_index != NULL,
1482b394cd1eSFedor Uporov 	    ("ext4_ext_more_to_rm: bad index from path"));
1483b394cd1eSFedor Uporov 
1484b394cd1eSFedor Uporov 	if (path->ep_index < EXT_FIRST_INDEX(path->ep_header))
1485b394cd1eSFedor Uporov 		return (0);
1486b394cd1eSFedor Uporov 
1487b394cd1eSFedor Uporov 	if (path->ep_header->eh_ecount == path->index_count)
1488b394cd1eSFedor Uporov 		return (0);
1489b394cd1eSFedor Uporov 
1490b394cd1eSFedor Uporov 	return (1);
1491b394cd1eSFedor Uporov }
1492b394cd1eSFedor Uporov 
1493b394cd1eSFedor Uporov int
1494b394cd1eSFedor Uporov ext4_ext_remove_space(struct inode *ip, off_t length, int flags,
1495b394cd1eSFedor Uporov     struct ucred *cred, struct thread *td)
1496b394cd1eSFedor Uporov {
1497b394cd1eSFedor Uporov 	struct buf *bp;
1498b394cd1eSFedor Uporov 	struct ext4_extent_header *ehp;
1499b394cd1eSFedor Uporov 	struct ext4_extent_path *path;
1500b394cd1eSFedor Uporov 	int depth;
1501b394cd1eSFedor Uporov 	int i, error;
1502b394cd1eSFedor Uporov 
1503b394cd1eSFedor Uporov 	ehp = (struct ext4_extent_header *)ip->i_db;
1504b394cd1eSFedor Uporov 	depth = ext4_ext_inode_depth(ip);
1505b394cd1eSFedor Uporov 
1506b394cd1eSFedor Uporov 	error = ext4_ext_check_header(ip, ehp);
1507b394cd1eSFedor Uporov 	if(error)
1508b394cd1eSFedor Uporov 		return (error);
1509b394cd1eSFedor Uporov 
1510b394cd1eSFedor Uporov 	path = malloc(sizeof(struct ext4_extent_path) * (depth + 1),
1511b394cd1eSFedor Uporov 		      M_EXT2EXTENTS, M_WAITOK | M_ZERO);
1512b394cd1eSFedor Uporov 	if (!path)
1513b394cd1eSFedor Uporov 		return (ENOMEM);
1514b394cd1eSFedor Uporov 
1515b394cd1eSFedor Uporov 	i = 0;
1516b394cd1eSFedor Uporov 	path[0].ep_header = ehp;
1517b394cd1eSFedor Uporov 	path[0].ep_depth = depth;
1518b394cd1eSFedor Uporov 	while (i >= 0 && error == 0) {
1519b394cd1eSFedor Uporov 		if (i == depth) {
1520b394cd1eSFedor Uporov 			/* This is leaf. */
1521b394cd1eSFedor Uporov 			error = ext4_ext_rm_leaf(ip, path, length);
1522b394cd1eSFedor Uporov 			if (error)
1523b394cd1eSFedor Uporov 				break;
1524b394cd1eSFedor Uporov 			free(path[i].ep_data, M_EXT2EXTENTS);
1525b394cd1eSFedor Uporov 			path[i].ep_data = NULL;
1526b394cd1eSFedor Uporov 			i--;
1527b394cd1eSFedor Uporov 			continue;
1528b394cd1eSFedor Uporov 		}
1529b394cd1eSFedor Uporov 
1530b394cd1eSFedor Uporov 		/* This is index. */
1531b394cd1eSFedor Uporov 		if (!path[i].ep_header)
1532b394cd1eSFedor Uporov 			path[i].ep_header =
1533b394cd1eSFedor Uporov 			    (struct ext4_extent_header *)path[i].ep_data;
1534b394cd1eSFedor Uporov 
1535b394cd1eSFedor Uporov 		if (!path[i].ep_index) {
1536b394cd1eSFedor Uporov 			/* This level hasn't touched yet. */
1537b394cd1eSFedor Uporov 			path[i].ep_index = EXT_LAST_INDEX(path[i].ep_header);
1538b394cd1eSFedor Uporov 			path[i].index_count = path[i].ep_header->eh_ecount + 1;
1539b394cd1eSFedor Uporov 		} else {
1540b394cd1eSFedor Uporov 			/* We've already was here, see at next index. */
1541b394cd1eSFedor Uporov 			path[i].ep_index--;
1542b394cd1eSFedor Uporov 		}
1543b394cd1eSFedor Uporov 
1544b394cd1eSFedor Uporov 		if (ext4_ext_more_to_rm(path + i)) {
1545b394cd1eSFedor Uporov 			memset(path + i + 1, 0, sizeof(*path));
1546b394cd1eSFedor Uporov 			bp = ext4_read_extent_tree_block(ip,
1547b394cd1eSFedor Uporov 			    ext4_ext_index_pblock(path[i].ep_index),
1548b394cd1eSFedor Uporov 			    path[0].ep_depth - (i + 1), 0);
1549b394cd1eSFedor Uporov 			if (!bp) {
1550b394cd1eSFedor Uporov 				error = EIO;
1551b394cd1eSFedor Uporov 				break;
1552b394cd1eSFedor Uporov 			}
1553b394cd1eSFedor Uporov 
1554b394cd1eSFedor Uporov 			ext4_ext_fill_path_bdata(&path[i+1], bp,
1555b394cd1eSFedor Uporov 			    ext4_ext_index_pblock(path[i].ep_index));
1556b394cd1eSFedor Uporov 			brelse(bp);
1557b394cd1eSFedor Uporov 			path[i].index_count = path[i].ep_header->eh_ecount;
1558b394cd1eSFedor Uporov 			i++;
1559b394cd1eSFedor Uporov 		} else {
1560b394cd1eSFedor Uporov 			if (path[i].ep_header->eh_ecount == 0 && i > 0) {
1561b394cd1eSFedor Uporov 				/* Index is empty, remove it. */
1562b394cd1eSFedor Uporov 				error = ext4_ext_rm_index(ip, path + i);
1563b394cd1eSFedor Uporov 			}
1564b394cd1eSFedor Uporov 			free(path[i].ep_data, M_EXT2EXTENTS);
1565b394cd1eSFedor Uporov 			path[i].ep_data = NULL;
1566b394cd1eSFedor Uporov 			i--;
1567b394cd1eSFedor Uporov 		}
1568b394cd1eSFedor Uporov 	}
1569b394cd1eSFedor Uporov 
1570b394cd1eSFedor Uporov 	if (path->ep_header->eh_ecount == 0) {
1571b394cd1eSFedor Uporov 		/*
1572b394cd1eSFedor Uporov 		 * Truncate the tree to zero.
1573b394cd1eSFedor Uporov 		 */
1574b394cd1eSFedor Uporov 		 ext4_ext_header(ip)->eh_depth = 0;
1575b394cd1eSFedor Uporov 		 ext4_ext_header(ip)->eh_max = ext4_ext_space_root(ip);
1576b394cd1eSFedor Uporov 		 ext4_ext_dirty(ip, path);
1577b394cd1eSFedor Uporov 
1578b394cd1eSFedor Uporov 	}
1579b394cd1eSFedor Uporov 
1580b394cd1eSFedor Uporov 	ext4_ext_drop_refs(path);
1581b394cd1eSFedor Uporov 	free(path, M_EXT2EXTENTS);
1582b394cd1eSFedor Uporov 
1583b394cd1eSFedor Uporov 	return (error);
1584d7511a40SPedro F. Giffuni }
1585