xref: /linux/fs/nilfs2/alloc.c (revision e0e53dee69e07e9446eb16ceabd55a1116611696)
1 /*
2  * alloc.c - NILFS dat/inode allocator
3  *
4  * Copyright (C) 2006-2008 Nippon Telegraph and Telephone Corporation.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License as published by
8  * the Free Software Foundation; either version 2 of the License, or
9  * (at your option) any later version.
10  *
11  * This program is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  * GNU General Public License for more details.
15  *
16  * You should have received a copy of the GNU General Public License
17  * along with this program; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301  USA
19  *
20  * Original code was written by Koji Sato <koji@osrg.net>.
21  * Two allocators were unified by Ryusuke Konishi <ryusuke@osrg.net>,
22  *                                Amagai Yoshiji <amagai@osrg.net>.
23  */
24 
25 #include <linux/types.h>
26 #include <linux/buffer_head.h>
27 #include <linux/fs.h>
28 #include <linux/bitops.h>
29 #include "mdt.h"
30 #include "alloc.h"
31 
32 
33 static inline unsigned long
34 nilfs_palloc_groups_per_desc_block(const struct inode *inode)
35 {
36 	return (1UL << inode->i_blkbits) /
37 		sizeof(struct nilfs_palloc_group_desc);
38 }
39 
40 static inline unsigned long
41 nilfs_palloc_groups_count(const struct inode *inode)
42 {
43 	return 1UL << (BITS_PER_LONG - (inode->i_blkbits + 3 /* log2(8) */));
44 }
45 
46 int nilfs_palloc_init_blockgroup(struct inode *inode, unsigned entry_size)
47 {
48 	struct nilfs_mdt_info *mi = NILFS_MDT(inode);
49 
50 	mi->mi_bgl = kmalloc(sizeof(*mi->mi_bgl), GFP_NOFS);
51 	if (!mi->mi_bgl)
52 		return -ENOMEM;
53 
54 	bgl_lock_init(mi->mi_bgl);
55 
56 	nilfs_mdt_set_entry_size(inode, entry_size, 0);
57 
58 	mi->mi_blocks_per_group =
59 		DIV_ROUND_UP(nilfs_palloc_entries_per_group(inode),
60 			     mi->mi_entries_per_block) + 1;
61 		/* Number of blocks in a group including entry blocks and
62 		   a bitmap block */
63 	mi->mi_blocks_per_desc_block =
64 		nilfs_palloc_groups_per_desc_block(inode) *
65 		mi->mi_blocks_per_group + 1;
66 		/* Number of blocks per descriptor including the
67 		   descriptor block */
68 	return 0;
69 }
70 
71 static unsigned long nilfs_palloc_group(const struct inode *inode, __u64 nr,
72 					unsigned long *offset)
73 {
74 	__u64 group = nr;
75 
76 	*offset = do_div(group, nilfs_palloc_entries_per_group(inode));
77 	return group;
78 }
79 
80 static unsigned long
81 nilfs_palloc_desc_blkoff(const struct inode *inode, unsigned long group)
82 {
83 	unsigned long desc_block =
84 		group / nilfs_palloc_groups_per_desc_block(inode);
85 	return desc_block * NILFS_MDT(inode)->mi_blocks_per_desc_block;
86 }
87 
88 static unsigned long
89 nilfs_palloc_bitmap_blkoff(const struct inode *inode, unsigned long group)
90 {
91 	unsigned long desc_offset =
92 		group % nilfs_palloc_groups_per_desc_block(inode);
93 	return nilfs_palloc_desc_blkoff(inode, group) + 1 +
94 		desc_offset * NILFS_MDT(inode)->mi_blocks_per_group;
95 }
96 
97 static unsigned long
98 nilfs_palloc_group_desc_nfrees(struct inode *inode, unsigned long group,
99 			       const struct nilfs_palloc_group_desc *desc)
100 {
101 	unsigned long nfree;
102 
103 	spin_lock(nilfs_mdt_bgl_lock(inode, group));
104 	nfree = le32_to_cpu(desc->pg_nfrees);
105 	spin_unlock(nilfs_mdt_bgl_lock(inode, group));
106 	return nfree;
107 }
108 
109 static void
110 nilfs_palloc_group_desc_add_entries(struct inode *inode,
111 				    unsigned long group,
112 				    struct nilfs_palloc_group_desc *desc,
113 				    u32 n)
114 {
115 	spin_lock(nilfs_mdt_bgl_lock(inode, group));
116 	le32_add_cpu(&desc->pg_nfrees, n);
117 	spin_unlock(nilfs_mdt_bgl_lock(inode, group));
118 }
119 
120 static unsigned long
121 nilfs_palloc_entry_blkoff(const struct inode *inode, __u64 nr)
122 {
123 	unsigned long group, group_offset;
124 
125 	group = nilfs_palloc_group(inode, nr, &group_offset);
126 
127 	return nilfs_palloc_bitmap_blkoff(inode, group) + 1 +
128 		group_offset / NILFS_MDT(inode)->mi_entries_per_block;
129 }
130 
131 static void nilfs_palloc_desc_block_init(struct inode *inode,
132 					 struct buffer_head *bh, void *kaddr)
133 {
134 	struct nilfs_palloc_group_desc *desc = kaddr + bh_offset(bh);
135 	unsigned long n = nilfs_palloc_groups_per_desc_block(inode);
136 	__le32 nfrees;
137 
138 	nfrees = cpu_to_le32(nilfs_palloc_entries_per_group(inode));
139 	while (n-- > 0) {
140 		desc->pg_nfrees = nfrees;
141 		desc++;
142 	}
143 }
144 
145 static int nilfs_palloc_get_block(struct inode *inode, unsigned long blkoff,
146 				  int create,
147 				  void (*init_block)(struct inode *,
148 						     struct buffer_head *,
149 						     void *),
150 				  struct buffer_head **bhp,
151 				  struct nilfs_bh_assoc *prev,
152 				  spinlock_t *lock)
153 {
154 	int ret;
155 
156 	spin_lock(lock);
157 	if (prev->bh && blkoff == prev->blkoff) {
158 		get_bh(prev->bh);
159 		*bhp = prev->bh;
160 		spin_unlock(lock);
161 		return 0;
162 	}
163 	spin_unlock(lock);
164 
165 	ret = nilfs_mdt_get_block(inode, blkoff, create, init_block, bhp);
166 	if (!ret) {
167 		spin_lock(lock);
168 		/*
169 		 * The following code must be safe for change of the
170 		 * cache contents during the get block call.
171 		 */
172 		brelse(prev->bh);
173 		get_bh(*bhp);
174 		prev->bh = *bhp;
175 		prev->blkoff = blkoff;
176 		spin_unlock(lock);
177 	}
178 	return ret;
179 }
180 
181 static int nilfs_palloc_get_desc_block(struct inode *inode,
182 				       unsigned long group,
183 				       int create, struct buffer_head **bhp)
184 {
185 	struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache;
186 
187 	return nilfs_palloc_get_block(inode,
188 				      nilfs_palloc_desc_blkoff(inode, group),
189 				      create, nilfs_palloc_desc_block_init,
190 				      bhp, &cache->prev_desc, &cache->lock);
191 }
192 
193 static int nilfs_palloc_get_bitmap_block(struct inode *inode,
194 					 unsigned long group,
195 					 int create, struct buffer_head **bhp)
196 {
197 	struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache;
198 
199 	return nilfs_palloc_get_block(inode,
200 				      nilfs_palloc_bitmap_blkoff(inode, group),
201 				      create, NULL, bhp,
202 				      &cache->prev_bitmap, &cache->lock);
203 }
204 
205 int nilfs_palloc_get_entry_block(struct inode *inode, __u64 nr,
206 				 int create, struct buffer_head **bhp)
207 {
208 	struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache;
209 
210 	return nilfs_palloc_get_block(inode,
211 				      nilfs_palloc_entry_blkoff(inode, nr),
212 				      create, NULL, bhp,
213 				      &cache->prev_entry, &cache->lock);
214 }
215 
216 static struct nilfs_palloc_group_desc *
217 nilfs_palloc_block_get_group_desc(const struct inode *inode,
218 				  unsigned long group,
219 				  const struct buffer_head *bh, void *kaddr)
220 {
221 	return (struct nilfs_palloc_group_desc *)(kaddr + bh_offset(bh)) +
222 		group % nilfs_palloc_groups_per_desc_block(inode);
223 }
224 
225 void *nilfs_palloc_block_get_entry(const struct inode *inode, __u64 nr,
226 				   const struct buffer_head *bh, void *kaddr)
227 {
228 	unsigned long entry_offset, group_offset;
229 
230 	nilfs_palloc_group(inode, nr, &group_offset);
231 	entry_offset = group_offset % NILFS_MDT(inode)->mi_entries_per_block;
232 
233 	return kaddr + bh_offset(bh) +
234 		entry_offset * NILFS_MDT(inode)->mi_entry_size;
235 }
236 
237 static int nilfs_palloc_find_available_slot(struct inode *inode,
238 					    unsigned long group,
239 					    unsigned long target,
240 					    unsigned char *bitmap,
241 					    int bsize)  /* size in bits */
242 {
243 	int curr, pos, end, i;
244 
245 	if (target > 0) {
246 		end = (target + BITS_PER_LONG - 1) & ~(BITS_PER_LONG - 1);
247 		if (end > bsize)
248 			end = bsize;
249 		pos = nilfs_find_next_zero_bit(bitmap, end, target);
250 		if (pos < end &&
251 		    !nilfs_set_bit_atomic(
252 			    nilfs_mdt_bgl_lock(inode, group), pos, bitmap))
253 			return pos;
254 	} else
255 		end = 0;
256 
257 	for (i = 0, curr = end;
258 	     i < bsize;
259 	     i += BITS_PER_LONG, curr += BITS_PER_LONG) {
260 		/* wrap around */
261 		if (curr >= bsize)
262 			curr = 0;
263 		while (*((unsigned long *)bitmap + curr / BITS_PER_LONG)
264 		       != ~0UL) {
265 			end = curr + BITS_PER_LONG;
266 			if (end > bsize)
267 				end = bsize;
268 			pos = nilfs_find_next_zero_bit(bitmap, end, curr);
269 			if ((pos < end) &&
270 			    !nilfs_set_bit_atomic(
271 				    nilfs_mdt_bgl_lock(inode, group), pos,
272 				    bitmap))
273 				return pos;
274 		}
275 	}
276 	return -ENOSPC;
277 }
278 
279 static unsigned long
280 nilfs_palloc_rest_groups_in_desc_block(const struct inode *inode,
281 				       unsigned long curr, unsigned long max)
282 {
283 	return min_t(unsigned long,
284 		     nilfs_palloc_groups_per_desc_block(inode) -
285 		     curr % nilfs_palloc_groups_per_desc_block(inode),
286 		     max - curr + 1);
287 }
288 
289 int nilfs_palloc_prepare_alloc_entry(struct inode *inode,
290 				     struct nilfs_palloc_req *req)
291 {
292 	struct buffer_head *desc_bh, *bitmap_bh;
293 	struct nilfs_palloc_group_desc *desc;
294 	unsigned char *bitmap;
295 	void *desc_kaddr, *bitmap_kaddr;
296 	unsigned long group, maxgroup, ngroups;
297 	unsigned long group_offset, maxgroup_offset;
298 	unsigned long n, entries_per_group, groups_per_desc_block;
299 	unsigned long i, j;
300 	int pos, ret;
301 
302 	ngroups = nilfs_palloc_groups_count(inode);
303 	maxgroup = ngroups - 1;
304 	group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset);
305 	entries_per_group = nilfs_palloc_entries_per_group(inode);
306 	groups_per_desc_block = nilfs_palloc_groups_per_desc_block(inode);
307 
308 	for (i = 0; i < ngroups; i += n) {
309 		if (group >= ngroups) {
310 			/* wrap around */
311 			group = 0;
312 			maxgroup = nilfs_palloc_group(inode, req->pr_entry_nr,
313 						      &maxgroup_offset) - 1;
314 		}
315 		ret = nilfs_palloc_get_desc_block(inode, group, 1, &desc_bh);
316 		if (ret < 0)
317 			return ret;
318 		desc_kaddr = kmap(desc_bh->b_page);
319 		desc = nilfs_palloc_block_get_group_desc(
320 			inode, group, desc_bh, desc_kaddr);
321 		n = nilfs_palloc_rest_groups_in_desc_block(inode, group,
322 							   maxgroup);
323 		for (j = 0; j < n; j++, desc++, group++) {
324 			if (nilfs_palloc_group_desc_nfrees(inode, group, desc)
325 			    > 0) {
326 				ret = nilfs_palloc_get_bitmap_block(
327 					inode, group, 1, &bitmap_bh);
328 				if (ret < 0)
329 					goto out_desc;
330 				bitmap_kaddr = kmap(bitmap_bh->b_page);
331 				bitmap = bitmap_kaddr + bh_offset(bitmap_bh);
332 				pos = nilfs_palloc_find_available_slot(
333 					inode, group, group_offset, bitmap,
334 					entries_per_group);
335 				if (pos >= 0) {
336 					/* found a free entry */
337 					nilfs_palloc_group_desc_add_entries(
338 						inode, group, desc, -1);
339 					req->pr_entry_nr =
340 						entries_per_group * group + pos;
341 					kunmap(desc_bh->b_page);
342 					kunmap(bitmap_bh->b_page);
343 
344 					req->pr_desc_bh = desc_bh;
345 					req->pr_bitmap_bh = bitmap_bh;
346 					return 0;
347 				}
348 				kunmap(bitmap_bh->b_page);
349 				brelse(bitmap_bh);
350 			}
351 
352 			group_offset = 0;
353 		}
354 
355 		kunmap(desc_bh->b_page);
356 		brelse(desc_bh);
357 	}
358 
359 	/* no entries left */
360 	return -ENOSPC;
361 
362  out_desc:
363 	kunmap(desc_bh->b_page);
364 	brelse(desc_bh);
365 	return ret;
366 }
367 
368 void nilfs_palloc_commit_alloc_entry(struct inode *inode,
369 				     struct nilfs_palloc_req *req)
370 {
371 	nilfs_mdt_mark_buffer_dirty(req->pr_bitmap_bh);
372 	nilfs_mdt_mark_buffer_dirty(req->pr_desc_bh);
373 	nilfs_mdt_mark_dirty(inode);
374 
375 	brelse(req->pr_bitmap_bh);
376 	brelse(req->pr_desc_bh);
377 }
378 
379 void nilfs_palloc_commit_free_entry(struct inode *inode,
380 				    struct nilfs_palloc_req *req)
381 {
382 	struct nilfs_palloc_group_desc *desc;
383 	unsigned long group, group_offset;
384 	unsigned char *bitmap;
385 	void *desc_kaddr, *bitmap_kaddr;
386 
387 	group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset);
388 	desc_kaddr = kmap(req->pr_desc_bh->b_page);
389 	desc = nilfs_palloc_block_get_group_desc(inode, group,
390 						 req->pr_desc_bh, desc_kaddr);
391 	bitmap_kaddr = kmap(req->pr_bitmap_bh->b_page);
392 	bitmap = bitmap_kaddr + bh_offset(req->pr_bitmap_bh);
393 
394 	if (!nilfs_clear_bit_atomic(nilfs_mdt_bgl_lock(inode, group),
395 				    group_offset, bitmap))
396 		printk(KERN_WARNING "%s: entry number %llu already freed\n",
397 		       __func__, (unsigned long long)req->pr_entry_nr);
398 
399 	nilfs_palloc_group_desc_add_entries(inode, group, desc, 1);
400 
401 	kunmap(req->pr_bitmap_bh->b_page);
402 	kunmap(req->pr_desc_bh->b_page);
403 
404 	nilfs_mdt_mark_buffer_dirty(req->pr_desc_bh);
405 	nilfs_mdt_mark_buffer_dirty(req->pr_bitmap_bh);
406 	nilfs_mdt_mark_dirty(inode);
407 
408 	brelse(req->pr_bitmap_bh);
409 	brelse(req->pr_desc_bh);
410 }
411 
412 void nilfs_palloc_abort_alloc_entry(struct inode *inode,
413 				    struct nilfs_palloc_req *req)
414 {
415 	struct nilfs_palloc_group_desc *desc;
416 	void *desc_kaddr, *bitmap_kaddr;
417 	unsigned char *bitmap;
418 	unsigned long group, group_offset;
419 
420 	group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset);
421 	desc_kaddr = kmap(req->pr_desc_bh->b_page);
422 	desc = nilfs_palloc_block_get_group_desc(inode, group,
423 						 req->pr_desc_bh, desc_kaddr);
424 	bitmap_kaddr = kmap(req->pr_bitmap_bh->b_page);
425 	bitmap = bitmap_kaddr + bh_offset(req->pr_bitmap_bh);
426 	if (!nilfs_clear_bit_atomic(nilfs_mdt_bgl_lock(inode, group),
427 				    group_offset, bitmap))
428 		printk(KERN_WARNING "%s: entry numer %llu already freed\n",
429 		       __func__, (unsigned long long)req->pr_entry_nr);
430 
431 	nilfs_palloc_group_desc_add_entries(inode, group, desc, 1);
432 
433 	kunmap(req->pr_bitmap_bh->b_page);
434 	kunmap(req->pr_desc_bh->b_page);
435 
436 	brelse(req->pr_bitmap_bh);
437 	brelse(req->pr_desc_bh);
438 
439 	req->pr_entry_nr = 0;
440 	req->pr_bitmap_bh = NULL;
441 	req->pr_desc_bh = NULL;
442 }
443 
444 int nilfs_palloc_prepare_free_entry(struct inode *inode,
445 				    struct nilfs_palloc_req *req)
446 {
447 	struct buffer_head *desc_bh, *bitmap_bh;
448 	unsigned long group, group_offset;
449 	int ret;
450 
451 	group = nilfs_palloc_group(inode, req->pr_entry_nr, &group_offset);
452 	ret = nilfs_palloc_get_desc_block(inode, group, 1, &desc_bh);
453 	if (ret < 0)
454 		return ret;
455 	ret = nilfs_palloc_get_bitmap_block(inode, group, 1, &bitmap_bh);
456 	if (ret < 0) {
457 		brelse(desc_bh);
458 		return ret;
459 	}
460 
461 	req->pr_desc_bh = desc_bh;
462 	req->pr_bitmap_bh = bitmap_bh;
463 	return 0;
464 }
465 
466 void nilfs_palloc_abort_free_entry(struct inode *inode,
467 				   struct nilfs_palloc_req *req)
468 {
469 	brelse(req->pr_bitmap_bh);
470 	brelse(req->pr_desc_bh);
471 
472 	req->pr_entry_nr = 0;
473 	req->pr_bitmap_bh = NULL;
474 	req->pr_desc_bh = NULL;
475 }
476 
477 static int
478 nilfs_palloc_group_is_in(struct inode *inode, unsigned long group, __u64 nr)
479 {
480 	__u64 first, last;
481 
482 	first = group * nilfs_palloc_entries_per_group(inode);
483 	last = first + nilfs_palloc_entries_per_group(inode) - 1;
484 	return (nr >= first) && (nr <= last);
485 }
486 
487 int nilfs_palloc_freev(struct inode *inode, __u64 *entry_nrs, size_t nitems)
488 {
489 	struct buffer_head *desc_bh, *bitmap_bh;
490 	struct nilfs_palloc_group_desc *desc;
491 	unsigned char *bitmap;
492 	void *desc_kaddr, *bitmap_kaddr;
493 	unsigned long group, group_offset;
494 	int i, j, n, ret;
495 
496 	for (i = 0; i < nitems; i += n) {
497 		group = nilfs_palloc_group(inode, entry_nrs[i], &group_offset);
498 		ret = nilfs_palloc_get_desc_block(inode, group, 0, &desc_bh);
499 		if (ret < 0)
500 			return ret;
501 		ret = nilfs_palloc_get_bitmap_block(inode, group, 0,
502 						    &bitmap_bh);
503 		if (ret < 0) {
504 			brelse(desc_bh);
505 			return ret;
506 		}
507 		desc_kaddr = kmap(desc_bh->b_page);
508 		desc = nilfs_palloc_block_get_group_desc(
509 			inode, group, desc_bh, desc_kaddr);
510 		bitmap_kaddr = kmap(bitmap_bh->b_page);
511 		bitmap = bitmap_kaddr + bh_offset(bitmap_bh);
512 		for (j = i, n = 0;
513 		     (j < nitems) && nilfs_palloc_group_is_in(inode, group,
514 							      entry_nrs[j]);
515 		     j++, n++) {
516 			nilfs_palloc_group(inode, entry_nrs[j], &group_offset);
517 			if (!nilfs_clear_bit_atomic(
518 				    nilfs_mdt_bgl_lock(inode, group),
519 				    group_offset, bitmap)) {
520 				printk(KERN_WARNING
521 				       "%s: entry number %llu already freed\n",
522 				       __func__,
523 				       (unsigned long long)entry_nrs[j]);
524 			}
525 		}
526 		nilfs_palloc_group_desc_add_entries(inode, group, desc, n);
527 
528 		kunmap(bitmap_bh->b_page);
529 		kunmap(desc_bh->b_page);
530 
531 		nilfs_mdt_mark_buffer_dirty(desc_bh);
532 		nilfs_mdt_mark_buffer_dirty(bitmap_bh);
533 		nilfs_mdt_mark_dirty(inode);
534 
535 		brelse(bitmap_bh);
536 		brelse(desc_bh);
537 	}
538 	return 0;
539 }
540 
541 void nilfs_palloc_setup_cache(struct inode *inode,
542 			      struct nilfs_palloc_cache *cache)
543 {
544 	NILFS_MDT(inode)->mi_palloc_cache = cache;
545 	spin_lock_init(&cache->lock);
546 }
547 
548 void nilfs_palloc_clear_cache(struct inode *inode)
549 {
550 	struct nilfs_palloc_cache *cache = NILFS_MDT(inode)->mi_palloc_cache;
551 
552 	spin_lock(&cache->lock);
553 	brelse(cache->prev_desc.bh);
554 	brelse(cache->prev_bitmap.bh);
555 	brelse(cache->prev_entry.bh);
556 	cache->prev_desc.bh = NULL;
557 	cache->prev_bitmap.bh = NULL;
558 	cache->prev_entry.bh = NULL;
559 	spin_unlock(&cache->lock);
560 }
561 
562 void nilfs_palloc_destroy_cache(struct inode *inode)
563 {
564 	nilfs_palloc_clear_cache(inode);
565 	NILFS_MDT(inode)->mi_palloc_cache = NULL;
566 }
567