xref: /freebsd/sys/kern/vfs_hash.c (revision cd85d599d83f202202e03c0bdf49ac613b640831)
16c325a2aSPoul-Henning Kamp /*-
26c325a2aSPoul-Henning Kamp  * Copyright (c) 2005 Poul-Henning Kamp
36c325a2aSPoul-Henning Kamp  * All rights reserved.
46c325a2aSPoul-Henning Kamp  *
56c325a2aSPoul-Henning Kamp  * Redistribution and use in source and binary forms, with or without
66c325a2aSPoul-Henning Kamp  * modification, are permitted provided that the following conditions
76c325a2aSPoul-Henning Kamp  * are met:
86c325a2aSPoul-Henning Kamp  * 1. Redistributions of source code must retain the above copyright
96c325a2aSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer.
106c325a2aSPoul-Henning Kamp  * 2. Redistributions in binary form must reproduce the above copyright
116c325a2aSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer in the
126c325a2aSPoul-Henning Kamp  *    documentation and/or other materials provided with the distribution.
136c325a2aSPoul-Henning Kamp  *
146c325a2aSPoul-Henning Kamp  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
156c325a2aSPoul-Henning Kamp  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
166c325a2aSPoul-Henning Kamp  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
176c325a2aSPoul-Henning Kamp  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
186c325a2aSPoul-Henning Kamp  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
196c325a2aSPoul-Henning Kamp  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
206c325a2aSPoul-Henning Kamp  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
216c325a2aSPoul-Henning Kamp  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
226c325a2aSPoul-Henning Kamp  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
236c325a2aSPoul-Henning Kamp  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
246c325a2aSPoul-Henning Kamp  * SUCH DAMAGE.
256c325a2aSPoul-Henning Kamp  *
266c325a2aSPoul-Henning Kamp  */
276c325a2aSPoul-Henning Kamp 
286c325a2aSPoul-Henning Kamp #include <sys/cdefs.h>
296c325a2aSPoul-Henning Kamp __FBSDID("$FreeBSD$");
306c325a2aSPoul-Henning Kamp 
316c325a2aSPoul-Henning Kamp #include <sys/param.h>
326c325a2aSPoul-Henning Kamp #include <sys/systm.h>
336c325a2aSPoul-Henning Kamp #include <sys/kernel.h>
346c325a2aSPoul-Henning Kamp #include <sys/malloc.h>
3578bb3c21SPoul-Henning Kamp #include <sys/mount.h>
36af77c1a6SMateusz Guzik #include <sys/rwlock.h>
376c325a2aSPoul-Henning Kamp #include <sys/vnode.h>
386c325a2aSPoul-Henning Kamp 
395bb84bc8SRobert Watson static MALLOC_DEFINE(M_VFS_HASH, "vfs_hash", "VFS hash table");
406c325a2aSPoul-Henning Kamp 
4178bb3c21SPoul-Henning Kamp static LIST_HEAD(vfs_hash_head, vnode)	*vfs_hash_tbl;
4278bb3c21SPoul-Henning Kamp static LIST_HEAD(,vnode)		vfs_hash_side;
436c325a2aSPoul-Henning Kamp static u_long				vfs_hash_mask;
44af77c1a6SMateusz Guzik static struct rwlock			vfs_hash_lock;
456c325a2aSPoul-Henning Kamp 
466c325a2aSPoul-Henning Kamp static void
476c325a2aSPoul-Henning Kamp vfs_hashinit(void *dummy __unused)
486c325a2aSPoul-Henning Kamp {
496c325a2aSPoul-Henning Kamp 
506c325a2aSPoul-Henning Kamp 	vfs_hash_tbl = hashinit(desiredvnodes, M_VFS_HASH, &vfs_hash_mask);
51af77c1a6SMateusz Guzik 	rw_init(&vfs_hash_lock, "vfs hash");
5278bb3c21SPoul-Henning Kamp 	LIST_INIT(&vfs_hash_side);
536c325a2aSPoul-Henning Kamp }
546c325a2aSPoul-Henning Kamp 
556c325a2aSPoul-Henning Kamp /* Must be SI_ORDER_SECOND so desiredvnodes is available */
56237fdd78SRobert Watson SYSINIT(vfs_hash, SI_SUB_VFS, SI_ORDER_SECOND, vfs_hashinit, NULL);
576c325a2aSPoul-Henning Kamp 
58f6af8e37SKonstantin Belousov u_int
59f6af8e37SKonstantin Belousov vfs_hash_index(struct vnode *vp)
60f6af8e37SKonstantin Belousov {
61f6af8e37SKonstantin Belousov 
62f6af8e37SKonstantin Belousov 	return (vp->v_hash + vp->v_mount->mnt_hashseed);
63f6af8e37SKonstantin Belousov }
64f6af8e37SKonstantin Belousov 
6578bb3c21SPoul-Henning Kamp static struct vfs_hash_head *
667b982bc8SKonstantin Belousov vfs_hash_bucket(const struct mount *mp, u_int hash)
6778bb3c21SPoul-Henning Kamp {
6878bb3c21SPoul-Henning Kamp 
6978bb3c21SPoul-Henning Kamp 	return (&vfs_hash_tbl[(hash + mp->mnt_hashseed) & vfs_hash_mask]);
7078bb3c21SPoul-Henning Kamp }
7178bb3c21SPoul-Henning Kamp 
726c325a2aSPoul-Henning Kamp int
73*cd85d599SKonstantin Belousov vfs_hash_get(const struct mount *mp, u_int hash, int flags, struct thread *td,
74*cd85d599SKonstantin Belousov     struct vnode **vpp, vfs_hash_cmp_t *fn, void *arg)
756c325a2aSPoul-Henning Kamp {
766c325a2aSPoul-Henning Kamp 	struct vnode *vp;
776c325a2aSPoul-Henning Kamp 	int error;
786c325a2aSPoul-Henning Kamp 
796c325a2aSPoul-Henning Kamp 	while (1) {
80af77c1a6SMateusz Guzik 		rw_rlock(&vfs_hash_lock);
817b982bc8SKonstantin Belousov 		LIST_FOREACH(vp, vfs_hash_bucket(mp, hash), v_hashlist) {
826c325a2aSPoul-Henning Kamp 			if (vp->v_hash != hash)
836c325a2aSPoul-Henning Kamp 				continue;
846c325a2aSPoul-Henning Kamp 			if (vp->v_mount != mp)
856c325a2aSPoul-Henning Kamp 				continue;
8651f5ce0cSPoul-Henning Kamp 			if (fn != NULL && fn(vp, arg))
8751f5ce0cSPoul-Henning Kamp 				continue;
88752fc07dSMateusz Guzik 			vhold(vp);
89af77c1a6SMateusz Guzik 			rw_runlock(&vfs_hash_lock);
90752fc07dSMateusz Guzik 			error = vget(vp, flags | LK_VNHELD, td);
916ff5e2dbSTor Egge 			if (error == ENOENT && (flags & LK_NOWAIT) == 0)
926c325a2aSPoul-Henning Kamp 				break;
936c325a2aSPoul-Henning Kamp 			if (error)
946c325a2aSPoul-Henning Kamp 				return (error);
956c325a2aSPoul-Henning Kamp 			*vpp = vp;
966c325a2aSPoul-Henning Kamp 			return (0);
976c325a2aSPoul-Henning Kamp 		}
986c325a2aSPoul-Henning Kamp 		if (vp == NULL) {
99af77c1a6SMateusz Guzik 			rw_runlock(&vfs_hash_lock);
1006c325a2aSPoul-Henning Kamp 			*vpp = NULL;
1016c325a2aSPoul-Henning Kamp 			return (0);
1026c325a2aSPoul-Henning Kamp 		}
1036c325a2aSPoul-Henning Kamp 	}
1046c325a2aSPoul-Henning Kamp }
1056c325a2aSPoul-Henning Kamp 
1066c325a2aSPoul-Henning Kamp void
1076c325a2aSPoul-Henning Kamp vfs_hash_remove(struct vnode *vp)
1086c325a2aSPoul-Henning Kamp {
1096c325a2aSPoul-Henning Kamp 
110af77c1a6SMateusz Guzik 	rw_wlock(&vfs_hash_lock);
1116c325a2aSPoul-Henning Kamp 	LIST_REMOVE(vp, v_hashlist);
112af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
1136c325a2aSPoul-Henning Kamp }
1146c325a2aSPoul-Henning Kamp 
1156c325a2aSPoul-Henning Kamp int
116*cd85d599SKonstantin Belousov vfs_hash_insert(struct vnode *vp, u_int hash, int flags, struct thread *td,
117*cd85d599SKonstantin Belousov     struct vnode **vpp, vfs_hash_cmp_t *fn, void *arg)
1186c325a2aSPoul-Henning Kamp {
1196c325a2aSPoul-Henning Kamp 	struct vnode *vp2;
1206c325a2aSPoul-Henning Kamp 	int error;
1216c325a2aSPoul-Henning Kamp 
122e82ef95cSPoul-Henning Kamp 	*vpp = NULL;
1236c325a2aSPoul-Henning Kamp 	while (1) {
124af77c1a6SMateusz Guzik 		rw_wlock(&vfs_hash_lock);
1256c325a2aSPoul-Henning Kamp 		LIST_FOREACH(vp2,
1267b982bc8SKonstantin Belousov 		    vfs_hash_bucket(vp->v_mount, hash), v_hashlist) {
1276c325a2aSPoul-Henning Kamp 			if (vp2->v_hash != hash)
1286c325a2aSPoul-Henning Kamp 				continue;
1296c325a2aSPoul-Henning Kamp 			if (vp2->v_mount != vp->v_mount)
1306c325a2aSPoul-Henning Kamp 				continue;
131a1e1d551SPoul-Henning Kamp 			if (fn != NULL && fn(vp2, arg))
13251f5ce0cSPoul-Henning Kamp 				continue;
133752fc07dSMateusz Guzik 			vhold(vp2);
134af77c1a6SMateusz Guzik 			rw_wunlock(&vfs_hash_lock);
135752fc07dSMateusz Guzik 			error = vget(vp2, flags | LK_VNHELD, td);
1366ff5e2dbSTor Egge 			if (error == ENOENT && (flags & LK_NOWAIT) == 0)
1376c325a2aSPoul-Henning Kamp 				break;
138af77c1a6SMateusz Guzik 			rw_wlock(&vfs_hash_lock);
13978bb3c21SPoul-Henning Kamp 			LIST_INSERT_HEAD(&vfs_hash_side, vp, v_hashlist);
140af77c1a6SMateusz Guzik 			rw_wunlock(&vfs_hash_lock);
14145c26fa2SPoul-Henning Kamp 			vput(vp);
14245c26fa2SPoul-Henning Kamp 			if (!error)
1436c325a2aSPoul-Henning Kamp 				*vpp = vp2;
14445c26fa2SPoul-Henning Kamp 			return (error);
1456c325a2aSPoul-Henning Kamp 		}
1466c325a2aSPoul-Henning Kamp 		if (vp2 == NULL)
1476c325a2aSPoul-Henning Kamp 			break;
1486c325a2aSPoul-Henning Kamp 
1496c325a2aSPoul-Henning Kamp 	}
1506c325a2aSPoul-Henning Kamp 	vp->v_hash = hash;
1517b982bc8SKonstantin Belousov 	LIST_INSERT_HEAD(vfs_hash_bucket(vp->v_mount, hash), vp, v_hashlist);
152af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
1536c325a2aSPoul-Henning Kamp 	return (0);
1546c325a2aSPoul-Henning Kamp }
1556c325a2aSPoul-Henning Kamp 
1566c325a2aSPoul-Henning Kamp void
1576c325a2aSPoul-Henning Kamp vfs_hash_rehash(struct vnode *vp, u_int hash)
1586c325a2aSPoul-Henning Kamp {
1596c325a2aSPoul-Henning Kamp 
160af77c1a6SMateusz Guzik 	rw_wlock(&vfs_hash_lock);
1616c325a2aSPoul-Henning Kamp 	LIST_REMOVE(vp, v_hashlist);
1627b982bc8SKonstantin Belousov 	LIST_INSERT_HEAD(vfs_hash_bucket(vp->v_mount, hash), vp, v_hashlist);
1636c325a2aSPoul-Henning Kamp 	vp->v_hash = hash;
164af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
1656c325a2aSPoul-Henning Kamp }
16617518b1aSKirk McKusick 
16717518b1aSKirk McKusick void
16817518b1aSKirk McKusick vfs_hash_changesize(int newmaxvnodes)
16917518b1aSKirk McKusick {
17017518b1aSKirk McKusick 	struct vfs_hash_head *vfs_hash_newtbl, *vfs_hash_oldtbl;
17117518b1aSKirk McKusick 	u_long vfs_hash_newmask, vfs_hash_oldmask;
17217518b1aSKirk McKusick 	struct vnode *vp;
17317518b1aSKirk McKusick 	int i;
17417518b1aSKirk McKusick 
17517518b1aSKirk McKusick 	vfs_hash_newtbl = hashinit(newmaxvnodes, M_VFS_HASH,
17617518b1aSKirk McKusick 		&vfs_hash_newmask);
17717518b1aSKirk McKusick 	/* If same hash table size, nothing to do */
17817518b1aSKirk McKusick 	if (vfs_hash_mask == vfs_hash_newmask) {
17917518b1aSKirk McKusick 		free(vfs_hash_newtbl, M_VFS_HASH);
18017518b1aSKirk McKusick 		return;
18117518b1aSKirk McKusick 	}
18217518b1aSKirk McKusick 	/*
18317518b1aSKirk McKusick 	 * Move everything from the old hash table to the new table.
18417518b1aSKirk McKusick 	 * None of the vnodes in the table can be recycled because to
18517518b1aSKirk McKusick 	 * do so, they have to be removed from the hash table.
18617518b1aSKirk McKusick 	 */
18717518b1aSKirk McKusick 	rw_wlock(&vfs_hash_lock);
18817518b1aSKirk McKusick 	vfs_hash_oldtbl = vfs_hash_tbl;
18917518b1aSKirk McKusick 	vfs_hash_oldmask = vfs_hash_mask;
19017518b1aSKirk McKusick 	vfs_hash_tbl = vfs_hash_newtbl;
19117518b1aSKirk McKusick 	vfs_hash_mask = vfs_hash_newmask;
19217518b1aSKirk McKusick 	for (i = 0; i <= vfs_hash_oldmask; i++) {
19317518b1aSKirk McKusick 		while ((vp = LIST_FIRST(&vfs_hash_oldtbl[i])) != NULL) {
19417518b1aSKirk McKusick 			LIST_REMOVE(vp, v_hashlist);
19517518b1aSKirk McKusick 			LIST_INSERT_HEAD(
19617518b1aSKirk McKusick 			    vfs_hash_bucket(vp->v_mount, vp->v_hash),
19717518b1aSKirk McKusick 			    vp, v_hashlist);
19817518b1aSKirk McKusick 		}
19917518b1aSKirk McKusick 	}
20017518b1aSKirk McKusick 	rw_wunlock(&vfs_hash_lock);
20117518b1aSKirk McKusick 	free(vfs_hash_oldtbl, M_VFS_HASH);
20217518b1aSKirk McKusick }
203