xref: /freebsd/sys/kern/vfs_hash.c (revision 4d846d260e2b9a3d4d0a701462568268cbfe7a5b)
16c325a2aSPoul-Henning Kamp /*-
2*4d846d26SWarner Losh  * SPDX-License-Identifier: BSD-2-Clause
38a36da99SPedro F. Giffuni  *
46c325a2aSPoul-Henning Kamp  * Copyright (c) 2005 Poul-Henning Kamp
56c325a2aSPoul-Henning Kamp  * All rights reserved.
66c325a2aSPoul-Henning Kamp  *
76c325a2aSPoul-Henning Kamp  * Redistribution and use in source and binary forms, with or without
86c325a2aSPoul-Henning Kamp  * modification, are permitted provided that the following conditions
96c325a2aSPoul-Henning Kamp  * are met:
106c325a2aSPoul-Henning Kamp  * 1. Redistributions of source code must retain the above copyright
116c325a2aSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer.
126c325a2aSPoul-Henning Kamp  * 2. Redistributions in binary form must reproduce the above copyright
136c325a2aSPoul-Henning Kamp  *    notice, this list of conditions and the following disclaimer in the
146c325a2aSPoul-Henning Kamp  *    documentation and/or other materials provided with the distribution.
156c325a2aSPoul-Henning Kamp  *
166c325a2aSPoul-Henning Kamp  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
176c325a2aSPoul-Henning Kamp  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
186c325a2aSPoul-Henning Kamp  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
196c325a2aSPoul-Henning Kamp  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
206c325a2aSPoul-Henning Kamp  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
216c325a2aSPoul-Henning Kamp  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
226c325a2aSPoul-Henning Kamp  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
236c325a2aSPoul-Henning Kamp  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
246c325a2aSPoul-Henning Kamp  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
256c325a2aSPoul-Henning Kamp  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
266c325a2aSPoul-Henning Kamp  * SUCH DAMAGE.
276c325a2aSPoul-Henning Kamp  *
286c325a2aSPoul-Henning Kamp  */
296c325a2aSPoul-Henning Kamp 
306c325a2aSPoul-Henning Kamp #include <sys/cdefs.h>
316c325a2aSPoul-Henning Kamp __FBSDID("$FreeBSD$");
326c325a2aSPoul-Henning Kamp 
336c325a2aSPoul-Henning Kamp #include <sys/param.h>
346c325a2aSPoul-Henning Kamp #include <sys/systm.h>
356c325a2aSPoul-Henning Kamp #include <sys/kernel.h>
366c325a2aSPoul-Henning Kamp #include <sys/malloc.h>
3778bb3c21SPoul-Henning Kamp #include <sys/mount.h>
38af77c1a6SMateusz Guzik #include <sys/rwlock.h>
396c325a2aSPoul-Henning Kamp #include <sys/vnode.h>
406c325a2aSPoul-Henning Kamp 
415bb84bc8SRobert Watson static MALLOC_DEFINE(M_VFS_HASH, "vfs_hash", "VFS hash table");
426c325a2aSPoul-Henning Kamp 
4378bb3c21SPoul-Henning Kamp static LIST_HEAD(vfs_hash_head, vnode)	*vfs_hash_tbl;
4478bb3c21SPoul-Henning Kamp static LIST_HEAD(,vnode)		vfs_hash_side;
456c325a2aSPoul-Henning Kamp static u_long				vfs_hash_mask;
46bb62c418SMateusz Guzik static struct rwlock __exclusive_cache_line vfs_hash_lock;
476c325a2aSPoul-Henning Kamp 
486c325a2aSPoul-Henning Kamp static void
496c325a2aSPoul-Henning Kamp vfs_hashinit(void *dummy __unused)
506c325a2aSPoul-Henning Kamp {
516c325a2aSPoul-Henning Kamp 
526c325a2aSPoul-Henning Kamp 	vfs_hash_tbl = hashinit(desiredvnodes, M_VFS_HASH, &vfs_hash_mask);
53af77c1a6SMateusz Guzik 	rw_init(&vfs_hash_lock, "vfs hash");
5478bb3c21SPoul-Henning Kamp 	LIST_INIT(&vfs_hash_side);
556c325a2aSPoul-Henning Kamp }
566c325a2aSPoul-Henning Kamp 
576c325a2aSPoul-Henning Kamp /* Must be SI_ORDER_SECOND so desiredvnodes is available */
58237fdd78SRobert Watson SYSINIT(vfs_hash, SI_SUB_VFS, SI_ORDER_SECOND, vfs_hashinit, NULL);
596c325a2aSPoul-Henning Kamp 
60f6af8e37SKonstantin Belousov u_int
61f6af8e37SKonstantin Belousov vfs_hash_index(struct vnode *vp)
62f6af8e37SKonstantin Belousov {
63f6af8e37SKonstantin Belousov 
64f6af8e37SKonstantin Belousov 	return (vp->v_hash + vp->v_mount->mnt_hashseed);
65f6af8e37SKonstantin Belousov }
66f6af8e37SKonstantin Belousov 
6778bb3c21SPoul-Henning Kamp static struct vfs_hash_head *
687b982bc8SKonstantin Belousov vfs_hash_bucket(const struct mount *mp, u_int hash)
6978bb3c21SPoul-Henning Kamp {
7078bb3c21SPoul-Henning Kamp 
7178bb3c21SPoul-Henning Kamp 	return (&vfs_hash_tbl[(hash + mp->mnt_hashseed) & vfs_hash_mask]);
7278bb3c21SPoul-Henning Kamp }
7378bb3c21SPoul-Henning Kamp 
746c325a2aSPoul-Henning Kamp int
75cd85d599SKonstantin Belousov vfs_hash_get(const struct mount *mp, u_int hash, int flags, struct thread *td,
76cd85d599SKonstantin Belousov     struct vnode **vpp, vfs_hash_cmp_t *fn, void *arg)
776c325a2aSPoul-Henning Kamp {
786c325a2aSPoul-Henning Kamp 	struct vnode *vp;
79e3c3248cSMateusz Guzik 	enum vgetstate vs;
806c325a2aSPoul-Henning Kamp 	int error;
816c325a2aSPoul-Henning Kamp 
826c325a2aSPoul-Henning Kamp 	while (1) {
83af77c1a6SMateusz Guzik 		rw_rlock(&vfs_hash_lock);
847b982bc8SKonstantin Belousov 		LIST_FOREACH(vp, vfs_hash_bucket(mp, hash), v_hashlist) {
856c325a2aSPoul-Henning Kamp 			if (vp->v_hash != hash)
866c325a2aSPoul-Henning Kamp 				continue;
876c325a2aSPoul-Henning Kamp 			if (vp->v_mount != mp)
886c325a2aSPoul-Henning Kamp 				continue;
8951f5ce0cSPoul-Henning Kamp 			if (fn != NULL && fn(vp, arg))
9051f5ce0cSPoul-Henning Kamp 				continue;
91e3c3248cSMateusz Guzik 			vs = vget_prep(vp);
92af77c1a6SMateusz Guzik 			rw_runlock(&vfs_hash_lock);
93e3c3248cSMateusz Guzik 			error = vget_finish(vp, flags, vs);
946ff5e2dbSTor Egge 			if (error == ENOENT && (flags & LK_NOWAIT) == 0)
956c325a2aSPoul-Henning Kamp 				break;
967c1e4aabSKonstantin Belousov 			if (error != 0)
976c325a2aSPoul-Henning Kamp 				return (error);
987c1e4aabSKonstantin Belousov 			if (vp->v_hash != hash ||
997c1e4aabSKonstantin Belousov 			    (fn != NULL && fn(vp, arg))) {
1007c1e4aabSKonstantin Belousov 				vput(vp);
1017c1e4aabSKonstantin Belousov 				/* Restart the bucket walk. */
1027c1e4aabSKonstantin Belousov 				break;
1037c1e4aabSKonstantin Belousov 			}
1046c325a2aSPoul-Henning Kamp 			*vpp = vp;
1056c325a2aSPoul-Henning Kamp 			return (0);
1066c325a2aSPoul-Henning Kamp 		}
1076c325a2aSPoul-Henning Kamp 		if (vp == NULL) {
108af77c1a6SMateusz Guzik 			rw_runlock(&vfs_hash_lock);
1096c325a2aSPoul-Henning Kamp 			*vpp = NULL;
1106c325a2aSPoul-Henning Kamp 			return (0);
1116c325a2aSPoul-Henning Kamp 		}
1126c325a2aSPoul-Henning Kamp 	}
1136c325a2aSPoul-Henning Kamp }
1146c325a2aSPoul-Henning Kamp 
1156c325a2aSPoul-Henning Kamp void
11654a33d2fSKonstantin Belousov vfs_hash_ref(const struct mount *mp, u_int hash, struct thread *td,
11754a33d2fSKonstantin Belousov     struct vnode **vpp, vfs_hash_cmp_t *fn, void *arg)
11854a33d2fSKonstantin Belousov {
11954a33d2fSKonstantin Belousov 	struct vnode *vp;
12054a33d2fSKonstantin Belousov 
12154a33d2fSKonstantin Belousov 	while (1) {
12254a33d2fSKonstantin Belousov 		rw_rlock(&vfs_hash_lock);
12354a33d2fSKonstantin Belousov 		LIST_FOREACH(vp, vfs_hash_bucket(mp, hash), v_hashlist) {
12454a33d2fSKonstantin Belousov 			if (vp->v_hash != hash)
12554a33d2fSKonstantin Belousov 				continue;
12654a33d2fSKonstantin Belousov 			if (vp->v_mount != mp)
12754a33d2fSKonstantin Belousov 				continue;
12854a33d2fSKonstantin Belousov 			if (fn != NULL && fn(vp, arg))
12954a33d2fSKonstantin Belousov 				continue;
13054a33d2fSKonstantin Belousov 			vhold(vp);
13154a33d2fSKonstantin Belousov 			rw_runlock(&vfs_hash_lock);
13254a33d2fSKonstantin Belousov 			vref(vp);
13354a33d2fSKonstantin Belousov 			vdrop(vp);
13454a33d2fSKonstantin Belousov 			*vpp = vp;
13554a33d2fSKonstantin Belousov 			return;
13654a33d2fSKonstantin Belousov 		}
13754a33d2fSKonstantin Belousov 		if (vp == NULL) {
13854a33d2fSKonstantin Belousov 			rw_runlock(&vfs_hash_lock);
13954a33d2fSKonstantin Belousov 			*vpp = NULL;
14054a33d2fSKonstantin Belousov 			return;
14154a33d2fSKonstantin Belousov 		}
14254a33d2fSKonstantin Belousov 	}
14354a33d2fSKonstantin Belousov }
14454a33d2fSKonstantin Belousov 
14554a33d2fSKonstantin Belousov void
1466c325a2aSPoul-Henning Kamp vfs_hash_remove(struct vnode *vp)
1476c325a2aSPoul-Henning Kamp {
1486c325a2aSPoul-Henning Kamp 
149af77c1a6SMateusz Guzik 	rw_wlock(&vfs_hash_lock);
1506c325a2aSPoul-Henning Kamp 	LIST_REMOVE(vp, v_hashlist);
151af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
1526c325a2aSPoul-Henning Kamp }
1536c325a2aSPoul-Henning Kamp 
1546c325a2aSPoul-Henning Kamp int
155cd85d599SKonstantin Belousov vfs_hash_insert(struct vnode *vp, u_int hash, int flags, struct thread *td,
156cd85d599SKonstantin Belousov     struct vnode **vpp, vfs_hash_cmp_t *fn, void *arg)
1576c325a2aSPoul-Henning Kamp {
1586c325a2aSPoul-Henning Kamp 	struct vnode *vp2;
159e3c3248cSMateusz Guzik 	enum vgetstate vs;
1606c325a2aSPoul-Henning Kamp 	int error;
1616c325a2aSPoul-Henning Kamp 
162e82ef95cSPoul-Henning Kamp 	*vpp = NULL;
1636c325a2aSPoul-Henning Kamp 	while (1) {
164af77c1a6SMateusz Guzik 		rw_wlock(&vfs_hash_lock);
1656c325a2aSPoul-Henning Kamp 		LIST_FOREACH(vp2,
1667b982bc8SKonstantin Belousov 		    vfs_hash_bucket(vp->v_mount, hash), v_hashlist) {
1676c325a2aSPoul-Henning Kamp 			if (vp2->v_hash != hash)
1686c325a2aSPoul-Henning Kamp 				continue;
1696c325a2aSPoul-Henning Kamp 			if (vp2->v_mount != vp->v_mount)
1706c325a2aSPoul-Henning Kamp 				continue;
171a1e1d551SPoul-Henning Kamp 			if (fn != NULL && fn(vp2, arg))
17251f5ce0cSPoul-Henning Kamp 				continue;
173e3c3248cSMateusz Guzik 			vs = vget_prep(vp2);
174af77c1a6SMateusz Guzik 			rw_wunlock(&vfs_hash_lock);
175e3c3248cSMateusz Guzik 			error = vget_finish(vp2, flags, vs);
1766ff5e2dbSTor Egge 			if (error == ENOENT && (flags & LK_NOWAIT) == 0)
1776c325a2aSPoul-Henning Kamp 				break;
178af77c1a6SMateusz Guzik 			rw_wlock(&vfs_hash_lock);
17978bb3c21SPoul-Henning Kamp 			LIST_INSERT_HEAD(&vfs_hash_side, vp, v_hashlist);
180af77c1a6SMateusz Guzik 			rw_wunlock(&vfs_hash_lock);
181a0a36d48SChuck Silvers 			vgone(vp);
18245c26fa2SPoul-Henning Kamp 			vput(vp);
18345c26fa2SPoul-Henning Kamp 			if (!error)
1846c325a2aSPoul-Henning Kamp 				*vpp = vp2;
18545c26fa2SPoul-Henning Kamp 			return (error);
1866c325a2aSPoul-Henning Kamp 		}
1876c325a2aSPoul-Henning Kamp 		if (vp2 == NULL)
1886c325a2aSPoul-Henning Kamp 			break;
1896c325a2aSPoul-Henning Kamp 	}
1906c325a2aSPoul-Henning Kamp 	vp->v_hash = hash;
1917b982bc8SKonstantin Belousov 	LIST_INSERT_HEAD(vfs_hash_bucket(vp->v_mount, hash), vp, v_hashlist);
192af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
1936c325a2aSPoul-Henning Kamp 	return (0);
1946c325a2aSPoul-Henning Kamp }
1956c325a2aSPoul-Henning Kamp 
1966c325a2aSPoul-Henning Kamp void
1976c325a2aSPoul-Henning Kamp vfs_hash_rehash(struct vnode *vp, u_int hash)
1986c325a2aSPoul-Henning Kamp {
199f19063abSKonstantin Belousov 	ASSERT_VOP_ELOCKED(vp, "rehash requires excl lock");
2006c325a2aSPoul-Henning Kamp 
201af77c1a6SMateusz Guzik 	rw_wlock(&vfs_hash_lock);
2026c325a2aSPoul-Henning Kamp 	LIST_REMOVE(vp, v_hashlist);
2037b982bc8SKonstantin Belousov 	LIST_INSERT_HEAD(vfs_hash_bucket(vp->v_mount, hash), vp, v_hashlist);
2046c325a2aSPoul-Henning Kamp 	vp->v_hash = hash;
205af77c1a6SMateusz Guzik 	rw_wunlock(&vfs_hash_lock);
2066c325a2aSPoul-Henning Kamp }
20717518b1aSKirk McKusick 
20817518b1aSKirk McKusick void
20969283067SMateusz Guzik vfs_hash_changesize(u_long newmaxvnodes)
21017518b1aSKirk McKusick {
21117518b1aSKirk McKusick 	struct vfs_hash_head *vfs_hash_newtbl, *vfs_hash_oldtbl;
21217518b1aSKirk McKusick 	u_long vfs_hash_newmask, vfs_hash_oldmask;
21317518b1aSKirk McKusick 	struct vnode *vp;
21417518b1aSKirk McKusick 	int i;
21517518b1aSKirk McKusick 
21617518b1aSKirk McKusick 	vfs_hash_newtbl = hashinit(newmaxvnodes, M_VFS_HASH,
21717518b1aSKirk McKusick 		&vfs_hash_newmask);
21817518b1aSKirk McKusick 	/* If same hash table size, nothing to do */
21917518b1aSKirk McKusick 	if (vfs_hash_mask == vfs_hash_newmask) {
22017518b1aSKirk McKusick 		free(vfs_hash_newtbl, M_VFS_HASH);
22117518b1aSKirk McKusick 		return;
22217518b1aSKirk McKusick 	}
22317518b1aSKirk McKusick 	/*
22417518b1aSKirk McKusick 	 * Move everything from the old hash table to the new table.
22517518b1aSKirk McKusick 	 * None of the vnodes in the table can be recycled because to
22617518b1aSKirk McKusick 	 * do so, they have to be removed from the hash table.
22717518b1aSKirk McKusick 	 */
22817518b1aSKirk McKusick 	rw_wlock(&vfs_hash_lock);
22917518b1aSKirk McKusick 	vfs_hash_oldtbl = vfs_hash_tbl;
23017518b1aSKirk McKusick 	vfs_hash_oldmask = vfs_hash_mask;
23117518b1aSKirk McKusick 	vfs_hash_tbl = vfs_hash_newtbl;
23217518b1aSKirk McKusick 	vfs_hash_mask = vfs_hash_newmask;
23317518b1aSKirk McKusick 	for (i = 0; i <= vfs_hash_oldmask; i++) {
23417518b1aSKirk McKusick 		while ((vp = LIST_FIRST(&vfs_hash_oldtbl[i])) != NULL) {
23517518b1aSKirk McKusick 			LIST_REMOVE(vp, v_hashlist);
23617518b1aSKirk McKusick 			LIST_INSERT_HEAD(
23717518b1aSKirk McKusick 			    vfs_hash_bucket(vp->v_mount, vp->v_hash),
23817518b1aSKirk McKusick 			    vp, v_hashlist);
23917518b1aSKirk McKusick 		}
24017518b1aSKirk McKusick 	}
24117518b1aSKirk McKusick 	rw_wunlock(&vfs_hash_lock);
24217518b1aSKirk McKusick 	free(vfs_hash_oldtbl, M_VFS_HASH);
24317518b1aSKirk McKusick }
244