xref: /freebsd/sys/vm/vm_pagequeue.h (revision 30fbfdda6cb85c3d66ce6f10a30c0e87a510f1ab)
1e2068d0bSJeff Roberson /*-
2e2068d0bSJeff Roberson  * SPDX-License-Identifier: (BSD-3-Clause AND MIT-CMU)
3e2068d0bSJeff Roberson  *
4e2068d0bSJeff Roberson  * Copyright (c) 1991, 1993
5e2068d0bSJeff Roberson  *	The Regents of the University of California.  All rights reserved.
6e2068d0bSJeff Roberson  *
7e2068d0bSJeff Roberson  * This code is derived from software contributed to Berkeley by
8e2068d0bSJeff Roberson  * The Mach Operating System project at Carnegie-Mellon University.
9e2068d0bSJeff Roberson  *
10e2068d0bSJeff Roberson  * Redistribution and use in source and binary forms, with or without
11e2068d0bSJeff Roberson  * modification, are permitted provided that the following conditions
12e2068d0bSJeff Roberson  * are met:
13e2068d0bSJeff Roberson  * 1. Redistributions of source code must retain the above copyright
14e2068d0bSJeff Roberson  *    notice, this list of conditions and the following disclaimer.
15e2068d0bSJeff Roberson  * 2. Redistributions in binary form must reproduce the above copyright
16e2068d0bSJeff Roberson  *    notice, this list of conditions and the following disclaimer in the
17e2068d0bSJeff Roberson  *    documentation and/or other materials provided with the distribution.
18e2068d0bSJeff Roberson  * 3. Neither the name of the University nor the names of its contributors
19e2068d0bSJeff Roberson  *    may be used to endorse or promote products derived from this software
20e2068d0bSJeff Roberson  *    without specific prior written permission.
21e2068d0bSJeff Roberson  *
22e2068d0bSJeff Roberson  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23e2068d0bSJeff Roberson  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24e2068d0bSJeff Roberson  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25e2068d0bSJeff Roberson  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26e2068d0bSJeff Roberson  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27e2068d0bSJeff Roberson  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28e2068d0bSJeff Roberson  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29e2068d0bSJeff Roberson  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30e2068d0bSJeff Roberson  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31e2068d0bSJeff Roberson  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32e2068d0bSJeff Roberson  * SUCH DAMAGE.
33e2068d0bSJeff Roberson  *
34e2068d0bSJeff Roberson  *	from: @(#)vm_page.h	8.2 (Berkeley) 12/13/93
35e2068d0bSJeff Roberson  *
36e2068d0bSJeff Roberson  *
37e2068d0bSJeff Roberson  * Copyright (c) 1987, 1990 Carnegie-Mellon University.
38e2068d0bSJeff Roberson  * All rights reserved.
39e2068d0bSJeff Roberson  *
40e2068d0bSJeff Roberson  * Authors: Avadis Tevanian, Jr., Michael Wayne Young
41e2068d0bSJeff Roberson  *
42e2068d0bSJeff Roberson  * Permission to use, copy, modify and distribute this software and
43e2068d0bSJeff Roberson  * its documentation is hereby granted, provided that both the copyright
44e2068d0bSJeff Roberson  * notice and this permission notice appear in all copies of the
45e2068d0bSJeff Roberson  * software, derivative works or modified versions, and any portions
46e2068d0bSJeff Roberson  * thereof, and that both notices appear in supporting documentation.
47e2068d0bSJeff Roberson  *
48e2068d0bSJeff Roberson  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
49e2068d0bSJeff Roberson  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
50e2068d0bSJeff Roberson  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
51e2068d0bSJeff Roberson  *
52e2068d0bSJeff Roberson  * Carnegie Mellon requests users of this software to return to
53e2068d0bSJeff Roberson  *
54e2068d0bSJeff Roberson  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
55e2068d0bSJeff Roberson  *  School of Computer Science
56e2068d0bSJeff Roberson  *  Carnegie Mellon University
57e2068d0bSJeff Roberson  *  Pittsburgh PA 15213-3890
58e2068d0bSJeff Roberson  *
59e2068d0bSJeff Roberson  * any improvements or extensions that they make and grant Carnegie the
60e2068d0bSJeff Roberson  * rights to redistribute these changes.
61e2068d0bSJeff Roberson  *
62e2068d0bSJeff Roberson  * $FreeBSD$
63e2068d0bSJeff Roberson  */
64e2068d0bSJeff Roberson 
65e2068d0bSJeff Roberson #ifndef	_VM_PAGEQUEUE_
66e2068d0bSJeff Roberson #define	_VM_PAGEQUEUE_
67e2068d0bSJeff Roberson 
68e2068d0bSJeff Roberson #ifdef _KERNEL
69e2068d0bSJeff Roberson struct vm_pagequeue {
70e2068d0bSJeff Roberson 	struct mtx	pq_mutex;
71e2068d0bSJeff Roberson 	struct pglist	pq_pl;
72e2068d0bSJeff Roberson 	int		pq_cnt;
73e2068d0bSJeff Roberson 	const char	* const pq_name;
74e2068d0bSJeff Roberson } __aligned(CACHE_LINE_SIZE);
75e2068d0bSJeff Roberson 
765f8cd1c0SJeff Roberson #include <sys/pidctrl.h>
775f8cd1c0SJeff Roberson struct sysctl_oid;
78e2068d0bSJeff Roberson 
79*30fbfddaSJeff Roberson /*
80*30fbfddaSJeff Roberson  * One vm_domain per-numa domain.  Contains pagequeues, free page structures,
81*30fbfddaSJeff Roberson  * and accounting.
82*30fbfddaSJeff Roberson  *
83*30fbfddaSJeff Roberson  * Lock Key:
84*30fbfddaSJeff Roberson  * f   vmd_free_mtx
85*30fbfddaSJeff Roberson  * p   vmd_pageout_mtx
86*30fbfddaSJeff Roberson  * d   vm_domainset_lock
87*30fbfddaSJeff Roberson  * a   atomic
88*30fbfddaSJeff Roberson  * c   const after boot
89*30fbfddaSJeff Roberson */
90e2068d0bSJeff Roberson struct vm_domain {
91e2068d0bSJeff Roberson 	struct vm_pagequeue vmd_pagequeues[PQ_COUNT];
92e2068d0bSJeff Roberson 	struct mtx_padalign vmd_free_mtx;
93*30fbfddaSJeff Roberson 	struct mtx_padalign vmd_pageout_mtx;
94*30fbfddaSJeff Roberson 	struct vmem *vmd_kernel_arena;	/* (c) per-domain kva arena. */
95*30fbfddaSJeff Roberson 	u_int vmd_domain;		/* (c) Domain number. */
96*30fbfddaSJeff Roberson 	u_int vmd_page_count;		/* (c) Total page count. */
97*30fbfddaSJeff Roberson 	long vmd_segs;			/* (c) bitmask of the segments */
98*30fbfddaSJeff Roberson 	u_int __aligned(CACHE_LINE_SIZE) vmd_free_count; /* (a,f) free page count */
99*30fbfddaSJeff Roberson 	u_int vmd_pageout_deficit;	/* (a) Estimated number of pages deficit */
100*30fbfddaSJeff Roberson 	uint8_t vmd_pad[CACHE_LINE_SIZE - (sizeof(u_int) * 2)];
101e2068d0bSJeff Roberson 
102*30fbfddaSJeff Roberson 	/* Paging control variables, used within single threaded page daemon. */
1035f8cd1c0SJeff Roberson 	struct pidctrl vmd_pid;		/* Pageout controller. */
104e2068d0bSJeff Roberson 	boolean_t vmd_oom;
105e2068d0bSJeff Roberson 	int vmd_oom_seq;
106e2068d0bSJeff Roberson 	int vmd_last_active_scan;
107e2068d0bSJeff Roberson 	struct vm_page vmd_laundry_marker;
108e2068d0bSJeff Roberson 	struct vm_page vmd_marker; /* marker for pagedaemon private use */
109e2068d0bSJeff Roberson 	struct vm_page vmd_inacthead; /* marker for LRU-defeating insertions */
110e2068d0bSJeff Roberson 
111*30fbfddaSJeff Roberson 	int vmd_pageout_wanted;		/* (a, p) pageout daemon wait channel */
112*30fbfddaSJeff Roberson 	int vmd_pageout_pages_needed;	/* (d) page daemon waiting for pages? */
113*30fbfddaSJeff Roberson 	bool vmd_minset;		/* (d) Are we in vm_min_domains? */
114*30fbfddaSJeff Roberson 	bool vmd_severeset;		/* (d) Are we in vm_severe_domains? */
115e2068d0bSJeff Roberson 	int vmd_inactq_scans;
116e2068d0bSJeff Roberson 	enum {
117e2068d0bSJeff Roberson 		VM_LAUNDRY_IDLE = 0,
118e2068d0bSJeff Roberson 		VM_LAUNDRY_BACKGROUND,
119e2068d0bSJeff Roberson 		VM_LAUNDRY_SHORTFALL
120e2068d0bSJeff Roberson 	} vmd_laundry_request;
121e2068d0bSJeff Roberson 
122e2068d0bSJeff Roberson 	/* Paging thresholds. */
123e2068d0bSJeff Roberson 	u_int vmd_background_launder_target;
124e2068d0bSJeff Roberson 	u_int vmd_free_reserved;	/* (c) pages reserved for deadlock */
125e2068d0bSJeff Roberson 	u_int vmd_free_target;		/* (c) pages desired free */
126e2068d0bSJeff Roberson 	u_int vmd_free_min;		/* (c) pages desired free */
127e2068d0bSJeff Roberson 	u_int vmd_inactive_target;	/* (c) pages desired inactive */
128e2068d0bSJeff Roberson 	u_int vmd_pageout_free_min;	/* (c) min pages reserved for kernel */
129e2068d0bSJeff Roberson 	u_int vmd_pageout_wakeup_thresh;/* (c) min pages to wake pagedaemon */
130e2068d0bSJeff Roberson 	u_int vmd_interrupt_free_min;	/* (c) reserved pages for int code */
131e2068d0bSJeff Roberson 	u_int vmd_free_severe;		/* (c) severe page depletion point */
1325f8cd1c0SJeff Roberson 
1335f8cd1c0SJeff Roberson 	/* Name for sysctl etc. */
1345f8cd1c0SJeff Roberson 	struct sysctl_oid *vmd_oid;
1355f8cd1c0SJeff Roberson 	char vmd_name[sizeof(__XSTRING(MAXMEMDOM))];
136e2068d0bSJeff Roberson } __aligned(CACHE_LINE_SIZE);
137e2068d0bSJeff Roberson 
138e2068d0bSJeff Roberson extern struct vm_domain vm_dom[MAXMEMDOM];
139e2068d0bSJeff Roberson 
140e2068d0bSJeff Roberson #define	VM_DOMAIN(n)	(&vm_dom[(n)])
141e2068d0bSJeff Roberson 
142e2068d0bSJeff Roberson #define	vm_pagequeue_assert_locked(pq)	mtx_assert(&(pq)->pq_mutex, MA_OWNED)
143e2068d0bSJeff Roberson #define	vm_pagequeue_lock(pq)		mtx_lock(&(pq)->pq_mutex)
144e2068d0bSJeff Roberson #define	vm_pagequeue_lockptr(pq)	(&(pq)->pq_mutex)
145e2068d0bSJeff Roberson #define	vm_pagequeue_unlock(pq)		mtx_unlock(&(pq)->pq_mutex)
146e2068d0bSJeff Roberson 
147e2068d0bSJeff Roberson #define	vm_domain_free_assert_locked(n)					\
148e2068d0bSJeff Roberson 	    mtx_assert(vm_domain_free_lockptr((n)), MA_OWNED)
149e2068d0bSJeff Roberson #define	vm_domain_free_assert_unlocked(n)				\
150e2068d0bSJeff Roberson 	    mtx_assert(vm_domain_free_lockptr((n)), MA_NOTOWNED)
151e2068d0bSJeff Roberson #define	vm_domain_free_lock(d)						\
152e2068d0bSJeff Roberson 	    mtx_lock(vm_domain_free_lockptr((d)))
153e2068d0bSJeff Roberson #define	vm_domain_free_lockptr(d)					\
154e2068d0bSJeff Roberson 	    (&(d)->vmd_free_mtx)
155e2068d0bSJeff Roberson #define	vm_domain_free_unlock(d)					\
156e2068d0bSJeff Roberson 	    mtx_unlock(vm_domain_free_lockptr((d)))
157e2068d0bSJeff Roberson 
158*30fbfddaSJeff Roberson #define	vm_domain_pageout_lockptr(d)					\
159*30fbfddaSJeff Roberson 	    (&(d)->vmd_pageout_mtx)
160*30fbfddaSJeff Roberson #define	vm_domain_pageout_assert_locked(n)				\
161*30fbfddaSJeff Roberson 	    mtx_assert(vm_domain_pageout_lockptr((n)), MA_OWNED)
162*30fbfddaSJeff Roberson #define	vm_domain_pageout_assert_unlocked(n)				\
163*30fbfddaSJeff Roberson 	    mtx_assert(vm_domain_pageout_lockptr((n)), MA_NOTOWNED)
164*30fbfddaSJeff Roberson #define	vm_domain_pageout_lock(d)					\
165*30fbfddaSJeff Roberson 	    mtx_lock(vm_domain_pageout_lockptr((d)))
166*30fbfddaSJeff Roberson #define	vm_domain_pageout_unlock(d)					\
167*30fbfddaSJeff Roberson 	    mtx_unlock(vm_domain_pageout_lockptr((d)))
168*30fbfddaSJeff Roberson 
169e2068d0bSJeff Roberson static __inline void
170e2068d0bSJeff Roberson vm_pagequeue_cnt_add(struct vm_pagequeue *pq, int addend)
171e2068d0bSJeff Roberson {
172e2068d0bSJeff Roberson 
173e2068d0bSJeff Roberson #ifdef notyet
174e2068d0bSJeff Roberson 	vm_pagequeue_assert_locked(pq);
175e2068d0bSJeff Roberson #endif
176e2068d0bSJeff Roberson 	pq->pq_cnt += addend;
177e2068d0bSJeff Roberson }
178e2068d0bSJeff Roberson #define	vm_pagequeue_cnt_inc(pq)	vm_pagequeue_cnt_add((pq), 1)
179e2068d0bSJeff Roberson #define	vm_pagequeue_cnt_dec(pq)	vm_pagequeue_cnt_add((pq), -1)
180e2068d0bSJeff Roberson 
181e2068d0bSJeff Roberson void vm_domain_set(struct vm_domain *vmd);
182*30fbfddaSJeff Roberson void vm_domain_clear(struct vm_domain *vmd);
183e2068d0bSJeff Roberson int vm_domain_available(struct vm_domain *vmd, int req, int npages);
184e2068d0bSJeff Roberson 
185e2068d0bSJeff Roberson /*
186e2068d0bSJeff Roberson  *      vm_pagequeue_domain:
187e2068d0bSJeff Roberson  *
188e2068d0bSJeff Roberson  *      Return the memory domain the page belongs to.
189e2068d0bSJeff Roberson  */
190e2068d0bSJeff Roberson static inline struct vm_domain *
191e2068d0bSJeff Roberson vm_pagequeue_domain(vm_page_t m)
192e2068d0bSJeff Roberson {
193e2068d0bSJeff Roberson 
194e2068d0bSJeff Roberson 	return (VM_DOMAIN(vm_phys_domain(m)));
195e2068d0bSJeff Roberson }
196e2068d0bSJeff Roberson 
197e2068d0bSJeff Roberson /*
198e2068d0bSJeff Roberson  * Return the number of pages we need to free-up or cache
199e2068d0bSJeff Roberson  * A positive number indicates that we do not have enough free pages.
200e2068d0bSJeff Roberson  */
201e2068d0bSJeff Roberson static inline int
202e2068d0bSJeff Roberson vm_paging_target(struct vm_domain *vmd)
203e2068d0bSJeff Roberson {
204e2068d0bSJeff Roberson 
205e2068d0bSJeff Roberson 	return (vmd->vmd_free_target - vmd->vmd_free_count);
206e2068d0bSJeff Roberson }
207e2068d0bSJeff Roberson 
208e2068d0bSJeff Roberson /*
209e2068d0bSJeff Roberson  * Returns TRUE if the pagedaemon needs to be woken up.
210e2068d0bSJeff Roberson  */
211e2068d0bSJeff Roberson static inline int
212e2068d0bSJeff Roberson vm_paging_needed(struct vm_domain *vmd, u_int free_count)
213e2068d0bSJeff Roberson {
214e2068d0bSJeff Roberson 
215e2068d0bSJeff Roberson 	return (free_count < vmd->vmd_pageout_wakeup_thresh);
216e2068d0bSJeff Roberson }
217e2068d0bSJeff Roberson 
218e2068d0bSJeff Roberson /*
219e2068d0bSJeff Roberson  * Returns TRUE if the domain is below the min paging target.
220e2068d0bSJeff Roberson  */
221e2068d0bSJeff Roberson static inline int
222e2068d0bSJeff Roberson vm_paging_min(struct vm_domain *vmd)
223e2068d0bSJeff Roberson {
224e2068d0bSJeff Roberson 
225e2068d0bSJeff Roberson         return (vmd->vmd_free_min > vmd->vmd_free_count);
226e2068d0bSJeff Roberson }
227e2068d0bSJeff Roberson 
228e2068d0bSJeff Roberson /*
229e2068d0bSJeff Roberson  * Returns TRUE if the domain is below the severe paging target.
230e2068d0bSJeff Roberson  */
231e2068d0bSJeff Roberson static inline int
232e2068d0bSJeff Roberson vm_paging_severe(struct vm_domain *vmd)
233e2068d0bSJeff Roberson {
234e2068d0bSJeff Roberson 
235e2068d0bSJeff Roberson         return (vmd->vmd_free_severe > vmd->vmd_free_count);
236e2068d0bSJeff Roberson }
237e2068d0bSJeff Roberson 
238e2068d0bSJeff Roberson /*
239e2068d0bSJeff Roberson  * Return the number of pages we need to launder.
240e2068d0bSJeff Roberson  * A positive number indicates that we have a shortfall of clean pages.
241e2068d0bSJeff Roberson  */
242e2068d0bSJeff Roberson static inline int
243e2068d0bSJeff Roberson vm_laundry_target(struct vm_domain *vmd)
244e2068d0bSJeff Roberson {
245e2068d0bSJeff Roberson 
246e2068d0bSJeff Roberson 	return (vm_paging_target(vmd));
247e2068d0bSJeff Roberson }
248e2068d0bSJeff Roberson 
249*30fbfddaSJeff Roberson void pagedaemon_wakeup(int domain);
250*30fbfddaSJeff Roberson 
251*30fbfddaSJeff Roberson static inline void
252*30fbfddaSJeff Roberson vm_domain_freecnt_inc(struct vm_domain *vmd, int adj)
253e2068d0bSJeff Roberson {
254*30fbfddaSJeff Roberson 	u_int old, new;
255e2068d0bSJeff Roberson 
256*30fbfddaSJeff Roberson 	old = atomic_fetchadd_int(&vmd->vmd_free_count, adj);
257*30fbfddaSJeff Roberson 	new = old + adj;
258*30fbfddaSJeff Roberson 	/*
259*30fbfddaSJeff Roberson 	 * Only update bitsets on transitions.  Notice we short-circuit the
260*30fbfddaSJeff Roberson 	 * rest of the checks if we're above min already.
261*30fbfddaSJeff Roberson 	 */
262*30fbfddaSJeff Roberson 	if (old < vmd->vmd_free_min && (new >= vmd->vmd_free_min ||
263*30fbfddaSJeff Roberson 	    (old < vmd->vmd_free_severe && new >= vmd->vmd_free_severe) ||
264*30fbfddaSJeff Roberson 	    (old < vmd->vmd_pageout_free_min &&
265*30fbfddaSJeff Roberson 	    new >= vmd->vmd_pageout_free_min)))
266*30fbfddaSJeff Roberson 		vm_domain_clear(vmd);
267*30fbfddaSJeff Roberson }
268*30fbfddaSJeff Roberson 
269*30fbfddaSJeff Roberson static inline void
270*30fbfddaSJeff Roberson vm_domain_freecnt_dec(struct vm_domain *vmd, int adj)
271*30fbfddaSJeff Roberson {
272*30fbfddaSJeff Roberson 	u_int old, new;
273*30fbfddaSJeff Roberson 
274*30fbfddaSJeff Roberson 	old = atomic_fetchadd_int(&vmd->vmd_free_count, -adj);
275*30fbfddaSJeff Roberson 	new = old - adj;
276*30fbfddaSJeff Roberson 	KASSERT(new >= 0, ("vm_domain_freecnt_dec: free count underflow"));
277*30fbfddaSJeff Roberson 	if (vm_paging_needed(vmd, new) && !vm_paging_needed(vmd, old))
278*30fbfddaSJeff Roberson 		pagedaemon_wakeup(vmd->vmd_domain);
279*30fbfddaSJeff Roberson 	/* Only update bitsets on transitions. */
280*30fbfddaSJeff Roberson 	if ((old >= vmd->vmd_free_min && new < vmd->vmd_free_min) ||
281*30fbfddaSJeff Roberson 	    (old >= vmd->vmd_free_severe && new < vmd->vmd_free_severe))
282e2068d0bSJeff Roberson 		vm_domain_set(vmd);
283e2068d0bSJeff Roberson }
284e2068d0bSJeff Roberson 
285e2068d0bSJeff Roberson 
286e2068d0bSJeff Roberson #endif	/* _KERNEL */
287e2068d0bSJeff Roberson #endif				/* !_VM_PAGEQUEUE_ */
288