xref: /freebsd/sys/vm/vm_pagequeue.h (revision 0766f278d88b93e81e8b81cac6258cf75cde3e35)
1e2068d0bSJeff Roberson /*-
2e2068d0bSJeff Roberson  * SPDX-License-Identifier: (BSD-3-Clause AND MIT-CMU)
3e2068d0bSJeff Roberson  *
4e2068d0bSJeff Roberson  * Copyright (c) 1991, 1993
5e2068d0bSJeff Roberson  *	The Regents of the University of California.  All rights reserved.
6e2068d0bSJeff Roberson  *
7e2068d0bSJeff Roberson  * This code is derived from software contributed to Berkeley by
8e2068d0bSJeff Roberson  * The Mach Operating System project at Carnegie-Mellon University.
9e2068d0bSJeff Roberson  *
10e2068d0bSJeff Roberson  * Redistribution and use in source and binary forms, with or without
11e2068d0bSJeff Roberson  * modification, are permitted provided that the following conditions
12e2068d0bSJeff Roberson  * are met:
13e2068d0bSJeff Roberson  * 1. Redistributions of source code must retain the above copyright
14e2068d0bSJeff Roberson  *    notice, this list of conditions and the following disclaimer.
15e2068d0bSJeff Roberson  * 2. Redistributions in binary form must reproduce the above copyright
16e2068d0bSJeff Roberson  *    notice, this list of conditions and the following disclaimer in the
17e2068d0bSJeff Roberson  *    documentation and/or other materials provided with the distribution.
18e2068d0bSJeff Roberson  * 3. Neither the name of the University nor the names of its contributors
19e2068d0bSJeff Roberson  *    may be used to endorse or promote products derived from this software
20e2068d0bSJeff Roberson  *    without specific prior written permission.
21e2068d0bSJeff Roberson  *
22e2068d0bSJeff Roberson  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
23e2068d0bSJeff Roberson  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
24e2068d0bSJeff Roberson  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
25e2068d0bSJeff Roberson  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
26e2068d0bSJeff Roberson  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
27e2068d0bSJeff Roberson  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
28e2068d0bSJeff Roberson  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
29e2068d0bSJeff Roberson  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
30e2068d0bSJeff Roberson  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
31e2068d0bSJeff Roberson  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
32e2068d0bSJeff Roberson  * SUCH DAMAGE.
33e2068d0bSJeff Roberson  *
34e2068d0bSJeff Roberson  *	from: @(#)vm_page.h	8.2 (Berkeley) 12/13/93
35e2068d0bSJeff Roberson  *
36e2068d0bSJeff Roberson  *
37e2068d0bSJeff Roberson  * Copyright (c) 1987, 1990 Carnegie-Mellon University.
38e2068d0bSJeff Roberson  * All rights reserved.
39e2068d0bSJeff Roberson  *
40e2068d0bSJeff Roberson  * Authors: Avadis Tevanian, Jr., Michael Wayne Young
41e2068d0bSJeff Roberson  *
42e2068d0bSJeff Roberson  * Permission to use, copy, modify and distribute this software and
43e2068d0bSJeff Roberson  * its documentation is hereby granted, provided that both the copyright
44e2068d0bSJeff Roberson  * notice and this permission notice appear in all copies of the
45e2068d0bSJeff Roberson  * software, derivative works or modified versions, and any portions
46e2068d0bSJeff Roberson  * thereof, and that both notices appear in supporting documentation.
47e2068d0bSJeff Roberson  *
48e2068d0bSJeff Roberson  * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS"
49e2068d0bSJeff Roberson  * CONDITION.  CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND
50e2068d0bSJeff Roberson  * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE.
51e2068d0bSJeff Roberson  *
52e2068d0bSJeff Roberson  * Carnegie Mellon requests users of this software to return to
53e2068d0bSJeff Roberson  *
54e2068d0bSJeff Roberson  *  Software Distribution Coordinator  or  Software.Distribution@CS.CMU.EDU
55e2068d0bSJeff Roberson  *  School of Computer Science
56e2068d0bSJeff Roberson  *  Carnegie Mellon University
57e2068d0bSJeff Roberson  *  Pittsburgh PA 15213-3890
58e2068d0bSJeff Roberson  *
59e2068d0bSJeff Roberson  * any improvements or extensions that they make and grant Carnegie the
60e2068d0bSJeff Roberson  * rights to redistribute these changes.
61e2068d0bSJeff Roberson  *
62e2068d0bSJeff Roberson  * $FreeBSD$
63e2068d0bSJeff Roberson  */
64e2068d0bSJeff Roberson 
65e2068d0bSJeff Roberson #ifndef	_VM_PAGEQUEUE_
66e2068d0bSJeff Roberson #define	_VM_PAGEQUEUE_
67e2068d0bSJeff Roberson 
68e2068d0bSJeff Roberson #ifdef _KERNEL
69e2068d0bSJeff Roberson struct vm_pagequeue {
70e2068d0bSJeff Roberson 	struct mtx	pq_mutex;
71e2068d0bSJeff Roberson 	struct pglist	pq_pl;
72e2068d0bSJeff Roberson 	int		pq_cnt;
73e2068d0bSJeff Roberson 	const char	* const pq_name;
74e2068d0bSJeff Roberson } __aligned(CACHE_LINE_SIZE);
75e2068d0bSJeff Roberson 
765cd29d0fSMark Johnston #ifndef VM_BATCHQUEUE_SIZE
775cd29d0fSMark Johnston #define	VM_BATCHQUEUE_SIZE	7
785cd29d0fSMark Johnston #endif
795cd29d0fSMark Johnston 
805cd29d0fSMark Johnston struct vm_batchqueue {
815cd29d0fSMark Johnston 	vm_page_t	bq_pa[VM_BATCHQUEUE_SIZE];
825cd29d0fSMark Johnston 	int		bq_cnt;
835cd29d0fSMark Johnston } __aligned(CACHE_LINE_SIZE);
845cd29d0fSMark Johnston 
85c33e3a64SJeff Roberson #include <vm/uma.h>
865cd29d0fSMark Johnston #include <sys/pidctrl.h>
875f8cd1c0SJeff Roberson struct sysctl_oid;
88e2068d0bSJeff Roberson 
8930fbfddaSJeff Roberson /*
9030fbfddaSJeff Roberson  * One vm_domain per-numa domain.  Contains pagequeues, free page structures,
9130fbfddaSJeff Roberson  * and accounting.
9230fbfddaSJeff Roberson  *
9330fbfddaSJeff Roberson  * Lock Key:
9430fbfddaSJeff Roberson  * f	vmd_free_mtx
9530fbfddaSJeff Roberson  * p	vmd_pageout_mtx
9630fbfddaSJeff Roberson  * d	vm_domainset_lock
9730fbfddaSJeff Roberson  * a	atomic
9830fbfddaSJeff Roberson  * c	const after boot
9960684862SMark Johnston  * q	page queue lock
10030fbfddaSJeff Roberson */
101e2068d0bSJeff Roberson struct vm_domain {
102e2068d0bSJeff Roberson 	struct vm_pagequeue vmd_pagequeues[PQ_COUNT];
103e2068d0bSJeff Roberson 	struct mtx_padalign vmd_free_mtx;
10430fbfddaSJeff Roberson 	struct mtx_padalign vmd_pageout_mtx;
105c33e3a64SJeff Roberson 	uma_zone_t vmd_pgcache;		/* (c) page free cache. */
106*0766f278SJonathan T. Looney 	struct vmem *vmd_kernel_arena;	/* (c) per-domain kva R/W arena. */
107*0766f278SJonathan T. Looney 	struct vmem *vmd_kernel_rwx_arena; /* (c) per-domain kva R/W/X arena. */
10830fbfddaSJeff Roberson 	u_int vmd_domain;		/* (c) Domain number. */
10930fbfddaSJeff Roberson 	u_int vmd_page_count;		/* (c) Total page count. */
11030fbfddaSJeff Roberson 	long vmd_segs;			/* (c) bitmask of the segments */
11130fbfddaSJeff Roberson 	u_int __aligned(CACHE_LINE_SIZE) vmd_free_count; /* (a,f) free page count */
11230fbfddaSJeff Roberson 	u_int vmd_pageout_deficit;	/* (a) Estimated number of pages deficit */
11330fbfddaSJeff Roberson 	uint8_t vmd_pad[CACHE_LINE_SIZE - (sizeof(u_int) * 2)];
114e2068d0bSJeff Roberson 
11530fbfddaSJeff Roberson 	/* Paging control variables, used within single threaded page daemon. */
1165f8cd1c0SJeff Roberson 	struct pidctrl vmd_pid;		/* Pageout controller. */
117e2068d0bSJeff Roberson 	boolean_t vmd_oom;
118e2068d0bSJeff Roberson 	int vmd_oom_seq;
119e2068d0bSJeff Roberson 	int vmd_last_active_scan;
1205cd29d0fSMark Johnston 	struct vm_page vmd_markers[PQ_COUNT]; /* (q) markers for queue scans */
121e2068d0bSJeff Roberson 	struct vm_page vmd_inacthead; /* marker for LRU-defeating insertions */
1225cd29d0fSMark Johnston 	struct vm_page vmd_clock[2]; /* markers for active queue scan */
123e2068d0bSJeff Roberson 
12430fbfddaSJeff Roberson 	int vmd_pageout_wanted;		/* (a, p) pageout daemon wait channel */
12530fbfddaSJeff Roberson 	int vmd_pageout_pages_needed;	/* (d) page daemon waiting for pages? */
12630fbfddaSJeff Roberson 	bool vmd_minset;		/* (d) Are we in vm_min_domains? */
12730fbfddaSJeff Roberson 	bool vmd_severeset;		/* (d) Are we in vm_severe_domains? */
128e2068d0bSJeff Roberson 	enum {
129e2068d0bSJeff Roberson 		VM_LAUNDRY_IDLE = 0,
130e2068d0bSJeff Roberson 		VM_LAUNDRY_BACKGROUND,
131e2068d0bSJeff Roberson 		VM_LAUNDRY_SHORTFALL
132e2068d0bSJeff Roberson 	} vmd_laundry_request;
133e2068d0bSJeff Roberson 
13460684862SMark Johnston 	/* Paging thresholds and targets. */
13560684862SMark Johnston 	u_int vmd_clean_pages_freed;	/* (q) accumulator for laundry thread */
13660684862SMark Johnston 	u_int vmd_background_launder_target; /* (c) */
137e2068d0bSJeff Roberson 	u_int vmd_free_reserved;	/* (c) pages reserved for deadlock */
138e2068d0bSJeff Roberson 	u_int vmd_free_target;		/* (c) pages desired free */
139e2068d0bSJeff Roberson 	u_int vmd_free_min;		/* (c) pages desired free */
140e2068d0bSJeff Roberson 	u_int vmd_inactive_target;	/* (c) pages desired inactive */
141e2068d0bSJeff Roberson 	u_int vmd_pageout_free_min;	/* (c) min pages reserved for kernel */
142e2068d0bSJeff Roberson 	u_int vmd_pageout_wakeup_thresh;/* (c) min pages to wake pagedaemon */
143e2068d0bSJeff Roberson 	u_int vmd_interrupt_free_min;	/* (c) reserved pages for int code */
144e2068d0bSJeff Roberson 	u_int vmd_free_severe;		/* (c) severe page depletion point */
1455f8cd1c0SJeff Roberson 
1465f8cd1c0SJeff Roberson 	/* Name for sysctl etc. */
1475f8cd1c0SJeff Roberson 	struct sysctl_oid *vmd_oid;
1485f8cd1c0SJeff Roberson 	char vmd_name[sizeof(__XSTRING(MAXMEMDOM))];
149e2068d0bSJeff Roberson } __aligned(CACHE_LINE_SIZE);
150e2068d0bSJeff Roberson 
151e2068d0bSJeff Roberson extern struct vm_domain vm_dom[MAXMEMDOM];
152e2068d0bSJeff Roberson 
153e2068d0bSJeff Roberson #define	VM_DOMAIN(n)	(&vm_dom[(n)])
154e2068d0bSJeff Roberson 
155e2068d0bSJeff Roberson #define	vm_pagequeue_assert_locked(pq)	mtx_assert(&(pq)->pq_mutex, MA_OWNED)
156e2068d0bSJeff Roberson #define	vm_pagequeue_lock(pq)		mtx_lock(&(pq)->pq_mutex)
157e2068d0bSJeff Roberson #define	vm_pagequeue_lockptr(pq)	(&(pq)->pq_mutex)
1585cd29d0fSMark Johnston #define	vm_pagequeue_trylock(pq)	mtx_trylock(&(pq)->pq_mutex)
159e2068d0bSJeff Roberson #define	vm_pagequeue_unlock(pq)		mtx_unlock(&(pq)->pq_mutex)
160e2068d0bSJeff Roberson 
161e2068d0bSJeff Roberson #define	vm_domain_free_assert_locked(n)					\
162e2068d0bSJeff Roberson 	    mtx_assert(vm_domain_free_lockptr((n)), MA_OWNED)
163e2068d0bSJeff Roberson #define	vm_domain_free_assert_unlocked(n)				\
164e2068d0bSJeff Roberson 	    mtx_assert(vm_domain_free_lockptr((n)), MA_NOTOWNED)
165e2068d0bSJeff Roberson #define	vm_domain_free_lock(d)						\
166e2068d0bSJeff Roberson 	    mtx_lock(vm_domain_free_lockptr((d)))
167e2068d0bSJeff Roberson #define	vm_domain_free_lockptr(d)					\
168e2068d0bSJeff Roberson 	    (&(d)->vmd_free_mtx)
1695cd29d0fSMark Johnston #define	vm_domain_free_trylock(d)					\
1705cd29d0fSMark Johnston 	    mtx_trylock(vm_domain_free_lockptr((d)))
171e2068d0bSJeff Roberson #define	vm_domain_free_unlock(d)					\
172e2068d0bSJeff Roberson 	    mtx_unlock(vm_domain_free_lockptr((d)))
173e2068d0bSJeff Roberson 
17430fbfddaSJeff Roberson #define	vm_domain_pageout_lockptr(d)					\
17530fbfddaSJeff Roberson 	    (&(d)->vmd_pageout_mtx)
17630fbfddaSJeff Roberson #define	vm_domain_pageout_assert_locked(n)				\
17730fbfddaSJeff Roberson 	    mtx_assert(vm_domain_pageout_lockptr((n)), MA_OWNED)
17830fbfddaSJeff Roberson #define	vm_domain_pageout_assert_unlocked(n)				\
17930fbfddaSJeff Roberson 	    mtx_assert(vm_domain_pageout_lockptr((n)), MA_NOTOWNED)
18030fbfddaSJeff Roberson #define	vm_domain_pageout_lock(d)					\
18130fbfddaSJeff Roberson 	    mtx_lock(vm_domain_pageout_lockptr((d)))
18230fbfddaSJeff Roberson #define	vm_domain_pageout_unlock(d)					\
18330fbfddaSJeff Roberson 	    mtx_unlock(vm_domain_pageout_lockptr((d)))
18430fbfddaSJeff Roberson 
185e2068d0bSJeff Roberson static __inline void
186e2068d0bSJeff Roberson vm_pagequeue_cnt_add(struct vm_pagequeue *pq, int addend)
187e2068d0bSJeff Roberson {
188e2068d0bSJeff Roberson 
189e2068d0bSJeff Roberson 	vm_pagequeue_assert_locked(pq);
190e2068d0bSJeff Roberson 	pq->pq_cnt += addend;
191e2068d0bSJeff Roberson }
192e2068d0bSJeff Roberson #define	vm_pagequeue_cnt_inc(pq)	vm_pagequeue_cnt_add((pq), 1)
193e2068d0bSJeff Roberson #define	vm_pagequeue_cnt_dec(pq)	vm_pagequeue_cnt_add((pq), -1)
194e2068d0bSJeff Roberson 
1955cd29d0fSMark Johnston static inline void
1965cd29d0fSMark Johnston vm_batchqueue_init(struct vm_batchqueue *bq)
1975cd29d0fSMark Johnston {
1985cd29d0fSMark Johnston 
1995cd29d0fSMark Johnston 	bq->bq_cnt = 0;
2005cd29d0fSMark Johnston }
2015cd29d0fSMark Johnston 
2025cd29d0fSMark Johnston static inline bool
2035cd29d0fSMark Johnston vm_batchqueue_insert(struct vm_batchqueue *bq, vm_page_t m)
2045cd29d0fSMark Johnston {
2055cd29d0fSMark Johnston 
2065cd29d0fSMark Johnston 	if (bq->bq_cnt < nitems(bq->bq_pa)) {
2075cd29d0fSMark Johnston 		bq->bq_pa[bq->bq_cnt++] = m;
2085cd29d0fSMark Johnston 		return (true);
2095cd29d0fSMark Johnston 	}
2105cd29d0fSMark Johnston 	return (false);
2115cd29d0fSMark Johnston }
2125cd29d0fSMark Johnston 
2135cd29d0fSMark Johnston static inline vm_page_t
2145cd29d0fSMark Johnston vm_batchqueue_pop(struct vm_batchqueue *bq)
2155cd29d0fSMark Johnston {
2165cd29d0fSMark Johnston 
2175cd29d0fSMark Johnston 	if (bq->bq_cnt == 0)
2185cd29d0fSMark Johnston 		return (NULL);
2195cd29d0fSMark Johnston 	return (bq->bq_pa[--bq->bq_cnt]);
2205cd29d0fSMark Johnston }
2215cd29d0fSMark Johnston 
222e2068d0bSJeff Roberson void vm_domain_set(struct vm_domain *vmd);
22330fbfddaSJeff Roberson void vm_domain_clear(struct vm_domain *vmd);
2245c930c89SJeff Roberson int vm_domain_allocate(struct vm_domain *vmd, int req, int npages);
225e2068d0bSJeff Roberson 
226e2068d0bSJeff Roberson /*
227e2068d0bSJeff Roberson  *      vm_pagequeue_domain:
228e2068d0bSJeff Roberson  *
229e2068d0bSJeff Roberson  *      Return the memory domain the page belongs to.
230e2068d0bSJeff Roberson  */
231e2068d0bSJeff Roberson static inline struct vm_domain *
232e2068d0bSJeff Roberson vm_pagequeue_domain(vm_page_t m)
233e2068d0bSJeff Roberson {
234e2068d0bSJeff Roberson 
235e2068d0bSJeff Roberson 	return (VM_DOMAIN(vm_phys_domain(m)));
236e2068d0bSJeff Roberson }
237e2068d0bSJeff Roberson 
238e2068d0bSJeff Roberson /*
239e2068d0bSJeff Roberson  * Return the number of pages we need to free-up or cache
240e2068d0bSJeff Roberson  * A positive number indicates that we do not have enough free pages.
241e2068d0bSJeff Roberson  */
242e2068d0bSJeff Roberson static inline int
243e2068d0bSJeff Roberson vm_paging_target(struct vm_domain *vmd)
244e2068d0bSJeff Roberson {
245e2068d0bSJeff Roberson 
246e2068d0bSJeff Roberson 	return (vmd->vmd_free_target - vmd->vmd_free_count);
247e2068d0bSJeff Roberson }
248e2068d0bSJeff Roberson 
249e2068d0bSJeff Roberson /*
250e2068d0bSJeff Roberson  * Returns TRUE if the pagedaemon needs to be woken up.
251e2068d0bSJeff Roberson  */
252e2068d0bSJeff Roberson static inline int
253e2068d0bSJeff Roberson vm_paging_needed(struct vm_domain *vmd, u_int free_count)
254e2068d0bSJeff Roberson {
255e2068d0bSJeff Roberson 
256e2068d0bSJeff Roberson 	return (free_count < vmd->vmd_pageout_wakeup_thresh);
257e2068d0bSJeff Roberson }
258e2068d0bSJeff Roberson 
259e2068d0bSJeff Roberson /*
260e2068d0bSJeff Roberson  * Returns TRUE if the domain is below the min paging target.
261e2068d0bSJeff Roberson  */
262e2068d0bSJeff Roberson static inline int
263e2068d0bSJeff Roberson vm_paging_min(struct vm_domain *vmd)
264e2068d0bSJeff Roberson {
265e2068d0bSJeff Roberson 
266e2068d0bSJeff Roberson         return (vmd->vmd_free_min > vmd->vmd_free_count);
267e2068d0bSJeff Roberson }
268e2068d0bSJeff Roberson 
269e2068d0bSJeff Roberson /*
270e2068d0bSJeff Roberson  * Returns TRUE if the domain is below the severe paging target.
271e2068d0bSJeff Roberson  */
272e2068d0bSJeff Roberson static inline int
273e2068d0bSJeff Roberson vm_paging_severe(struct vm_domain *vmd)
274e2068d0bSJeff Roberson {
275e2068d0bSJeff Roberson 
276e2068d0bSJeff Roberson         return (vmd->vmd_free_severe > vmd->vmd_free_count);
277e2068d0bSJeff Roberson }
278e2068d0bSJeff Roberson 
279e2068d0bSJeff Roberson /*
280e2068d0bSJeff Roberson  * Return the number of pages we need to launder.
281e2068d0bSJeff Roberson  * A positive number indicates that we have a shortfall of clean pages.
282e2068d0bSJeff Roberson  */
283e2068d0bSJeff Roberson static inline int
284e2068d0bSJeff Roberson vm_laundry_target(struct vm_domain *vmd)
285e2068d0bSJeff Roberson {
286e2068d0bSJeff Roberson 
287e2068d0bSJeff Roberson 	return (vm_paging_target(vmd));
288e2068d0bSJeff Roberson }
289e2068d0bSJeff Roberson 
29030fbfddaSJeff Roberson void pagedaemon_wakeup(int domain);
29130fbfddaSJeff Roberson 
29230fbfddaSJeff Roberson static inline void
29330fbfddaSJeff Roberson vm_domain_freecnt_inc(struct vm_domain *vmd, int adj)
294e2068d0bSJeff Roberson {
29530fbfddaSJeff Roberson 	u_int old, new;
296e2068d0bSJeff Roberson 
29730fbfddaSJeff Roberson 	old = atomic_fetchadd_int(&vmd->vmd_free_count, adj);
29830fbfddaSJeff Roberson 	new = old + adj;
29930fbfddaSJeff Roberson 	/*
30030fbfddaSJeff Roberson 	 * Only update bitsets on transitions.  Notice we short-circuit the
30130fbfddaSJeff Roberson 	 * rest of the checks if we're above min already.
30230fbfddaSJeff Roberson 	 */
30330fbfddaSJeff Roberson 	if (old < vmd->vmd_free_min && (new >= vmd->vmd_free_min ||
30430fbfddaSJeff Roberson 	    (old < vmd->vmd_free_severe && new >= vmd->vmd_free_severe) ||
30530fbfddaSJeff Roberson 	    (old < vmd->vmd_pageout_free_min &&
30630fbfddaSJeff Roberson 	    new >= vmd->vmd_pageout_free_min)))
30730fbfddaSJeff Roberson 		vm_domain_clear(vmd);
30830fbfddaSJeff Roberson }
30930fbfddaSJeff Roberson 
310e2068d0bSJeff Roberson #endif	/* _KERNEL */
311e2068d0bSJeff Roberson #endif				/* !_VM_PAGEQUEUE_ */
312