160727d8bSWarner Losh /*- 2796df753SPedro F. Giffuni * SPDX-License-Identifier: (BSD-3-Clause AND MIT-CMU) 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1991, 1993 5df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * This code is derived from software contributed to Berkeley by 8df8bae1dSRodney W. Grimes * The Mach Operating System project at Carnegie-Mellon University. 9df8bae1dSRodney W. Grimes * 10df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 11df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 12df8bae1dSRodney W. Grimes * are met: 13df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 14df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 15df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 17df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 18fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 19df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 20df8bae1dSRodney W. Grimes * without specific prior written permission. 21df8bae1dSRodney W. Grimes * 22df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32df8bae1dSRodney W. Grimes * SUCH DAMAGE. 33df8bae1dSRodney W. Grimes * 343c4dd356SDavid Greenman * from: @(#)vm_init.c 8.1 (Berkeley) 6/11/93 35df8bae1dSRodney W. Grimes * 36df8bae1dSRodney W. Grimes * 37df8bae1dSRodney W. Grimes * Copyright (c) 1987, 1990 Carnegie-Mellon University. 38df8bae1dSRodney W. Grimes * All rights reserved. 39df8bae1dSRodney W. Grimes * 40df8bae1dSRodney W. Grimes * Authors: Avadis Tevanian, Jr., Michael Wayne Young 41df8bae1dSRodney W. Grimes * 42df8bae1dSRodney W. Grimes * Permission to use, copy, modify and distribute this software and 43df8bae1dSRodney W. Grimes * its documentation is hereby granted, provided that both the copyright 44df8bae1dSRodney W. Grimes * notice and this permission notice appear in all copies of the 45df8bae1dSRodney W. Grimes * software, derivative works or modified versions, and any portions 46df8bae1dSRodney W. Grimes * thereof, and that both notices appear in supporting documentation. 47df8bae1dSRodney W. Grimes * 48df8bae1dSRodney W. Grimes * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS" 49df8bae1dSRodney W. Grimes * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND 50df8bae1dSRodney W. Grimes * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE. 51df8bae1dSRodney W. Grimes * 52df8bae1dSRodney W. Grimes * Carnegie Mellon requests users of this software to return to 53df8bae1dSRodney W. Grimes * 54df8bae1dSRodney W. Grimes * Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU 55df8bae1dSRodney W. Grimes * School of Computer Science 56df8bae1dSRodney W. Grimes * Carnegie Mellon University 57df8bae1dSRodney W. Grimes * Pittsburgh PA 15213-3890 58df8bae1dSRodney W. Grimes * 59df8bae1dSRodney W. Grimes * any improvements or extensions that they make and grant Carnegie the 60df8bae1dSRodney W. Grimes * rights to redistribute these changes. 61df8bae1dSRodney W. Grimes */ 62df8bae1dSRodney W. Grimes 63df8bae1dSRodney W. Grimes /* 64df8bae1dSRodney W. Grimes * Initialize the Virtual Memory subsystem. 65df8bae1dSRodney W. Grimes */ 66df8bae1dSRodney W. Grimes 67874651b1SDavid E. O'Brien #include <sys/cdefs.h> 68874651b1SDavid E. O'Brien __FBSDID("$FreeBSD$"); 69874651b1SDavid E. O'Brien 70df8bae1dSRodney W. Grimes #include <sys/param.h> 712b14f991SJulian Elischer #include <sys/kernel.h> 72fb919e4dSMark Murray #include <sys/lock.h> 73fb919e4dSMark Murray #include <sys/proc.h> 7489f6b863SAttilio Rao #include <sys/rwlock.h> 755df87b21SJeff Roberson #include <sys/malloc.h> 76f5fca0d8SKris Kennaway #include <sys/sysctl.h> 7705f0fdd2SPoul-Henning Kamp #include <sys/systm.h> 78cebde069SMike Silbersack #include <sys/selinfo.h> 7921fae961SJeff Roberson #include <sys/smp.h> 80cebde069SMike Silbersack #include <sys/pipe.h> 81219d632cSMatthew Dillon #include <sys/bio.h> 82219d632cSMatthew Dillon #include <sys/buf.h> 835f518366SJeff Roberson #include <sys/vmem.h> 847a469c8eSJeff Roberson #include <sys/vmmeter.h> 85df8bae1dSRodney W. Grimes 86df8bae1dSRodney W. Grimes #include <vm/vm.h> 87219d632cSMatthew Dillon #include <vm/vm_param.h> 88219d632cSMatthew Dillon #include <vm/vm_kern.h> 89efeaf95aSDavid Greenman #include <vm/vm_object.h> 90df8bae1dSRodney W. Grimes #include <vm/vm_page.h> 917a469c8eSJeff Roberson #include <vm/vm_phys.h> 92e2068d0bSJeff Roberson #include <vm/vm_pagequeue.h> 93efeaf95aSDavid Greenman #include <vm/vm_map.h> 9424a1cce3SDavid Greenman #include <vm/vm_pager.h> 95efeaf95aSDavid Greenman #include <vm/vm_extern.h> 96df8bae1dSRodney W. Grimes 97ae941b1bSGleb Smirnoff extern void uma_startup1(void); 98f7d35785SGleb Smirnoff extern void uma_startup2(void); 99ae941b1bSGleb Smirnoff extern void vm_radix_reserve_kva(void); 1007a469c8eSJeff Roberson 1010fca57b8SThomas Moestl long physmem; 1020fca57b8SThomas Moestl 103df8bae1dSRodney W. Grimes /* 1042b14f991SJulian Elischer * System initialization 1052b14f991SJulian Elischer */ 10611caded3SAlfred Perlstein static void vm_mem_init(void *); 107237fdd78SRobert Watson SYSINIT(vm_mem, SI_SUB_VM, SI_ORDER_FIRST, vm_mem_init, NULL); 1082b14f991SJulian Elischer 1092b14f991SJulian Elischer /* 110df8bae1dSRodney W. Grimes * vm_init initializes the virtual memory system. 111df8bae1dSRodney W. Grimes * This is done only by the first cpu up. 112df8bae1dSRodney W. Grimes * 113df8bae1dSRodney W. Grimes * The start and end address of physical memory is passed in. 114df8bae1dSRodney W. Grimes */ 1152b14f991SJulian Elischer static void 116*1aed6d48SMark Johnston vm_mem_init(void *dummy) 117df8bae1dSRodney W. Grimes { 1185df87b21SJeff Roberson 119df8bae1dSRodney W. Grimes /* 1200d94caffSDavid Greenman * Initializes resident memory structures. From here on, all physical 1210d94caffSDavid Greenman * memory is accounted for, and we use only virtual addresses. 122df8bae1dSRodney W. Grimes */ 12326f9a767SRodney W. Grimes vm_set_page_size(); 124889eb0fcSAlan Cox virtual_avail = vm_page_startup(virtual_avail); 125e7841165SDag-Erling Smørgrav 126ae941b1bSGleb Smirnoff #ifdef UMA_MD_SMALL_ALLOC 127ae941b1bSGleb Smirnoff /* Announce page availability to UMA. */ 128ae941b1bSGleb Smirnoff uma_startup1(); 129ae941b1bSGleb Smirnoff #endif 130df8bae1dSRodney W. Grimes /* 131df8bae1dSRodney W. Grimes * Initialize other VM packages 132df8bae1dSRodney W. Grimes */ 1335f518366SJeff Roberson vmem_startup(); 134a316d390SJohn Dyson vm_object_init(); 135df8bae1dSRodney W. Grimes vm_map_startup(); 136df8bae1dSRodney W. Grimes kmem_init(virtual_avail, virtual_end); 1375df87b21SJeff Roberson 138ae941b1bSGleb Smirnoff #ifndef UMA_MD_SMALL_ALLOC 139ae941b1bSGleb Smirnoff /* Set up radix zone to use noobj_alloc. */ 140ae941b1bSGleb Smirnoff vm_radix_reserve_kva(); 141ae941b1bSGleb Smirnoff #endif 142f7d35785SGleb Smirnoff /* Announce full page availability to UMA. */ 143f7d35785SGleb Smirnoff uma_startup2(); 1445df87b21SJeff Roberson kmem_init_zero_region(); 145bdb93eb2SAlan Cox pmap_init(); 146df8bae1dSRodney W. Grimes vm_pager_init(); 147df8bae1dSRodney W. Grimes } 148219d632cSMatthew Dillon 149219d632cSMatthew Dillon void 150219d632cSMatthew Dillon vm_ksubmap_init(struct kva_md_info *kmi) 151219d632cSMatthew Dillon { 152219d632cSMatthew Dillon vm_offset_t firstaddr; 153219d632cSMatthew Dillon caddr_t v; 154219d632cSMatthew Dillon vm_size_t size = 0; 155447b3772SPeter Wemm long physmem_est; 156219d632cSMatthew Dillon vm_offset_t minaddr; 157219d632cSMatthew Dillon vm_offset_t maxaddr; 158219d632cSMatthew Dillon 159219d632cSMatthew Dillon /* 160219d632cSMatthew Dillon * Allocate space for system data structures. 161219d632cSMatthew Dillon * The first available kernel virtual address is in "v". 162219d632cSMatthew Dillon * As pages of kernel virtual memory are allocated, "v" is incremented. 163219d632cSMatthew Dillon * As pages of memory are allocated and cleared, 164219d632cSMatthew Dillon * "firstaddr" is incremented. 165219d632cSMatthew Dillon */ 166219d632cSMatthew Dillon 167219d632cSMatthew Dillon /* 168219d632cSMatthew Dillon * Make two passes. The first pass calculates how much memory is 169219d632cSMatthew Dillon * needed and allocates it. The second pass assigns virtual 170219d632cSMatthew Dillon * addresses to the various data structures. 171219d632cSMatthew Dillon */ 172219d632cSMatthew Dillon firstaddr = 0; 173219d632cSMatthew Dillon again: 174219d632cSMatthew Dillon v = (caddr_t)firstaddr; 175219d632cSMatthew Dillon 176219d632cSMatthew Dillon /* 177219d632cSMatthew Dillon * Discount the physical memory larger than the size of kernel_map 178219d632cSMatthew Dillon * to avoid eating up all of KVA space. 179219d632cSMatthew Dillon */ 180f0165b1cSKonstantin Belousov physmem_est = lmin(physmem, btoc(vm_map_max(kernel_map) - 181f0165b1cSKonstantin Belousov vm_map_min(kernel_map))); 182219d632cSMatthew Dillon 183219d632cSMatthew Dillon v = kern_vfs_bio_buffer_alloc(v, physmem_est); 184219d632cSMatthew Dillon 185219d632cSMatthew Dillon /* 186219d632cSMatthew Dillon * End of first pass, size has been calculated so allocate memory 187219d632cSMatthew Dillon */ 188219d632cSMatthew Dillon if (firstaddr == 0) { 189857961d9SRobert Drehmel size = (vm_size_t)v; 190edb2994aSAndrew Gallatin #ifdef VM_FREELIST_DMA32 191edb2994aSAndrew Gallatin /* 192edb2994aSAndrew Gallatin * Try to protect 32-bit DMAable memory from the largest 193edb2994aSAndrew Gallatin * early alloc of wired mem. 194edb2994aSAndrew Gallatin */ 195db7c2a48SAlan Cox firstaddr = kmem_alloc_attr(size, M_ZERO | M_NOWAIT, 196db7c2a48SAlan Cox (vm_paddr_t)1 << 32, ~(vm_paddr_t)0, VM_MEMATTR_DEFAULT); 197edb2994aSAndrew Gallatin if (firstaddr == 0) 198edb2994aSAndrew Gallatin #endif 19983a90bffSAlan Cox firstaddr = kmem_malloc(size, M_ZERO | M_WAITOK); 200219d632cSMatthew Dillon if (firstaddr == 0) 201219d632cSMatthew Dillon panic("startup: no room for tables"); 202219d632cSMatthew Dillon goto again; 203219d632cSMatthew Dillon } 204219d632cSMatthew Dillon 205219d632cSMatthew Dillon /* 206219d632cSMatthew Dillon * End of second pass, addresses have been assigned 207219d632cSMatthew Dillon */ 208219d632cSMatthew Dillon if ((vm_size_t)((char *)v - firstaddr) != size) 209219d632cSMatthew Dillon panic("startup: table size inconsistency"); 210219d632cSMatthew Dillon 2115df87b21SJeff Roberson /* 2125df87b21SJeff Roberson * Allocate the clean map to hold all of the paging and I/O virtual 2135df87b21SJeff Roberson * memory. 2145df87b21SJeff Roberson */ 2155f518366SJeff Roberson size = (long)nbuf * BKVASIZE + (long)nswbuf * MAXPHYS + 2165f518366SJeff Roberson (long)bio_transient_maxcnt * MAXPHYS; 2175df87b21SJeff Roberson kmi->clean_sva = firstaddr = kva_alloc(size); 2185df87b21SJeff Roberson kmi->clean_eva = firstaddr + size; 2195f518366SJeff Roberson 2205df87b21SJeff Roberson /* 2215df87b21SJeff Roberson * Allocate the buffer arena. 22221fae961SJeff Roberson * 22321fae961SJeff Roberson * Enable the quantum cache if we have more than 4 cpus. This 22421fae961SJeff Roberson * avoids lock contention at the expense of some fragmentation. 2255df87b21SJeff Roberson */ 2265f518366SJeff Roberson size = (long)nbuf * BKVASIZE; 2275df87b21SJeff Roberson kmi->buffer_sva = firstaddr; 2285f518366SJeff Roberson kmi->buffer_eva = kmi->buffer_sva + size; 2295f518366SJeff Roberson vmem_init(buffer_arena, "buffer arena", kmi->buffer_sva, size, 23021fae961SJeff Roberson PAGE_SIZE, (mp_ncpus > 4) ? BKVASIZE * 8 : 0, 0); 2315df87b21SJeff Roberson firstaddr += size; 2325f518366SJeff Roberson 2335df87b21SJeff Roberson /* 2345df87b21SJeff Roberson * Now swap kva. 2355df87b21SJeff Roberson */ 2365df87b21SJeff Roberson swapbkva = firstaddr; 2375f518366SJeff Roberson size = (long)nswbuf * MAXPHYS; 2385df87b21SJeff Roberson firstaddr += size; 2395f518366SJeff Roberson 2405df87b21SJeff Roberson /* 2415df87b21SJeff Roberson * And optionally transient bio space. 2425df87b21SJeff Roberson */ 2437db07e1cSKonstantin Belousov if (bio_transient_maxcnt != 0) { 2445f518366SJeff Roberson size = (long)bio_transient_maxcnt * MAXPHYS; 2455f518366SJeff Roberson vmem_init(transient_arena, "transient arena", 2465df87b21SJeff Roberson firstaddr, size, PAGE_SIZE, 0, 0); 2475df87b21SJeff Roberson firstaddr += size; 2487db07e1cSKonstantin Belousov } 2495df87b21SJeff Roberson if (firstaddr != kmi->clean_eva) 2505df87b21SJeff Roberson panic("Clean map calculation incorrect"); 2515df87b21SJeff Roberson 2525df87b21SJeff Roberson /* 253ec492b13SMark Johnston * Allocate the pageable submaps. We may cache an exec map entry per 254ec492b13SMark Johnston * CPU, so we therefore need to reserve space for at least ncpu+1 255ec492b13SMark Johnston * entries to avoid deadlock. The exec map is also used by some image 256ec492b13SMark Johnston * activators, so we leave a fixed number of pages for their use. 2575df87b21SJeff Roberson */ 258ec492b13SMark Johnston #ifdef __LP64__ 259ec492b13SMark Johnston exec_map_entries = 8 * mp_ncpus; 260ec492b13SMark Johnston #else 2618d65cba2SMark Johnston exec_map_entries = 2 * mp_ncpus + 4; 262ec492b13SMark Johnston #endif 263ec492b13SMark Johnston exec_map_entry_size = round_page(PATH_MAX + ARG_MAX); 264219d632cSMatthew Dillon exec_map = kmem_suballoc(kernel_map, &minaddr, &maxaddr, 265ec492b13SMark Johnston exec_map_entries * exec_map_entry_size + 64 * PAGE_SIZE, FALSE); 2663202ed75SAlan Cox pipe_map = kmem_suballoc(kernel_map, &minaddr, &maxaddr, maxpipekva, 2673202ed75SAlan Cox FALSE); 268219d632cSMatthew Dillon } 269