160727d8bSWarner Losh /*- 2796df753SPedro F. Giffuni * SPDX-License-Identifier: (BSD-3-Clause AND MIT-CMU) 351369649SPedro F. Giffuni * 4df8bae1dSRodney W. Grimes * Copyright (c) 1991, 1993 5df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 6df8bae1dSRodney W. Grimes * 7df8bae1dSRodney W. Grimes * This code is derived from software contributed to Berkeley by 8df8bae1dSRodney W. Grimes * The Mach Operating System project at Carnegie-Mellon University. 9df8bae1dSRodney W. Grimes * 10df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 11df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 12df8bae1dSRodney W. Grimes * are met: 13df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 14df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 15df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 16df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 17df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 18fbbd9655SWarner Losh * 3. Neither the name of the University nor the names of its contributors 19df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 20df8bae1dSRodney W. Grimes * without specific prior written permission. 21df8bae1dSRodney W. Grimes * 22df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32df8bae1dSRodney W. Grimes * SUCH DAMAGE. 33df8bae1dSRodney W. Grimes * 343c4dd356SDavid Greenman * from: @(#)vm_init.c 8.1 (Berkeley) 6/11/93 35df8bae1dSRodney W. Grimes * 36df8bae1dSRodney W. Grimes * 37df8bae1dSRodney W. Grimes * Copyright (c) 1987, 1990 Carnegie-Mellon University. 38df8bae1dSRodney W. Grimes * All rights reserved. 39df8bae1dSRodney W. Grimes * 40df8bae1dSRodney W. Grimes * Authors: Avadis Tevanian, Jr., Michael Wayne Young 41df8bae1dSRodney W. Grimes * 42df8bae1dSRodney W. Grimes * Permission to use, copy, modify and distribute this software and 43df8bae1dSRodney W. Grimes * its documentation is hereby granted, provided that both the copyright 44df8bae1dSRodney W. Grimes * notice and this permission notice appear in all copies of the 45df8bae1dSRodney W. Grimes * software, derivative works or modified versions, and any portions 46df8bae1dSRodney W. Grimes * thereof, and that both notices appear in supporting documentation. 47df8bae1dSRodney W. Grimes * 48df8bae1dSRodney W. Grimes * CARNEGIE MELLON ALLOWS FREE USE OF THIS SOFTWARE IN ITS "AS IS" 49df8bae1dSRodney W. Grimes * CONDITION. CARNEGIE MELLON DISCLAIMS ANY LIABILITY OF ANY KIND 50df8bae1dSRodney W. Grimes * FOR ANY DAMAGES WHATSOEVER RESULTING FROM THE USE OF THIS SOFTWARE. 51df8bae1dSRodney W. Grimes * 52df8bae1dSRodney W. Grimes * Carnegie Mellon requests users of this software to return to 53df8bae1dSRodney W. Grimes * 54df8bae1dSRodney W. Grimes * Software Distribution Coordinator or Software.Distribution@CS.CMU.EDU 55df8bae1dSRodney W. Grimes * School of Computer Science 56df8bae1dSRodney W. Grimes * Carnegie Mellon University 57df8bae1dSRodney W. Grimes * Pittsburgh PA 15213-3890 58df8bae1dSRodney W. Grimes * 59df8bae1dSRodney W. Grimes * any improvements or extensions that they make and grant Carnegie the 60df8bae1dSRodney W. Grimes * rights to redistribute these changes. 61df8bae1dSRodney W. Grimes */ 62df8bae1dSRodney W. Grimes 63df8bae1dSRodney W. Grimes /* 64df8bae1dSRodney W. Grimes * Initialize the Virtual Memory subsystem. 65df8bae1dSRodney W. Grimes */ 66df8bae1dSRodney W. Grimes 67874651b1SDavid E. O'Brien #include <sys/cdefs.h> 68874651b1SDavid E. O'Brien __FBSDID("$FreeBSD$"); 69874651b1SDavid E. O'Brien 70df8bae1dSRodney W. Grimes #include <sys/param.h> 7187ab1a10SMark Johnston #include <sys/domainset.h> 722b14f991SJulian Elischer #include <sys/kernel.h> 73fb919e4dSMark Murray #include <sys/lock.h> 74fb919e4dSMark Murray #include <sys/proc.h> 7589f6b863SAttilio Rao #include <sys/rwlock.h> 765df87b21SJeff Roberson #include <sys/malloc.h> 77f5fca0d8SKris Kennaway #include <sys/sysctl.h> 7805f0fdd2SPoul-Henning Kamp #include <sys/systm.h> 79cebde069SMike Silbersack #include <sys/selinfo.h> 8021fae961SJeff Roberson #include <sys/smp.h> 81cebde069SMike Silbersack #include <sys/pipe.h> 82219d632cSMatthew Dillon #include <sys/bio.h> 83219d632cSMatthew Dillon #include <sys/buf.h> 845f518366SJeff Roberson #include <sys/vmem.h> 857a469c8eSJeff Roberson #include <sys/vmmeter.h> 86df8bae1dSRodney W. Grimes 87df8bae1dSRodney W. Grimes #include <vm/vm.h> 88219d632cSMatthew Dillon #include <vm/vm_param.h> 89219d632cSMatthew Dillon #include <vm/vm_kern.h> 90efeaf95aSDavid Greenman #include <vm/vm_object.h> 91df8bae1dSRodney W. Grimes #include <vm/vm_page.h> 927a469c8eSJeff Roberson #include <vm/vm_phys.h> 93e2068d0bSJeff Roberson #include <vm/vm_pagequeue.h> 94efeaf95aSDavid Greenman #include <vm/vm_map.h> 9524a1cce3SDavid Greenman #include <vm/vm_pager.h> 96efeaf95aSDavid Greenman #include <vm/vm_extern.h> 97df8bae1dSRodney W. Grimes 98ae941b1bSGleb Smirnoff extern void uma_startup1(void); 99f7d35785SGleb Smirnoff extern void uma_startup2(void); 100ae941b1bSGleb Smirnoff extern void vm_radix_reserve_kva(void); 1017a469c8eSJeff Roberson 1020fca57b8SThomas Moestl long physmem; 1030fca57b8SThomas Moestl 104df8bae1dSRodney W. Grimes /* 1052b14f991SJulian Elischer * System initialization 1062b14f991SJulian Elischer */ 10711caded3SAlfred Perlstein static void vm_mem_init(void *); 108237fdd78SRobert Watson SYSINIT(vm_mem, SI_SUB_VM, SI_ORDER_FIRST, vm_mem_init, NULL); 1092b14f991SJulian Elischer 1102b14f991SJulian Elischer /* 111df8bae1dSRodney W. Grimes * vm_init initializes the virtual memory system. 112df8bae1dSRodney W. Grimes * This is done only by the first cpu up. 113df8bae1dSRodney W. Grimes * 114df8bae1dSRodney W. Grimes * The start and end address of physical memory is passed in. 115df8bae1dSRodney W. Grimes */ 1162b14f991SJulian Elischer static void 1171aed6d48SMark Johnston vm_mem_init(void *dummy) 118df8bae1dSRodney W. Grimes { 1195df87b21SJeff Roberson 120df8bae1dSRodney W. Grimes /* 12187ab1a10SMark Johnston * Initialize static domainsets, used by various allocators. 12287ab1a10SMark Johnston */ 12387ab1a10SMark Johnston domainset_init(); 12487ab1a10SMark Johnston 12587ab1a10SMark Johnston /* 126920239efSMark Johnston * Initialize resident memory structures. From here on, all physical 1270d94caffSDavid Greenman * memory is accounted for, and we use only virtual addresses. 128df8bae1dSRodney W. Grimes */ 12926f9a767SRodney W. Grimes vm_set_page_size(); 130889eb0fcSAlan Cox virtual_avail = vm_page_startup(virtual_avail); 131e7841165SDag-Erling Smørgrav 132920239efSMark Johnston /* 133920239efSMark Johnston * Set an initial domain policy for thread0 so that allocations 134920239efSMark Johnston * can work. 135920239efSMark Johnston */ 136920239efSMark Johnston domainset_zero(); 137920239efSMark Johnston 138ae941b1bSGleb Smirnoff #ifdef UMA_MD_SMALL_ALLOC 139ae941b1bSGleb Smirnoff /* Announce page availability to UMA. */ 140ae941b1bSGleb Smirnoff uma_startup1(); 141ae941b1bSGleb Smirnoff #endif 142df8bae1dSRodney W. Grimes /* 143df8bae1dSRodney W. Grimes * Initialize other VM packages 144df8bae1dSRodney W. Grimes */ 1455f518366SJeff Roberson vmem_startup(); 146a316d390SJohn Dyson vm_object_init(); 147df8bae1dSRodney W. Grimes vm_map_startup(); 148df8bae1dSRodney W. Grimes kmem_init(virtual_avail, virtual_end); 1495df87b21SJeff Roberson 150ae941b1bSGleb Smirnoff #ifndef UMA_MD_SMALL_ALLOC 151ae941b1bSGleb Smirnoff /* Set up radix zone to use noobj_alloc. */ 152ae941b1bSGleb Smirnoff vm_radix_reserve_kva(); 153ae941b1bSGleb Smirnoff #endif 154f7d35785SGleb Smirnoff /* Announce full page availability to UMA. */ 155f7d35785SGleb Smirnoff uma_startup2(); 1565df87b21SJeff Roberson kmem_init_zero_region(); 157bdb93eb2SAlan Cox pmap_init(); 158df8bae1dSRodney W. Grimes vm_pager_init(); 159df8bae1dSRodney W. Grimes } 160219d632cSMatthew Dillon 161219d632cSMatthew Dillon void 162219d632cSMatthew Dillon vm_ksubmap_init(struct kva_md_info *kmi) 163219d632cSMatthew Dillon { 164219d632cSMatthew Dillon vm_offset_t firstaddr; 165219d632cSMatthew Dillon caddr_t v; 166219d632cSMatthew Dillon vm_size_t size = 0; 167447b3772SPeter Wemm long physmem_est; 168219d632cSMatthew Dillon vm_offset_t minaddr; 169219d632cSMatthew Dillon vm_offset_t maxaddr; 170219d632cSMatthew Dillon 171219d632cSMatthew Dillon /* 172219d632cSMatthew Dillon * Allocate space for system data structures. 173219d632cSMatthew Dillon * The first available kernel virtual address is in "v". 174219d632cSMatthew Dillon * As pages of kernel virtual memory are allocated, "v" is incremented. 175219d632cSMatthew Dillon * As pages of memory are allocated and cleared, 176219d632cSMatthew Dillon * "firstaddr" is incremented. 177219d632cSMatthew Dillon */ 178219d632cSMatthew Dillon 179219d632cSMatthew Dillon /* 180219d632cSMatthew Dillon * Make two passes. The first pass calculates how much memory is 181219d632cSMatthew Dillon * needed and allocates it. The second pass assigns virtual 182219d632cSMatthew Dillon * addresses to the various data structures. 183219d632cSMatthew Dillon */ 184219d632cSMatthew Dillon firstaddr = 0; 185219d632cSMatthew Dillon again: 186219d632cSMatthew Dillon v = (caddr_t)firstaddr; 187219d632cSMatthew Dillon 188219d632cSMatthew Dillon /* 189219d632cSMatthew Dillon * Discount the physical memory larger than the size of kernel_map 190219d632cSMatthew Dillon * to avoid eating up all of KVA space. 191219d632cSMatthew Dillon */ 192f0165b1cSKonstantin Belousov physmem_est = lmin(physmem, btoc(vm_map_max(kernel_map) - 193f0165b1cSKonstantin Belousov vm_map_min(kernel_map))); 194219d632cSMatthew Dillon 195219d632cSMatthew Dillon v = kern_vfs_bio_buffer_alloc(v, physmem_est); 196219d632cSMatthew Dillon 197219d632cSMatthew Dillon /* 198219d632cSMatthew Dillon * End of first pass, size has been calculated so allocate memory 199219d632cSMatthew Dillon */ 200219d632cSMatthew Dillon if (firstaddr == 0) { 201857961d9SRobert Drehmel size = (vm_size_t)v; 202edb2994aSAndrew Gallatin #ifdef VM_FREELIST_DMA32 203edb2994aSAndrew Gallatin /* 204edb2994aSAndrew Gallatin * Try to protect 32-bit DMAable memory from the largest 205edb2994aSAndrew Gallatin * early alloc of wired mem. 206edb2994aSAndrew Gallatin */ 207db7c2a48SAlan Cox firstaddr = kmem_alloc_attr(size, M_ZERO | M_NOWAIT, 208db7c2a48SAlan Cox (vm_paddr_t)1 << 32, ~(vm_paddr_t)0, VM_MEMATTR_DEFAULT); 209edb2994aSAndrew Gallatin if (firstaddr == 0) 210edb2994aSAndrew Gallatin #endif 21183a90bffSAlan Cox firstaddr = kmem_malloc(size, M_ZERO | M_WAITOK); 212219d632cSMatthew Dillon if (firstaddr == 0) 213219d632cSMatthew Dillon panic("startup: no room for tables"); 214219d632cSMatthew Dillon goto again; 215219d632cSMatthew Dillon } 216219d632cSMatthew Dillon 217219d632cSMatthew Dillon /* 218219d632cSMatthew Dillon * End of second pass, addresses have been assigned 219219d632cSMatthew Dillon */ 220219d632cSMatthew Dillon if ((vm_size_t)((char *)v - firstaddr) != size) 221219d632cSMatthew Dillon panic("startup: table size inconsistency"); 222219d632cSMatthew Dillon 2235df87b21SJeff Roberson /* 224*46b0292aSGleb Smirnoff * Allocate the clean map to hold all of I/O virtual memory. 2255df87b21SJeff Roberson */ 226*46b0292aSGleb Smirnoff size = (long)nbuf * BKVASIZE + (long)bio_transient_maxcnt * MAXPHYS; 2275df87b21SJeff Roberson kmi->clean_sva = firstaddr = kva_alloc(size); 2285df87b21SJeff Roberson kmi->clean_eva = firstaddr + size; 2295f518366SJeff Roberson 2305df87b21SJeff Roberson /* 2315df87b21SJeff Roberson * Allocate the buffer arena. 23221fae961SJeff Roberson * 23321fae961SJeff Roberson * Enable the quantum cache if we have more than 4 cpus. This 23421fae961SJeff Roberson * avoids lock contention at the expense of some fragmentation. 2355df87b21SJeff Roberson */ 2365f518366SJeff Roberson size = (long)nbuf * BKVASIZE; 2375df87b21SJeff Roberson kmi->buffer_sva = firstaddr; 2385f518366SJeff Roberson kmi->buffer_eva = kmi->buffer_sva + size; 2395f518366SJeff Roberson vmem_init(buffer_arena, "buffer arena", kmi->buffer_sva, size, 24021fae961SJeff Roberson PAGE_SIZE, (mp_ncpus > 4) ? BKVASIZE * 8 : 0, 0); 2415df87b21SJeff Roberson firstaddr += size; 2425f518366SJeff Roberson 2435df87b21SJeff Roberson /* 2445df87b21SJeff Roberson * And optionally transient bio space. 2455df87b21SJeff Roberson */ 2467db07e1cSKonstantin Belousov if (bio_transient_maxcnt != 0) { 2475f518366SJeff Roberson size = (long)bio_transient_maxcnt * MAXPHYS; 2485f518366SJeff Roberson vmem_init(transient_arena, "transient arena", 2495df87b21SJeff Roberson firstaddr, size, PAGE_SIZE, 0, 0); 2505df87b21SJeff Roberson firstaddr += size; 2517db07e1cSKonstantin Belousov } 2525df87b21SJeff Roberson if (firstaddr != kmi->clean_eva) 2535df87b21SJeff Roberson panic("Clean map calculation incorrect"); 2545df87b21SJeff Roberson 2555df87b21SJeff Roberson /* 256ec492b13SMark Johnston * Allocate the pageable submaps. We may cache an exec map entry per 257ec492b13SMark Johnston * CPU, so we therefore need to reserve space for at least ncpu+1 258ec492b13SMark Johnston * entries to avoid deadlock. The exec map is also used by some image 259ec492b13SMark Johnston * activators, so we leave a fixed number of pages for their use. 2605df87b21SJeff Roberson */ 261ec492b13SMark Johnston #ifdef __LP64__ 262ec492b13SMark Johnston exec_map_entries = 8 * mp_ncpus; 263ec492b13SMark Johnston #else 2648d65cba2SMark Johnston exec_map_entries = 2 * mp_ncpus + 4; 265ec492b13SMark Johnston #endif 266ec492b13SMark Johnston exec_map_entry_size = round_page(PATH_MAX + ARG_MAX); 267219d632cSMatthew Dillon exec_map = kmem_suballoc(kernel_map, &minaddr, &maxaddr, 268ec492b13SMark Johnston exec_map_entries * exec_map_entry_size + 64 * PAGE_SIZE, FALSE); 2693202ed75SAlan Cox pipe_map = kmem_suballoc(kernel_map, &minaddr, &maxaddr, maxpipekva, 2703202ed75SAlan Cox FALSE); 271219d632cSMatthew Dillon } 272