11cdefd08SHans Petter Selasky /*- 21cdefd08SHans Petter Selasky * Copyright (c) 2010 Isilon Systems, Inc. 396fc97c8SStephen Hurd * Copyright (c) 2016 Matthew Macy (mmacy@mattmacy.io) 41cdefd08SHans Petter Selasky * Copyright (c) 2017 Mellanox Technologies, Ltd. 51cdefd08SHans Petter Selasky * All rights reserved. 61cdefd08SHans Petter Selasky * 71cdefd08SHans Petter Selasky * Redistribution and use in source and binary forms, with or without 81cdefd08SHans Petter Selasky * modification, are permitted provided that the following conditions 91cdefd08SHans Petter Selasky * are met: 101cdefd08SHans Petter Selasky * 1. Redistributions of source code must retain the above copyright 111cdefd08SHans Petter Selasky * notice unmodified, this list of conditions, and the following 121cdefd08SHans Petter Selasky * disclaimer. 131cdefd08SHans Petter Selasky * 2. Redistributions in binary form must reproduce the above copyright 141cdefd08SHans Petter Selasky * notice, this list of conditions and the following disclaimer in the 151cdefd08SHans Petter Selasky * documentation and/or other materials provided with the distribution. 161cdefd08SHans Petter Selasky * 171cdefd08SHans Petter Selasky * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 181cdefd08SHans Petter Selasky * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 191cdefd08SHans Petter Selasky * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 201cdefd08SHans Petter Selasky * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 211cdefd08SHans Petter Selasky * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 221cdefd08SHans Petter Selasky * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 231cdefd08SHans Petter Selasky * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 241cdefd08SHans Petter Selasky * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 251cdefd08SHans Petter Selasky * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 261cdefd08SHans Petter Selasky * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 271cdefd08SHans Petter Selasky */ 281cdefd08SHans Petter Selasky 291cdefd08SHans Petter Selasky #include <sys/cdefs.h> 301cdefd08SHans Petter Selasky __FBSDID("$FreeBSD$"); 311cdefd08SHans Petter Selasky 321cdefd08SHans Petter Selasky #include <sys/param.h> 331cdefd08SHans Petter Selasky #include <sys/systm.h> 341cdefd08SHans Petter Selasky #include <sys/malloc.h> 351cdefd08SHans Petter Selasky #include <sys/kernel.h> 361cdefd08SHans Petter Selasky #include <sys/sysctl.h> 371cdefd08SHans Petter Selasky #include <sys/lock.h> 381cdefd08SHans Petter Selasky #include <sys/mutex.h> 391cdefd08SHans Petter Selasky #include <sys/rwlock.h> 401cdefd08SHans Petter Selasky #include <sys/proc.h> 411cdefd08SHans Petter Selasky #include <sys/sched.h> 421cdefd08SHans Petter Selasky 431cdefd08SHans Petter Selasky #include <machine/bus.h> 441cdefd08SHans Petter Selasky 451cdefd08SHans Petter Selasky #include <vm/vm.h> 468186b527SHans Petter Selasky #include <vm/pmap.h> 478186b527SHans Petter Selasky #include <vm/vm_param.h> 488186b527SHans Petter Selasky #include <vm/vm_kern.h> 498186b527SHans Petter Selasky #include <vm/vm_object.h> 508186b527SHans Petter Selasky #include <vm/vm_map.h> 511cdefd08SHans Petter Selasky #include <vm/vm_page.h> 521cdefd08SHans Petter Selasky #include <vm/vm_pageout.h> 538186b527SHans Petter Selasky #include <vm/vm_pager.h> 548186b527SHans Petter Selasky #include <vm/vm_radix.h> 558186b527SHans Petter Selasky #include <vm/vm_reserv.h> 568186b527SHans Petter Selasky #include <vm/vm_extern.h> 578186b527SHans Petter Selasky 588186b527SHans Petter Selasky #include <vm/uma.h> 598186b527SHans Petter Selasky #include <vm/uma_int.h> 608186b527SHans Petter Selasky 618186b527SHans Petter Selasky #include <linux/gfp.h> 628186b527SHans Petter Selasky #include <linux/mm.h> 638186b527SHans Petter Selasky #include <linux/preempt.h> 64c05238a6SHans Petter Selasky #include <linux/fs.h> 651179b649SEmmanuel Vadot #include <linux/shmem_fs.h> 661cdefd08SHans Petter Selasky 678734a562SHans Petter Selasky void 688734a562SHans Petter Selasky si_meminfo(struct sysinfo *si) 698734a562SHans Petter Selasky { 708734a562SHans Petter Selasky si->totalram = physmem; 718734a562SHans Petter Selasky si->totalhigh = 0; 728734a562SHans Petter Selasky si->mem_unit = PAGE_SIZE; 738734a562SHans Petter Selasky } 748734a562SHans Petter Selasky 751cdefd08SHans Petter Selasky void * 761cdefd08SHans Petter Selasky linux_page_address(struct page *page) 771cdefd08SHans Petter Selasky { 78a8c348dbSHans Petter Selasky 79*546c117fSMark Johnston if (page->object != kernel_object) { 809a8196ceSNathan Whitehorn return (PMAP_HAS_DMAP ? 8151bd6f96SJustin Hibbits ((void *)(uintptr_t)PHYS_TO_DMAP(VM_PAGE_TO_PHYS(page))) : 8251bd6f96SJustin Hibbits NULL); 83a8c348dbSHans Petter Selasky } 841cdefd08SHans Petter Selasky return ((void *)(uintptr_t)(VM_MIN_KERNEL_ADDRESS + 851cdefd08SHans Petter Selasky IDX_TO_OFF(page->pindex))); 861cdefd08SHans Petter Selasky } 871cdefd08SHans Petter Selasky 881cdefd08SHans Petter Selasky vm_page_t 891cdefd08SHans Petter Selasky linux_alloc_pages(gfp_t flags, unsigned int order) 901cdefd08SHans Petter Selasky { 91ad6b97e7SNathan Whitehorn vm_page_t page; 92ad6b97e7SNathan Whitehorn 93ad6b97e7SNathan Whitehorn if (PMAP_HAS_DMAP) { 941cdefd08SHans Petter Selasky unsigned long npages = 1UL << order; 951ef5e651SMark Johnston int req = VM_ALLOC_NOOBJ | VM_ALLOC_WIRED | VM_ALLOC_NORMAL; 961cdefd08SHans Petter Selasky 971ef5e651SMark Johnston if ((flags & M_ZERO) != 0) 981ef5e651SMark Johnston req |= VM_ALLOC_ZERO; 991cdefd08SHans Petter Selasky if (order == 0 && (flags & GFP_DMA32) == 0) { 1001cdefd08SHans Petter Selasky page = vm_page_alloc(NULL, 0, req); 1011cdefd08SHans Petter Selasky if (page == NULL) 1021cdefd08SHans Petter Selasky return (NULL); 1031cdefd08SHans Petter Selasky } else { 1041cdefd08SHans Petter Selasky vm_paddr_t pmax = (flags & GFP_DMA32) ? 1051cdefd08SHans Petter Selasky BUS_SPACE_MAXADDR_32BIT : BUS_SPACE_MAXADDR; 1061cdefd08SHans Petter Selasky retry: 1071cdefd08SHans Petter Selasky page = vm_page_alloc_contig(NULL, 0, req, 1081cdefd08SHans Petter Selasky npages, 0, pmax, PAGE_SIZE, 0, VM_MEMATTR_DEFAULT); 1091cdefd08SHans Petter Selasky 1101cdefd08SHans Petter Selasky if (page == NULL) { 1111cdefd08SHans Petter Selasky if (flags & M_WAITOK) { 1121cdefd08SHans Petter Selasky if (!vm_page_reclaim_contig(req, 1131cdefd08SHans Petter Selasky npages, 0, pmax, PAGE_SIZE, 0)) { 1142c0f13aaSKonstantin Belousov vm_wait(NULL); 1151cdefd08SHans Petter Selasky } 1161cdefd08SHans Petter Selasky flags &= ~M_WAITOK; 1171cdefd08SHans Petter Selasky goto retry; 1181cdefd08SHans Petter Selasky } 1191cdefd08SHans Petter Selasky return (NULL); 1201cdefd08SHans Petter Selasky } 1211cdefd08SHans Petter Selasky } 1221cdefd08SHans Petter Selasky if (flags & M_ZERO) { 1231cdefd08SHans Petter Selasky unsigned long x; 1241cdefd08SHans Petter Selasky 1251cdefd08SHans Petter Selasky for (x = 0; x != npages; x++) { 1261cdefd08SHans Petter Selasky vm_page_t pgo = page + x; 1271cdefd08SHans Petter Selasky 1281cdefd08SHans Petter Selasky if ((pgo->flags & PG_ZERO) == 0) 1291cdefd08SHans Petter Selasky pmap_zero_page(pgo); 1301cdefd08SHans Petter Selasky } 1311cdefd08SHans Petter Selasky } 132ad6b97e7SNathan Whitehorn } else { 1331cdefd08SHans Petter Selasky vm_offset_t vaddr; 1341cdefd08SHans Petter Selasky 1351cdefd08SHans Petter Selasky vaddr = linux_alloc_kmem(flags, order); 1361cdefd08SHans Petter Selasky if (vaddr == 0) 1371cdefd08SHans Petter Selasky return (NULL); 1381cdefd08SHans Petter Selasky 1391cdefd08SHans Petter Selasky page = PHYS_TO_VM_PAGE(vtophys((void *)vaddr)); 1401cdefd08SHans Petter Selasky 1411cdefd08SHans Petter Selasky KASSERT(vaddr == (vm_offset_t)page_address(page), 1421cdefd08SHans Petter Selasky ("Page address mismatch")); 143ad6b97e7SNathan Whitehorn } 144ad6b97e7SNathan Whitehorn 1451cdefd08SHans Petter Selasky return (page); 1461cdefd08SHans Petter Selasky } 1471cdefd08SHans Petter Selasky 1481cdefd08SHans Petter Selasky void 1491cdefd08SHans Petter Selasky linux_free_pages(vm_page_t page, unsigned int order) 1501cdefd08SHans Petter Selasky { 1519a8196ceSNathan Whitehorn if (PMAP_HAS_DMAP) { 1521cdefd08SHans Petter Selasky unsigned long npages = 1UL << order; 1531cdefd08SHans Petter Selasky unsigned long x; 1541cdefd08SHans Petter Selasky 1551cdefd08SHans Petter Selasky for (x = 0; x != npages; x++) { 1561cdefd08SHans Petter Selasky vm_page_t pgo = page + x; 1571cdefd08SHans Petter Selasky 1581ef5e651SMark Johnston if (vm_page_unwire_noq(pgo)) 1591cdefd08SHans Petter Selasky vm_page_free(pgo); 1601cdefd08SHans Petter Selasky } 1619a8196ceSNathan Whitehorn } else { 1621cdefd08SHans Petter Selasky vm_offset_t vaddr; 1631cdefd08SHans Petter Selasky 1641cdefd08SHans Petter Selasky vaddr = (vm_offset_t)page_address(page); 1651cdefd08SHans Petter Selasky 1661cdefd08SHans Petter Selasky linux_free_kmem(vaddr, order); 1679a8196ceSNathan Whitehorn } 1681cdefd08SHans Petter Selasky } 1691cdefd08SHans Petter Selasky 1701cdefd08SHans Petter Selasky vm_offset_t 1711cdefd08SHans Petter Selasky linux_alloc_kmem(gfp_t flags, unsigned int order) 1721cdefd08SHans Petter Selasky { 1731cdefd08SHans Petter Selasky size_t size = ((size_t)PAGE_SIZE) << order; 1741cdefd08SHans Petter Selasky vm_offset_t addr; 1751cdefd08SHans Petter Selasky 1761cdefd08SHans Petter Selasky if ((flags & GFP_DMA32) == 0) { 17783a90bffSAlan Cox addr = kmem_malloc(size, flags & GFP_NATIVE_MASK); 1781cdefd08SHans Petter Selasky } else { 17944d0efb2SAlan Cox addr = kmem_alloc_contig(size, flags & GFP_NATIVE_MASK, 0, 18044d0efb2SAlan Cox BUS_SPACE_MAXADDR_32BIT, PAGE_SIZE, 0, VM_MEMATTR_DEFAULT); 1811cdefd08SHans Petter Selasky } 1821cdefd08SHans Petter Selasky return (addr); 1831cdefd08SHans Petter Selasky } 1841cdefd08SHans Petter Selasky 1851cdefd08SHans Petter Selasky void 1861cdefd08SHans Petter Selasky linux_free_kmem(vm_offset_t addr, unsigned int order) 1871cdefd08SHans Petter Selasky { 1881cdefd08SHans Petter Selasky size_t size = ((size_t)PAGE_SIZE) << order; 1891cdefd08SHans Petter Selasky 19049bfa624SAlan Cox kmem_free(addr, size); 1911cdefd08SHans Petter Selasky } 1928186b527SHans Petter Selasky 1938186b527SHans Petter Selasky static int 1948186b527SHans Petter Selasky linux_get_user_pages_internal(vm_map_t map, unsigned long start, int nr_pages, 1958186b527SHans Petter Selasky int write, struct page **pages) 1968186b527SHans Petter Selasky { 1978186b527SHans Petter Selasky vm_prot_t prot; 1988186b527SHans Petter Selasky size_t len; 1998186b527SHans Petter Selasky int count; 2008186b527SHans Petter Selasky 2018186b527SHans Petter Selasky prot = write ? (VM_PROT_READ | VM_PROT_WRITE) : VM_PROT_READ; 2028186b527SHans Petter Selasky len = ((size_t)nr_pages) << PAGE_SHIFT; 2038186b527SHans Petter Selasky count = vm_fault_quick_hold_pages(map, start, len, prot, pages, nr_pages); 204eeacb3b0SMark Johnston return (count == -1 ? -EFAULT : nr_pages); 2058186b527SHans Petter Selasky } 2068186b527SHans Petter Selasky 2078186b527SHans Petter Selasky int 2088186b527SHans Petter Selasky __get_user_pages_fast(unsigned long start, int nr_pages, int write, 2098186b527SHans Petter Selasky struct page **pages) 2108186b527SHans Petter Selasky { 2118186b527SHans Petter Selasky vm_map_t map; 2128186b527SHans Petter Selasky vm_page_t *mp; 2138186b527SHans Petter Selasky vm_offset_t va; 2148186b527SHans Petter Selasky vm_offset_t end; 2158186b527SHans Petter Selasky vm_prot_t prot; 2168186b527SHans Petter Selasky int count; 2178186b527SHans Petter Selasky 2188186b527SHans Petter Selasky if (nr_pages == 0 || in_interrupt()) 2198186b527SHans Petter Selasky return (0); 2208186b527SHans Petter Selasky 2218186b527SHans Petter Selasky MPASS(pages != NULL); 2228186b527SHans Petter Selasky va = start; 2238186b527SHans Petter Selasky map = &curthread->td_proc->p_vmspace->vm_map; 2248186b527SHans Petter Selasky end = start + (((size_t)nr_pages) << PAGE_SHIFT); 2258186b527SHans Petter Selasky if (start < vm_map_min(map) || end > vm_map_max(map)) 2268186b527SHans Petter Selasky return (-EINVAL); 2278186b527SHans Petter Selasky prot = write ? (VM_PROT_READ | VM_PROT_WRITE) : VM_PROT_READ; 2288186b527SHans Petter Selasky for (count = 0, mp = pages, va = start; va < end; 2298186b527SHans Petter Selasky mp++, va += PAGE_SIZE, count++) { 2308186b527SHans Petter Selasky *mp = pmap_extract_and_hold(map->pmap, va, prot); 2318186b527SHans Petter Selasky if (*mp == NULL) 2328186b527SHans Petter Selasky break; 2338186b527SHans Petter Selasky 2348186b527SHans Petter Selasky if ((prot & VM_PROT_WRITE) != 0 && 2358186b527SHans Petter Selasky (*mp)->dirty != VM_PAGE_BITS_ALL) { 2368186b527SHans Petter Selasky /* 2378186b527SHans Petter Selasky * Explicitly dirty the physical page. Otherwise, the 2388186b527SHans Petter Selasky * caller's changes may go unnoticed because they are 2398186b527SHans Petter Selasky * performed through an unmanaged mapping or by a DMA 2408186b527SHans Petter Selasky * operation. 2418186b527SHans Petter Selasky * 2428186b527SHans Petter Selasky * The object lock is not held here. 2438186b527SHans Petter Selasky * See vm_page_clear_dirty_mask(). 2448186b527SHans Petter Selasky */ 2458186b527SHans Petter Selasky vm_page_dirty(*mp); 2468186b527SHans Petter Selasky } 2478186b527SHans Petter Selasky } 2488186b527SHans Petter Selasky return (count); 2498186b527SHans Petter Selasky } 2508186b527SHans Petter Selasky 2518186b527SHans Petter Selasky long 2528186b527SHans Petter Selasky get_user_pages_remote(struct task_struct *task, struct mm_struct *mm, 2538186b527SHans Petter Selasky unsigned long start, unsigned long nr_pages, int gup_flags, 2548186b527SHans Petter Selasky struct page **pages, struct vm_area_struct **vmas) 2558186b527SHans Petter Selasky { 2568186b527SHans Petter Selasky vm_map_t map; 2578186b527SHans Petter Selasky 25868b9f2f0SHans Petter Selasky map = &task->task_thread->td_proc->p_vmspace->vm_map; 2598186b527SHans Petter Selasky return (linux_get_user_pages_internal(map, start, nr_pages, 2608186b527SHans Petter Selasky !!(gup_flags & FOLL_WRITE), pages)); 2618186b527SHans Petter Selasky } 2628186b527SHans Petter Selasky 2638186b527SHans Petter Selasky long 2648186b527SHans Petter Selasky get_user_pages(unsigned long start, unsigned long nr_pages, int gup_flags, 2658186b527SHans Petter Selasky struct page **pages, struct vm_area_struct **vmas) 2668186b527SHans Petter Selasky { 2678186b527SHans Petter Selasky vm_map_t map; 2688186b527SHans Petter Selasky 2698186b527SHans Petter Selasky map = &curthread->td_proc->p_vmspace->vm_map; 2708186b527SHans Petter Selasky return (linux_get_user_pages_internal(map, start, nr_pages, 2718186b527SHans Petter Selasky !!(gup_flags & FOLL_WRITE), pages)); 2728186b527SHans Petter Selasky } 2738186b527SHans Petter Selasky 2748186b527SHans Petter Selasky int 2758186b527SHans Petter Selasky is_vmalloc_addr(const void *addr) 2768186b527SHans Petter Selasky { 2778186b527SHans Petter Selasky return (vtoslab((vm_offset_t)addr & ~UMA_SLAB_MASK) != NULL); 2788186b527SHans Petter Selasky } 279