1c0587701SJoel Dahl /*- 2e3813573SMatthew D Fleming * Copyright (c) 2005, Bosko Milekic <bmilekic@FreeBSD.org>. 3e3813573SMatthew D Fleming * Copyright (c) 2010 Isilon Systems, Inc. (http://www.isilon.com/) 4e3813573SMatthew D Fleming * All rights reserved. 5e4eb384bSBosko Milekic * 6e4eb384bSBosko Milekic * Redistribution and use in source and binary forms, with or without 7e4eb384bSBosko Milekic * modification, are permitted provided that the following conditions 8e4eb384bSBosko Milekic * are met: 9e4eb384bSBosko Milekic * 1. Redistributions of source code must retain the above copyright 10e4eb384bSBosko Milekic * notice unmodified, this list of conditions, and the following 11e4eb384bSBosko Milekic * disclaimer. 12e4eb384bSBosko Milekic * 2. Redistributions in binary form must reproduce the above copyright 13e4eb384bSBosko Milekic * notice, this list of conditions and the following disclaimer in the 14e4eb384bSBosko Milekic * documentation and/or other materials provided with the distribution. 15e4eb384bSBosko Milekic * 16e4eb384bSBosko Milekic * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 17e4eb384bSBosko Milekic * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 18e4eb384bSBosko Milekic * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 19e4eb384bSBosko Milekic * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 20e4eb384bSBosko Milekic * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 21e4eb384bSBosko Milekic * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 22e4eb384bSBosko Milekic * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 23e4eb384bSBosko Milekic * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 24e4eb384bSBosko Milekic * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 25e4eb384bSBosko Milekic * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26e4eb384bSBosko Milekic */ 27e4eb384bSBosko Milekic 28e4eb384bSBosko Milekic #include <sys/cdefs.h> 29e4eb384bSBosko Milekic __FBSDID("$FreeBSD$"); 30e4eb384bSBosko Milekic 31e4eb384bSBosko Milekic /* 32e4eb384bSBosko Milekic * MemGuard is a simple replacement allocator for debugging only 33e4eb384bSBosko Milekic * which provides ElectricFence-style memory barrier protection on 34e4eb384bSBosko Milekic * objects being allocated, and is used to detect tampering-after-free 35e4eb384bSBosko Milekic * scenarios. 36e4eb384bSBosko Milekic * 37e4eb384bSBosko Milekic * See the memguard(9) man page for more information on using MemGuard. 38e4eb384bSBosko Milekic */ 39e4eb384bSBosko Milekic 40f02d86e2SMatthew D Fleming #include "opt_vm.h" 41f02d86e2SMatthew D Fleming 42e4eb384bSBosko Milekic #include <sys/param.h> 43e4eb384bSBosko Milekic #include <sys/systm.h> 44e4eb384bSBosko Milekic #include <sys/kernel.h> 45e4eb384bSBosko Milekic #include <sys/types.h> 46e4eb384bSBosko Milekic #include <sys/queue.h> 47e4eb384bSBosko Milekic #include <sys/lock.h> 48e4eb384bSBosko Milekic #include <sys/mutex.h> 49e4eb384bSBosko Milekic #include <sys/malloc.h> 50d362c40dSPawel Jakub Dawidek #include <sys/sysctl.h> 515df87b21SJeff Roberson #include <sys/vmem.h> 52e4eb384bSBosko Milekic 53e4eb384bSBosko Milekic #include <vm/vm.h> 54e3813573SMatthew D Fleming #include <vm/uma.h> 5503412565SBosko Milekic #include <vm/vm_param.h> 56e4eb384bSBosko Milekic #include <vm/vm_page.h> 57e4eb384bSBosko Milekic #include <vm/vm_map.h> 58e3813573SMatthew D Fleming #include <vm/vm_object.h> 59*8441d1e8SJeff Roberson #include <vm/vm_kern.h> 60e4eb384bSBosko Milekic #include <vm/vm_extern.h> 618d689e04SGleb Smirnoff #include <vm/uma_int.h> 62e4eb384bSBosko Milekic #include <vm/memguard.h> 63e4eb384bSBosko Milekic 646472ac3dSEd Schouten static SYSCTL_NODE(_vm, OID_AUTO, memguard, CTLFLAG_RW, NULL, "MemGuard data"); 65d362c40dSPawel Jakub Dawidek /* 66d362c40dSPawel Jakub Dawidek * The vm_memguard_divisor variable controls how much of kmem_map should be 67d362c40dSPawel Jakub Dawidek * reserved for MemGuard. 68d362c40dSPawel Jakub Dawidek */ 69e3813573SMatthew D Fleming static u_int vm_memguard_divisor; 70e3813573SMatthew D Fleming SYSCTL_UINT(_vm_memguard, OID_AUTO, divisor, CTLFLAG_RDTUN, 71e3813573SMatthew D Fleming &vm_memguard_divisor, 72d362c40dSPawel Jakub Dawidek 0, "(kmem_size/memguard_divisor) == memguard submap size"); 73d362c40dSPawel Jakub Dawidek 74d362c40dSPawel Jakub Dawidek /* 75d362c40dSPawel Jakub Dawidek * Short description (ks_shortdesc) of memory type to monitor. 76d362c40dSPawel Jakub Dawidek */ 77d362c40dSPawel Jakub Dawidek static char vm_memguard_desc[128] = ""; 78d362c40dSPawel Jakub Dawidek static struct malloc_type *vm_memguard_mtype = NULL; 79d362c40dSPawel Jakub Dawidek TUNABLE_STR("vm.memguard.desc", vm_memguard_desc, sizeof(vm_memguard_desc)); 80d362c40dSPawel Jakub Dawidek static int 81d362c40dSPawel Jakub Dawidek memguard_sysctl_desc(SYSCTL_HANDLER_ARGS) 82d362c40dSPawel Jakub Dawidek { 83e3813573SMatthew D Fleming char desc[sizeof(vm_memguard_desc)]; 84e3813573SMatthew D Fleming int error; 85d362c40dSPawel Jakub Dawidek 86d362c40dSPawel Jakub Dawidek strlcpy(desc, vm_memguard_desc, sizeof(desc)); 87d362c40dSPawel Jakub Dawidek error = sysctl_handle_string(oidp, desc, sizeof(desc), req); 88d362c40dSPawel Jakub Dawidek if (error != 0 || req->newptr == NULL) 89d362c40dSPawel Jakub Dawidek return (error); 90d362c40dSPawel Jakub Dawidek 91d362c40dSPawel Jakub Dawidek mtx_lock(&malloc_mtx); 92d362c40dSPawel Jakub Dawidek /* 93d362c40dSPawel Jakub Dawidek * If mtp is NULL, it will be initialized in memguard_cmp(). 94d362c40dSPawel Jakub Dawidek */ 95e3813573SMatthew D Fleming vm_memguard_mtype = malloc_desc2type(desc); 96d362c40dSPawel Jakub Dawidek strlcpy(vm_memguard_desc, desc, sizeof(vm_memguard_desc)); 97d362c40dSPawel Jakub Dawidek mtx_unlock(&malloc_mtx); 98d362c40dSPawel Jakub Dawidek return (error); 99d362c40dSPawel Jakub Dawidek } 100e3813573SMatthew D Fleming SYSCTL_PROC(_vm_memguard, OID_AUTO, desc, 101e3813573SMatthew D Fleming CTLTYPE_STRING | CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 0, 102d362c40dSPawel Jakub Dawidek memguard_sysctl_desc, "A", "Short description of memory type to monitor"); 103d362c40dSPawel Jakub Dawidek 104e3813573SMatthew D Fleming static vm_offset_t memguard_cursor; 1055df87b21SJeff Roberson static vm_offset_t memguard_base; 106e3813573SMatthew D Fleming static vm_size_t memguard_mapsize; 107e3813573SMatthew D Fleming static vm_size_t memguard_physlimit; 108e3813573SMatthew D Fleming static u_long memguard_wasted; 109e3813573SMatthew D Fleming static u_long memguard_wrap; 110e3813573SMatthew D Fleming static u_long memguard_succ; 111e3813573SMatthew D Fleming static u_long memguard_fail_kva; 112e3813573SMatthew D Fleming static u_long memguard_fail_pgs; 113e3813573SMatthew D Fleming 114e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, cursor, CTLFLAG_RD, 115e3813573SMatthew D Fleming &memguard_cursor, 0, "MemGuard cursor"); 116e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, mapsize, CTLFLAG_RD, 1175df87b21SJeff Roberson &memguard_mapsize, 0, "MemGuard private arena size"); 118e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, phys_limit, CTLFLAG_RD, 119e3813573SMatthew D Fleming &memguard_physlimit, 0, "Limit on MemGuard memory consumption"); 120e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, wasted, CTLFLAG_RD, 121e3813573SMatthew D Fleming &memguard_wasted, 0, "Excess memory used through page promotion"); 122e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, wrapcnt, CTLFLAG_RD, 123e3813573SMatthew D Fleming &memguard_wrap, 0, "MemGuard cursor wrap count"); 124e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, numalloc, CTLFLAG_RD, 125e3813573SMatthew D Fleming &memguard_succ, 0, "Count of successful MemGuard allocations"); 126e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, fail_kva, CTLFLAG_RD, 127e3813573SMatthew D Fleming &memguard_fail_kva, 0, "MemGuard failures due to lack of KVA"); 128e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, fail_pgs, CTLFLAG_RD, 129e3813573SMatthew D Fleming &memguard_fail_pgs, 0, "MemGuard failures due to lack of pages"); 130e3813573SMatthew D Fleming 1318d689e04SGleb Smirnoff #define MG_GUARD_AROUND 0x001 1328d689e04SGleb Smirnoff #define MG_GUARD_ALLLARGE 0x002 1338d689e04SGleb Smirnoff #define MG_GUARD_NOFREE 0x004 1348d689e04SGleb Smirnoff static int memguard_options = MG_GUARD_AROUND; 135e3813573SMatthew D Fleming TUNABLE_INT("vm.memguard.options", &memguard_options); 136e3813573SMatthew D Fleming SYSCTL_INT(_vm_memguard, OID_AUTO, options, CTLFLAG_RW, 137e3813573SMatthew D Fleming &memguard_options, 0, 138e3813573SMatthew D Fleming "MemGuard options:\n" 139e3813573SMatthew D Fleming "\t0x001 - add guard pages around each allocation\n" 1408d689e04SGleb Smirnoff "\t0x002 - always use MemGuard for allocations over a page\n" 1418d689e04SGleb Smirnoff "\t0x004 - guard uma(9) zones with UMA_ZONE_NOFREE flag"); 142e3813573SMatthew D Fleming 143e3813573SMatthew D Fleming static u_int memguard_minsize; 144e3813573SMatthew D Fleming static u_long memguard_minsize_reject; 145e3813573SMatthew D Fleming SYSCTL_UINT(_vm_memguard, OID_AUTO, minsize, CTLFLAG_RW, 146e3813573SMatthew D Fleming &memguard_minsize, 0, "Minimum size for page promotion"); 147e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, minsize_reject, CTLFLAG_RD, 148e3813573SMatthew D Fleming &memguard_minsize_reject, 0, "# times rejected for size"); 149e3813573SMatthew D Fleming 150e3813573SMatthew D Fleming static u_int memguard_frequency; 151e3813573SMatthew D Fleming static u_long memguard_frequency_hits; 152e3813573SMatthew D Fleming TUNABLE_INT("vm.memguard.frequency", &memguard_frequency); 153e3813573SMatthew D Fleming SYSCTL_UINT(_vm_memguard, OID_AUTO, frequency, CTLFLAG_RW, 154e3813573SMatthew D Fleming &memguard_frequency, 0, "Times in 100000 that MemGuard will randomly run"); 155e3813573SMatthew D Fleming SYSCTL_ULONG(_vm_memguard, OID_AUTO, frequency_hits, CTLFLAG_RD, 156e3813573SMatthew D Fleming &memguard_frequency_hits, 0, "# times MemGuard randomly chose"); 157e3813573SMatthew D Fleming 158e4eb384bSBosko Milekic 159e4eb384bSBosko Milekic /* 160e3813573SMatthew D Fleming * Return a fudged value to be used for vm_kmem_size for allocating 161e3813573SMatthew D Fleming * the kmem_map. The memguard memory will be a submap. 162e4eb384bSBosko Milekic */ 163e3813573SMatthew D Fleming unsigned long 164f806cdcfSMatthew D Fleming memguard_fudge(unsigned long km_size, const struct vm_map *parent_map) 165e3813573SMatthew D Fleming { 166f806cdcfSMatthew D Fleming u_long mem_pgs, parent_size; 167e4eb384bSBosko Milekic 168e3813573SMatthew D Fleming vm_memguard_divisor = 10; 169e3813573SMatthew D Fleming TUNABLE_INT_FETCH("vm.memguard.divisor", &vm_memguard_divisor); 170e3813573SMatthew D Fleming 171f806cdcfSMatthew D Fleming parent_size = vm_map_max(parent_map) - vm_map_min(parent_map) + 172f806cdcfSMatthew D Fleming PAGE_SIZE; 173e3813573SMatthew D Fleming /* Pick a conservative value if provided value sucks. */ 174e3813573SMatthew D Fleming if ((vm_memguard_divisor <= 0) || 175f806cdcfSMatthew D Fleming ((parent_size / vm_memguard_divisor) == 0)) 176e3813573SMatthew D Fleming vm_memguard_divisor = 10; 177e4eb384bSBosko Milekic /* 178e3813573SMatthew D Fleming * Limit consumption of physical pages to 179e3813573SMatthew D Fleming * 1/vm_memguard_divisor of system memory. If the KVA is 180e3813573SMatthew D Fleming * smaller than this then the KVA limit comes into play first. 181e3813573SMatthew D Fleming * This prevents memguard's page promotions from completely 182e3813573SMatthew D Fleming * using up memory, since most malloc(9) calls are sub-page. 183e4eb384bSBosko Milekic */ 184f806cdcfSMatthew D Fleming mem_pgs = cnt.v_page_count; 185e3813573SMatthew D Fleming memguard_physlimit = (mem_pgs / vm_memguard_divisor) * PAGE_SIZE; 186e3813573SMatthew D Fleming /* 187e3813573SMatthew D Fleming * We want as much KVA as we can take safely. Use at most our 188f806cdcfSMatthew D Fleming * allotted fraction of the parent map's size. Limit this to 189f806cdcfSMatthew D Fleming * twice the physical memory to avoid using too much memory as 190f806cdcfSMatthew D Fleming * pagetable pages (size must be multiple of PAGE_SIZE). 191e3813573SMatthew D Fleming */ 192f806cdcfSMatthew D Fleming memguard_mapsize = round_page(parent_size / vm_memguard_divisor); 193f806cdcfSMatthew D Fleming if (memguard_mapsize / (2 * PAGE_SIZE) > mem_pgs) 194e3813573SMatthew D Fleming memguard_mapsize = mem_pgs * 2 * PAGE_SIZE; 195f806cdcfSMatthew D Fleming if (km_size + memguard_mapsize > parent_size) 196f806cdcfSMatthew D Fleming memguard_mapsize = 0; 197e3813573SMatthew D Fleming return (km_size + memguard_mapsize); 198e3813573SMatthew D Fleming } 199e4eb384bSBosko Milekic 200e4eb384bSBosko Milekic /* 201e4eb384bSBosko Milekic * Initialize the MemGuard mock allocator. All objects from MemGuard come 202e4eb384bSBosko Milekic * out of a single VM map (contiguous chunk of address space). 203e4eb384bSBosko Milekic */ 204e4eb384bSBosko Milekic void 2055df87b21SJeff Roberson memguard_init(vmem_t *parent) 206e4eb384bSBosko Milekic { 2075df87b21SJeff Roberson vm_offset_t base; 208e4eb384bSBosko Milekic 209*8441d1e8SJeff Roberson vmem_alloc(parent, memguard_mapsize, M_BESTFIT | M_WAITOK, &base); 210*8441d1e8SJeff Roberson vmem_init(memguard_arena, "memguard arena", base, memguard_mapsize, 2115df87b21SJeff Roberson PAGE_SIZE, 0, M_WAITOK); 212e3813573SMatthew D Fleming memguard_cursor = base; 2135df87b21SJeff Roberson memguard_base = base; 214e4eb384bSBosko Milekic 215e4eb384bSBosko Milekic printf("MEMGUARD DEBUGGING ALLOCATOR INITIALIZED:\n"); 216e3813573SMatthew D Fleming printf("\tMEMGUARD map base: 0x%lx\n", (u_long)base); 217e3813573SMatthew D Fleming printf("\tMEMGUARD map size: %jd KBytes\n", 218e3813573SMatthew D Fleming (uintmax_t)memguard_mapsize >> 10); 219e4eb384bSBosko Milekic } 220e4eb384bSBosko Milekic 221e4eb384bSBosko Milekic /* 222e3813573SMatthew D Fleming * Run things that can't be done as early as memguard_init(). 223e3813573SMatthew D Fleming */ 224e3813573SMatthew D Fleming static void 225e3813573SMatthew D Fleming memguard_sysinit(void) 226e3813573SMatthew D Fleming { 227e3813573SMatthew D Fleming struct sysctl_oid_list *parent; 228e3813573SMatthew D Fleming 229e3813573SMatthew D Fleming parent = SYSCTL_STATIC_CHILDREN(_vm_memguard); 230e3813573SMatthew D Fleming 231e3813573SMatthew D Fleming SYSCTL_ADD_ULONG(NULL, parent, OID_AUTO, "mapstart", CTLFLAG_RD, 2325df87b21SJeff Roberson &memguard_base, "MemGuard KVA base"); 233e3813573SMatthew D Fleming SYSCTL_ADD_ULONG(NULL, parent, OID_AUTO, "maplimit", CTLFLAG_RD, 2345df87b21SJeff Roberson &memguard_mapsize, "MemGuard KVA size"); 2355df87b21SJeff Roberson #if 0 236e3813573SMatthew D Fleming SYSCTL_ADD_ULONG(NULL, parent, OID_AUTO, "mapused", CTLFLAG_RD, 237e3813573SMatthew D Fleming &memguard_map->size, "MemGuard KVA used"); 2385df87b21SJeff Roberson #endif 239e3813573SMatthew D Fleming } 240e3813573SMatthew D Fleming SYSINIT(memguard, SI_SUB_KLD, SI_ORDER_ANY, memguard_sysinit, NULL); 241e3813573SMatthew D Fleming 242e3813573SMatthew D Fleming /* 243e3813573SMatthew D Fleming * v2sizep() converts a virtual address of the first page allocated for 244e3813573SMatthew D Fleming * an item to a pointer to u_long recording the size of the original 245e3813573SMatthew D Fleming * allocation request. 246e3813573SMatthew D Fleming * 247e3813573SMatthew D Fleming * This routine is very similar to those defined by UMA in uma_int.h. 248e3813573SMatthew D Fleming * The difference is that this routine stores the originally allocated 249e3813573SMatthew D Fleming * size in one of the page's fields that is unused when the page is 250e3813573SMatthew D Fleming * wired rather than the object field, which is used. 251e3813573SMatthew D Fleming */ 252e3813573SMatthew D Fleming static u_long * 253e3813573SMatthew D Fleming v2sizep(vm_offset_t va) 254e3813573SMatthew D Fleming { 255a2a200a2SMatthew D Fleming vm_paddr_t pa; 256e3813573SMatthew D Fleming struct vm_page *p; 257e3813573SMatthew D Fleming 258a2a200a2SMatthew D Fleming pa = pmap_kextract(va); 259a2a200a2SMatthew D Fleming if (pa == 0) 260a2a200a2SMatthew D Fleming panic("MemGuard detected double-free of %p", (void *)va); 261a2a200a2SMatthew D Fleming p = PHYS_TO_VM_PAGE(pa); 262e3813573SMatthew D Fleming KASSERT(p->wire_count != 0 && p->queue == PQ_NONE, 263e3813573SMatthew D Fleming ("MEMGUARD: Expected wired page %p in vtomgfifo!", p)); 264c325e866SKonstantin Belousov return (&p->plinks.memguard.p); 265e3813573SMatthew D Fleming } 266e3813573SMatthew D Fleming 2675df87b21SJeff Roberson static u_long * 2685df87b21SJeff Roberson v2sizev(vm_offset_t va) 2695df87b21SJeff Roberson { 2705df87b21SJeff Roberson vm_paddr_t pa; 2715df87b21SJeff Roberson struct vm_page *p; 2725df87b21SJeff Roberson 2735df87b21SJeff Roberson pa = pmap_kextract(va); 2745df87b21SJeff Roberson if (pa == 0) 2755df87b21SJeff Roberson panic("MemGuard detected double-free of %p", (void *)va); 2765df87b21SJeff Roberson p = PHYS_TO_VM_PAGE(pa); 2775df87b21SJeff Roberson KASSERT(p->wire_count != 0 && p->queue == PQ_NONE, 2785df87b21SJeff Roberson ("MEMGUARD: Expected wired page %p in vtomgfifo!", p)); 279c325e866SKonstantin Belousov return (&p->plinks.memguard.v); 2805df87b21SJeff Roberson } 2815df87b21SJeff Roberson 282e3813573SMatthew D Fleming /* 283e3813573SMatthew D Fleming * Allocate a single object of specified size with specified flags 284e3813573SMatthew D Fleming * (either M_WAITOK or M_NOWAIT). 285e4eb384bSBosko Milekic */ 286e4eb384bSBosko Milekic void * 287e3813573SMatthew D Fleming memguard_alloc(unsigned long req_size, int flags) 288e4eb384bSBosko Milekic { 289e3813573SMatthew D Fleming vm_offset_t addr; 290e3813573SMatthew D Fleming u_long size_p, size_v; 291e3813573SMatthew D Fleming int do_guard, rv; 292e4eb384bSBosko Milekic 293e3813573SMatthew D Fleming size_p = round_page(req_size); 294e3813573SMatthew D Fleming if (size_p == 0) 295e3813573SMatthew D Fleming return (NULL); 296e4eb384bSBosko Milekic /* 297e3813573SMatthew D Fleming * To ensure there are holes on both sides of the allocation, 298e3813573SMatthew D Fleming * request 2 extra pages of KVA. We will only actually add a 299e3813573SMatthew D Fleming * vm_map_entry and get pages for the original request. Save 300e3813573SMatthew D Fleming * the value of memguard_options so we have a consistent 301e3813573SMatthew D Fleming * value. 302e4eb384bSBosko Milekic */ 303e3813573SMatthew D Fleming size_v = size_p; 3048d689e04SGleb Smirnoff do_guard = (memguard_options & MG_GUARD_AROUND) != 0; 305e3813573SMatthew D Fleming if (do_guard) 306e3813573SMatthew D Fleming size_v += 2 * PAGE_SIZE; 307e4eb384bSBosko Milekic 308e3813573SMatthew D Fleming /* 309e3813573SMatthew D Fleming * When we pass our memory limit, reject sub-page allocations. 310e3813573SMatthew D Fleming * Page-size and larger allocations will use the same amount 311e3813573SMatthew D Fleming * of physical memory whether we allocate or hand off to 312e3813573SMatthew D Fleming * uma_large_alloc(), so keep those. 313e3813573SMatthew D Fleming */ 314*8441d1e8SJeff Roberson if (vmem_size(memguard_arena, VMEM_ALLOC) >= memguard_physlimit && 315e3813573SMatthew D Fleming req_size < PAGE_SIZE) { 316e3813573SMatthew D Fleming addr = (vm_offset_t)NULL; 317e3813573SMatthew D Fleming memguard_fail_pgs++; 318e3813573SMatthew D Fleming goto out; 319e4eb384bSBosko Milekic } 320e3813573SMatthew D Fleming /* 321e3813573SMatthew D Fleming * Keep a moving cursor so we don't recycle KVA as long as 322e3813573SMatthew D Fleming * possible. It's not perfect, since we don't know in what 323e3813573SMatthew D Fleming * order previous allocations will be free'd, but it's simple 324e3813573SMatthew D Fleming * and fast, and requires O(1) additional storage if guard 325e3813573SMatthew D Fleming * pages are not used. 326e3813573SMatthew D Fleming * 327e3813573SMatthew D Fleming * XXX This scheme will lead to greater fragmentation of the 328e3813573SMatthew D Fleming * map, unless vm_map_findspace() is tweaked. 329e3813573SMatthew D Fleming */ 330e3813573SMatthew D Fleming for (;;) { 331*8441d1e8SJeff Roberson if (vmem_xalloc(memguard_arena, size_v, 0, 0, 0, 332*8441d1e8SJeff Roberson memguard_cursor, VMEM_ADDR_MAX, 333*8441d1e8SJeff Roberson M_BESTFIT | M_NOWAIT, &addr) == 0) 334e3813573SMatthew D Fleming break; 335e3813573SMatthew D Fleming /* 336e3813573SMatthew D Fleming * The map has no space. This may be due to 337e3813573SMatthew D Fleming * fragmentation, or because the cursor is near the 338e3813573SMatthew D Fleming * end of the map. 339e3813573SMatthew D Fleming */ 3405df87b21SJeff Roberson if (memguard_cursor == memguard_base) { 341e3813573SMatthew D Fleming memguard_fail_kva++; 342e3813573SMatthew D Fleming addr = (vm_offset_t)NULL; 343e3813573SMatthew D Fleming goto out; 344e3813573SMatthew D Fleming } 345e3813573SMatthew D Fleming memguard_wrap++; 3465df87b21SJeff Roberson memguard_cursor = memguard_base; 347e3813573SMatthew D Fleming } 348e3813573SMatthew D Fleming if (do_guard) 349e3813573SMatthew D Fleming addr += PAGE_SIZE; 3505df87b21SJeff Roberson rv = kmem_back(kmem_object, addr, size_p, flags); 351e3813573SMatthew D Fleming if (rv != KERN_SUCCESS) { 352*8441d1e8SJeff Roberson vmem_xfree(memguard_arena, addr, size_v); 353e3813573SMatthew D Fleming memguard_fail_pgs++; 354e3813573SMatthew D Fleming addr = (vm_offset_t)NULL; 355e3813573SMatthew D Fleming goto out; 356e3813573SMatthew D Fleming } 3575df87b21SJeff Roberson memguard_cursor = addr + size_v; 358e3813573SMatthew D Fleming *v2sizep(trunc_page(addr)) = req_size; 3595df87b21SJeff Roberson *v2sizev(trunc_page(addr)) = size_v; 360e3813573SMatthew D Fleming memguard_succ++; 361e3813573SMatthew D Fleming if (req_size < PAGE_SIZE) { 362e3813573SMatthew D Fleming memguard_wasted += (PAGE_SIZE - req_size); 363e3813573SMatthew D Fleming if (do_guard) { 364e3813573SMatthew D Fleming /* 365e3813573SMatthew D Fleming * Align the request to 16 bytes, and return 366e3813573SMatthew D Fleming * an address near the end of the page, to 367e3813573SMatthew D Fleming * better detect array overrun. 368e3813573SMatthew D Fleming */ 369e3813573SMatthew D Fleming req_size = roundup2(req_size, 16); 370e3813573SMatthew D Fleming addr += (PAGE_SIZE - req_size); 371e3813573SMatthew D Fleming } 372e3813573SMatthew D Fleming } 373e3813573SMatthew D Fleming out: 374e3813573SMatthew D Fleming return ((void *)addr); 375e3813573SMatthew D Fleming } 376e3813573SMatthew D Fleming 377e3813573SMatthew D Fleming int 378e3813573SMatthew D Fleming is_memguard_addr(void *addr) 379e3813573SMatthew D Fleming { 380e3813573SMatthew D Fleming vm_offset_t a = (vm_offset_t)(uintptr_t)addr; 381e3813573SMatthew D Fleming 3825df87b21SJeff Roberson return (a >= memguard_base && a < memguard_base + memguard_mapsize); 383e4eb384bSBosko Milekic } 384e4eb384bSBosko Milekic 385e4eb384bSBosko Milekic /* 386e4eb384bSBosko Milekic * Free specified single object. 387e4eb384bSBosko Milekic */ 388e4eb384bSBosko Milekic void 389e3813573SMatthew D Fleming memguard_free(void *ptr) 390e4eb384bSBosko Milekic { 391e3813573SMatthew D Fleming vm_offset_t addr; 3925df87b21SJeff Roberson u_long req_size, size, sizev; 393e3813573SMatthew D Fleming char *temp; 394e3813573SMatthew D Fleming int i; 395e4eb384bSBosko Milekic 396e3813573SMatthew D Fleming addr = trunc_page((uintptr_t)ptr); 397e3813573SMatthew D Fleming req_size = *v2sizep(addr); 3985df87b21SJeff Roberson sizev = *v2sizev(addr); 399e3813573SMatthew D Fleming size = round_page(req_size); 40003412565SBosko Milekic 40103412565SBosko Milekic /* 402e3813573SMatthew D Fleming * Page should not be guarded right now, so force a write. 403e3813573SMatthew D Fleming * The purpose of this is to increase the likelihood of 404e3813573SMatthew D Fleming * catching a double-free, but not necessarily a 405e3813573SMatthew D Fleming * tamper-after-free (the second thread freeing might not 406e3813573SMatthew D Fleming * write before freeing, so this forces it to and, 407e3813573SMatthew D Fleming * subsequently, trigger a fault). 40803412565SBosko Milekic */ 409e3813573SMatthew D Fleming temp = ptr; 410e3813573SMatthew D Fleming for (i = 0; i < size; i += PAGE_SIZE) 411e3813573SMatthew D Fleming temp[i] = 'M'; 41203412565SBosko Milekic 413e3813573SMatthew D Fleming /* 414e3813573SMatthew D Fleming * This requires carnal knowledge of the implementation of 415e3813573SMatthew D Fleming * kmem_free(), but since we've already replaced kmem_malloc() 416e3813573SMatthew D Fleming * above, it's not really any worse. We want to use the 417e3813573SMatthew D Fleming * vm_map lock to serialize updates to memguard_wasted, since 418e3813573SMatthew D Fleming * we had the lock at increment. 419e3813573SMatthew D Fleming */ 4205df87b21SJeff Roberson kmem_unback(kmem_object, addr, size); 4215df87b21SJeff Roberson if (sizev > size) 4225df87b21SJeff Roberson addr -= PAGE_SIZE; 423*8441d1e8SJeff Roberson vmem_xfree(memguard_arena, addr, sizev); 424e3813573SMatthew D Fleming if (req_size < PAGE_SIZE) 425e3813573SMatthew D Fleming memguard_wasted -= (PAGE_SIZE - req_size); 426e4eb384bSBosko Milekic } 427e4eb384bSBosko Milekic 4286d3ed393SMatthew D Fleming /* 4296d3ed393SMatthew D Fleming * Re-allocate an allocation that was originally guarded. 4306d3ed393SMatthew D Fleming */ 4316d3ed393SMatthew D Fleming void * 4326d3ed393SMatthew D Fleming memguard_realloc(void *addr, unsigned long size, struct malloc_type *mtp, 4336d3ed393SMatthew D Fleming int flags) 4346d3ed393SMatthew D Fleming { 4356d3ed393SMatthew D Fleming void *newaddr; 4366d3ed393SMatthew D Fleming u_long old_size; 4376d3ed393SMatthew D Fleming 4386d3ed393SMatthew D Fleming /* 4396d3ed393SMatthew D Fleming * Allocate the new block. Force the allocation to be guarded 4406d3ed393SMatthew D Fleming * as the original may have been guarded through random 4416d3ed393SMatthew D Fleming * chance, and that should be preserved. 4426d3ed393SMatthew D Fleming */ 4436d3ed393SMatthew D Fleming if ((newaddr = memguard_alloc(size, flags)) == NULL) 4446d3ed393SMatthew D Fleming return (NULL); 4456d3ed393SMatthew D Fleming 4466d3ed393SMatthew D Fleming /* Copy over original contents. */ 4476d3ed393SMatthew D Fleming old_size = *v2sizep(trunc_page((uintptr_t)addr)); 4486d3ed393SMatthew D Fleming bcopy(addr, newaddr, min(size, old_size)); 4496d3ed393SMatthew D Fleming memguard_free(addr); 4506d3ed393SMatthew D Fleming return (newaddr); 4516d3ed393SMatthew D Fleming } 4526d3ed393SMatthew D Fleming 4538d689e04SGleb Smirnoff static int 4548d689e04SGleb Smirnoff memguard_cmp(unsigned long size) 455d362c40dSPawel Jakub Dawidek { 456d362c40dSPawel Jakub Dawidek 457e3813573SMatthew D Fleming if (size < memguard_minsize) { 458e3813573SMatthew D Fleming memguard_minsize_reject++; 459e3813573SMatthew D Fleming return (0); 460e3813573SMatthew D Fleming } 4618d689e04SGleb Smirnoff if ((memguard_options & MG_GUARD_ALLLARGE) != 0 && size >= PAGE_SIZE) 462e3813573SMatthew D Fleming return (1); 463e3813573SMatthew D Fleming if (memguard_frequency > 0 && 464e3813573SMatthew D Fleming (random() % 100000) < memguard_frequency) { 465e3813573SMatthew D Fleming memguard_frequency_hits++; 466e3813573SMatthew D Fleming return (1); 467e3813573SMatthew D Fleming } 4688d689e04SGleb Smirnoff 4698d689e04SGleb Smirnoff return (0); 4708d689e04SGleb Smirnoff } 4718d689e04SGleb Smirnoff 4728d689e04SGleb Smirnoff int 4738d689e04SGleb Smirnoff memguard_cmp_mtp(struct malloc_type *mtp, unsigned long size) 4748d689e04SGleb Smirnoff { 4758d689e04SGleb Smirnoff 4768d689e04SGleb Smirnoff if (memguard_cmp(size)) 4778d689e04SGleb Smirnoff return(1); 4788d689e04SGleb Smirnoff 479d362c40dSPawel Jakub Dawidek #if 1 480d362c40dSPawel Jakub Dawidek /* 481d362c40dSPawel Jakub Dawidek * The safest way of comparsion is to always compare short description 482d362c40dSPawel Jakub Dawidek * string of memory type, but it is also the slowest way. 483d362c40dSPawel Jakub Dawidek */ 484d362c40dSPawel Jakub Dawidek return (strcmp(mtp->ks_shortdesc, vm_memguard_desc) == 0); 485d362c40dSPawel Jakub Dawidek #else 486d362c40dSPawel Jakub Dawidek /* 487d362c40dSPawel Jakub Dawidek * If we compare pointers, there are two possible problems: 488d362c40dSPawel Jakub Dawidek * 1. Memory type was unloaded and new memory type was allocated at the 489d362c40dSPawel Jakub Dawidek * same address. 490d362c40dSPawel Jakub Dawidek * 2. Memory type was unloaded and loaded again, but allocated at a 491d362c40dSPawel Jakub Dawidek * different address. 492d362c40dSPawel Jakub Dawidek */ 493d362c40dSPawel Jakub Dawidek if (vm_memguard_mtype != NULL) 494d362c40dSPawel Jakub Dawidek return (mtp == vm_memguard_mtype); 495d362c40dSPawel Jakub Dawidek if (strcmp(mtp->ks_shortdesc, vm_memguard_desc) == 0) { 496d362c40dSPawel Jakub Dawidek vm_memguard_mtype = mtp; 497d362c40dSPawel Jakub Dawidek return (1); 498d362c40dSPawel Jakub Dawidek } 499d362c40dSPawel Jakub Dawidek return (0); 500d362c40dSPawel Jakub Dawidek #endif 501d362c40dSPawel Jakub Dawidek } 5028d689e04SGleb Smirnoff 5038d689e04SGleb Smirnoff int 5048d689e04SGleb Smirnoff memguard_cmp_zone(uma_zone_t zone) 5058d689e04SGleb Smirnoff { 5068d689e04SGleb Smirnoff 5078d689e04SGleb Smirnoff if ((memguard_options & MG_GUARD_NOFREE) == 0 && 5088d689e04SGleb Smirnoff zone->uz_flags & UMA_ZONE_NOFREE) 5098d689e04SGleb Smirnoff return (0); 5108d689e04SGleb Smirnoff 5118d689e04SGleb Smirnoff if (memguard_cmp(zone->uz_size)) 5128d689e04SGleb Smirnoff return (1); 5138d689e04SGleb Smirnoff 5148d689e04SGleb Smirnoff /* 5158d689e04SGleb Smirnoff * The safest way of comparsion is to always compare zone name, 5168d689e04SGleb Smirnoff * but it is also the slowest way. 5178d689e04SGleb Smirnoff */ 5188d689e04SGleb Smirnoff return (strcmp(zone->uz_name, vm_memguard_desc) == 0); 5198d689e04SGleb Smirnoff } 520