1099a0e58SBosko Milekic /*- 28076cb52SBosko Milekic * Copyright (c) 2004, 2005, 38076cb52SBosko Milekic * Bosko Milekic <bmilekic@FreeBSD.org>. All rights reserved. 4099a0e58SBosko Milekic * 5099a0e58SBosko Milekic * Redistribution and use in source and binary forms, with or without 6099a0e58SBosko Milekic * modification, are permitted provided that the following conditions 7099a0e58SBosko Milekic * are met: 8099a0e58SBosko Milekic * 1. Redistributions of source code must retain the above copyright 9099a0e58SBosko Milekic * notice unmodified, this list of conditions and the following 10099a0e58SBosko Milekic * disclaimer. 11099a0e58SBosko Milekic * 2. Redistributions in binary form must reproduce the above copyright 12099a0e58SBosko Milekic * notice, this list of conditions and the following disclaimer in the 13099a0e58SBosko Milekic * documentation and/or other materials provided with the distribution. 14099a0e58SBosko Milekic * 15099a0e58SBosko Milekic * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 16099a0e58SBosko Milekic * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17099a0e58SBosko Milekic * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 18099a0e58SBosko Milekic * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 19099a0e58SBosko Milekic * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 20099a0e58SBosko Milekic * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 21099a0e58SBosko Milekic * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 22099a0e58SBosko Milekic * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 23099a0e58SBosko Milekic * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 24099a0e58SBosko Milekic * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 25099a0e58SBosko Milekic * SUCH DAMAGE. 26099a0e58SBosko Milekic */ 27099a0e58SBosko Milekic 28099a0e58SBosko Milekic #include <sys/cdefs.h> 29099a0e58SBosko Milekic __FBSDID("$FreeBSD$"); 30099a0e58SBosko Milekic 31099a0e58SBosko Milekic #include "opt_mac.h" 32099a0e58SBosko Milekic #include "opt_param.h" 33099a0e58SBosko Milekic 34099a0e58SBosko Milekic #include <sys/param.h> 35099a0e58SBosko Milekic #include <sys/malloc.h> 36099a0e58SBosko Milekic #include <sys/systm.h> 37099a0e58SBosko Milekic #include <sys/mbuf.h> 38099a0e58SBosko Milekic #include <sys/domain.h> 39099a0e58SBosko Milekic #include <sys/eventhandler.h> 40099a0e58SBosko Milekic #include <sys/kernel.h> 41099a0e58SBosko Milekic #include <sys/protosw.h> 42099a0e58SBosko Milekic #include <sys/smp.h> 43099a0e58SBosko Milekic #include <sys/sysctl.h> 44099a0e58SBosko Milekic 45aed55708SRobert Watson #include <security/mac/mac_framework.h> 46aed55708SRobert Watson 47099a0e58SBosko Milekic #include <vm/vm.h> 48099a0e58SBosko Milekic #include <vm/vm_page.h> 49099a0e58SBosko Milekic #include <vm/uma.h> 50121f0509SMike Silbersack #include <vm/uma_int.h> 51121f0509SMike Silbersack #include <vm/uma_dbg.h> 52099a0e58SBosko Milekic 53099a0e58SBosko Milekic /* 54099a0e58SBosko Milekic * In FreeBSD, Mbufs and Mbuf Clusters are allocated from UMA 55099a0e58SBosko Milekic * Zones. 56099a0e58SBosko Milekic * 57099a0e58SBosko Milekic * Mbuf Clusters (2K, contiguous) are allocated from the Cluster 58099a0e58SBosko Milekic * Zone. The Zone can be capped at kern.ipc.nmbclusters, if the 59099a0e58SBosko Milekic * administrator so desires. 60099a0e58SBosko Milekic * 61099a0e58SBosko Milekic * Mbufs are allocated from a UMA Master Zone called the Mbuf 62099a0e58SBosko Milekic * Zone. 63099a0e58SBosko Milekic * 64099a0e58SBosko Milekic * Additionally, FreeBSD provides a Packet Zone, which it 65099a0e58SBosko Milekic * configures as a Secondary Zone to the Mbuf Master Zone, 66099a0e58SBosko Milekic * thus sharing backend Slab kegs with the Mbuf Master Zone. 67099a0e58SBosko Milekic * 68099a0e58SBosko Milekic * Thus common-case allocations and locking are simplified: 69099a0e58SBosko Milekic * 70099a0e58SBosko Milekic * m_clget() m_getcl() 71099a0e58SBosko Milekic * | | 72099a0e58SBosko Milekic * | .------------>[(Packet Cache)] m_get(), m_gethdr() 73099a0e58SBosko Milekic * | | [ Packet ] | 74099a0e58SBosko Milekic * [(Cluster Cache)] [ Secondary ] [ (Mbuf Cache) ] 75099a0e58SBosko Milekic * [ Cluster Zone ] [ Zone ] [ Mbuf Master Zone ] 76099a0e58SBosko Milekic * | \________ | 77099a0e58SBosko Milekic * [ Cluster Keg ] \ / 78099a0e58SBosko Milekic * | [ Mbuf Keg ] 79099a0e58SBosko Milekic * [ Cluster Slabs ] | 80099a0e58SBosko Milekic * | [ Mbuf Slabs ] 81099a0e58SBosko Milekic * \____________(VM)_________________/ 8256a4e45aSAndre Oppermann * 8356a4e45aSAndre Oppermann * 84fcf90618SGleb Smirnoff * Whenever an object is allocated with uma_zalloc() out of 8556a4e45aSAndre Oppermann * one of the Zones its _ctor_ function is executed. The same 86fcf90618SGleb Smirnoff * for any deallocation through uma_zfree() the _dtor_ function 8756a4e45aSAndre Oppermann * is executed. 8856a4e45aSAndre Oppermann * 8956a4e45aSAndre Oppermann * Caches are per-CPU and are filled from the Master Zone. 9056a4e45aSAndre Oppermann * 91fcf90618SGleb Smirnoff * Whenever an object is allocated from the underlying global 9256a4e45aSAndre Oppermann * memory pool it gets pre-initialized with the _zinit_ functions. 9356a4e45aSAndre Oppermann * When the Keg's are overfull objects get decomissioned with 9456a4e45aSAndre Oppermann * _zfini_ functions and free'd back to the global memory pool. 9556a4e45aSAndre Oppermann * 96099a0e58SBosko Milekic */ 97099a0e58SBosko Milekic 9856a4e45aSAndre Oppermann int nmbclusters; /* limits number of mbuf clusters */ 99ec63cb90SAndre Oppermann int nmbjumbop; /* limits number of page size jumbo clusters */ 10056a4e45aSAndre Oppermann int nmbjumbo9; /* limits number of 9k jumbo clusters */ 10156a4e45aSAndre Oppermann int nmbjumbo16; /* limits number of 16k jumbo clusters */ 102099a0e58SBosko Milekic struct mbstat mbstat; 103099a0e58SBosko Milekic 104099a0e58SBosko Milekic static void 105099a0e58SBosko Milekic tunable_mbinit(void *dummy) 106099a0e58SBosko Milekic { 107099a0e58SBosko Milekic 108099a0e58SBosko Milekic /* This has to be done before VM init. */ 109099a0e58SBosko Milekic nmbclusters = 1024 + maxusers * 64; 110099a0e58SBosko Milekic TUNABLE_INT_FETCH("kern.ipc.nmbclusters", &nmbclusters); 111099a0e58SBosko Milekic } 112099a0e58SBosko Milekic SYSINIT(tunable_mbinit, SI_SUB_TUNABLES, SI_ORDER_ANY, tunable_mbinit, NULL); 113099a0e58SBosko Milekic 11456a4e45aSAndre Oppermann /* XXX: These should be tuneables. Can't change UMA limits on the fly. */ 1154f590175SPaul Saab static int 1164f590175SPaul Saab sysctl_nmbclusters(SYSCTL_HANDLER_ARGS) 1174f590175SPaul Saab { 1184f590175SPaul Saab int error, newnmbclusters; 1194f590175SPaul Saab 1204f590175SPaul Saab newnmbclusters = nmbclusters; 121041b706bSDavid Malone error = sysctl_handle_int(oidp, &newnmbclusters, 0, req); 1224f590175SPaul Saab if (error == 0 && req->newptr) { 1234f590175SPaul Saab if (newnmbclusters > nmbclusters) { 1244f590175SPaul Saab nmbclusters = newnmbclusters; 1254f590175SPaul Saab uma_zone_set_max(zone_clust, nmbclusters); 1264f590175SPaul Saab EVENTHANDLER_INVOKE(nmbclusters_change); 1274f590175SPaul Saab } else 1284f590175SPaul Saab error = EINVAL; 1294f590175SPaul Saab } 1304f590175SPaul Saab return (error); 1314f590175SPaul Saab } 1324f590175SPaul Saab SYSCTL_PROC(_kern_ipc, OID_AUTO, nmbclusters, CTLTYPE_INT|CTLFLAG_RW, 1334f590175SPaul Saab &nmbclusters, 0, sysctl_nmbclusters, "IU", 134099a0e58SBosko Milekic "Maximum number of mbuf clusters allowed"); 135ec63cb90SAndre Oppermann SYSCTL_INT(_kern_ipc, OID_AUTO, nmbjumbop, CTLFLAG_RW, &nmbjumbop, 0, 136ec63cb90SAndre Oppermann "Maximum number of mbuf page size jumbo clusters allowed"); 13756a4e45aSAndre Oppermann SYSCTL_INT(_kern_ipc, OID_AUTO, nmbjumbo9, CTLFLAG_RW, &nmbjumbo9, 0, 13856a4e45aSAndre Oppermann "Maximum number of mbuf 9k jumbo clusters allowed"); 13956a4e45aSAndre Oppermann SYSCTL_INT(_kern_ipc, OID_AUTO, nmbjumbo16, CTLFLAG_RW, &nmbjumbo16, 0, 14056a4e45aSAndre Oppermann "Maximum number of mbuf 16k jumbo clusters allowed"); 141099a0e58SBosko Milekic SYSCTL_STRUCT(_kern_ipc, OID_AUTO, mbstat, CTLFLAG_RD, &mbstat, mbstat, 142099a0e58SBosko Milekic "Mbuf general information and statistics"); 143099a0e58SBosko Milekic 144099a0e58SBosko Milekic /* 145099a0e58SBosko Milekic * Zones from which we allocate. 146099a0e58SBosko Milekic */ 147099a0e58SBosko Milekic uma_zone_t zone_mbuf; 148099a0e58SBosko Milekic uma_zone_t zone_clust; 149099a0e58SBosko Milekic uma_zone_t zone_pack; 150ec63cb90SAndre Oppermann uma_zone_t zone_jumbop; 15156a4e45aSAndre Oppermann uma_zone_t zone_jumbo9; 15256a4e45aSAndre Oppermann uma_zone_t zone_jumbo16; 15356a4e45aSAndre Oppermann uma_zone_t zone_ext_refcnt; 154099a0e58SBosko Milekic 155099a0e58SBosko Milekic /* 156099a0e58SBosko Milekic * Local prototypes. 157099a0e58SBosko Milekic */ 158b23f72e9SBrian Feldman static int mb_ctor_mbuf(void *, int, void *, int); 159b23f72e9SBrian Feldman static int mb_ctor_clust(void *, int, void *, int); 160b23f72e9SBrian Feldman static int mb_ctor_pack(void *, int, void *, int); 161099a0e58SBosko Milekic static void mb_dtor_mbuf(void *, int, void *); 16256a4e45aSAndre Oppermann static void mb_dtor_clust(void *, int, void *); 16356a4e45aSAndre Oppermann static void mb_dtor_pack(void *, int, void *); 16456a4e45aSAndre Oppermann static int mb_zinit_pack(void *, int, int); 16556a4e45aSAndre Oppermann static void mb_zfini_pack(void *, int); 166099a0e58SBosko Milekic 167099a0e58SBosko Milekic static void mb_reclaim(void *); 168099a0e58SBosko Milekic static void mbuf_init(void *); 169099a0e58SBosko Milekic 170a04946cfSBrian Somers /* Ensure that MSIZE doesn't break dtom() - it must be a power of 2 */ 171a04946cfSBrian Somers CTASSERT((((MSIZE - 1) ^ MSIZE) + 1) >> 1 == MSIZE); 172a04946cfSBrian Somers 173099a0e58SBosko Milekic /* 174099a0e58SBosko Milekic * Initialize FreeBSD Network buffer allocation. 175099a0e58SBosko Milekic */ 176099a0e58SBosko Milekic SYSINIT(mbuf, SI_SUB_MBUF, SI_ORDER_FIRST, mbuf_init, NULL) 177099a0e58SBosko Milekic static void 178099a0e58SBosko Milekic mbuf_init(void *dummy) 179099a0e58SBosko Milekic { 180099a0e58SBosko Milekic 181099a0e58SBosko Milekic /* 182099a0e58SBosko Milekic * Configure UMA zones for Mbufs, Clusters, and Packets. 183099a0e58SBosko Milekic */ 18456a4e45aSAndre Oppermann zone_mbuf = uma_zcreate(MBUF_MEM_NAME, MSIZE, 18556a4e45aSAndre Oppermann mb_ctor_mbuf, mb_dtor_mbuf, 186121f0509SMike Silbersack #ifdef INVARIANTS 18756a4e45aSAndre Oppermann trash_init, trash_fini, 188121f0509SMike Silbersack #else 18956a4e45aSAndre Oppermann NULL, NULL, 190121f0509SMike Silbersack #endif 19156a4e45aSAndre Oppermann MSIZE - 1, UMA_ZONE_MAXBUCKET); 19256a4e45aSAndre Oppermann 19368352adfSRobert Watson zone_clust = uma_zcreate(MBUF_CLUSTER_MEM_NAME, MCLBYTES, 19456a4e45aSAndre Oppermann mb_ctor_clust, mb_dtor_clust, 195121f0509SMike Silbersack #ifdef INVARIANTS 19656a4e45aSAndre Oppermann trash_init, trash_fini, 197121f0509SMike Silbersack #else 19856a4e45aSAndre Oppermann NULL, NULL, 199121f0509SMike Silbersack #endif 20056a4e45aSAndre Oppermann UMA_ALIGN_PTR, UMA_ZONE_REFCNT); 201099a0e58SBosko Milekic if (nmbclusters > 0) 202099a0e58SBosko Milekic uma_zone_set_max(zone_clust, nmbclusters); 203099a0e58SBosko Milekic 20456a4e45aSAndre Oppermann zone_pack = uma_zsecond_create(MBUF_PACKET_MEM_NAME, mb_ctor_pack, 20556a4e45aSAndre Oppermann mb_dtor_pack, mb_zinit_pack, mb_zfini_pack, zone_mbuf); 20656a4e45aSAndre Oppermann 207fcf90618SGleb Smirnoff /* Make jumbo frame zone too. Page size, 9k and 16k. */ 208ec63cb90SAndre Oppermann zone_jumbop = uma_zcreate(MBUF_JUMBOP_MEM_NAME, MJUMPAGESIZE, 209d5269a63SAndre Oppermann mb_ctor_clust, mb_dtor_clust, 210d5269a63SAndre Oppermann #ifdef INVARIANTS 211d5269a63SAndre Oppermann trash_init, trash_fini, 212d5269a63SAndre Oppermann #else 213d5269a63SAndre Oppermann NULL, NULL, 214d5269a63SAndre Oppermann #endif 215d5269a63SAndre Oppermann UMA_ALIGN_PTR, UMA_ZONE_REFCNT); 216ec63cb90SAndre Oppermann if (nmbjumbop > 0) 217ec63cb90SAndre Oppermann uma_zone_set_max(zone_jumbop, nmbjumbop); 218d5269a63SAndre Oppermann 21956a4e45aSAndre Oppermann zone_jumbo9 = uma_zcreate(MBUF_JUMBO9_MEM_NAME, MJUM9BYTES, 22056a4e45aSAndre Oppermann mb_ctor_clust, mb_dtor_clust, 22156a4e45aSAndre Oppermann #ifdef INVARIANTS 22256a4e45aSAndre Oppermann trash_init, trash_fini, 22356a4e45aSAndre Oppermann #else 22456a4e45aSAndre Oppermann NULL, NULL, 22556a4e45aSAndre Oppermann #endif 22656a4e45aSAndre Oppermann UMA_ALIGN_PTR, UMA_ZONE_REFCNT); 22756a4e45aSAndre Oppermann if (nmbjumbo9 > 0) 22856a4e45aSAndre Oppermann uma_zone_set_max(zone_jumbo9, nmbjumbo9); 22956a4e45aSAndre Oppermann 23056a4e45aSAndre Oppermann zone_jumbo16 = uma_zcreate(MBUF_JUMBO16_MEM_NAME, MJUM16BYTES, 23156a4e45aSAndre Oppermann mb_ctor_clust, mb_dtor_clust, 23256a4e45aSAndre Oppermann #ifdef INVARIANTS 23356a4e45aSAndre Oppermann trash_init, trash_fini, 23456a4e45aSAndre Oppermann #else 23556a4e45aSAndre Oppermann NULL, NULL, 23656a4e45aSAndre Oppermann #endif 23756a4e45aSAndre Oppermann UMA_ALIGN_PTR, UMA_ZONE_REFCNT); 23856a4e45aSAndre Oppermann if (nmbjumbo16 > 0) 23956a4e45aSAndre Oppermann uma_zone_set_max(zone_jumbo16, nmbjumbo16); 24056a4e45aSAndre Oppermann 24156a4e45aSAndre Oppermann zone_ext_refcnt = uma_zcreate(MBUF_EXTREFCNT_MEM_NAME, sizeof(u_int), 24256a4e45aSAndre Oppermann NULL, NULL, 24356a4e45aSAndre Oppermann NULL, NULL, 24456a4e45aSAndre Oppermann UMA_ALIGN_PTR, UMA_ZONE_ZINIT); 24556a4e45aSAndre Oppermann 24656a4e45aSAndre Oppermann /* uma_prealloc() goes here... */ 247099a0e58SBosko Milekic 248099a0e58SBosko Milekic /* 249099a0e58SBosko Milekic * Hook event handler for low-memory situation, used to 250099a0e58SBosko Milekic * drain protocols and push data back to the caches (UMA 251099a0e58SBosko Milekic * later pushes it back to VM). 252099a0e58SBosko Milekic */ 253099a0e58SBosko Milekic EVENTHANDLER_REGISTER(vm_lowmem, mb_reclaim, NULL, 254099a0e58SBosko Milekic EVENTHANDLER_PRI_FIRST); 255099a0e58SBosko Milekic 256099a0e58SBosko Milekic /* 257099a0e58SBosko Milekic * [Re]set counters and local statistics knobs. 258099a0e58SBosko Milekic * XXX Some of these should go and be replaced, but UMA stat 259099a0e58SBosko Milekic * gathering needs to be revised. 260099a0e58SBosko Milekic */ 261099a0e58SBosko Milekic mbstat.m_mbufs = 0; 262099a0e58SBosko Milekic mbstat.m_mclusts = 0; 263099a0e58SBosko Milekic mbstat.m_drain = 0; 264099a0e58SBosko Milekic mbstat.m_msize = MSIZE; 265099a0e58SBosko Milekic mbstat.m_mclbytes = MCLBYTES; 266099a0e58SBosko Milekic mbstat.m_minclsize = MINCLSIZE; 267099a0e58SBosko Milekic mbstat.m_mlen = MLEN; 268099a0e58SBosko Milekic mbstat.m_mhlen = MHLEN; 269099a0e58SBosko Milekic mbstat.m_numtypes = MT_NTYPES; 270099a0e58SBosko Milekic 271099a0e58SBosko Milekic mbstat.m_mcfail = mbstat.m_mpfail = 0; 272099a0e58SBosko Milekic mbstat.sf_iocnt = 0; 273099a0e58SBosko Milekic mbstat.sf_allocwait = mbstat.sf_allocfail = 0; 274099a0e58SBosko Milekic } 275099a0e58SBosko Milekic 276099a0e58SBosko Milekic /* 277099a0e58SBosko Milekic * Constructor for Mbuf master zone. 278099a0e58SBosko Milekic * 279099a0e58SBosko Milekic * The 'arg' pointer points to a mb_args structure which 280099a0e58SBosko Milekic * contains call-specific information required to support the 28156a4e45aSAndre Oppermann * mbuf allocation API. See mbuf.h. 282099a0e58SBosko Milekic */ 283b23f72e9SBrian Feldman static int 284b23f72e9SBrian Feldman mb_ctor_mbuf(void *mem, int size, void *arg, int how) 285099a0e58SBosko Milekic { 286099a0e58SBosko Milekic struct mbuf *m; 287099a0e58SBosko Milekic struct mb_args *args; 288b23f72e9SBrian Feldman #ifdef MAC 289b23f72e9SBrian Feldman int error; 290b23f72e9SBrian Feldman #endif 291099a0e58SBosko Milekic int flags; 292099a0e58SBosko Milekic short type; 293099a0e58SBosko Milekic 294121f0509SMike Silbersack #ifdef INVARIANTS 295121f0509SMike Silbersack trash_ctor(mem, size, arg, how); 296121f0509SMike Silbersack #endif 297099a0e58SBosko Milekic m = (struct mbuf *)mem; 298099a0e58SBosko Milekic args = (struct mb_args *)arg; 299099a0e58SBosko Milekic flags = args->flags; 300099a0e58SBosko Milekic type = args->type; 301099a0e58SBosko Milekic 30256a4e45aSAndre Oppermann /* 30356a4e45aSAndre Oppermann * The mbuf is initialized later. The caller has the 304fcf90618SGleb Smirnoff * responsibility to set up any MAC labels too. 30556a4e45aSAndre Oppermann */ 30656a4e45aSAndre Oppermann if (type == MT_NOINIT) 30756a4e45aSAndre Oppermann return (0); 30856a4e45aSAndre Oppermann 309099a0e58SBosko Milekic m->m_next = NULL; 310099a0e58SBosko Milekic m->m_nextpkt = NULL; 31156a4e45aSAndre Oppermann m->m_len = 0; 3126bc72ab9SBosko Milekic m->m_flags = flags; 31356a4e45aSAndre Oppermann m->m_type = type; 314099a0e58SBosko Milekic if (flags & M_PKTHDR) { 315099a0e58SBosko Milekic m->m_data = m->m_pktdat; 316099a0e58SBosko Milekic m->m_pkthdr.rcvif = NULL; 31756a4e45aSAndre Oppermann m->m_pkthdr.len = 0; 31856a4e45aSAndre Oppermann m->m_pkthdr.header = NULL; 319099a0e58SBosko Milekic m->m_pkthdr.csum_flags = 0; 32056a4e45aSAndre Oppermann m->m_pkthdr.csum_data = 0; 321a855e2b4SAndre Oppermann m->m_pkthdr.tso_segsz = 0; 322a855e2b4SAndre Oppermann m->m_pkthdr.ether_vtag = 0; 323099a0e58SBosko Milekic SLIST_INIT(&m->m_pkthdr.tags); 324099a0e58SBosko Milekic #ifdef MAC 325099a0e58SBosko Milekic /* If the label init fails, fail the alloc */ 32630d239bcSRobert Watson error = mac_mbuf_init(m, how); 327b23f72e9SBrian Feldman if (error) 328b23f72e9SBrian Feldman return (error); 329099a0e58SBosko Milekic #endif 3306bc72ab9SBosko Milekic } else 331099a0e58SBosko Milekic m->m_data = m->m_dat; 332b23f72e9SBrian Feldman return (0); 333099a0e58SBosko Milekic } 334099a0e58SBosko Milekic 335099a0e58SBosko Milekic /* 33656a4e45aSAndre Oppermann * The Mbuf master zone destructor. 337099a0e58SBosko Milekic */ 338099a0e58SBosko Milekic static void 339099a0e58SBosko Milekic mb_dtor_mbuf(void *mem, int size, void *arg) 340099a0e58SBosko Milekic { 341099a0e58SBosko Milekic struct mbuf *m; 342629b9e08SKip Macy unsigned long flags; 343099a0e58SBosko Milekic 344099a0e58SBosko Milekic m = (struct mbuf *)mem; 345629b9e08SKip Macy flags = (unsigned long)arg; 346629b9e08SKip Macy 347629b9e08SKip Macy if ((flags & MB_NOTAGS) == 0 && (m->m_flags & M_PKTHDR) != 0) 348099a0e58SBosko Milekic m_tag_delete_chain(m, NULL); 34956a4e45aSAndre Oppermann KASSERT((m->m_flags & M_EXT) == 0, ("%s: M_EXT set", __func__)); 350457869b9SKip Macy KASSERT((m->m_flags & M_NOFREE) == 0, ("%s: M_NOFREE set", __func__)); 351121f0509SMike Silbersack #ifdef INVARIANTS 352121f0509SMike Silbersack trash_dtor(mem, size, arg); 353121f0509SMike Silbersack #endif 354099a0e58SBosko Milekic } 355099a0e58SBosko Milekic 35656a4e45aSAndre Oppermann /* 35756a4e45aSAndre Oppermann * The Mbuf Packet zone destructor. 35856a4e45aSAndre Oppermann */ 359099a0e58SBosko Milekic static void 360099a0e58SBosko Milekic mb_dtor_pack(void *mem, int size, void *arg) 361099a0e58SBosko Milekic { 362099a0e58SBosko Milekic struct mbuf *m; 363099a0e58SBosko Milekic 364099a0e58SBosko Milekic m = (struct mbuf *)mem; 365099a0e58SBosko Milekic if ((m->m_flags & M_PKTHDR) != 0) 366099a0e58SBosko Milekic m_tag_delete_chain(m, NULL); 36756a4e45aSAndre Oppermann 36856a4e45aSAndre Oppermann /* Make sure we've got a clean cluster back. */ 36956a4e45aSAndre Oppermann KASSERT((m->m_flags & M_EXT) == M_EXT, ("%s: M_EXT not set", __func__)); 37056a4e45aSAndre Oppermann KASSERT(m->m_ext.ext_buf != NULL, ("%s: ext_buf == NULL", __func__)); 37156a4e45aSAndre Oppermann KASSERT(m->m_ext.ext_free == NULL, ("%s: ext_free != NULL", __func__)); 37256a4e45aSAndre Oppermann KASSERT(m->m_ext.ext_args == NULL, ("%s: ext_args != NULL", __func__)); 37356a4e45aSAndre Oppermann KASSERT(m->m_ext.ext_size == MCLBYTES, ("%s: ext_size != MCLBYTES", __func__)); 37449d46b61SGleb Smirnoff KASSERT(m->m_ext.ext_type == EXT_PACKET, ("%s: ext_type != EXT_PACKET", __func__)); 37556a4e45aSAndre Oppermann KASSERT(*m->m_ext.ref_cnt == 1, ("%s: ref_cnt != 1", __func__)); 376121f0509SMike Silbersack #ifdef INVARIANTS 377121f0509SMike Silbersack trash_dtor(m->m_ext.ext_buf, MCLBYTES, arg); 378121f0509SMike Silbersack #endif 3796c125b8dSMohan Srinivasan /* 380ef44c8d2SDavid E. O'Brien * If there are processes blocked on zone_clust, waiting for pages 381ef44c8d2SDavid E. O'Brien * to be freed up, * cause them to be woken up by draining the 382ef44c8d2SDavid E. O'Brien * packet zone. We are exposed to a race here * (in the check for 383ef44c8d2SDavid E. O'Brien * the UMA_ZFLAG_FULL) where we might miss the flag set, but that 384ef44c8d2SDavid E. O'Brien * is deliberate. We don't want to acquire the zone lock for every 385ef44c8d2SDavid E. O'Brien * mbuf free. 3866c125b8dSMohan Srinivasan */ 3876c125b8dSMohan Srinivasan if (uma_zone_exhausted_nolock(zone_clust)) 3886c125b8dSMohan Srinivasan zone_drain(zone_pack); 389099a0e58SBosko Milekic } 390099a0e58SBosko Milekic 391099a0e58SBosko Milekic /* 392ec63cb90SAndre Oppermann * The Cluster and Jumbo[PAGESIZE|9|16] zone constructor. 393099a0e58SBosko Milekic * 394099a0e58SBosko Milekic * Here the 'arg' pointer points to the Mbuf which we 39556a4e45aSAndre Oppermann * are configuring cluster storage for. If 'arg' is 39656a4e45aSAndre Oppermann * empty we allocate just the cluster without setting 39756a4e45aSAndre Oppermann * the mbuf to it. See mbuf.h. 398099a0e58SBosko Milekic */ 399b23f72e9SBrian Feldman static int 400b23f72e9SBrian Feldman mb_ctor_clust(void *mem, int size, void *arg, int how) 401099a0e58SBosko Milekic { 402099a0e58SBosko Milekic struct mbuf *m; 40356a4e45aSAndre Oppermann u_int *refcnt; 4040f4d9d04SKip Macy int type; 4050f4d9d04SKip Macy uma_zone_t zone; 406099a0e58SBosko Milekic 407121f0509SMike Silbersack #ifdef INVARIANTS 408121f0509SMike Silbersack trash_ctor(mem, size, arg, how); 409121f0509SMike Silbersack #endif 41056a4e45aSAndre Oppermann switch (size) { 41156a4e45aSAndre Oppermann case MCLBYTES: 41256a4e45aSAndre Oppermann type = EXT_CLUSTER; 4130f4d9d04SKip Macy zone = zone_clust; 41456a4e45aSAndre Oppermann break; 415ec63cb90SAndre Oppermann #if MJUMPAGESIZE != MCLBYTES 416ec63cb90SAndre Oppermann case MJUMPAGESIZE: 417ec63cb90SAndre Oppermann type = EXT_JUMBOP; 4180f4d9d04SKip Macy zone = zone_jumbop; 419d5269a63SAndre Oppermann break; 42036ae3fd3SAndre Oppermann #endif 42156a4e45aSAndre Oppermann case MJUM9BYTES: 42256a4e45aSAndre Oppermann type = EXT_JUMBO9; 4230f4d9d04SKip Macy zone = zone_jumbo9; 42456a4e45aSAndre Oppermann break; 42556a4e45aSAndre Oppermann case MJUM16BYTES: 42656a4e45aSAndre Oppermann type = EXT_JUMBO16; 4270f4d9d04SKip Macy zone = zone_jumbo16; 42856a4e45aSAndre Oppermann break; 42956a4e45aSAndre Oppermann default: 43056a4e45aSAndre Oppermann panic("unknown cluster size"); 43156a4e45aSAndre Oppermann break; 43256a4e45aSAndre Oppermann } 4330f4d9d04SKip Macy 4340f4d9d04SKip Macy m = (struct mbuf *)arg; 4350f4d9d04SKip Macy refcnt = uma_find_refcnt(zone, mem); 4360f4d9d04SKip Macy *refcnt = 1; 4370f4d9d04SKip Macy if (m != NULL) { 438099a0e58SBosko Milekic m->m_ext.ext_buf = (caddr_t)mem; 439099a0e58SBosko Milekic m->m_data = m->m_ext.ext_buf; 440099a0e58SBosko Milekic m->m_flags |= M_EXT; 441099a0e58SBosko Milekic m->m_ext.ext_free = NULL; 442099a0e58SBosko Milekic m->m_ext.ext_args = NULL; 44356a4e45aSAndre Oppermann m->m_ext.ext_size = size; 44456a4e45aSAndre Oppermann m->m_ext.ext_type = type; 4450f4d9d04SKip Macy m->m_ext.ref_cnt = refcnt; 44656a4e45aSAndre Oppermann } 4470f4d9d04SKip Macy 448b23f72e9SBrian Feldman return (0); 449099a0e58SBosko Milekic } 450099a0e58SBosko Milekic 45156a4e45aSAndre Oppermann /* 45256a4e45aSAndre Oppermann * The Mbuf Cluster zone destructor. 45356a4e45aSAndre Oppermann */ 454099a0e58SBosko Milekic static void 455099a0e58SBosko Milekic mb_dtor_clust(void *mem, int size, void *arg) 456099a0e58SBosko Milekic { 457121f0509SMike Silbersack #ifdef INVARIANTS 4580f4d9d04SKip Macy uma_zone_t zone; 4590f4d9d04SKip Macy 4600f4d9d04SKip Macy zone = m_getzone(size); 4610f4d9d04SKip Macy KASSERT(*(uma_find_refcnt(zone, mem)) <= 1, 4620f4d9d04SKip Macy ("%s: refcnt incorrect %u", __func__, 4630f4d9d04SKip Macy *(uma_find_refcnt(zone, mem))) ); 4640f4d9d04SKip Macy 465121f0509SMike Silbersack trash_dtor(mem, size, arg); 466121f0509SMike Silbersack #endif 467099a0e58SBosko Milekic } 468099a0e58SBosko Milekic 469099a0e58SBosko Milekic /* 470099a0e58SBosko Milekic * The Packet secondary zone's init routine, executed on the 47156a4e45aSAndre Oppermann * object's transition from mbuf keg slab to zone cache. 472099a0e58SBosko Milekic */ 473b23f72e9SBrian Feldman static int 47456a4e45aSAndre Oppermann mb_zinit_pack(void *mem, int size, int how) 475099a0e58SBosko Milekic { 476099a0e58SBosko Milekic struct mbuf *m; 477099a0e58SBosko Milekic 47856a4e45aSAndre Oppermann m = (struct mbuf *)mem; /* m is virgin. */ 479a7bd90efSAndre Oppermann if (uma_zalloc_arg(zone_clust, m, how) == NULL || 480a7bd90efSAndre Oppermann m->m_ext.ext_buf == NULL) 481b23f72e9SBrian Feldman return (ENOMEM); 482cd5bb63bSAndre Oppermann m->m_ext.ext_type = EXT_PACKET; /* Override. */ 483121f0509SMike Silbersack #ifdef INVARIANTS 484121f0509SMike Silbersack trash_init(m->m_ext.ext_buf, MCLBYTES, how); 485121f0509SMike Silbersack #endif 486b23f72e9SBrian Feldman return (0); 487099a0e58SBosko Milekic } 488099a0e58SBosko Milekic 489099a0e58SBosko Milekic /* 490099a0e58SBosko Milekic * The Packet secondary zone's fini routine, executed on the 491099a0e58SBosko Milekic * object's transition from zone cache to keg slab. 492099a0e58SBosko Milekic */ 493099a0e58SBosko Milekic static void 49456a4e45aSAndre Oppermann mb_zfini_pack(void *mem, int size) 495099a0e58SBosko Milekic { 496099a0e58SBosko Milekic struct mbuf *m; 497099a0e58SBosko Milekic 498099a0e58SBosko Milekic m = (struct mbuf *)mem; 499121f0509SMike Silbersack #ifdef INVARIANTS 500121f0509SMike Silbersack trash_fini(m->m_ext.ext_buf, MCLBYTES); 501121f0509SMike Silbersack #endif 502099a0e58SBosko Milekic uma_zfree_arg(zone_clust, m->m_ext.ext_buf, NULL); 503a7b844d2SMike Silbersack #ifdef INVARIANTS 504a7b844d2SMike Silbersack trash_dtor(mem, size, NULL); 505a7b844d2SMike Silbersack #endif 506099a0e58SBosko Milekic } 507099a0e58SBosko Milekic 508099a0e58SBosko Milekic /* 509099a0e58SBosko Milekic * The "packet" keg constructor. 510099a0e58SBosko Milekic */ 511b23f72e9SBrian Feldman static int 512b23f72e9SBrian Feldman mb_ctor_pack(void *mem, int size, void *arg, int how) 513099a0e58SBosko Milekic { 514099a0e58SBosko Milekic struct mbuf *m; 515099a0e58SBosko Milekic struct mb_args *args; 516b23f72e9SBrian Feldman #ifdef MAC 517b23f72e9SBrian Feldman int error; 518b23f72e9SBrian Feldman #endif 519b23f72e9SBrian Feldman int flags; 520099a0e58SBosko Milekic short type; 521099a0e58SBosko Milekic 522099a0e58SBosko Milekic m = (struct mbuf *)mem; 523099a0e58SBosko Milekic args = (struct mb_args *)arg; 524099a0e58SBosko Milekic flags = args->flags; 525099a0e58SBosko Milekic type = args->type; 526099a0e58SBosko Milekic 527121f0509SMike Silbersack #ifdef INVARIANTS 528121f0509SMike Silbersack trash_ctor(m->m_ext.ext_buf, MCLBYTES, arg, how); 529121f0509SMike Silbersack #endif 530099a0e58SBosko Milekic m->m_next = NULL; 5316bc72ab9SBosko Milekic m->m_nextpkt = NULL; 532099a0e58SBosko Milekic m->m_data = m->m_ext.ext_buf; 53356a4e45aSAndre Oppermann m->m_len = 0; 53456a4e45aSAndre Oppermann m->m_flags = (flags | M_EXT); 53556a4e45aSAndre Oppermann m->m_type = type; 536099a0e58SBosko Milekic 537099a0e58SBosko Milekic if (flags & M_PKTHDR) { 538099a0e58SBosko Milekic m->m_pkthdr.rcvif = NULL; 53956a4e45aSAndre Oppermann m->m_pkthdr.len = 0; 54056a4e45aSAndre Oppermann m->m_pkthdr.header = NULL; 541099a0e58SBosko Milekic m->m_pkthdr.csum_flags = 0; 54256a4e45aSAndre Oppermann m->m_pkthdr.csum_data = 0; 543a855e2b4SAndre Oppermann m->m_pkthdr.tso_segsz = 0; 544a855e2b4SAndre Oppermann m->m_pkthdr.ether_vtag = 0; 545099a0e58SBosko Milekic SLIST_INIT(&m->m_pkthdr.tags); 546099a0e58SBosko Milekic #ifdef MAC 547099a0e58SBosko Milekic /* If the label init fails, fail the alloc */ 54830d239bcSRobert Watson error = mac_mbuf_init(m, how); 549b23f72e9SBrian Feldman if (error) 550b23f72e9SBrian Feldman return (error); 551099a0e58SBosko Milekic #endif 552099a0e58SBosko Milekic } 55356a4e45aSAndre Oppermann /* m_ext is already initialized. */ 55456a4e45aSAndre Oppermann 555b23f72e9SBrian Feldman return (0); 556099a0e58SBosko Milekic } 557099a0e58SBosko Milekic 558099a0e58SBosko Milekic /* 559099a0e58SBosko Milekic * This is the protocol drain routine. 560099a0e58SBosko Milekic * 561099a0e58SBosko Milekic * No locks should be held when this is called. The drain routines have to 562099a0e58SBosko Milekic * presently acquire some locks which raises the possibility of lock order 563099a0e58SBosko Milekic * reversal. 564099a0e58SBosko Milekic */ 565099a0e58SBosko Milekic static void 566099a0e58SBosko Milekic mb_reclaim(void *junk) 567099a0e58SBosko Milekic { 568099a0e58SBosko Milekic struct domain *dp; 569099a0e58SBosko Milekic struct protosw *pr; 570099a0e58SBosko Milekic 571099a0e58SBosko Milekic WITNESS_WARN(WARN_GIANTOK | WARN_SLEEPOK | WARN_PANIC, NULL, 572099a0e58SBosko Milekic "mb_reclaim()"); 573099a0e58SBosko Milekic 574099a0e58SBosko Milekic for (dp = domains; dp != NULL; dp = dp->dom_next) 575099a0e58SBosko Milekic for (pr = dp->dom_protosw; pr < dp->dom_protoswNPROTOSW; pr++) 576099a0e58SBosko Milekic if (pr->pr_drain != NULL) 577099a0e58SBosko Milekic (*pr->pr_drain)(); 578099a0e58SBosko Milekic } 579