11cafed39SJonathan Lemon /*- 2d4b5cae4SRobert Watson * Copyright (c) 2007-2009 Robert N. M. Watson 32d22f334SRobert Watson * Copyright (c) 2010 Juniper Networks, Inc. 4e3b6e33cSJake Burkholder * All rights reserved. 5e3b6e33cSJake Burkholder * 62d22f334SRobert Watson * This software was developed by Robert N. M. Watson under contract 72d22f334SRobert Watson * to Juniper Networks, Inc. 82d22f334SRobert Watson * 9e3b6e33cSJake Burkholder * Redistribution and use in source and binary forms, with or without 10e3b6e33cSJake Burkholder * modification, are permitted provided that the following conditions 11e3b6e33cSJake Burkholder * are met: 12e3b6e33cSJake Burkholder * 1. Redistributions of source code must retain the above copyright 131cafed39SJonathan Lemon * notice, this list of conditions and the following disclaimer. 14e3b6e33cSJake Burkholder * 2. Redistributions in binary form must reproduce the above copyright 15e3b6e33cSJake Burkholder * notice, this list of conditions and the following disclaimer in the 16e3b6e33cSJake Burkholder * documentation and/or other materials provided with the distribution. 17e3b6e33cSJake Burkholder * 181cafed39SJonathan Lemon * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 191cafed39SJonathan Lemon * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 201cafed39SJonathan Lemon * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 211cafed39SJonathan Lemon * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 221cafed39SJonathan Lemon * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 231cafed39SJonathan Lemon * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 241cafed39SJonathan Lemon * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 251cafed39SJonathan Lemon * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 261cafed39SJonathan Lemon * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 271cafed39SJonathan Lemon * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 281cafed39SJonathan Lemon * SUCH DAMAGE. 29e3b6e33cSJake Burkholder */ 30e3b6e33cSJake Burkholder 31d4b5cae4SRobert Watson #include <sys/cdefs.h> 32d4b5cae4SRobert Watson __FBSDID("$FreeBSD$"); 33d4b5cae4SRobert Watson 34d4b5cae4SRobert Watson /* 35d4b5cae4SRobert Watson * netisr is a packet dispatch service, allowing synchronous (directly 36d4b5cae4SRobert Watson * dispatched) and asynchronous (deferred dispatch) processing of packets by 37d4b5cae4SRobert Watson * registered protocol handlers. Callers pass a protocol identifier and 38d4b5cae4SRobert Watson * packet to netisr, along with a direct dispatch hint, and work will either 390a32e29fSRobert Watson * be immediately processed by the registered handler, or passed to a 400a32e29fSRobert Watson * software interrupt (SWI) thread for deferred dispatch. Callers will 410a32e29fSRobert Watson * generally select one or the other based on: 42d4b5cae4SRobert Watson * 430a32e29fSRobert Watson * - Whether directly dispatching a netisr handler lead to code reentrance or 44d4b5cae4SRobert Watson * lock recursion, such as entering the socket code from the socket code. 450a32e29fSRobert Watson * - Whether directly dispatching a netisr handler lead to recursive 46d4b5cae4SRobert Watson * processing, such as when decapsulating several wrapped layers of tunnel 47d4b5cae4SRobert Watson * information (IPSEC within IPSEC within ...). 48d4b5cae4SRobert Watson * 49d4b5cae4SRobert Watson * Maintaining ordering for protocol streams is a critical design concern. 50d4b5cae4SRobert Watson * Enforcing ordering limits the opportunity for concurrency, but maintains 51d4b5cae4SRobert Watson * the strong ordering requirements found in some protocols, such as TCP. Of 52d4b5cae4SRobert Watson * related concern is CPU affinity--it is desirable to process all data 53d4b5cae4SRobert Watson * associated with a particular stream on the same CPU over time in order to 54d4b5cae4SRobert Watson * avoid acquiring locks associated with the connection on different CPUs, 55d4b5cae4SRobert Watson * keep connection data in one cache, and to generally encourage associated 56d4b5cae4SRobert Watson * user threads to live on the same CPU as the stream. It's also desirable 57d4b5cae4SRobert Watson * to avoid lock migration and contention where locks are associated with 58d4b5cae4SRobert Watson * more than one flow. 59d4b5cae4SRobert Watson * 60d4b5cae4SRobert Watson * netisr supports several policy variations, represented by the 610a32e29fSRobert Watson * NETISR_POLICY_* constants, allowing protocols to play various roles in 62d4b5cae4SRobert Watson * identifying flows, assigning work to CPUs, etc. These are described in 630a32e29fSRobert Watson * netisr.h. 64d4b5cae4SRobert Watson */ 65d4b5cae4SRobert Watson 66d4b5cae4SRobert Watson #include "opt_ddb.h" 67f0796cd2SGleb Smirnoff #include "opt_device_polling.h" 681d8cd39eSRobert Watson 69e3b6e33cSJake Burkholder #include <sys/param.h> 70e3b6e33cSJake Burkholder #include <sys/bus.h> 71e3b6e33cSJake Burkholder #include <sys/kernel.h> 721cafed39SJonathan Lemon #include <sys/kthread.h> 73d4b5cae4SRobert Watson #include <sys/interrupt.h> 741cafed39SJonathan Lemon #include <sys/lock.h> 751cafed39SJonathan Lemon #include <sys/mbuf.h> 76d4b5cae4SRobert Watson #include <sys/mutex.h> 7753402767SRobert Watson #include <sys/pcpu.h> 78d4b5cae4SRobert Watson #include <sys/proc.h> 79d4b5cae4SRobert Watson #include <sys/rmlock.h> 80d4b5cae4SRobert Watson #include <sys/sched.h> 81d4b5cae4SRobert Watson #include <sys/smp.h> 821cafed39SJonathan Lemon #include <sys/socket.h> 83d4b5cae4SRobert Watson #include <sys/sysctl.h> 84d4b5cae4SRobert Watson #include <sys/systm.h> 85d4b5cae4SRobert Watson 86d4b5cae4SRobert Watson #ifdef DDB 87d4b5cae4SRobert Watson #include <ddb/ddb.h> 88d4b5cae4SRobert Watson #endif 891cafed39SJonathan Lemon 90938448cdSRobert Watson #define _WANT_NETISR_INTERNAL /* Enable definitions from netisr_internal.h */ 911cafed39SJonathan Lemon #include <net/if.h> 921cafed39SJonathan Lemon #include <net/if_var.h> 93e3b6e33cSJake Burkholder #include <net/netisr.h> 94938448cdSRobert Watson #include <net/netisr_internal.h> 95530c0060SRobert Watson #include <net/vnet.h> 96e3b6e33cSJake Burkholder 97d4b5cae4SRobert Watson /*- 98d4b5cae4SRobert Watson * Synchronize use and modification of the registered netisr data structures; 99d4b5cae4SRobert Watson * acquire a read lock while modifying the set of registered protocols to 100d4b5cae4SRobert Watson * prevent partially registered or unregistered protocols from being run. 101d4b5cae4SRobert Watson * 102d4b5cae4SRobert Watson * The following data structures and fields are protected by this lock: 103d4b5cae4SRobert Watson * 104938448cdSRobert Watson * - The netisr_proto array, including all fields of struct netisr_proto. 105d4b5cae4SRobert Watson * - The nws array, including all fields of struct netisr_worker. 106d4b5cae4SRobert Watson * - The nws_array array. 107d4b5cae4SRobert Watson * 108d4b5cae4SRobert Watson * Note: the NETISR_LOCKING define controls whether read locks are acquired 109d4b5cae4SRobert Watson * in packet processing paths requiring netisr registration stability. This 1100a32e29fSRobert Watson * is disabled by default as it can lead to measurable performance 111d4b5cae4SRobert Watson * degradation even with rmlocks (3%-6% for loopback ping-pong traffic), and 112d4b5cae4SRobert Watson * because netisr registration and unregistration is extremely rare at 113d4b5cae4SRobert Watson * runtime. If it becomes more common, this decision should be revisited. 114d4b5cae4SRobert Watson * 115d4b5cae4SRobert Watson * XXXRW: rmlocks don't support assertions. 116d4b5cae4SRobert Watson */ 117d4b5cae4SRobert Watson static struct rmlock netisr_rmlock; 118d4b5cae4SRobert Watson #define NETISR_LOCK_INIT() rm_init_flags(&netisr_rmlock, "netisr", \ 119d4b5cae4SRobert Watson RM_NOWITNESS) 120d4b5cae4SRobert Watson #define NETISR_LOCK_ASSERT() 121d4b5cae4SRobert Watson #define NETISR_RLOCK(tracker) rm_rlock(&netisr_rmlock, (tracker)) 122d4b5cae4SRobert Watson #define NETISR_RUNLOCK(tracker) rm_runlock(&netisr_rmlock, (tracker)) 123d4b5cae4SRobert Watson #define NETISR_WLOCK() rm_wlock(&netisr_rmlock) 124d4b5cae4SRobert Watson #define NETISR_WUNLOCK() rm_wunlock(&netisr_rmlock) 125d4b5cae4SRobert Watson /* #define NETISR_LOCKING */ 126e3b6e33cSJake Burkholder 127d4b5cae4SRobert Watson SYSCTL_NODE(_net, OID_AUTO, isr, CTLFLAG_RW, 0, "netisr"); 1281cafed39SJonathan Lemon 129d4b5cae4SRobert Watson /*- 130d4b5cae4SRobert Watson * Three direct dispatch policies are supported: 131d4b5cae4SRobert Watson * 132d4b5cae4SRobert Watson * - Always defer: all work is scheduled for a netisr, regardless of context. 133d4b5cae4SRobert Watson * (!direct) 134d4b5cae4SRobert Watson * 135d4b5cae4SRobert Watson * - Hybrid: if the executing context allows direct dispatch, and we're 136d4b5cae4SRobert Watson * running on the CPU the work would be done on, then direct dispatch if it 137d4b5cae4SRobert Watson * wouldn't violate ordering constraints on the workstream. 138d4b5cae4SRobert Watson * (direct && !direct_force) 139d4b5cae4SRobert Watson * 140d4b5cae4SRobert Watson * - Always direct: if the executing context allows direct dispatch, always 141d4b5cae4SRobert Watson * direct dispatch. (direct && direct_force) 142d4b5cae4SRobert Watson * 143d4b5cae4SRobert Watson * Notice that changing the global policy could lead to short periods of 144d4b5cae4SRobert Watson * misordered processing, but this is considered acceptable as compared to 145d4b5cae4SRobert Watson * the complexity of enforcing ordering during policy changes. 146d4b5cae4SRobert Watson */ 147d4b5cae4SRobert Watson static int netisr_direct_force = 1; /* Always direct dispatch. */ 148d4b5cae4SRobert Watson TUNABLE_INT("net.isr.direct_force", &netisr_direct_force); 149d4b5cae4SRobert Watson SYSCTL_INT(_net_isr, OID_AUTO, direct_force, CTLFLAG_RW, 150d4b5cae4SRobert Watson &netisr_direct_force, 0, "Force direct dispatch"); 151e3b6e33cSJake Burkholder 152d4b5cae4SRobert Watson static int netisr_direct = 1; /* Enable direct dispatch. */ 153cea2165bSRobert Watson TUNABLE_INT("net.isr.direct", &netisr_direct); 154d4b5cae4SRobert Watson SYSCTL_INT(_net_isr, OID_AUTO, direct, CTLFLAG_RW, 155d4b5cae4SRobert Watson &netisr_direct, 0, "Enable direct dispatch"); 1561cafed39SJonathan Lemon 1571cafed39SJonathan Lemon /* 158d4b5cae4SRobert Watson * Allow the administrator to limit the number of threads (CPUs) to use for 159d4b5cae4SRobert Watson * netisr. We don't check netisr_maxthreads before creating the thread for 160d4b5cae4SRobert Watson * CPU 0, so in practice we ignore values <= 1. This must be set at boot. 161d4b5cae4SRobert Watson * We will create at most one thread per CPU. 1625fd04e38SRobert Watson */ 1639e6e01ebSRobert Watson static int netisr_maxthreads = -1; /* Max number of threads. */ 164d4b5cae4SRobert Watson TUNABLE_INT("net.isr.maxthreads", &netisr_maxthreads); 16578494902SPawel Jakub Dawidek SYSCTL_INT(_net_isr, OID_AUTO, maxthreads, CTLFLAG_RDTUN, 166d4b5cae4SRobert Watson &netisr_maxthreads, 0, 167d4b5cae4SRobert Watson "Use at most this many CPUs for netisr processing"); 1685fd04e38SRobert Watson 169d4b5cae4SRobert Watson static int netisr_bindthreads = 0; /* Bind threads to CPUs. */ 170d4b5cae4SRobert Watson TUNABLE_INT("net.isr.bindthreads", &netisr_bindthreads); 17178494902SPawel Jakub Dawidek SYSCTL_INT(_net_isr, OID_AUTO, bindthreads, CTLFLAG_RDTUN, 172d4b5cae4SRobert Watson &netisr_bindthreads, 0, "Bind netisr threads to CPUs."); 173d4b5cae4SRobert Watson 174d4b5cae4SRobert Watson /* 1750a32e29fSRobert Watson * Limit per-workstream mbuf queue limits s to at most net.isr.maxqlimit, 1760a32e29fSRobert Watson * both for initial configuration and later modification using 1770a32e29fSRobert Watson * netisr_setqlimit(). 178d4b5cae4SRobert Watson */ 179d4b5cae4SRobert Watson #define NETISR_DEFAULT_MAXQLIMIT 10240 180d4b5cae4SRobert Watson static u_int netisr_maxqlimit = NETISR_DEFAULT_MAXQLIMIT; 181d4b5cae4SRobert Watson TUNABLE_INT("net.isr.maxqlimit", &netisr_maxqlimit); 18278494902SPawel Jakub Dawidek SYSCTL_INT(_net_isr, OID_AUTO, maxqlimit, CTLFLAG_RDTUN, 183d4b5cae4SRobert Watson &netisr_maxqlimit, 0, 184d4b5cae4SRobert Watson "Maximum netisr per-protocol, per-CPU queue depth."); 185d4b5cae4SRobert Watson 186d4b5cae4SRobert Watson /* 1870a32e29fSRobert Watson * The default per-workstream mbuf queue limit for protocols that don't 1880a32e29fSRobert Watson * initialize the nh_qlimit field of their struct netisr_handler. If this is 1890a32e29fSRobert Watson * set above netisr_maxqlimit, we truncate it to the maximum during boot. 190d4b5cae4SRobert Watson */ 191d4b5cae4SRobert Watson #define NETISR_DEFAULT_DEFAULTQLIMIT 256 192d4b5cae4SRobert Watson static u_int netisr_defaultqlimit = NETISR_DEFAULT_DEFAULTQLIMIT; 193d4b5cae4SRobert Watson TUNABLE_INT("net.isr.defaultqlimit", &netisr_defaultqlimit); 19478494902SPawel Jakub Dawidek SYSCTL_INT(_net_isr, OID_AUTO, defaultqlimit, CTLFLAG_RDTUN, 195d4b5cae4SRobert Watson &netisr_defaultqlimit, 0, 196d4b5cae4SRobert Watson "Default netisr per-protocol, per-CPU queue limit if not set by protocol"); 197d4b5cae4SRobert Watson 198d4b5cae4SRobert Watson /* 199938448cdSRobert Watson * Store and export the compile-time constant NETISR_MAXPROT limit on the 200938448cdSRobert Watson * number of protocols that can register with netisr at a time. This is 201938448cdSRobert Watson * required for crashdump analysis, as it sizes netisr_proto[]. 202d4b5cae4SRobert Watson */ 203938448cdSRobert Watson static u_int netisr_maxprot = NETISR_MAXPROT; 204938448cdSRobert Watson SYSCTL_INT(_net_isr, OID_AUTO, maxprot, CTLFLAG_RD, 205938448cdSRobert Watson &netisr_maxprot, 0, 206938448cdSRobert Watson "Compile-time limit on the number of protocols supported by netisr."); 207d4b5cae4SRobert Watson 208d4b5cae4SRobert Watson /* 209938448cdSRobert Watson * The netisr_proto array describes all registered protocols, indexed by 210938448cdSRobert Watson * protocol number. See netisr_internal.h for more details. 211d4b5cae4SRobert Watson */ 212938448cdSRobert Watson static struct netisr_proto netisr_proto[NETISR_MAXPROT]; 213d4b5cae4SRobert Watson 214d4b5cae4SRobert Watson /* 215938448cdSRobert Watson * Per-CPU workstream data. See netisr_internal.h for more details. 216d4b5cae4SRobert Watson */ 21753402767SRobert Watson DPCPU_DEFINE(struct netisr_workstream, nws); 218d4b5cae4SRobert Watson 219d4b5cae4SRobert Watson /* 220d4b5cae4SRobert Watson * Map contiguous values between 0 and nws_count into CPU IDs appropriate for 22153402767SRobert Watson * accessing workstreams. This allows constructions of the form 22253402767SRobert Watson * DPCPU_ID_GET(nws_array[arbitraryvalue % nws_count], nws). 223d4b5cae4SRobert Watson */ 224d4b5cae4SRobert Watson static u_int nws_array[MAXCPU]; 225d4b5cae4SRobert Watson 226d4b5cae4SRobert Watson /* 227d4b5cae4SRobert Watson * Number of registered workstreams. Will be at most the number of running 228d4b5cae4SRobert Watson * CPUs once fully started. 229d4b5cae4SRobert Watson */ 230d4b5cae4SRobert Watson static u_int nws_count; 231d4b5cae4SRobert Watson SYSCTL_INT(_net_isr, OID_AUTO, numthreads, CTLFLAG_RD, 232d4b5cae4SRobert Watson &nws_count, 0, "Number of extant netisr threads."); 233d4b5cae4SRobert Watson 234d4b5cae4SRobert Watson /* 235d4b5cae4SRobert Watson * Synchronization for each workstream: a mutex protects all mutable fields 236d4b5cae4SRobert Watson * in each stream, including per-protocol state (mbuf queues). The SWI is 237d4b5cae4SRobert Watson * woken up if asynchronous dispatch is required. 238d4b5cae4SRobert Watson */ 239d4b5cae4SRobert Watson #define NWS_LOCK(s) mtx_lock(&(s)->nws_mtx) 240d4b5cae4SRobert Watson #define NWS_LOCK_ASSERT(s) mtx_assert(&(s)->nws_mtx, MA_OWNED) 241d4b5cae4SRobert Watson #define NWS_UNLOCK(s) mtx_unlock(&(s)->nws_mtx) 242d4b5cae4SRobert Watson #define NWS_SIGNAL(s) swi_sched((s)->nws_swi_cookie, 0) 243d4b5cae4SRobert Watson 244d4b5cae4SRobert Watson /* 245d4b5cae4SRobert Watson * Utility routines for protocols that implement their own mapping of flows 246d4b5cae4SRobert Watson * to CPUs. 247d4b5cae4SRobert Watson */ 248d4b5cae4SRobert Watson u_int 249d4b5cae4SRobert Watson netisr_get_cpucount(void) 250d4b5cae4SRobert Watson { 251d4b5cae4SRobert Watson 252d4b5cae4SRobert Watson return (nws_count); 2535fd04e38SRobert Watson } 254d4b5cae4SRobert Watson 255d4b5cae4SRobert Watson u_int 256d4b5cae4SRobert Watson netisr_get_cpuid(u_int cpunumber) 257d4b5cae4SRobert Watson { 258d4b5cae4SRobert Watson 259d4b5cae4SRobert Watson KASSERT(cpunumber < nws_count, ("%s: %u > %u", __func__, cpunumber, 260d4b5cae4SRobert Watson nws_count)); 261d4b5cae4SRobert Watson 262d4b5cae4SRobert Watson return (nws_array[cpunumber]); 2635fd04e38SRobert Watson } 2645fd04e38SRobert Watson 2655fd04e38SRobert Watson /* 2660a32e29fSRobert Watson * The default implementation of flow -> CPU ID mapping. 267d4b5cae4SRobert Watson * 268d4b5cae4SRobert Watson * Non-static so that protocols can use it to map their own work to specific 269d4b5cae4SRobert Watson * CPUs in a manner consistent to netisr for affinity purposes. 270d4b5cae4SRobert Watson */ 271d4b5cae4SRobert Watson u_int 272d4b5cae4SRobert Watson netisr_default_flow2cpu(u_int flowid) 273d4b5cae4SRobert Watson { 274d4b5cae4SRobert Watson 275d4b5cae4SRobert Watson return (nws_array[flowid % nws_count]); 276d4b5cae4SRobert Watson } 277d4b5cae4SRobert Watson 278d4b5cae4SRobert Watson /* 279d4b5cae4SRobert Watson * Register a new netisr handler, which requires initializing per-protocol 280d4b5cae4SRobert Watson * fields for each workstream. All netisr work is briefly suspended while 281d4b5cae4SRobert Watson * the protocol is installed. 2821cafed39SJonathan Lemon */ 2831cafed39SJonathan Lemon void 284d4b5cae4SRobert Watson netisr_register(const struct netisr_handler *nhp) 2851cafed39SJonathan Lemon { 286d4b5cae4SRobert Watson struct netisr_work *npwp; 287d4b5cae4SRobert Watson const char *name; 288d4b5cae4SRobert Watson u_int i, proto; 2891cafed39SJonathan Lemon 290d4b5cae4SRobert Watson proto = nhp->nh_proto; 291d4b5cae4SRobert Watson name = nhp->nh_name; 29259dd72d0SRobert Watson 2937902224cSSam Leffler /* 294d4b5cae4SRobert Watson * Test that the requested registration is valid. 2957902224cSSam Leffler */ 296d4b5cae4SRobert Watson KASSERT(nhp->nh_name != NULL, 297d4b5cae4SRobert Watson ("%s: nh_name NULL for %u", __func__, proto)); 298d4b5cae4SRobert Watson KASSERT(nhp->nh_handler != NULL, 299d4b5cae4SRobert Watson ("%s: nh_handler NULL for %s", __func__, name)); 300d4b5cae4SRobert Watson KASSERT(nhp->nh_policy == NETISR_POLICY_SOURCE || 301d4b5cae4SRobert Watson nhp->nh_policy == NETISR_POLICY_FLOW || 302d4b5cae4SRobert Watson nhp->nh_policy == NETISR_POLICY_CPU, 303d4b5cae4SRobert Watson ("%s: unsupported nh_policy %u for %s", __func__, 304d4b5cae4SRobert Watson nhp->nh_policy, name)); 305d4b5cae4SRobert Watson KASSERT(nhp->nh_policy == NETISR_POLICY_FLOW || 306d4b5cae4SRobert Watson nhp->nh_m2flow == NULL, 307d4b5cae4SRobert Watson ("%s: nh_policy != FLOW but m2flow defined for %s", __func__, 308d4b5cae4SRobert Watson name)); 309d4b5cae4SRobert Watson KASSERT(nhp->nh_policy == NETISR_POLICY_CPU || nhp->nh_m2cpuid == NULL, 310d4b5cae4SRobert Watson ("%s: nh_policy != CPU but m2cpuid defined for %s", __func__, 311d4b5cae4SRobert Watson name)); 312d4b5cae4SRobert Watson KASSERT(nhp->nh_policy != NETISR_POLICY_CPU || nhp->nh_m2cpuid != NULL, 313d4b5cae4SRobert Watson ("%s: nh_policy == CPU but m2cpuid not defined for %s", __func__, 314d4b5cae4SRobert Watson name)); 315d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 316d4b5cae4SRobert Watson ("%s(%u, %s): protocol too big", __func__, proto, name)); 317d4b5cae4SRobert Watson 318d4b5cae4SRobert Watson /* 319d4b5cae4SRobert Watson * Test that no existing registration exists for this protocol. 320d4b5cae4SRobert Watson */ 321d4b5cae4SRobert Watson NETISR_WLOCK(); 322938448cdSRobert Watson KASSERT(netisr_proto[proto].np_name == NULL, 323d4b5cae4SRobert Watson ("%s(%u, %s): name present", __func__, proto, name)); 324938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler == NULL, 325d4b5cae4SRobert Watson ("%s(%u, %s): handler present", __func__, proto, name)); 326d4b5cae4SRobert Watson 327938448cdSRobert Watson netisr_proto[proto].np_name = name; 328938448cdSRobert Watson netisr_proto[proto].np_handler = nhp->nh_handler; 329938448cdSRobert Watson netisr_proto[proto].np_m2flow = nhp->nh_m2flow; 330938448cdSRobert Watson netisr_proto[proto].np_m2cpuid = nhp->nh_m2cpuid; 331938448cdSRobert Watson netisr_proto[proto].np_drainedcpu = nhp->nh_drainedcpu; 332d4b5cae4SRobert Watson if (nhp->nh_qlimit == 0) 333938448cdSRobert Watson netisr_proto[proto].np_qlimit = netisr_defaultqlimit; 334d4b5cae4SRobert Watson else if (nhp->nh_qlimit > netisr_maxqlimit) { 335d4b5cae4SRobert Watson printf("%s: %s requested queue limit %u capped to " 336d4b5cae4SRobert Watson "net.isr.maxqlimit %u\n", __func__, name, nhp->nh_qlimit, 337d4b5cae4SRobert Watson netisr_maxqlimit); 338938448cdSRobert Watson netisr_proto[proto].np_qlimit = netisr_maxqlimit; 339d4b5cae4SRobert Watson } else 340938448cdSRobert Watson netisr_proto[proto].np_qlimit = nhp->nh_qlimit; 341938448cdSRobert Watson netisr_proto[proto].np_policy = nhp->nh_policy; 342*3aa6d94eSJohn Baldwin CPU_FOREACH(i) { 34353402767SRobert Watson npwp = &(DPCPU_ID_PTR(i, nws))->nws_work[proto]; 344d4b5cae4SRobert Watson bzero(npwp, sizeof(*npwp)); 345938448cdSRobert Watson npwp->nw_qlimit = netisr_proto[proto].np_qlimit; 3461cafed39SJonathan Lemon } 347d4b5cae4SRobert Watson NETISR_WUNLOCK(); 3481cafed39SJonathan Lemon } 3491cafed39SJonathan Lemon 3501cafed39SJonathan Lemon /* 351d4b5cae4SRobert Watson * Clear drop counters across all workstreams for a protocol. 352d4b5cae4SRobert Watson */ 353d4b5cae4SRobert Watson void 354d4b5cae4SRobert Watson netisr_clearqdrops(const struct netisr_handler *nhp) 355d4b5cae4SRobert Watson { 356d4b5cae4SRobert Watson struct netisr_work *npwp; 357d4b5cae4SRobert Watson #ifdef INVARIANTS 358d4b5cae4SRobert Watson const char *name; 359d4b5cae4SRobert Watson #endif 360d4b5cae4SRobert Watson u_int i, proto; 361d4b5cae4SRobert Watson 362d4b5cae4SRobert Watson proto = nhp->nh_proto; 363d4b5cae4SRobert Watson #ifdef INVARIANTS 364d4b5cae4SRobert Watson name = nhp->nh_name; 365d4b5cae4SRobert Watson #endif 366d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 367d4b5cae4SRobert Watson ("%s(%u): protocol too big for %s", __func__, proto, name)); 368d4b5cae4SRobert Watson 369d4b5cae4SRobert Watson NETISR_WLOCK(); 370938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 371d4b5cae4SRobert Watson ("%s(%u): protocol not registered for %s", __func__, proto, 372d4b5cae4SRobert Watson name)); 373d4b5cae4SRobert Watson 374*3aa6d94eSJohn Baldwin CPU_FOREACH(i) { 37553402767SRobert Watson npwp = &(DPCPU_ID_PTR(i, nws))->nws_work[proto]; 376d4b5cae4SRobert Watson npwp->nw_qdrops = 0; 377d4b5cae4SRobert Watson } 378d4b5cae4SRobert Watson NETISR_WUNLOCK(); 379d4b5cae4SRobert Watson } 380d4b5cae4SRobert Watson 381d4b5cae4SRobert Watson /* 3820a32e29fSRobert Watson * Query current drop counters across all workstreams for a protocol. 383d4b5cae4SRobert Watson */ 384d4b5cae4SRobert Watson void 385d4b5cae4SRobert Watson netisr_getqdrops(const struct netisr_handler *nhp, u_int64_t *qdropp) 386d4b5cae4SRobert Watson { 387d4b5cae4SRobert Watson struct netisr_work *npwp; 388d4b5cae4SRobert Watson struct rm_priotracker tracker; 389d4b5cae4SRobert Watson #ifdef INVARIANTS 390d4b5cae4SRobert Watson const char *name; 391d4b5cae4SRobert Watson #endif 392d4b5cae4SRobert Watson u_int i, proto; 393d4b5cae4SRobert Watson 394d4b5cae4SRobert Watson *qdropp = 0; 395d4b5cae4SRobert Watson proto = nhp->nh_proto; 396d4b5cae4SRobert Watson #ifdef INVARIANTS 397d4b5cae4SRobert Watson name = nhp->nh_name; 398d4b5cae4SRobert Watson #endif 399d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 400d4b5cae4SRobert Watson ("%s(%u): protocol too big for %s", __func__, proto, name)); 401d4b5cae4SRobert Watson 402d4b5cae4SRobert Watson NETISR_RLOCK(&tracker); 403938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 404d4b5cae4SRobert Watson ("%s(%u): protocol not registered for %s", __func__, proto, 405d4b5cae4SRobert Watson name)); 406d4b5cae4SRobert Watson 407*3aa6d94eSJohn Baldwin CPU_FOREACH(i) { 40853402767SRobert Watson npwp = &(DPCPU_ID_PTR(i, nws))->nws_work[proto]; 409d4b5cae4SRobert Watson *qdropp += npwp->nw_qdrops; 410d4b5cae4SRobert Watson } 411d4b5cae4SRobert Watson NETISR_RUNLOCK(&tracker); 412d4b5cae4SRobert Watson } 413d4b5cae4SRobert Watson 414d4b5cae4SRobert Watson /* 4150a32e29fSRobert Watson * Query current per-workstream queue limit for a protocol. 416d4b5cae4SRobert Watson */ 417d4b5cae4SRobert Watson void 418d4b5cae4SRobert Watson netisr_getqlimit(const struct netisr_handler *nhp, u_int *qlimitp) 419d4b5cae4SRobert Watson { 420d4b5cae4SRobert Watson struct rm_priotracker tracker; 421d4b5cae4SRobert Watson #ifdef INVARIANTS 422d4b5cae4SRobert Watson const char *name; 423d4b5cae4SRobert Watson #endif 424d4b5cae4SRobert Watson u_int proto; 425d4b5cae4SRobert Watson 426d4b5cae4SRobert Watson proto = nhp->nh_proto; 427d4b5cae4SRobert Watson #ifdef INVARIANTS 428d4b5cae4SRobert Watson name = nhp->nh_name; 429d4b5cae4SRobert Watson #endif 430d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 431d4b5cae4SRobert Watson ("%s(%u): protocol too big for %s", __func__, proto, name)); 432d4b5cae4SRobert Watson 433d4b5cae4SRobert Watson NETISR_RLOCK(&tracker); 434938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 435d4b5cae4SRobert Watson ("%s(%u): protocol not registered for %s", __func__, proto, 436d4b5cae4SRobert Watson name)); 437938448cdSRobert Watson *qlimitp = netisr_proto[proto].np_qlimit; 438d4b5cae4SRobert Watson NETISR_RUNLOCK(&tracker); 439d4b5cae4SRobert Watson } 440d4b5cae4SRobert Watson 441d4b5cae4SRobert Watson /* 442d4b5cae4SRobert Watson * Update the queue limit across per-workstream queues for a protocol. We 443d4b5cae4SRobert Watson * simply change the limits, and don't drain overflowed packets as they will 444d4b5cae4SRobert Watson * (hopefully) take care of themselves shortly. 4451cafed39SJonathan Lemon */ 4461cafed39SJonathan Lemon int 447d4b5cae4SRobert Watson netisr_setqlimit(const struct netisr_handler *nhp, u_int qlimit) 4481cafed39SJonathan Lemon { 449d4b5cae4SRobert Watson struct netisr_work *npwp; 450d4b5cae4SRobert Watson #ifdef INVARIANTS 451d4b5cae4SRobert Watson const char *name; 452d4b5cae4SRobert Watson #endif 453d4b5cae4SRobert Watson u_int i, proto; 4541cafed39SJonathan Lemon 455d4b5cae4SRobert Watson if (qlimit > netisr_maxqlimit) 456d4b5cae4SRobert Watson return (EINVAL); 457d4b5cae4SRobert Watson 458d4b5cae4SRobert Watson proto = nhp->nh_proto; 459d4b5cae4SRobert Watson #ifdef INVARIANTS 460d4b5cae4SRobert Watson name = nhp->nh_name; 461d4b5cae4SRobert Watson #endif 462d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 463d4b5cae4SRobert Watson ("%s(%u): protocol too big for %s", __func__, proto, name)); 464d4b5cae4SRobert Watson 465d4b5cae4SRobert Watson NETISR_WLOCK(); 466938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 467d4b5cae4SRobert Watson ("%s(%u): protocol not registered for %s", __func__, proto, 468d4b5cae4SRobert Watson name)); 469d4b5cae4SRobert Watson 470938448cdSRobert Watson netisr_proto[proto].np_qlimit = qlimit; 471*3aa6d94eSJohn Baldwin CPU_FOREACH(i) { 47253402767SRobert Watson npwp = &(DPCPU_ID_PTR(i, nws))->nws_work[proto]; 473d4b5cae4SRobert Watson npwp->nw_qlimit = qlimit; 474fb68148fSJonathan Lemon } 475d4b5cae4SRobert Watson NETISR_WUNLOCK(); 4763161f583SAndre Oppermann return (0); 477e3b6e33cSJake Burkholder } 478e3b6e33cSJake Burkholder 479d4b5cae4SRobert Watson /* 480d4b5cae4SRobert Watson * Drain all packets currently held in a particular protocol work queue. 481d4b5cae4SRobert Watson */ 482e3b6e33cSJake Burkholder static void 483d4b5cae4SRobert Watson netisr_drain_proto(struct netisr_work *npwp) 484e3b6e33cSJake Burkholder { 485d4b5cae4SRobert Watson struct mbuf *m; 486d4b5cae4SRobert Watson 487d4b5cae4SRobert Watson /* 488d4b5cae4SRobert Watson * We would assert the lock on the workstream but it's not passed in. 489d4b5cae4SRobert Watson */ 490d4b5cae4SRobert Watson while ((m = npwp->nw_head) != NULL) { 491d4b5cae4SRobert Watson npwp->nw_head = m->m_nextpkt; 492d4b5cae4SRobert Watson m->m_nextpkt = NULL; 493d4b5cae4SRobert Watson if (npwp->nw_head == NULL) 494d4b5cae4SRobert Watson npwp->nw_tail = NULL; 495d4b5cae4SRobert Watson npwp->nw_len--; 496d4b5cae4SRobert Watson m_freem(m); 497d4b5cae4SRobert Watson } 498d4b5cae4SRobert Watson KASSERT(npwp->nw_tail == NULL, ("%s: tail", __func__)); 499d4b5cae4SRobert Watson KASSERT(npwp->nw_len == 0, ("%s: len", __func__)); 500d4b5cae4SRobert Watson } 501d4b5cae4SRobert Watson 502d4b5cae4SRobert Watson /* 503d4b5cae4SRobert Watson * Remove the registration of a network protocol, which requires clearing 504d4b5cae4SRobert Watson * per-protocol fields across all workstreams, including freeing all mbufs in 505d4b5cae4SRobert Watson * the queues at time of unregister. All work in netisr is briefly suspended 506d4b5cae4SRobert Watson * while this takes place. 507d4b5cae4SRobert Watson */ 508d4b5cae4SRobert Watson void 509d4b5cae4SRobert Watson netisr_unregister(const struct netisr_handler *nhp) 510d4b5cae4SRobert Watson { 511d4b5cae4SRobert Watson struct netisr_work *npwp; 512d4b5cae4SRobert Watson #ifdef INVARIANTS 513d4b5cae4SRobert Watson const char *name; 514d4b5cae4SRobert Watson #endif 515d4b5cae4SRobert Watson u_int i, proto; 516d4b5cae4SRobert Watson 517d4b5cae4SRobert Watson proto = nhp->nh_proto; 518d4b5cae4SRobert Watson #ifdef INVARIANTS 519d4b5cae4SRobert Watson name = nhp->nh_name; 520d4b5cae4SRobert Watson #endif 521d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 522d4b5cae4SRobert Watson ("%s(%u): protocol too big for %s", __func__, proto, name)); 523d4b5cae4SRobert Watson 524d4b5cae4SRobert Watson NETISR_WLOCK(); 525938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 526d4b5cae4SRobert Watson ("%s(%u): protocol not registered for %s", __func__, proto, 527d4b5cae4SRobert Watson name)); 528d4b5cae4SRobert Watson 529938448cdSRobert Watson netisr_proto[proto].np_name = NULL; 530938448cdSRobert Watson netisr_proto[proto].np_handler = NULL; 531938448cdSRobert Watson netisr_proto[proto].np_m2flow = NULL; 532938448cdSRobert Watson netisr_proto[proto].np_m2cpuid = NULL; 533938448cdSRobert Watson netisr_proto[proto].np_qlimit = 0; 534938448cdSRobert Watson netisr_proto[proto].np_policy = 0; 535*3aa6d94eSJohn Baldwin CPU_FOREACH(i) { 53653402767SRobert Watson npwp = &(DPCPU_ID_PTR(i, nws))->nws_work[proto]; 537d4b5cae4SRobert Watson netisr_drain_proto(npwp); 538d4b5cae4SRobert Watson bzero(npwp, sizeof(*npwp)); 539d4b5cae4SRobert Watson } 540d4b5cae4SRobert Watson NETISR_WUNLOCK(); 541d4b5cae4SRobert Watson } 542d4b5cae4SRobert Watson 543d4b5cae4SRobert Watson /* 544d4b5cae4SRobert Watson * Look up the workstream given a packet and source identifier. Do this by 545d4b5cae4SRobert Watson * checking the protocol's policy, and optionally call out to the protocol 546d4b5cae4SRobert Watson * for assistance if required. 547d4b5cae4SRobert Watson */ 548d4b5cae4SRobert Watson static struct mbuf * 549d4b5cae4SRobert Watson netisr_select_cpuid(struct netisr_proto *npp, uintptr_t source, 550d4b5cae4SRobert Watson struct mbuf *m, u_int *cpuidp) 551d4b5cae4SRobert Watson { 552d4b5cae4SRobert Watson struct ifnet *ifp; 553d4b5cae4SRobert Watson 554d4b5cae4SRobert Watson NETISR_LOCK_ASSERT(); 555d4b5cae4SRobert Watson 556d4b5cae4SRobert Watson /* 557d4b5cae4SRobert Watson * In the event we have only one worker, shortcut and deliver to it 558d4b5cae4SRobert Watson * without further ado. 559d4b5cae4SRobert Watson */ 560d4b5cae4SRobert Watson if (nws_count == 1) { 561d4b5cae4SRobert Watson *cpuidp = nws_array[0]; 562d4b5cae4SRobert Watson return (m); 563d4b5cae4SRobert Watson } 564d4b5cae4SRobert Watson 565d4b5cae4SRobert Watson /* 566d4b5cae4SRobert Watson * What happens next depends on the policy selected by the protocol. 567d4b5cae4SRobert Watson * If we want to support per-interface policies, we should do that 568d4b5cae4SRobert Watson * here first. 569d4b5cae4SRobert Watson */ 570d4b5cae4SRobert Watson switch (npp->np_policy) { 571d4b5cae4SRobert Watson case NETISR_POLICY_CPU: 572d4b5cae4SRobert Watson return (npp->np_m2cpuid(m, source, cpuidp)); 573d4b5cae4SRobert Watson 574d4b5cae4SRobert Watson case NETISR_POLICY_FLOW: 575d4b5cae4SRobert Watson if (!(m->m_flags & M_FLOWID) && npp->np_m2flow != NULL) { 576d4b5cae4SRobert Watson m = npp->np_m2flow(m, source); 577d4b5cae4SRobert Watson if (m == NULL) 578d4b5cae4SRobert Watson return (NULL); 579d4b5cae4SRobert Watson } 580d4b5cae4SRobert Watson if (m->m_flags & M_FLOWID) { 581d4b5cae4SRobert Watson *cpuidp = 582d4b5cae4SRobert Watson netisr_default_flow2cpu(m->m_pkthdr.flowid); 583d4b5cae4SRobert Watson return (m); 584d4b5cae4SRobert Watson } 585d4b5cae4SRobert Watson /* FALLTHROUGH */ 586d4b5cae4SRobert Watson 587d4b5cae4SRobert Watson case NETISR_POLICY_SOURCE: 588d4b5cae4SRobert Watson ifp = m->m_pkthdr.rcvif; 589d4b5cae4SRobert Watson if (ifp != NULL) 590d4b5cae4SRobert Watson *cpuidp = nws_array[(ifp->if_index + source) % 591d4b5cae4SRobert Watson nws_count]; 592d4b5cae4SRobert Watson else 593d4b5cae4SRobert Watson *cpuidp = nws_array[source % nws_count]; 594d4b5cae4SRobert Watson return (m); 595d4b5cae4SRobert Watson 596d4b5cae4SRobert Watson default: 597d4b5cae4SRobert Watson panic("%s: invalid policy %u for %s", __func__, 598d4b5cae4SRobert Watson npp->np_policy, npp->np_name); 599d4b5cae4SRobert Watson } 600d4b5cae4SRobert Watson } 601d4b5cae4SRobert Watson 602d4b5cae4SRobert Watson /* 603d4b5cae4SRobert Watson * Process packets associated with a workstream and protocol. For reasons of 604d4b5cae4SRobert Watson * fairness, we process up to one complete netisr queue at a time, moving the 605d4b5cae4SRobert Watson * queue to a stack-local queue for processing, but do not loop refreshing 606d4b5cae4SRobert Watson * from the global queue. The caller is responsible for deciding whether to 607d4b5cae4SRobert Watson * loop, and for setting the NWS_RUNNING flag. The passed workstream will be 608d4b5cae4SRobert Watson * locked on entry and relocked before return, but will be released while 609d4b5cae4SRobert Watson * processing. The number of packets processed is returned. 610d4b5cae4SRobert Watson */ 611d4b5cae4SRobert Watson static u_int 612d4b5cae4SRobert Watson netisr_process_workstream_proto(struct netisr_workstream *nwsp, u_int proto) 613d4b5cae4SRobert Watson { 614d4b5cae4SRobert Watson struct netisr_work local_npw, *npwp; 615d4b5cae4SRobert Watson u_int handled; 616d4b5cae4SRobert Watson struct mbuf *m; 617d4b5cae4SRobert Watson 618d4b5cae4SRobert Watson NETISR_LOCK_ASSERT(); 619d4b5cae4SRobert Watson NWS_LOCK_ASSERT(nwsp); 620d4b5cae4SRobert Watson 621d4b5cae4SRobert Watson KASSERT(nwsp->nws_flags & NWS_RUNNING, 622d4b5cae4SRobert Watson ("%s(%u): not running", __func__, proto)); 623d4b5cae4SRobert Watson KASSERT(proto >= 0 && proto < NETISR_MAXPROT, 624d4b5cae4SRobert Watson ("%s(%u): invalid proto\n", __func__, proto)); 625d4b5cae4SRobert Watson 626d4b5cae4SRobert Watson npwp = &nwsp->nws_work[proto]; 627d4b5cae4SRobert Watson if (npwp->nw_len == 0) 628d4b5cae4SRobert Watson return (0); 629d4b5cae4SRobert Watson 630d4b5cae4SRobert Watson /* 631d4b5cae4SRobert Watson * Move the global work queue to a thread-local work queue. 632d4b5cae4SRobert Watson * 633d4b5cae4SRobert Watson * Notice that this means the effective maximum length of the queue 634d4b5cae4SRobert Watson * is actually twice that of the maximum queue length specified in 635d4b5cae4SRobert Watson * the protocol registration call. 636d4b5cae4SRobert Watson */ 637d4b5cae4SRobert Watson handled = npwp->nw_len; 638d4b5cae4SRobert Watson local_npw = *npwp; 639d4b5cae4SRobert Watson npwp->nw_head = NULL; 640d4b5cae4SRobert Watson npwp->nw_tail = NULL; 641d4b5cae4SRobert Watson npwp->nw_len = 0; 642d4b5cae4SRobert Watson nwsp->nws_pendingbits &= ~(1 << proto); 643d4b5cae4SRobert Watson NWS_UNLOCK(nwsp); 644d4b5cae4SRobert Watson while ((m = local_npw.nw_head) != NULL) { 645d4b5cae4SRobert Watson local_npw.nw_head = m->m_nextpkt; 646d4b5cae4SRobert Watson m->m_nextpkt = NULL; 647d4b5cae4SRobert Watson if (local_npw.nw_head == NULL) 648d4b5cae4SRobert Watson local_npw.nw_tail = NULL; 649d4b5cae4SRobert Watson local_npw.nw_len--; 650d4b5cae4SRobert Watson VNET_ASSERT(m->m_pkthdr.rcvif != NULL); 651d4b5cae4SRobert Watson CURVNET_SET(m->m_pkthdr.rcvif->if_vnet); 652938448cdSRobert Watson netisr_proto[proto].np_handler(m); 653d4b5cae4SRobert Watson CURVNET_RESTORE(); 654d4b5cae4SRobert Watson } 655d4b5cae4SRobert Watson KASSERT(local_npw.nw_len == 0, 656d4b5cae4SRobert Watson ("%s(%u): len %u", __func__, proto, local_npw.nw_len)); 657938448cdSRobert Watson if (netisr_proto[proto].np_drainedcpu) 658938448cdSRobert Watson netisr_proto[proto].np_drainedcpu(nwsp->nws_cpu); 659d4b5cae4SRobert Watson NWS_LOCK(nwsp); 660d4b5cae4SRobert Watson npwp->nw_handled += handled; 661d4b5cae4SRobert Watson return (handled); 662d4b5cae4SRobert Watson } 663d4b5cae4SRobert Watson 664d4b5cae4SRobert Watson /* 6650a32e29fSRobert Watson * SWI handler for netisr -- processes packets in a set of workstreams that 666d4b5cae4SRobert Watson * it owns, woken up by calls to NWS_SIGNAL(). If this workstream is already 667d4b5cae4SRobert Watson * being direct dispatched, go back to sleep and wait for the dispatching 668d4b5cae4SRobert Watson * thread to wake us up again. 669d4b5cae4SRobert Watson */ 670d4b5cae4SRobert Watson static void 671d4b5cae4SRobert Watson swi_net(void *arg) 672d4b5cae4SRobert Watson { 673d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 674d4b5cae4SRobert Watson struct rm_priotracker tracker; 675d4b5cae4SRobert Watson #endif 676d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 677d4b5cae4SRobert Watson u_int bits, prot; 678d4b5cae4SRobert Watson 679d4b5cae4SRobert Watson nwsp = arg; 680d4b5cae4SRobert Watson 6811cafed39SJonathan Lemon #ifdef DEVICE_POLLING 682d4b5cae4SRobert Watson KASSERT(nws_count == 1, 683d4b5cae4SRobert Watson ("%s: device_polling but nws_count != 1", __func__)); 684d4b5cae4SRobert Watson netisr_poll(); 685d4b5cae4SRobert Watson #endif 686d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 687d4b5cae4SRobert Watson NETISR_RLOCK(&tracker); 688d4b5cae4SRobert Watson #endif 689d4b5cae4SRobert Watson NWS_LOCK(nwsp); 690d4b5cae4SRobert Watson KASSERT(!(nwsp->nws_flags & NWS_RUNNING), ("swi_net: running")); 691d4b5cae4SRobert Watson if (nwsp->nws_flags & NWS_DISPATCHING) 692d4b5cae4SRobert Watson goto out; 693d4b5cae4SRobert Watson nwsp->nws_flags |= NWS_RUNNING; 694d4b5cae4SRobert Watson nwsp->nws_flags &= ~NWS_SCHEDULED; 695d4b5cae4SRobert Watson while ((bits = nwsp->nws_pendingbits) != 0) { 696d4b5cae4SRobert Watson while ((prot = ffs(bits)) != 0) { 697d4b5cae4SRobert Watson prot--; 698d4b5cae4SRobert Watson bits &= ~(1 << prot); 699d4b5cae4SRobert Watson (void)netisr_process_workstream_proto(nwsp, prot); 700d4b5cae4SRobert Watson } 701d4b5cae4SRobert Watson } 702d4b5cae4SRobert Watson nwsp->nws_flags &= ~NWS_RUNNING; 703d4b5cae4SRobert Watson out: 704d4b5cae4SRobert Watson NWS_UNLOCK(nwsp); 705d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 706d4b5cae4SRobert Watson NETISR_RUNLOCK(&tracker); 707d4b5cae4SRobert Watson #endif 708d4b5cae4SRobert Watson #ifdef DEVICE_POLLING 709d4b5cae4SRobert Watson netisr_pollmore(); 710d4b5cae4SRobert Watson #endif 711d4b5cae4SRobert Watson } 712d4b5cae4SRobert Watson 713d4b5cae4SRobert Watson static int 714d4b5cae4SRobert Watson netisr_queue_workstream(struct netisr_workstream *nwsp, u_int proto, 715d4b5cae4SRobert Watson struct netisr_work *npwp, struct mbuf *m, int *dosignalp) 716d4b5cae4SRobert Watson { 717d4b5cae4SRobert Watson 718d4b5cae4SRobert Watson NWS_LOCK_ASSERT(nwsp); 719d4b5cae4SRobert Watson 720d4b5cae4SRobert Watson *dosignalp = 0; 721d4b5cae4SRobert Watson if (npwp->nw_len < npwp->nw_qlimit) { 722d4b5cae4SRobert Watson m->m_nextpkt = NULL; 723d4b5cae4SRobert Watson if (npwp->nw_head == NULL) { 724d4b5cae4SRobert Watson npwp->nw_head = m; 725d4b5cae4SRobert Watson npwp->nw_tail = m; 726d4b5cae4SRobert Watson } else { 727d4b5cae4SRobert Watson npwp->nw_tail->m_nextpkt = m; 728d4b5cae4SRobert Watson npwp->nw_tail = m; 729d4b5cae4SRobert Watson } 730d4b5cae4SRobert Watson npwp->nw_len++; 731d4b5cae4SRobert Watson if (npwp->nw_len > npwp->nw_watermark) 732d4b5cae4SRobert Watson npwp->nw_watermark = npwp->nw_len; 7330a32e29fSRobert Watson 7340a32e29fSRobert Watson /* 7350a32e29fSRobert Watson * We must set the bit regardless of NWS_RUNNING, so that 7360a32e29fSRobert Watson * swi_net() keeps calling netisr_process_workstream_proto(). 7370a32e29fSRobert Watson */ 738d4b5cae4SRobert Watson nwsp->nws_pendingbits |= (1 << proto); 739d4b5cae4SRobert Watson if (!(nwsp->nws_flags & 740d4b5cae4SRobert Watson (NWS_RUNNING | NWS_DISPATCHING | NWS_SCHEDULED))) { 741d4b5cae4SRobert Watson nwsp->nws_flags |= NWS_SCHEDULED; 742d4b5cae4SRobert Watson *dosignalp = 1; /* Defer until unlocked. */ 743d4b5cae4SRobert Watson } 744d4b5cae4SRobert Watson npwp->nw_queued++; 745d4b5cae4SRobert Watson return (0); 746d4b5cae4SRobert Watson } else { 747ba3b25b3SBjoern A. Zeeb m_freem(m); 748d4b5cae4SRobert Watson npwp->nw_qdrops++; 749d4b5cae4SRobert Watson return (ENOBUFS); 750d4b5cae4SRobert Watson } 751d4b5cae4SRobert Watson } 752d4b5cae4SRobert Watson 753d4b5cae4SRobert Watson static int 754d4b5cae4SRobert Watson netisr_queue_internal(u_int proto, struct mbuf *m, u_int cpuid) 755d4b5cae4SRobert Watson { 756d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 757d4b5cae4SRobert Watson struct netisr_work *npwp; 758d4b5cae4SRobert Watson int dosignal, error; 759d4b5cae4SRobert Watson 760d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 761d4b5cae4SRobert Watson NETISR_LOCK_ASSERT(); 762d4b5cae4SRobert Watson #endif 7639e6e01ebSRobert Watson KASSERT(cpuid <= mp_maxid, ("%s: cpuid too big (%u, %u)", __func__, 7649e6e01ebSRobert Watson cpuid, mp_maxid)); 76553402767SRobert Watson KASSERT(!CPU_ABSENT(cpuid), ("%s: CPU %u absent", __func__, cpuid)); 766d4b5cae4SRobert Watson 767d4b5cae4SRobert Watson dosignal = 0; 768d4b5cae4SRobert Watson error = 0; 76953402767SRobert Watson nwsp = DPCPU_ID_PTR(cpuid, nws); 770d4b5cae4SRobert Watson npwp = &nwsp->nws_work[proto]; 771d4b5cae4SRobert Watson NWS_LOCK(nwsp); 772d4b5cae4SRobert Watson error = netisr_queue_workstream(nwsp, proto, npwp, m, &dosignal); 773d4b5cae4SRobert Watson NWS_UNLOCK(nwsp); 774d4b5cae4SRobert Watson if (dosignal) 775d4b5cae4SRobert Watson NWS_SIGNAL(nwsp); 776d4b5cae4SRobert Watson return (error); 777d4b5cae4SRobert Watson } 778d4b5cae4SRobert Watson 779d4b5cae4SRobert Watson int 780d4b5cae4SRobert Watson netisr_queue_src(u_int proto, uintptr_t source, struct mbuf *m) 781d4b5cae4SRobert Watson { 782d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 783d4b5cae4SRobert Watson struct rm_priotracker tracker; 784d4b5cae4SRobert Watson #endif 785d4b5cae4SRobert Watson u_int cpuid; 786d4b5cae4SRobert Watson int error; 787d4b5cae4SRobert Watson 788d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 789d4b5cae4SRobert Watson ("%s: invalid proto %u", __func__, proto)); 790d4b5cae4SRobert Watson 791d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 792d4b5cae4SRobert Watson NETISR_RLOCK(&tracker); 793d4b5cae4SRobert Watson #endif 794938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 795d4b5cae4SRobert Watson ("%s: invalid proto %u", __func__, proto)); 796d4b5cae4SRobert Watson 797938448cdSRobert Watson m = netisr_select_cpuid(&netisr_proto[proto], source, m, &cpuid); 79853402767SRobert Watson if (m != NULL) { 79953402767SRobert Watson KASSERT(!CPU_ABSENT(cpuid), ("%s: CPU %u absent", __func__, 80053402767SRobert Watson cpuid)); 801d4b5cae4SRobert Watson error = netisr_queue_internal(proto, m, cpuid); 80253402767SRobert Watson } else 803d4b5cae4SRobert Watson error = ENOBUFS; 804d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 805d4b5cae4SRobert Watson NETISR_RUNLOCK(&tracker); 806d4b5cae4SRobert Watson #endif 807d4b5cae4SRobert Watson return (error); 808d4b5cae4SRobert Watson } 809d4b5cae4SRobert Watson 810d4b5cae4SRobert Watson int 811d4b5cae4SRobert Watson netisr_queue(u_int proto, struct mbuf *m) 812d4b5cae4SRobert Watson { 813d4b5cae4SRobert Watson 814d4b5cae4SRobert Watson return (netisr_queue_src(proto, 0, m)); 815d4b5cae4SRobert Watson } 816d4b5cae4SRobert Watson 817d4b5cae4SRobert Watson /* 8180a32e29fSRobert Watson * Dispatch a packet for netisr processing; direct dispatch is permitted by 819d4b5cae4SRobert Watson * calling context. 820d4b5cae4SRobert Watson */ 821d4b5cae4SRobert Watson int 822d4b5cae4SRobert Watson netisr_dispatch_src(u_int proto, uintptr_t source, struct mbuf *m) 823d4b5cae4SRobert Watson { 824d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 825d4b5cae4SRobert Watson struct rm_priotracker tracker; 826d4b5cae4SRobert Watson #endif 827d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 828d4b5cae4SRobert Watson struct netisr_work *npwp; 829d4b5cae4SRobert Watson int dosignal, error; 830d4b5cae4SRobert Watson u_int cpuid; 831d4b5cae4SRobert Watson 832d4b5cae4SRobert Watson /* 833d4b5cae4SRobert Watson * If direct dispatch is entirely disabled, fall back on queueing. 834d4b5cae4SRobert Watson */ 835d4b5cae4SRobert Watson if (!netisr_direct) 836d4b5cae4SRobert Watson return (netisr_queue_src(proto, source, m)); 837d4b5cae4SRobert Watson 838d4b5cae4SRobert Watson KASSERT(proto < NETISR_MAXPROT, 839d4b5cae4SRobert Watson ("%s: invalid proto %u", __func__, proto)); 840d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 841d4b5cae4SRobert Watson NETISR_RLOCK(&tracker); 842d4b5cae4SRobert Watson #endif 843938448cdSRobert Watson KASSERT(netisr_proto[proto].np_handler != NULL, 844d4b5cae4SRobert Watson ("%s: invalid proto %u", __func__, proto)); 845d4b5cae4SRobert Watson 846d4b5cae4SRobert Watson /* 847d4b5cae4SRobert Watson * If direct dispatch is forced, then unconditionally dispatch 848d4b5cae4SRobert Watson * without a formal CPU selection. Borrow the current CPU's stats, 849d4b5cae4SRobert Watson * even if there's no worker on it. In this case we don't update 850d4b5cae4SRobert Watson * nws_flags because all netisr processing will be source ordered due 851d4b5cae4SRobert Watson * to always being forced to directly dispatch. 852d4b5cae4SRobert Watson */ 853d4b5cae4SRobert Watson if (netisr_direct_force) { 85453402767SRobert Watson nwsp = DPCPU_PTR(nws); 855d4b5cae4SRobert Watson npwp = &nwsp->nws_work[proto]; 856d4b5cae4SRobert Watson npwp->nw_dispatched++; 857d4b5cae4SRobert Watson npwp->nw_handled++; 858938448cdSRobert Watson netisr_proto[proto].np_handler(m); 859d4b5cae4SRobert Watson error = 0; 860d4b5cae4SRobert Watson goto out_unlock; 861d4b5cae4SRobert Watson } 862d4b5cae4SRobert Watson 863d4b5cae4SRobert Watson /* 864d4b5cae4SRobert Watson * Otherwise, we execute in a hybrid mode where we will try to direct 865d4b5cae4SRobert Watson * dispatch if we're on the right CPU and the netisr worker isn't 866d4b5cae4SRobert Watson * already running. 867d4b5cae4SRobert Watson */ 868938448cdSRobert Watson m = netisr_select_cpuid(&netisr_proto[proto], source, m, &cpuid); 869d4b5cae4SRobert Watson if (m == NULL) { 870d4b5cae4SRobert Watson error = ENOBUFS; 871d4b5cae4SRobert Watson goto out_unlock; 872d4b5cae4SRobert Watson } 87353402767SRobert Watson KASSERT(!CPU_ABSENT(cpuid), ("%s: CPU %u absent", __func__, cpuid)); 874d4b5cae4SRobert Watson sched_pin(); 875d4b5cae4SRobert Watson if (cpuid != curcpu) 876d4b5cae4SRobert Watson goto queue_fallback; 87753402767SRobert Watson nwsp = DPCPU_PTR(nws); 878d4b5cae4SRobert Watson npwp = &nwsp->nws_work[proto]; 879d4b5cae4SRobert Watson 880d4b5cae4SRobert Watson /*- 881d4b5cae4SRobert Watson * We are willing to direct dispatch only if three conditions hold: 882d4b5cae4SRobert Watson * 883d4b5cae4SRobert Watson * (1) The netisr worker isn't already running, 884d4b5cae4SRobert Watson * (2) Another thread isn't already directly dispatching, and 885d4b5cae4SRobert Watson * (3) The netisr hasn't already been woken up. 886d4b5cae4SRobert Watson */ 887d4b5cae4SRobert Watson NWS_LOCK(nwsp); 888d4b5cae4SRobert Watson if (nwsp->nws_flags & (NWS_RUNNING | NWS_DISPATCHING | NWS_SCHEDULED)) { 889d4b5cae4SRobert Watson error = netisr_queue_workstream(nwsp, proto, npwp, m, 890d4b5cae4SRobert Watson &dosignal); 89153402767SRobert Watson NWS_UNLOCK(nwsp); 892d4b5cae4SRobert Watson if (dosignal) 893d4b5cae4SRobert Watson NWS_SIGNAL(nwsp); 894d4b5cae4SRobert Watson goto out_unpin; 895d4b5cae4SRobert Watson } 896d4b5cae4SRobert Watson 897d4b5cae4SRobert Watson /* 898d4b5cae4SRobert Watson * The current thread is now effectively the netisr worker, so set 899d4b5cae4SRobert Watson * the dispatching flag to prevent concurrent processing of the 900d4b5cae4SRobert Watson * stream from another thread (even the netisr worker), which could 901d4b5cae4SRobert Watson * otherwise lead to effective misordering of the stream. 902d4b5cae4SRobert Watson */ 903d4b5cae4SRobert Watson nwsp->nws_flags |= NWS_DISPATCHING; 904d4b5cae4SRobert Watson NWS_UNLOCK(nwsp); 905938448cdSRobert Watson netisr_proto[proto].np_handler(m); 906d4b5cae4SRobert Watson NWS_LOCK(nwsp); 907d4b5cae4SRobert Watson nwsp->nws_flags &= ~NWS_DISPATCHING; 908d4b5cae4SRobert Watson npwp->nw_handled++; 909d4b5cae4SRobert Watson npwp->nw_hybrid_dispatched++; 910d4b5cae4SRobert Watson 911d4b5cae4SRobert Watson /* 912d4b5cae4SRobert Watson * If other work was enqueued by another thread while we were direct 913d4b5cae4SRobert Watson * dispatching, we need to signal the netisr worker to do that work. 914d4b5cae4SRobert Watson * In the future, we might want to do some of that work in the 915d4b5cae4SRobert Watson * current thread, rather than trigger further context switches. If 916d4b5cae4SRobert Watson * so, we'll want to establish a reasonable bound on the work done in 917d4b5cae4SRobert Watson * the "borrowed" context. 918d4b5cae4SRobert Watson */ 919d4b5cae4SRobert Watson if (nwsp->nws_pendingbits != 0) { 920d4b5cae4SRobert Watson nwsp->nws_flags |= NWS_SCHEDULED; 921d4b5cae4SRobert Watson dosignal = 1; 922d4b5cae4SRobert Watson } else 923d4b5cae4SRobert Watson dosignal = 0; 924d4b5cae4SRobert Watson NWS_UNLOCK(nwsp); 925d4b5cae4SRobert Watson if (dosignal) 926d4b5cae4SRobert Watson NWS_SIGNAL(nwsp); 927d4b5cae4SRobert Watson error = 0; 928d4b5cae4SRobert Watson goto out_unpin; 929d4b5cae4SRobert Watson 930d4b5cae4SRobert Watson queue_fallback: 931d4b5cae4SRobert Watson error = netisr_queue_internal(proto, m, cpuid); 932d4b5cae4SRobert Watson out_unpin: 933d4b5cae4SRobert Watson sched_unpin(); 934d4b5cae4SRobert Watson out_unlock: 935d4b5cae4SRobert Watson #ifdef NETISR_LOCKING 936d4b5cae4SRobert Watson NETISR_RUNLOCK(&tracker); 937d4b5cae4SRobert Watson #endif 938d4b5cae4SRobert Watson return (error); 939d4b5cae4SRobert Watson } 940d4b5cae4SRobert Watson 941d4b5cae4SRobert Watson int 942d4b5cae4SRobert Watson netisr_dispatch(u_int proto, struct mbuf *m) 943d4b5cae4SRobert Watson { 944d4b5cae4SRobert Watson 945d4b5cae4SRobert Watson return (netisr_dispatch_src(proto, 0, m)); 946d4b5cae4SRobert Watson } 947d4b5cae4SRobert Watson 948d4b5cae4SRobert Watson #ifdef DEVICE_POLLING 949d4b5cae4SRobert Watson /* 950d4b5cae4SRobert Watson * Kernel polling borrows a netisr thread to run interface polling in; this 951d4b5cae4SRobert Watson * function allows kernel polling to request that the netisr thread be 952d4b5cae4SRobert Watson * scheduled even if no packets are pending for protocols. 953d4b5cae4SRobert Watson */ 954d4b5cae4SRobert Watson void 955d4b5cae4SRobert Watson netisr_sched_poll(void) 956d4b5cae4SRobert Watson { 957d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 958d4b5cae4SRobert Watson 95953402767SRobert Watson nwsp = DPCPU_ID_PTR(nws_array[0], nws); 960d4b5cae4SRobert Watson NWS_SIGNAL(nwsp); 961d4b5cae4SRobert Watson } 9621cafed39SJonathan Lemon #endif 963e3b6e33cSJake Burkholder 964d4b5cae4SRobert Watson static void 965d4b5cae4SRobert Watson netisr_start_swi(u_int cpuid, struct pcpu *pc) 966d4b5cae4SRobert Watson { 967d4b5cae4SRobert Watson char swiname[12]; 968d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 969d4b5cae4SRobert Watson int error; 970d4b5cae4SRobert Watson 97153402767SRobert Watson KASSERT(!CPU_ABSENT(cpuid), ("%s: CPU %u absent", __func__, cpuid)); 97253402767SRobert Watson 97353402767SRobert Watson nwsp = DPCPU_ID_PTR(cpuid, nws); 974d4b5cae4SRobert Watson mtx_init(&nwsp->nws_mtx, "netisr_mtx", NULL, MTX_DEF); 975d4b5cae4SRobert Watson nwsp->nws_cpu = cpuid; 976d4b5cae4SRobert Watson snprintf(swiname, sizeof(swiname), "netisr %u", cpuid); 977d4b5cae4SRobert Watson error = swi_add(&nwsp->nws_intr_event, swiname, swi_net, nwsp, 978d4b5cae4SRobert Watson SWI_NET, INTR_MPSAFE, &nwsp->nws_swi_cookie); 979d4b5cae4SRobert Watson if (error) 980d4b5cae4SRobert Watson panic("%s: swi_add %d", __func__, error); 981d4b5cae4SRobert Watson pc->pc_netisr = nwsp->nws_intr_event; 982d4b5cae4SRobert Watson if (netisr_bindthreads) { 983d4b5cae4SRobert Watson error = intr_event_bind(nwsp->nws_intr_event, cpuid); 984d4b5cae4SRobert Watson if (error != 0) 985d4b5cae4SRobert Watson printf("%s: cpu %u: intr_event_bind: %d", __func__, 986d4b5cae4SRobert Watson cpuid, error); 987e3b6e33cSJake Burkholder } 988d4b5cae4SRobert Watson NETISR_WLOCK(); 989d4b5cae4SRobert Watson nws_array[nws_count] = nwsp->nws_cpu; 990d4b5cae4SRobert Watson nws_count++; 991d4b5cae4SRobert Watson NETISR_WUNLOCK(); 992e3b6e33cSJake Burkholder } 993e3b6e33cSJake Burkholder 994d4b5cae4SRobert Watson /* 995d4b5cae4SRobert Watson * Initialize the netisr subsystem. We rely on BSS and static initialization 996d4b5cae4SRobert Watson * of most fields in global data structures. 997d4b5cae4SRobert Watson * 998d4b5cae4SRobert Watson * Start a worker thread for the boot CPU so that we can support network 999d4b5cae4SRobert Watson * traffic immediately in case the network stack is used before additional 1000d4b5cae4SRobert Watson * CPUs are started (for example, diskless boot). 1001d4b5cae4SRobert Watson */ 1002e3b6e33cSJake Burkholder static void 1003d4b5cae4SRobert Watson netisr_init(void *arg) 1004e3b6e33cSJake Burkholder { 1005e3b6e33cSJake Burkholder 1006d4b5cae4SRobert Watson KASSERT(curcpu == 0, ("%s: not on CPU 0", __func__)); 1007d4b5cae4SRobert Watson 1008d4b5cae4SRobert Watson NETISR_LOCK_INIT(); 10099e6e01ebSRobert Watson if (netisr_maxthreads < 1) 1010d4b5cae4SRobert Watson netisr_maxthreads = 1; 10119e6e01ebSRobert Watson if (netisr_maxthreads > mp_ncpus) { 1012912f6323SRobert Watson printf("netisr_init: forcing maxthreads from %d to %d\n", 10139e6e01ebSRobert Watson netisr_maxthreads, mp_ncpus); 10149e6e01ebSRobert Watson netisr_maxthreads = mp_ncpus; 1015ed54411cSRobert Watson } 1016ed54411cSRobert Watson if (netisr_defaultqlimit > netisr_maxqlimit) { 1017912f6323SRobert Watson printf("netisr_init: forcing defaultqlimit from %d to %d\n", 10189e6e01ebSRobert Watson netisr_defaultqlimit, netisr_maxqlimit); 1019d4b5cae4SRobert Watson netisr_defaultqlimit = netisr_maxqlimit; 1020ed54411cSRobert Watson } 1021d4b5cae4SRobert Watson #ifdef DEVICE_POLLING 1022d4b5cae4SRobert Watson /* 1023d4b5cae4SRobert Watson * The device polling code is not yet aware of how to deal with 1024d4b5cae4SRobert Watson * multiple netisr threads, so for the time being compiling in device 1025d4b5cae4SRobert Watson * polling disables parallel netisr workers. 1026d4b5cae4SRobert Watson */ 1027ed54411cSRobert Watson if (netisr_maxthreads != 1 || netisr_bindthreads != 0) { 1028912f6323SRobert Watson printf("netisr_init: forcing maxthreads to 1 and " 1029912f6323SRobert Watson "bindthreads to 0 for device polling\n"); 1030d4b5cae4SRobert Watson netisr_maxthreads = 1; 1031d4b5cae4SRobert Watson netisr_bindthreads = 0; 1032ed54411cSRobert Watson } 1033d4b5cae4SRobert Watson #endif 1034d4b5cae4SRobert Watson 1035d4b5cae4SRobert Watson netisr_start_swi(curcpu, pcpu_find(curcpu)); 1036e3b6e33cSJake Burkholder } 1037d4b5cae4SRobert Watson SYSINIT(netisr_init, SI_SUB_SOFTINTR, SI_ORDER_FIRST, netisr_init, NULL); 1038d4b5cae4SRobert Watson 1039d4b5cae4SRobert Watson /* 1040d4b5cae4SRobert Watson * Start worker threads for additional CPUs. No attempt to gracefully handle 1041d4b5cae4SRobert Watson * work reassignment, we don't yet support dynamic reconfiguration. 1042d4b5cae4SRobert Watson */ 1043d4b5cae4SRobert Watson static void 1044d4b5cae4SRobert Watson netisr_start(void *arg) 1045d4b5cae4SRobert Watson { 1046d4b5cae4SRobert Watson struct pcpu *pc; 1047d4b5cae4SRobert Watson 1048d4b5cae4SRobert Watson SLIST_FOREACH(pc, &cpuhead, pc_allcpu) { 1049d4b5cae4SRobert Watson if (nws_count >= netisr_maxthreads) 1050d4b5cae4SRobert Watson break; 1051d4b5cae4SRobert Watson /* XXXRW: Is skipping absent CPUs still required here? */ 1052d4b5cae4SRobert Watson if (CPU_ABSENT(pc->pc_cpuid)) 1053d4b5cae4SRobert Watson continue; 1054d4b5cae4SRobert Watson /* Worker will already be present for boot CPU. */ 1055d4b5cae4SRobert Watson if (pc->pc_netisr != NULL) 1056d4b5cae4SRobert Watson continue; 1057d4b5cae4SRobert Watson netisr_start_swi(pc->pc_cpuid, pc); 1058d4b5cae4SRobert Watson } 1059d4b5cae4SRobert Watson } 1060d4b5cae4SRobert Watson SYSINIT(netisr_start, SI_SUB_SMP, SI_ORDER_MIDDLE, netisr_start, NULL); 1061d4b5cae4SRobert Watson 10622d22f334SRobert Watson /* 10632d22f334SRobert Watson * Sysctl monitoring for netisr: query a list of registered protocols. 10642d22f334SRobert Watson */ 10652d22f334SRobert Watson static int 10662d22f334SRobert Watson sysctl_netisr_proto(SYSCTL_HANDLER_ARGS) 10672d22f334SRobert Watson { 10682d22f334SRobert Watson struct rm_priotracker tracker; 10692d22f334SRobert Watson struct sysctl_netisr_proto *snpp, *snp_array; 10702d22f334SRobert Watson struct netisr_proto *npp; 10712d22f334SRobert Watson u_int counter, proto; 10722d22f334SRobert Watson int error; 10732d22f334SRobert Watson 10742d22f334SRobert Watson if (req->newptr != NULL) 10752d22f334SRobert Watson return (EINVAL); 10762d22f334SRobert Watson snp_array = malloc(sizeof(*snp_array) * NETISR_MAXPROT, M_TEMP, 10772d22f334SRobert Watson M_ZERO | M_WAITOK); 10782d22f334SRobert Watson counter = 0; 10792d22f334SRobert Watson NETISR_RLOCK(&tracker); 10802d22f334SRobert Watson for (proto = 0; proto < NETISR_MAXPROT; proto++) { 1081938448cdSRobert Watson npp = &netisr_proto[proto]; 10822d22f334SRobert Watson if (npp->np_name == NULL) 10832d22f334SRobert Watson continue; 10842d22f334SRobert Watson snpp = &snp_array[counter]; 10852d22f334SRobert Watson snpp->snp_version = sizeof(*snpp); 10862d22f334SRobert Watson strlcpy(snpp->snp_name, npp->np_name, NETISR_NAMEMAXLEN); 10872d22f334SRobert Watson snpp->snp_proto = proto; 10882d22f334SRobert Watson snpp->snp_qlimit = npp->np_qlimit; 10892d22f334SRobert Watson snpp->snp_policy = npp->np_policy; 10902d22f334SRobert Watson if (npp->np_m2flow != NULL) 10912d22f334SRobert Watson snpp->snp_flags |= NETISR_SNP_FLAGS_M2FLOW; 10922d22f334SRobert Watson if (npp->np_m2cpuid != NULL) 10932d22f334SRobert Watson snpp->snp_flags |= NETISR_SNP_FLAGS_M2CPUID; 10942d22f334SRobert Watson if (npp->np_drainedcpu != NULL) 10952d22f334SRobert Watson snpp->snp_flags |= NETISR_SNP_FLAGS_DRAINEDCPU; 10962d22f334SRobert Watson counter++; 10972d22f334SRobert Watson } 10982d22f334SRobert Watson NETISR_RUNLOCK(&tracker); 10997f450febSRobert Watson KASSERT(counter <= NETISR_MAXPROT, 11002d22f334SRobert Watson ("sysctl_netisr_proto: counter too big (%d)", counter)); 11012d22f334SRobert Watson error = SYSCTL_OUT(req, snp_array, sizeof(*snp_array) * counter); 11022d22f334SRobert Watson free(snp_array, M_TEMP); 11032d22f334SRobert Watson return (error); 11042d22f334SRobert Watson } 11052d22f334SRobert Watson 11062d22f334SRobert Watson SYSCTL_PROC(_net_isr, OID_AUTO, proto, 11072d22f334SRobert Watson CTLFLAG_RD|CTLTYPE_STRUCT|CTLFLAG_MPSAFE, 0, 0, sysctl_netisr_proto, 11082d22f334SRobert Watson "S,sysctl_netisr_proto", 11092d22f334SRobert Watson "Return list of protocols registered with netisr"); 11102d22f334SRobert Watson 11112d22f334SRobert Watson /* 11122d22f334SRobert Watson * Sysctl monitoring for netisr: query a list of workstreams. 11132d22f334SRobert Watson */ 11142d22f334SRobert Watson static int 11152d22f334SRobert Watson sysctl_netisr_workstream(SYSCTL_HANDLER_ARGS) 11162d22f334SRobert Watson { 11172d22f334SRobert Watson struct rm_priotracker tracker; 11182d22f334SRobert Watson struct sysctl_netisr_workstream *snwsp, *snws_array; 11192d22f334SRobert Watson struct netisr_workstream *nwsp; 11202d22f334SRobert Watson u_int counter, cpuid; 11212d22f334SRobert Watson int error; 11222d22f334SRobert Watson 11232d22f334SRobert Watson if (req->newptr != NULL) 11242d22f334SRobert Watson return (EINVAL); 11252d22f334SRobert Watson snws_array = malloc(sizeof(*snws_array) * MAXCPU, M_TEMP, 11262d22f334SRobert Watson M_ZERO | M_WAITOK); 11272d22f334SRobert Watson counter = 0; 11282d22f334SRobert Watson NETISR_RLOCK(&tracker); 1129*3aa6d94eSJohn Baldwin CPU_FOREACH(cpuid) { 11302d22f334SRobert Watson nwsp = DPCPU_ID_PTR(cpuid, nws); 11312d22f334SRobert Watson if (nwsp->nws_intr_event == NULL) 11322d22f334SRobert Watson continue; 11332d22f334SRobert Watson NWS_LOCK(nwsp); 11342d22f334SRobert Watson snwsp = &snws_array[counter]; 11352d22f334SRobert Watson snwsp->snws_version = sizeof(*snwsp); 11362d22f334SRobert Watson 11372d22f334SRobert Watson /* 11382d22f334SRobert Watson * For now, we equate workstream IDs and CPU IDs in the 11392d22f334SRobert Watson * kernel, but expose them independently to userspace in case 11402d22f334SRobert Watson * that assumption changes in the future. 11412d22f334SRobert Watson */ 11422d22f334SRobert Watson snwsp->snws_wsid = cpuid; 11432d22f334SRobert Watson snwsp->snws_cpu = cpuid; 11442d22f334SRobert Watson if (nwsp->nws_intr_event != NULL) 11452d22f334SRobert Watson snwsp->snws_flags |= NETISR_SNWS_FLAGS_INTR; 11462d22f334SRobert Watson NWS_UNLOCK(nwsp); 11472d22f334SRobert Watson counter++; 11482d22f334SRobert Watson } 11492d22f334SRobert Watson NETISR_RUNLOCK(&tracker); 11507f450febSRobert Watson KASSERT(counter <= MAXCPU, 11512d22f334SRobert Watson ("sysctl_netisr_workstream: counter too big (%d)", counter)); 11522d22f334SRobert Watson error = SYSCTL_OUT(req, snws_array, sizeof(*snws_array) * counter); 11532d22f334SRobert Watson free(snws_array, M_TEMP); 11542d22f334SRobert Watson return (error); 11552d22f334SRobert Watson } 11562d22f334SRobert Watson 11572d22f334SRobert Watson SYSCTL_PROC(_net_isr, OID_AUTO, workstream, 11582d22f334SRobert Watson CTLFLAG_RD|CTLTYPE_STRUCT|CTLFLAG_MPSAFE, 0, 0, sysctl_netisr_workstream, 11592d22f334SRobert Watson "S,sysctl_netisr_workstream", 11602d22f334SRobert Watson "Return list of workstreams implemented by netisr"); 11612d22f334SRobert Watson 11622d22f334SRobert Watson /* 11632d22f334SRobert Watson * Sysctl monitoring for netisr: query per-protocol data across all 11642d22f334SRobert Watson * workstreams. 11652d22f334SRobert Watson */ 11662d22f334SRobert Watson static int 11672d22f334SRobert Watson sysctl_netisr_work(SYSCTL_HANDLER_ARGS) 11682d22f334SRobert Watson { 11692d22f334SRobert Watson struct rm_priotracker tracker; 11702d22f334SRobert Watson struct sysctl_netisr_work *snwp, *snw_array; 11712d22f334SRobert Watson struct netisr_workstream *nwsp; 11722d22f334SRobert Watson struct netisr_proto *npp; 11732d22f334SRobert Watson struct netisr_work *nwp; 11742d22f334SRobert Watson u_int counter, cpuid, proto; 11752d22f334SRobert Watson int error; 11762d22f334SRobert Watson 11772d22f334SRobert Watson if (req->newptr != NULL) 11782d22f334SRobert Watson return (EINVAL); 11792d22f334SRobert Watson snw_array = malloc(sizeof(*snw_array) * MAXCPU * NETISR_MAXPROT, 11802d22f334SRobert Watson M_TEMP, M_ZERO | M_WAITOK); 11812d22f334SRobert Watson counter = 0; 11822d22f334SRobert Watson NETISR_RLOCK(&tracker); 1183*3aa6d94eSJohn Baldwin CPU_FOREACH(cpuid) { 11842d22f334SRobert Watson nwsp = DPCPU_ID_PTR(cpuid, nws); 11852d22f334SRobert Watson if (nwsp->nws_intr_event == NULL) 11862d22f334SRobert Watson continue; 11872d22f334SRobert Watson NWS_LOCK(nwsp); 11882d22f334SRobert Watson for (proto = 0; proto < NETISR_MAXPROT; proto++) { 1189938448cdSRobert Watson npp = &netisr_proto[proto]; 11902d22f334SRobert Watson if (npp->np_name == NULL) 11912d22f334SRobert Watson continue; 11922d22f334SRobert Watson nwp = &nwsp->nws_work[proto]; 11932d22f334SRobert Watson snwp = &snw_array[counter]; 11942d22f334SRobert Watson snwp->snw_version = sizeof(*snwp); 11952d22f334SRobert Watson snwp->snw_wsid = cpuid; /* See comment above. */ 11962d22f334SRobert Watson snwp->snw_proto = proto; 11972d22f334SRobert Watson snwp->snw_len = nwp->nw_len; 11982d22f334SRobert Watson snwp->snw_watermark = nwp->nw_watermark; 11992d22f334SRobert Watson snwp->snw_dispatched = nwp->nw_dispatched; 12002d22f334SRobert Watson snwp->snw_hybrid_dispatched = 12012d22f334SRobert Watson nwp->nw_hybrid_dispatched; 12022d22f334SRobert Watson snwp->snw_qdrops = nwp->nw_qdrops; 12032d22f334SRobert Watson snwp->snw_queued = nwp->nw_queued; 12042d22f334SRobert Watson snwp->snw_handled = nwp->nw_handled; 12052d22f334SRobert Watson counter++; 12062d22f334SRobert Watson } 12072d22f334SRobert Watson NWS_UNLOCK(nwsp); 12082d22f334SRobert Watson } 12097f450febSRobert Watson KASSERT(counter <= MAXCPU * NETISR_MAXPROT, 12102d22f334SRobert Watson ("sysctl_netisr_work: counter too big (%d)", counter)); 12112d22f334SRobert Watson NETISR_RUNLOCK(&tracker); 12122d22f334SRobert Watson error = SYSCTL_OUT(req, snw_array, sizeof(*snw_array) * counter); 12132d22f334SRobert Watson free(snw_array, M_TEMP); 12142d22f334SRobert Watson return (error); 12152d22f334SRobert Watson } 12162d22f334SRobert Watson 12172d22f334SRobert Watson SYSCTL_PROC(_net_isr, OID_AUTO, work, 12182d22f334SRobert Watson CTLFLAG_RD|CTLTYPE_STRUCT|CTLFLAG_MPSAFE, 0, 0, sysctl_netisr_work, 12192d22f334SRobert Watson "S,sysctl_netisr_work", 12202d22f334SRobert Watson "Return list of per-workstream, per-protocol work in netisr"); 12212d22f334SRobert Watson 1222d4b5cae4SRobert Watson #ifdef DDB 1223d4b5cae4SRobert Watson DB_SHOW_COMMAND(netisr, db_show_netisr) 1224d4b5cae4SRobert Watson { 1225d4b5cae4SRobert Watson struct netisr_workstream *nwsp; 1226d4b5cae4SRobert Watson struct netisr_work *nwp; 1227d4b5cae4SRobert Watson int first, proto; 122853402767SRobert Watson u_int cpuid; 1229d4b5cae4SRobert Watson 1230d4b5cae4SRobert Watson db_printf("%3s %6s %5s %5s %5s %8s %8s %8s %8s\n", "CPU", "Proto", 1231d4b5cae4SRobert Watson "Len", "WMark", "Max", "Disp", "HDisp", "Drop", "Queue"); 1232*3aa6d94eSJohn Baldwin CPU_FOREACH(cpuid) { 123353402767SRobert Watson nwsp = DPCPU_ID_PTR(cpuid, nws); 1234d4b5cae4SRobert Watson if (nwsp->nws_intr_event == NULL) 1235d4b5cae4SRobert Watson continue; 1236d4b5cae4SRobert Watson first = 1; 1237d4b5cae4SRobert Watson for (proto = 0; proto < NETISR_MAXPROT; proto++) { 1238938448cdSRobert Watson if (netisr_proto[proto].np_handler == NULL) 1239d4b5cae4SRobert Watson continue; 1240d4b5cae4SRobert Watson nwp = &nwsp->nws_work[proto]; 1241d4b5cae4SRobert Watson if (first) { 124253402767SRobert Watson db_printf("%3d ", cpuid); 1243d4b5cae4SRobert Watson first = 0; 1244d4b5cae4SRobert Watson } else 1245d4b5cae4SRobert Watson db_printf("%3s ", ""); 1246d4b5cae4SRobert Watson db_printf( 1247d4b5cae4SRobert Watson "%6s %5d %5d %5d %8ju %8ju %8ju %8ju\n", 1248938448cdSRobert Watson netisr_proto[proto].np_name, nwp->nw_len, 1249d4b5cae4SRobert Watson nwp->nw_watermark, nwp->nw_qlimit, 1250d4b5cae4SRobert Watson nwp->nw_dispatched, nwp->nw_hybrid_dispatched, 1251d4b5cae4SRobert Watson nwp->nw_qdrops, nwp->nw_queued); 1252d4b5cae4SRobert Watson } 1253d4b5cae4SRobert Watson } 1254d4b5cae4SRobert Watson } 1255d4b5cae4SRobert Watson #endif 1256