13b3a8eb9SGleb Smirnoff /*- 2fe267a55SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3fe267a55SPedro F. Giffuni * 491336b40SDon Lewis * Codel/FQ_Codel and PIE/FQ-PIE Code: 591336b40SDon Lewis * Copyright (C) 2016 Centre for Advanced Internet Architectures, 691336b40SDon Lewis * Swinburne University of Technology, Melbourne, Australia. 791336b40SDon Lewis * Portions of this code were made possible in part by a gift from 891336b40SDon Lewis * The Comcast Innovation Fund. 991336b40SDon Lewis * Implemented by Rasool Al-Saadi <ralsaadi@swin.edu.au> 1091336b40SDon Lewis * 113b3a8eb9SGleb Smirnoff * Copyright (c) 1998-2002,2010 Luigi Rizzo, Universita` di Pisa 123b3a8eb9SGleb Smirnoff * Portions Copyright (c) 2000 Akamba Corp. 133b3a8eb9SGleb Smirnoff * All rights reserved 143b3a8eb9SGleb Smirnoff * 153b3a8eb9SGleb Smirnoff * Redistribution and use in source and binary forms, with or without 163b3a8eb9SGleb Smirnoff * modification, are permitted provided that the following conditions 173b3a8eb9SGleb Smirnoff * are met: 183b3a8eb9SGleb Smirnoff * 1. Redistributions of source code must retain the above copyright 193b3a8eb9SGleb Smirnoff * notice, this list of conditions and the following disclaimer. 203b3a8eb9SGleb Smirnoff * 2. Redistributions in binary form must reproduce the above copyright 213b3a8eb9SGleb Smirnoff * notice, this list of conditions and the following disclaimer in the 223b3a8eb9SGleb Smirnoff * documentation and/or other materials provided with the distribution. 233b3a8eb9SGleb Smirnoff * 243b3a8eb9SGleb Smirnoff * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 253b3a8eb9SGleb Smirnoff * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 263b3a8eb9SGleb Smirnoff * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 273b3a8eb9SGleb Smirnoff * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 283b3a8eb9SGleb Smirnoff * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 293b3a8eb9SGleb Smirnoff * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 303b3a8eb9SGleb Smirnoff * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 313b3a8eb9SGleb Smirnoff * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 323b3a8eb9SGleb Smirnoff * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 333b3a8eb9SGleb Smirnoff * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 343b3a8eb9SGleb Smirnoff * SUCH DAMAGE. 353b3a8eb9SGleb Smirnoff */ 363b3a8eb9SGleb Smirnoff 373b3a8eb9SGleb Smirnoff #include <sys/cdefs.h> 383b3a8eb9SGleb Smirnoff __FBSDID("$FreeBSD$"); 393b3a8eb9SGleb Smirnoff 403b3a8eb9SGleb Smirnoff /* 413b3a8eb9SGleb Smirnoff * Configuration and internal object management for dummynet. 423b3a8eb9SGleb Smirnoff */ 433b3a8eb9SGleb Smirnoff 443b3a8eb9SGleb Smirnoff #include "opt_inet6.h" 453b3a8eb9SGleb Smirnoff 463b3a8eb9SGleb Smirnoff #include <sys/param.h> 47*51d73df1SKristof Provost #include <sys/ck.h> 483b3a8eb9SGleb Smirnoff #include <sys/systm.h> 493b3a8eb9SGleb Smirnoff #include <sys/malloc.h> 503b3a8eb9SGleb Smirnoff #include <sys/mbuf.h> 513b3a8eb9SGleb Smirnoff #include <sys/kernel.h> 523b3a8eb9SGleb Smirnoff #include <sys/lock.h> 533b3a8eb9SGleb Smirnoff #include <sys/module.h> 54eedc7fd9SGleb Smirnoff #include <sys/mutex.h> 553b3a8eb9SGleb Smirnoff #include <sys/priv.h> 563b3a8eb9SGleb Smirnoff #include <sys/proc.h> 573b3a8eb9SGleb Smirnoff #include <sys/rwlock.h> 583b3a8eb9SGleb Smirnoff #include <sys/socket.h> 593b3a8eb9SGleb Smirnoff #include <sys/socketvar.h> 603b3a8eb9SGleb Smirnoff #include <sys/time.h> 613b3a8eb9SGleb Smirnoff #include <sys/taskqueue.h> 623b3a8eb9SGleb Smirnoff #include <net/if.h> /* IFNAMSIZ, struct ifaddr, ifq head, lock.h mutex.h */ 633b3a8eb9SGleb Smirnoff #include <netinet/in.h> 643b3a8eb9SGleb Smirnoff #include <netinet/ip_var.h> /* ip_output(), IP_FORWARDING */ 653b3a8eb9SGleb Smirnoff #include <netinet/ip_fw.h> 663b3a8eb9SGleb Smirnoff #include <netinet/ip_dummynet.h> 67fe3bcfbdSTom Jones #include <net/vnet.h> 683b3a8eb9SGleb Smirnoff 693b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/ip_fw_private.h> 703b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/dn_heap.h> 713b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/ip_dn_private.h> 7291336b40SDon Lewis #ifdef NEW_AQM 7391336b40SDon Lewis #include <netpfil/ipfw/dn_aqm.h> 7491336b40SDon Lewis #endif 753b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/dn_sched.h> 763b3a8eb9SGleb Smirnoff 773b3a8eb9SGleb Smirnoff /* which objects to copy */ 783b3a8eb9SGleb Smirnoff #define DN_C_LINK 0x01 793b3a8eb9SGleb Smirnoff #define DN_C_SCH 0x02 803b3a8eb9SGleb Smirnoff #define DN_C_FLOW 0x04 813b3a8eb9SGleb Smirnoff #define DN_C_FS 0x08 823b3a8eb9SGleb Smirnoff #define DN_C_QUEUE 0x10 833b3a8eb9SGleb Smirnoff 843b3a8eb9SGleb Smirnoff /* we use this argument in case of a schk_new */ 853b3a8eb9SGleb Smirnoff struct schk_new_arg { 863b3a8eb9SGleb Smirnoff struct dn_alg *fp; 873b3a8eb9SGleb Smirnoff struct dn_sch *sch; 883b3a8eb9SGleb Smirnoff }; 893b3a8eb9SGleb Smirnoff 903b3a8eb9SGleb Smirnoff /*---- callout hooks. ----*/ 913b3a8eb9SGleb Smirnoff static struct callout dn_timeout; 92fe3bcfbdSTom Jones static int dn_tasks_started = 0; 93c8cfbc06SHans Petter Selasky static int dn_gone; 943b3a8eb9SGleb Smirnoff static struct task dn_task; 953b3a8eb9SGleb Smirnoff static struct taskqueue *dn_tq = NULL; 963b3a8eb9SGleb Smirnoff 97fe3bcfbdSTom Jones /* global scheduler list */ 98*51d73df1SKristof Provost struct mtx sched_mtx; 99*51d73df1SKristof Provost CK_LIST_HEAD(, dn_alg) schedlist; 100fe3bcfbdSTom Jones #ifdef NEW_AQM 101*51d73df1SKristof Provost CK_LIST_HEAD(, dn_aqm) aqmlist; /* list of AQMs */ 102fe3bcfbdSTom Jones #endif 103fe3bcfbdSTom Jones 1043b3a8eb9SGleb Smirnoff static void 1053b3a8eb9SGleb Smirnoff dummynet(void *arg) 1063b3a8eb9SGleb Smirnoff { 1073b3a8eb9SGleb Smirnoff 1083b3a8eb9SGleb Smirnoff (void)arg; /* UNUSED */ 109cbc4d2dbSJohn Baldwin taskqueue_enqueue(dn_tq, &dn_task); 1103b3a8eb9SGleb Smirnoff } 1113b3a8eb9SGleb Smirnoff 1123b3a8eb9SGleb Smirnoff void 1133b3a8eb9SGleb Smirnoff dn_reschedule(void) 1143b3a8eb9SGleb Smirnoff { 1155f4fc3dbSAlexander Motin 116c8cfbc06SHans Petter Selasky if (dn_gone != 0) 117c8cfbc06SHans Petter Selasky return; 1185f4fc3dbSAlexander Motin callout_reset_sbt(&dn_timeout, tick_sbt, 0, dummynet, NULL, 1195f4fc3dbSAlexander Motin C_HARDCLOCK | C_DIRECT_EXEC); 1203b3a8eb9SGleb Smirnoff } 1213b3a8eb9SGleb Smirnoff /*----- end of callout hooks -----*/ 1223b3a8eb9SGleb Smirnoff 12391336b40SDon Lewis #ifdef NEW_AQM 12491336b40SDon Lewis /* Return AQM descriptor for given type or name. */ 12591336b40SDon Lewis static struct dn_aqm * 12691336b40SDon Lewis find_aqm_type(int type, char *name) 12791336b40SDon Lewis { 12891336b40SDon Lewis struct dn_aqm *d; 12991336b40SDon Lewis 130*51d73df1SKristof Provost NET_EPOCH_ASSERT(); 131*51d73df1SKristof Provost 132*51d73df1SKristof Provost CK_LIST_FOREACH(d, &aqmlist, next) { 13391336b40SDon Lewis if (d->type == type || (name && !strcasecmp(d->name, name))) 13491336b40SDon Lewis return d; 13591336b40SDon Lewis } 13691336b40SDon Lewis return NULL; /* not found */ 13791336b40SDon Lewis } 13891336b40SDon Lewis #endif 13991336b40SDon Lewis 1403b3a8eb9SGleb Smirnoff /* Return a scheduler descriptor given the type or name. */ 1413b3a8eb9SGleb Smirnoff static struct dn_alg * 1423b3a8eb9SGleb Smirnoff find_sched_type(int type, char *name) 1433b3a8eb9SGleb Smirnoff { 1443b3a8eb9SGleb Smirnoff struct dn_alg *d; 1453b3a8eb9SGleb Smirnoff 146*51d73df1SKristof Provost NET_EPOCH_ASSERT(); 147*51d73df1SKristof Provost 148*51d73df1SKristof Provost CK_LIST_FOREACH(d, &schedlist, next) { 1493b3a8eb9SGleb Smirnoff if (d->type == type || (name && !strcasecmp(d->name, name))) 1503b3a8eb9SGleb Smirnoff return d; 1513b3a8eb9SGleb Smirnoff } 1523b3a8eb9SGleb Smirnoff return NULL; /* not found */ 1533b3a8eb9SGleb Smirnoff } 1543b3a8eb9SGleb Smirnoff 1553b3a8eb9SGleb Smirnoff int 1563b3a8eb9SGleb Smirnoff ipdn_bound_var(int *v, int dflt, int lo, int hi, const char *msg) 1573b3a8eb9SGleb Smirnoff { 1583b3a8eb9SGleb Smirnoff int oldv = *v; 1593b3a8eb9SGleb Smirnoff const char *op = NULL; 1603b3a8eb9SGleb Smirnoff if (dflt < lo) 1613b3a8eb9SGleb Smirnoff dflt = lo; 1623b3a8eb9SGleb Smirnoff if (dflt > hi) 1633b3a8eb9SGleb Smirnoff dflt = hi; 1643b3a8eb9SGleb Smirnoff if (oldv < lo) { 1653b3a8eb9SGleb Smirnoff *v = dflt; 1663b3a8eb9SGleb Smirnoff op = "Bump"; 1673b3a8eb9SGleb Smirnoff } else if (oldv > hi) { 1683b3a8eb9SGleb Smirnoff *v = hi; 1693b3a8eb9SGleb Smirnoff op = "Clamp"; 1703b3a8eb9SGleb Smirnoff } else 1713b3a8eb9SGleb Smirnoff return *v; 1723b3a8eb9SGleb Smirnoff if (op && msg) 1733b3a8eb9SGleb Smirnoff printf("%s %s to %d (was %d)\n", op, msg, *v, oldv); 1743b3a8eb9SGleb Smirnoff return *v; 1753b3a8eb9SGleb Smirnoff } 1763b3a8eb9SGleb Smirnoff 1773b3a8eb9SGleb Smirnoff /*---- flow_id mask, hash and compare functions ---*/ 1783b3a8eb9SGleb Smirnoff /* 1793b3a8eb9SGleb Smirnoff * The flow_id includes the 5-tuple, the queue/pipe number 1803b3a8eb9SGleb Smirnoff * which we store in the extra area in host order, 1813b3a8eb9SGleb Smirnoff * and for ipv6 also the flow_id6. 1823b3a8eb9SGleb Smirnoff * XXX see if we want the tos byte (can store in 'flags') 1833b3a8eb9SGleb Smirnoff */ 1843b3a8eb9SGleb Smirnoff static struct ipfw_flow_id * 1853b3a8eb9SGleb Smirnoff flow_id_mask(struct ipfw_flow_id *mask, struct ipfw_flow_id *id) 1863b3a8eb9SGleb Smirnoff { 1873b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(id); 1883b3a8eb9SGleb Smirnoff 1893b3a8eb9SGleb Smirnoff id->dst_port &= mask->dst_port; 1903b3a8eb9SGleb Smirnoff id->src_port &= mask->src_port; 1913b3a8eb9SGleb Smirnoff id->proto &= mask->proto; 1923b3a8eb9SGleb Smirnoff id->extra &= mask->extra; 1933b3a8eb9SGleb Smirnoff if (is_v6) { 1943b3a8eb9SGleb Smirnoff APPLY_MASK(&id->dst_ip6, &mask->dst_ip6); 1953b3a8eb9SGleb Smirnoff APPLY_MASK(&id->src_ip6, &mask->src_ip6); 1963b3a8eb9SGleb Smirnoff id->flow_id6 &= mask->flow_id6; 1973b3a8eb9SGleb Smirnoff } else { 1983b3a8eb9SGleb Smirnoff id->dst_ip &= mask->dst_ip; 1993b3a8eb9SGleb Smirnoff id->src_ip &= mask->src_ip; 2003b3a8eb9SGleb Smirnoff } 2013b3a8eb9SGleb Smirnoff return id; 2023b3a8eb9SGleb Smirnoff } 2033b3a8eb9SGleb Smirnoff 2043b3a8eb9SGleb Smirnoff /* computes an OR of two masks, result in dst and also returned */ 2053b3a8eb9SGleb Smirnoff static struct ipfw_flow_id * 2063b3a8eb9SGleb Smirnoff flow_id_or(struct ipfw_flow_id *src, struct ipfw_flow_id *dst) 2073b3a8eb9SGleb Smirnoff { 2083b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(dst); 2093b3a8eb9SGleb Smirnoff 2103b3a8eb9SGleb Smirnoff dst->dst_port |= src->dst_port; 2113b3a8eb9SGleb Smirnoff dst->src_port |= src->src_port; 2123b3a8eb9SGleb Smirnoff dst->proto |= src->proto; 2133b3a8eb9SGleb Smirnoff dst->extra |= src->extra; 2143b3a8eb9SGleb Smirnoff if (is_v6) { 2153b3a8eb9SGleb Smirnoff #define OR_MASK(_d, _s) \ 2163b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[0] |= (_s)->__u6_addr.__u6_addr32[0]; \ 2173b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[1] |= (_s)->__u6_addr.__u6_addr32[1]; \ 2183b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[2] |= (_s)->__u6_addr.__u6_addr32[2]; \ 2193b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[3] |= (_s)->__u6_addr.__u6_addr32[3]; 2203b3a8eb9SGleb Smirnoff OR_MASK(&dst->dst_ip6, &src->dst_ip6); 2213b3a8eb9SGleb Smirnoff OR_MASK(&dst->src_ip6, &src->src_ip6); 2223b3a8eb9SGleb Smirnoff #undef OR_MASK 2233b3a8eb9SGleb Smirnoff dst->flow_id6 |= src->flow_id6; 2243b3a8eb9SGleb Smirnoff } else { 2253b3a8eb9SGleb Smirnoff dst->dst_ip |= src->dst_ip; 2263b3a8eb9SGleb Smirnoff dst->src_ip |= src->src_ip; 2273b3a8eb9SGleb Smirnoff } 2283b3a8eb9SGleb Smirnoff return dst; 2293b3a8eb9SGleb Smirnoff } 2303b3a8eb9SGleb Smirnoff 2313b3a8eb9SGleb Smirnoff static int 2323b3a8eb9SGleb Smirnoff nonzero_mask(struct ipfw_flow_id *m) 2333b3a8eb9SGleb Smirnoff { 2343b3a8eb9SGleb Smirnoff if (m->dst_port || m->src_port || m->proto || m->extra) 2353b3a8eb9SGleb Smirnoff return 1; 2363b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(m)) { 2373b3a8eb9SGleb Smirnoff return 2383b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[0] || 2393b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[1] || 2403b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[2] || 2413b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[3] || 2423b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[0] || 2433b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[1] || 2443b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[2] || 2453b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[3] || 2463b3a8eb9SGleb Smirnoff m->flow_id6; 2473b3a8eb9SGleb Smirnoff } else { 2483b3a8eb9SGleb Smirnoff return m->dst_ip || m->src_ip; 2493b3a8eb9SGleb Smirnoff } 2503b3a8eb9SGleb Smirnoff } 2513b3a8eb9SGleb Smirnoff 2523b3a8eb9SGleb Smirnoff /* XXX we may want a better hash function */ 2533b3a8eb9SGleb Smirnoff static uint32_t 2543b3a8eb9SGleb Smirnoff flow_id_hash(struct ipfw_flow_id *id) 2553b3a8eb9SGleb Smirnoff { 2563b3a8eb9SGleb Smirnoff uint32_t i; 2573b3a8eb9SGleb Smirnoff 2583b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(id)) { 2593b3a8eb9SGleb Smirnoff uint32_t *d = (uint32_t *)&id->dst_ip6; 2603b3a8eb9SGleb Smirnoff uint32_t *s = (uint32_t *)&id->src_ip6; 2613b3a8eb9SGleb Smirnoff i = (d[0] ) ^ (d[1]) ^ 2623b3a8eb9SGleb Smirnoff (d[2] ) ^ (d[3]) ^ 2633b3a8eb9SGleb Smirnoff (d[0] >> 15) ^ (d[1] >> 15) ^ 2643b3a8eb9SGleb Smirnoff (d[2] >> 15) ^ (d[3] >> 15) ^ 2653b3a8eb9SGleb Smirnoff (s[0] << 1) ^ (s[1] << 1) ^ 2663b3a8eb9SGleb Smirnoff (s[2] << 1) ^ (s[3] << 1) ^ 2673b3a8eb9SGleb Smirnoff (s[0] << 16) ^ (s[1] << 16) ^ 2683b3a8eb9SGleb Smirnoff (s[2] << 16) ^ (s[3] << 16) ^ 2693b3a8eb9SGleb Smirnoff (id->dst_port << 1) ^ (id->src_port) ^ 2703b3a8eb9SGleb Smirnoff (id->extra) ^ 2713b3a8eb9SGleb Smirnoff (id->proto ) ^ (id->flow_id6); 2723b3a8eb9SGleb Smirnoff } else { 2733b3a8eb9SGleb Smirnoff i = (id->dst_ip) ^ (id->dst_ip >> 15) ^ 2743b3a8eb9SGleb Smirnoff (id->src_ip << 1) ^ (id->src_ip >> 16) ^ 2753b3a8eb9SGleb Smirnoff (id->extra) ^ 2763b3a8eb9SGleb Smirnoff (id->dst_port << 1) ^ (id->src_port) ^ (id->proto); 2773b3a8eb9SGleb Smirnoff } 2783b3a8eb9SGleb Smirnoff return i; 2793b3a8eb9SGleb Smirnoff } 2803b3a8eb9SGleb Smirnoff 2813b3a8eb9SGleb Smirnoff /* Like bcmp, returns 0 if ids match, 1 otherwise. */ 2823b3a8eb9SGleb Smirnoff static int 2833b3a8eb9SGleb Smirnoff flow_id_cmp(struct ipfw_flow_id *id1, struct ipfw_flow_id *id2) 2843b3a8eb9SGleb Smirnoff { 2853b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(id1); 2863b3a8eb9SGleb Smirnoff 2873b3a8eb9SGleb Smirnoff if (!is_v6) { 2883b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(id2)) 2893b3a8eb9SGleb Smirnoff return 1; /* different address families */ 2903b3a8eb9SGleb Smirnoff 2913b3a8eb9SGleb Smirnoff return (id1->dst_ip == id2->dst_ip && 2923b3a8eb9SGleb Smirnoff id1->src_ip == id2->src_ip && 2933b3a8eb9SGleb Smirnoff id1->dst_port == id2->dst_port && 2943b3a8eb9SGleb Smirnoff id1->src_port == id2->src_port && 2953b3a8eb9SGleb Smirnoff id1->proto == id2->proto && 2963b3a8eb9SGleb Smirnoff id1->extra == id2->extra) ? 0 : 1; 2973b3a8eb9SGleb Smirnoff } 2983b3a8eb9SGleb Smirnoff /* the ipv6 case */ 2993b3a8eb9SGleb Smirnoff return ( 3003b3a8eb9SGleb Smirnoff !bcmp(&id1->dst_ip6,&id2->dst_ip6, sizeof(id1->dst_ip6)) && 3013b3a8eb9SGleb Smirnoff !bcmp(&id1->src_ip6,&id2->src_ip6, sizeof(id1->src_ip6)) && 3023b3a8eb9SGleb Smirnoff id1->dst_port == id2->dst_port && 3033b3a8eb9SGleb Smirnoff id1->src_port == id2->src_port && 3043b3a8eb9SGleb Smirnoff id1->proto == id2->proto && 3053b3a8eb9SGleb Smirnoff id1->extra == id2->extra && 3063b3a8eb9SGleb Smirnoff id1->flow_id6 == id2->flow_id6) ? 0 : 1; 3073b3a8eb9SGleb Smirnoff } 3083b3a8eb9SGleb Smirnoff /*--------- end of flow-id mask, hash and compare ---------*/ 3093b3a8eb9SGleb Smirnoff 3103b3a8eb9SGleb Smirnoff /*--- support functions for the qht hashtable ---- 3113b3a8eb9SGleb Smirnoff * Entries are hashed by flow-id 3123b3a8eb9SGleb Smirnoff */ 3133b3a8eb9SGleb Smirnoff static uint32_t 3143b3a8eb9SGleb Smirnoff q_hash(uintptr_t key, int flags, void *arg) 3153b3a8eb9SGleb Smirnoff { 3163b3a8eb9SGleb Smirnoff /* compute the hash slot from the flow id */ 3173b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id = (flags & DNHT_KEY_IS_OBJ) ? 3183b3a8eb9SGleb Smirnoff &((struct dn_queue *)key)->ni.fid : 3193b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 3203b3a8eb9SGleb Smirnoff 3213b3a8eb9SGleb Smirnoff return flow_id_hash(id); 3223b3a8eb9SGleb Smirnoff } 3233b3a8eb9SGleb Smirnoff 3243b3a8eb9SGleb Smirnoff static int 3253b3a8eb9SGleb Smirnoff q_match(void *obj, uintptr_t key, int flags, void *arg) 3263b3a8eb9SGleb Smirnoff { 3273b3a8eb9SGleb Smirnoff struct dn_queue *o = (struct dn_queue *)obj; 3283b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id2; 3293b3a8eb9SGleb Smirnoff 3303b3a8eb9SGleb Smirnoff if (flags & DNHT_KEY_IS_OBJ) { 3313b3a8eb9SGleb Smirnoff /* compare pointers */ 3323b3a8eb9SGleb Smirnoff id2 = &((struct dn_queue *)key)->ni.fid; 3333b3a8eb9SGleb Smirnoff } else { 3343b3a8eb9SGleb Smirnoff id2 = (struct ipfw_flow_id *)key; 3353b3a8eb9SGleb Smirnoff } 3363b3a8eb9SGleb Smirnoff return (0 == flow_id_cmp(&o->ni.fid, id2)); 3373b3a8eb9SGleb Smirnoff } 3383b3a8eb9SGleb Smirnoff 3393b3a8eb9SGleb Smirnoff /* 3403b3a8eb9SGleb Smirnoff * create a new queue instance for the given 'key'. 3413b3a8eb9SGleb Smirnoff */ 3423b3a8eb9SGleb Smirnoff static void * 3433b3a8eb9SGleb Smirnoff q_new(uintptr_t key, int flags, void *arg) 3443b3a8eb9SGleb Smirnoff { 3453b3a8eb9SGleb Smirnoff struct dn_queue *q, *template = arg; 3463b3a8eb9SGleb Smirnoff struct dn_fsk *fs = template->fs; 3473b3a8eb9SGleb Smirnoff int size = sizeof(*q) + fs->sched->fp->q_datalen; 3483b3a8eb9SGleb Smirnoff 3493b3a8eb9SGleb Smirnoff q = malloc(size, M_DUMMYNET, M_NOWAIT | M_ZERO); 3503b3a8eb9SGleb Smirnoff if (q == NULL) { 3513b3a8eb9SGleb Smirnoff D("no memory for new queue"); 3523b3a8eb9SGleb Smirnoff return NULL; 3533b3a8eb9SGleb Smirnoff } 3543b3a8eb9SGleb Smirnoff 3553b3a8eb9SGleb Smirnoff set_oid(&q->ni.oid, DN_QUEUE, size); 3563b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) 3573b3a8eb9SGleb Smirnoff q->ni.fid = *(struct ipfw_flow_id *)key; 3583b3a8eb9SGleb Smirnoff q->fs = fs; 3593b3a8eb9SGleb Smirnoff q->_si = template->_si; 3603b3a8eb9SGleb Smirnoff q->_si->q_count++; 3613b3a8eb9SGleb Smirnoff 3623b3a8eb9SGleb Smirnoff if (fs->sched->fp->new_queue) 3633b3a8eb9SGleb Smirnoff fs->sched->fp->new_queue(q); 36491336b40SDon Lewis 36591336b40SDon Lewis #ifdef NEW_AQM 36691336b40SDon Lewis /* call AQM init function after creating a queue*/ 36791336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->init) 36891336b40SDon Lewis if(fs->aqmfp->init(q)) 36991336b40SDon Lewis D("unable to init AQM for fs %d", fs->fs.fs_nr); 37091336b40SDon Lewis #endif 371fe3bcfbdSTom Jones V_dn_cfg.queue_count++; 37291336b40SDon Lewis 3733b3a8eb9SGleb Smirnoff return q; 3743b3a8eb9SGleb Smirnoff } 3753b3a8eb9SGleb Smirnoff 3763b3a8eb9SGleb Smirnoff /* 3773b3a8eb9SGleb Smirnoff * Notify schedulers that a queue is going away. 3783b3a8eb9SGleb Smirnoff * If (flags & DN_DESTROY), also free the packets. 3793b3a8eb9SGleb Smirnoff * The version for callbacks is called q_delete_cb(). 3803b3a8eb9SGleb Smirnoff */ 3813b3a8eb9SGleb Smirnoff static void 3823b3a8eb9SGleb Smirnoff dn_delete_queue(struct dn_queue *q, int flags) 3833b3a8eb9SGleb Smirnoff { 3843b3a8eb9SGleb Smirnoff struct dn_fsk *fs = q->fs; 3853b3a8eb9SGleb Smirnoff 38691336b40SDon Lewis #ifdef NEW_AQM 38791336b40SDon Lewis /* clean up AQM status for queue 'q' 38891336b40SDon Lewis * cleanup here is called just with MULTIQUEUE 38991336b40SDon Lewis */ 39091336b40SDon Lewis if (fs && fs->aqmfp && fs->aqmfp->cleanup) 39191336b40SDon Lewis fs->aqmfp->cleanup(q); 39291336b40SDon Lewis #endif 3933b3a8eb9SGleb Smirnoff // D("fs %p si %p\n", fs, q->_si); 3943b3a8eb9SGleb Smirnoff /* notify the parent scheduler that the queue is going away */ 3953b3a8eb9SGleb Smirnoff if (fs && fs->sched->fp->free_queue) 3963b3a8eb9SGleb Smirnoff fs->sched->fp->free_queue(q); 3973b3a8eb9SGleb Smirnoff q->_si->q_count--; 3983b3a8eb9SGleb Smirnoff q->_si = NULL; 3993b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) { 4003b3a8eb9SGleb Smirnoff if (q->mq.head) 4013b3a8eb9SGleb Smirnoff dn_free_pkts(q->mq.head); 4023b3a8eb9SGleb Smirnoff bzero(q, sizeof(*q)); // safety 4033b3a8eb9SGleb Smirnoff free(q, M_DUMMYNET); 404fe3bcfbdSTom Jones V_dn_cfg.queue_count--; 4053b3a8eb9SGleb Smirnoff } 4063b3a8eb9SGleb Smirnoff } 4073b3a8eb9SGleb Smirnoff 4083b3a8eb9SGleb Smirnoff static int 4093b3a8eb9SGleb Smirnoff q_delete_cb(void *q, void *arg) 4103b3a8eb9SGleb Smirnoff { 4113b3a8eb9SGleb Smirnoff int flags = (int)(uintptr_t)arg; 4123b3a8eb9SGleb Smirnoff dn_delete_queue(q, flags); 4133b3a8eb9SGleb Smirnoff return (flags & DN_DESTROY) ? DNHT_SCAN_DEL : 0; 4143b3a8eb9SGleb Smirnoff } 4153b3a8eb9SGleb Smirnoff 4163b3a8eb9SGleb Smirnoff /* 4173b3a8eb9SGleb Smirnoff * calls dn_delete_queue/q_delete_cb on all queues, 4183b3a8eb9SGleb Smirnoff * which notifies the parent scheduler and possibly drains packets. 4193b3a8eb9SGleb Smirnoff * flags & DN_DESTROY: drains queues and destroy qht; 4203b3a8eb9SGleb Smirnoff */ 4213b3a8eb9SGleb Smirnoff static void 4223b3a8eb9SGleb Smirnoff qht_delete(struct dn_fsk *fs, int flags) 4233b3a8eb9SGleb Smirnoff { 4243b3a8eb9SGleb Smirnoff ND("fs %d start flags %d qht %p", 4253b3a8eb9SGleb Smirnoff fs->fs.fs_nr, flags, fs->qht); 4263b3a8eb9SGleb Smirnoff if (!fs->qht) 4273b3a8eb9SGleb Smirnoff return; 4283b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 4293b3a8eb9SGleb Smirnoff dn_ht_scan(fs->qht, q_delete_cb, (void *)(uintptr_t)flags); 4303b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) { 4313b3a8eb9SGleb Smirnoff dn_ht_free(fs->qht, 0); 4323b3a8eb9SGleb Smirnoff fs->qht = NULL; 4333b3a8eb9SGleb Smirnoff } 4343b3a8eb9SGleb Smirnoff } else { 4353b3a8eb9SGleb Smirnoff dn_delete_queue((struct dn_queue *)(fs->qht), flags); 4363b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) 4373b3a8eb9SGleb Smirnoff fs->qht = NULL; 4383b3a8eb9SGleb Smirnoff } 4393b3a8eb9SGleb Smirnoff } 4403b3a8eb9SGleb Smirnoff 4413b3a8eb9SGleb Smirnoff /* 4423b3a8eb9SGleb Smirnoff * Find and possibly create the queue for a MULTIQUEUE scheduler. 4433b3a8eb9SGleb Smirnoff * We never call it for !MULTIQUEUE (the queue is in the sch_inst). 4443b3a8eb9SGleb Smirnoff */ 4453b3a8eb9SGleb Smirnoff struct dn_queue * 4463b3a8eb9SGleb Smirnoff ipdn_q_find(struct dn_fsk *fs, struct dn_sch_inst *si, 4473b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id) 4483b3a8eb9SGleb Smirnoff { 4493b3a8eb9SGleb Smirnoff struct dn_queue template; 4503b3a8eb9SGleb Smirnoff 4513b3a8eb9SGleb Smirnoff template._si = si; 4523b3a8eb9SGleb Smirnoff template.fs = fs; 4533b3a8eb9SGleb Smirnoff 4543b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 4553b3a8eb9SGleb Smirnoff struct ipfw_flow_id masked_id; 4563b3a8eb9SGleb Smirnoff if (fs->qht == NULL) { 4573b3a8eb9SGleb Smirnoff fs->qht = dn_ht_init(NULL, fs->fs.buckets, 4583b3a8eb9SGleb Smirnoff offsetof(struct dn_queue, q_next), 4593b3a8eb9SGleb Smirnoff q_hash, q_match, q_new); 4603b3a8eb9SGleb Smirnoff if (fs->qht == NULL) 4613b3a8eb9SGleb Smirnoff return NULL; 4623b3a8eb9SGleb Smirnoff } 4633b3a8eb9SGleb Smirnoff masked_id = *id; 4643b3a8eb9SGleb Smirnoff flow_id_mask(&fs->fsk_mask, &masked_id); 4653b3a8eb9SGleb Smirnoff return dn_ht_find(fs->qht, (uintptr_t)&masked_id, 4663b3a8eb9SGleb Smirnoff DNHT_INSERT, &template); 4673b3a8eb9SGleb Smirnoff } else { 4683b3a8eb9SGleb Smirnoff if (fs->qht == NULL) 4693b3a8eb9SGleb Smirnoff fs->qht = q_new(0, 0, &template); 4703b3a8eb9SGleb Smirnoff return (struct dn_queue *)fs->qht; 4713b3a8eb9SGleb Smirnoff } 4723b3a8eb9SGleb Smirnoff } 4733b3a8eb9SGleb Smirnoff /*--- end of queue hash table ---*/ 4743b3a8eb9SGleb Smirnoff 4753b3a8eb9SGleb Smirnoff /*--- support functions for the sch_inst hashtable ---- 4763b3a8eb9SGleb Smirnoff * 4773b3a8eb9SGleb Smirnoff * These are hashed by flow-id 4783b3a8eb9SGleb Smirnoff */ 4793b3a8eb9SGleb Smirnoff static uint32_t 4803b3a8eb9SGleb Smirnoff si_hash(uintptr_t key, int flags, void *arg) 4813b3a8eb9SGleb Smirnoff { 4823b3a8eb9SGleb Smirnoff /* compute the hash slot from the flow id */ 4833b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id = (flags & DNHT_KEY_IS_OBJ) ? 4843b3a8eb9SGleb Smirnoff &((struct dn_sch_inst *)key)->ni.fid : 4853b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 4863b3a8eb9SGleb Smirnoff 4873b3a8eb9SGleb Smirnoff return flow_id_hash(id); 4883b3a8eb9SGleb Smirnoff } 4893b3a8eb9SGleb Smirnoff 4903b3a8eb9SGleb Smirnoff static int 4913b3a8eb9SGleb Smirnoff si_match(void *obj, uintptr_t key, int flags, void *arg) 4923b3a8eb9SGleb Smirnoff { 4933b3a8eb9SGleb Smirnoff struct dn_sch_inst *o = obj; 4943b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id2; 4953b3a8eb9SGleb Smirnoff 4963b3a8eb9SGleb Smirnoff id2 = (flags & DNHT_KEY_IS_OBJ) ? 4973b3a8eb9SGleb Smirnoff &((struct dn_sch_inst *)key)->ni.fid : 4983b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 4993b3a8eb9SGleb Smirnoff return flow_id_cmp(&o->ni.fid, id2) == 0; 5003b3a8eb9SGleb Smirnoff } 5013b3a8eb9SGleb Smirnoff 5023b3a8eb9SGleb Smirnoff /* 5033b3a8eb9SGleb Smirnoff * create a new instance for the given 'key' 5043b3a8eb9SGleb Smirnoff * Allocate memory for instance, delay line and scheduler private data. 5053b3a8eb9SGleb Smirnoff */ 5063b3a8eb9SGleb Smirnoff static void * 5073b3a8eb9SGleb Smirnoff si_new(uintptr_t key, int flags, void *arg) 5083b3a8eb9SGleb Smirnoff { 5093b3a8eb9SGleb Smirnoff struct dn_schk *s = arg; 5103b3a8eb9SGleb Smirnoff struct dn_sch_inst *si; 5113b3a8eb9SGleb Smirnoff int l = sizeof(*si) + s->fp->si_datalen; 5123b3a8eb9SGleb Smirnoff 5133b3a8eb9SGleb Smirnoff si = malloc(l, M_DUMMYNET, M_NOWAIT | M_ZERO); 5143b3a8eb9SGleb Smirnoff if (si == NULL) 5153b3a8eb9SGleb Smirnoff goto error; 5163b3a8eb9SGleb Smirnoff 5173b3a8eb9SGleb Smirnoff /* Set length only for the part passed up to userland. */ 5183b3a8eb9SGleb Smirnoff set_oid(&si->ni.oid, DN_SCH_I, sizeof(struct dn_flow)); 5193b3a8eb9SGleb Smirnoff set_oid(&(si->dline.oid), DN_DELAY_LINE, 5203b3a8eb9SGleb Smirnoff sizeof(struct delay_line)); 5213b3a8eb9SGleb Smirnoff /* mark si and dline as outside the event queue */ 5223b3a8eb9SGleb Smirnoff si->ni.oid.id = si->dline.oid.id = -1; 5233b3a8eb9SGleb Smirnoff 5243b3a8eb9SGleb Smirnoff si->sched = s; 5253b3a8eb9SGleb Smirnoff si->dline.si = si; 5263b3a8eb9SGleb Smirnoff 5273b3a8eb9SGleb Smirnoff if (s->fp->new_sched && s->fp->new_sched(si)) { 5283b3a8eb9SGleb Smirnoff D("new_sched error"); 5293b3a8eb9SGleb Smirnoff goto error; 5303b3a8eb9SGleb Smirnoff } 5313b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 5323b3a8eb9SGleb Smirnoff si->ni.fid = *(struct ipfw_flow_id *)key; 5333b3a8eb9SGleb Smirnoff 53491336b40SDon Lewis #ifdef NEW_AQM 53591336b40SDon Lewis /* init AQM status for !DN_MULTIQUEUE sched*/ 53691336b40SDon Lewis if (!(s->fp->flags & DN_MULTIQUEUE)) 53791336b40SDon Lewis if (s->fs->aqmfp && s->fs->aqmfp->init) 53891336b40SDon Lewis if(s->fs->aqmfp->init((struct dn_queue *)(si + 1))) { 53991336b40SDon Lewis D("unable to init AQM for fs %d", s->fs->fs.fs_nr); 54091336b40SDon Lewis goto error; 54191336b40SDon Lewis } 54291336b40SDon Lewis #endif 54391336b40SDon Lewis 544fe3bcfbdSTom Jones V_dn_cfg.si_count++; 5453b3a8eb9SGleb Smirnoff return si; 5463b3a8eb9SGleb Smirnoff 5473b3a8eb9SGleb Smirnoff error: 5483b3a8eb9SGleb Smirnoff if (si) { 5493b3a8eb9SGleb Smirnoff bzero(si, sizeof(*si)); // safety 5503b3a8eb9SGleb Smirnoff free(si, M_DUMMYNET); 5513b3a8eb9SGleb Smirnoff } 5523b3a8eb9SGleb Smirnoff return NULL; 5533b3a8eb9SGleb Smirnoff } 5543b3a8eb9SGleb Smirnoff 5553b3a8eb9SGleb Smirnoff /* 5563b3a8eb9SGleb Smirnoff * Callback from siht to delete all scheduler instances. Remove 5573b3a8eb9SGleb Smirnoff * si and delay line from the system heap, destroy all queues. 5583b3a8eb9SGleb Smirnoff * We assume that all flowset have been notified and do not 5593b3a8eb9SGleb Smirnoff * point to us anymore. 5603b3a8eb9SGleb Smirnoff */ 5613b3a8eb9SGleb Smirnoff static int 5623b3a8eb9SGleb Smirnoff si_destroy(void *_si, void *arg) 5633b3a8eb9SGleb Smirnoff { 5643b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 5653b3a8eb9SGleb Smirnoff struct dn_schk *s = si->sched; 5663b3a8eb9SGleb Smirnoff struct delay_line *dl = &si->dline; 5673b3a8eb9SGleb Smirnoff 5683b3a8eb9SGleb Smirnoff if (dl->oid.subtype) /* remove delay line from event heap */ 569fe3bcfbdSTom Jones heap_extract(&V_dn_cfg.evheap, dl); 5703b3a8eb9SGleb Smirnoff dn_free_pkts(dl->mq.head); /* drain delay line */ 5713b3a8eb9SGleb Smirnoff if (si->kflags & DN_ACTIVE) /* remove si from event heap */ 572fe3bcfbdSTom Jones heap_extract(&V_dn_cfg.evheap, si); 57391336b40SDon Lewis 57491336b40SDon Lewis #ifdef NEW_AQM 57591336b40SDon Lewis /* clean up AQM status for !DN_MULTIQUEUE sched 57691336b40SDon Lewis * Note that all queues belong to fs were cleaned up in fsk_detach. 57791336b40SDon Lewis * When drain_scheduler is called s->fs and q->fs are pointing 57891336b40SDon Lewis * to a correct fs, so we can use fs in this case. 57991336b40SDon Lewis */ 58091336b40SDon Lewis if (!(s->fp->flags & DN_MULTIQUEUE)) { 58191336b40SDon Lewis struct dn_queue *q = (struct dn_queue *)(si + 1); 58291336b40SDon Lewis if (q->aqm_status && q->fs->aqmfp) 58391336b40SDon Lewis if (q->fs->aqmfp->cleanup) 58491336b40SDon Lewis q->fs->aqmfp->cleanup(q); 58591336b40SDon Lewis } 58691336b40SDon Lewis #endif 5873b3a8eb9SGleb Smirnoff if (s->fp->free_sched) 5883b3a8eb9SGleb Smirnoff s->fp->free_sched(si); 5893b3a8eb9SGleb Smirnoff bzero(si, sizeof(*si)); /* safety */ 5903b3a8eb9SGleb Smirnoff free(si, M_DUMMYNET); 591fe3bcfbdSTom Jones V_dn_cfg.si_count--; 5923b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; 5933b3a8eb9SGleb Smirnoff } 5943b3a8eb9SGleb Smirnoff 5953b3a8eb9SGleb Smirnoff /* 5963b3a8eb9SGleb Smirnoff * Find the scheduler instance for this packet. If we need to apply 5973b3a8eb9SGleb Smirnoff * a mask, do on a local copy of the flow_id to preserve the original. 5983b3a8eb9SGleb Smirnoff * Assume siht is always initialized if we have a mask. 5993b3a8eb9SGleb Smirnoff */ 6003b3a8eb9SGleb Smirnoff struct dn_sch_inst * 6013b3a8eb9SGleb Smirnoff ipdn_si_find(struct dn_schk *s, struct ipfw_flow_id *id) 6023b3a8eb9SGleb Smirnoff { 6033b3a8eb9SGleb Smirnoff 6043b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 6053b3a8eb9SGleb Smirnoff struct ipfw_flow_id id_t = *id; 6063b3a8eb9SGleb Smirnoff flow_id_mask(&s->sch.sched_mask, &id_t); 6073b3a8eb9SGleb Smirnoff return dn_ht_find(s->siht, (uintptr_t)&id_t, 6083b3a8eb9SGleb Smirnoff DNHT_INSERT, s); 6093b3a8eb9SGleb Smirnoff } 6103b3a8eb9SGleb Smirnoff if (!s->siht) 6113b3a8eb9SGleb Smirnoff s->siht = si_new(0, 0, s); 6123b3a8eb9SGleb Smirnoff return (struct dn_sch_inst *)s->siht; 6133b3a8eb9SGleb Smirnoff } 6143b3a8eb9SGleb Smirnoff 6153b3a8eb9SGleb Smirnoff /* callback to flush credit for the scheduler instance */ 6163b3a8eb9SGleb Smirnoff static int 6173b3a8eb9SGleb Smirnoff si_reset_credit(void *_si, void *arg) 6183b3a8eb9SGleb Smirnoff { 6193b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 6203b3a8eb9SGleb Smirnoff struct dn_link *p = &si->sched->link; 6213b3a8eb9SGleb Smirnoff 622fe3bcfbdSTom Jones si->credit = p->burst + (V_dn_cfg.io_fast ? p->bandwidth : 0); 6233b3a8eb9SGleb Smirnoff return 0; 6243b3a8eb9SGleb Smirnoff } 6253b3a8eb9SGleb Smirnoff 6263b3a8eb9SGleb Smirnoff static void 6273b3a8eb9SGleb Smirnoff schk_reset_credit(struct dn_schk *s) 6283b3a8eb9SGleb Smirnoff { 6293b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 6303b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, si_reset_credit, NULL); 6313b3a8eb9SGleb Smirnoff else if (s->siht) 6323b3a8eb9SGleb Smirnoff si_reset_credit(s->siht, NULL); 6333b3a8eb9SGleb Smirnoff } 6343b3a8eb9SGleb Smirnoff /*---- end of sch_inst hashtable ---------------------*/ 6353b3a8eb9SGleb Smirnoff 6363b3a8eb9SGleb Smirnoff /*------------------------------------------------------- 6373b3a8eb9SGleb Smirnoff * flowset hash (fshash) support. Entries are hashed by fs_nr. 6383b3a8eb9SGleb Smirnoff * New allocations are put in the fsunlinked list, from which 6393b3a8eb9SGleb Smirnoff * they are removed when they point to a specific scheduler. 6403b3a8eb9SGleb Smirnoff */ 6413b3a8eb9SGleb Smirnoff static uint32_t 6423b3a8eb9SGleb Smirnoff fsk_hash(uintptr_t key, int flags, void *arg) 6433b3a8eb9SGleb Smirnoff { 6443b3a8eb9SGleb Smirnoff uint32_t i = !(flags & DNHT_KEY_IS_OBJ) ? key : 6453b3a8eb9SGleb Smirnoff ((struct dn_fsk *)key)->fs.fs_nr; 6463b3a8eb9SGleb Smirnoff 6473b3a8eb9SGleb Smirnoff return ( (i>>8)^(i>>4)^i ); 6483b3a8eb9SGleb Smirnoff } 6493b3a8eb9SGleb Smirnoff 6503b3a8eb9SGleb Smirnoff static int 6513b3a8eb9SGleb Smirnoff fsk_match(void *obj, uintptr_t key, int flags, void *arg) 6523b3a8eb9SGleb Smirnoff { 6533b3a8eb9SGleb Smirnoff struct dn_fsk *fs = obj; 6543b3a8eb9SGleb Smirnoff int i = !(flags & DNHT_KEY_IS_OBJ) ? key : 6553b3a8eb9SGleb Smirnoff ((struct dn_fsk *)key)->fs.fs_nr; 6563b3a8eb9SGleb Smirnoff 6573b3a8eb9SGleb Smirnoff return (fs->fs.fs_nr == i); 6583b3a8eb9SGleb Smirnoff } 6593b3a8eb9SGleb Smirnoff 6603b3a8eb9SGleb Smirnoff static void * 6613b3a8eb9SGleb Smirnoff fsk_new(uintptr_t key, int flags, void *arg) 6623b3a8eb9SGleb Smirnoff { 6633b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 6643b3a8eb9SGleb Smirnoff 6653b3a8eb9SGleb Smirnoff fs = malloc(sizeof(*fs), M_DUMMYNET, M_NOWAIT | M_ZERO); 6663b3a8eb9SGleb Smirnoff if (fs) { 6673b3a8eb9SGleb Smirnoff set_oid(&fs->fs.oid, DN_FS, sizeof(fs->fs)); 668fe3bcfbdSTom Jones V_dn_cfg.fsk_count++; 6693b3a8eb9SGleb Smirnoff fs->drain_bucket = 0; 670fe3bcfbdSTom Jones SLIST_INSERT_HEAD(&V_dn_cfg.fsu, fs, sch_chain); 6713b3a8eb9SGleb Smirnoff } 6723b3a8eb9SGleb Smirnoff return fs; 6733b3a8eb9SGleb Smirnoff } 6743b3a8eb9SGleb Smirnoff 67591336b40SDon Lewis #ifdef NEW_AQM 67691336b40SDon Lewis /* callback function for cleaning up AQM queue status belongs to a flowset 67791336b40SDon Lewis * connected to scheduler instance '_si' (for !DN_MULTIQUEUE only). 67891336b40SDon Lewis */ 67991336b40SDon Lewis static int 68091336b40SDon Lewis si_cleanup_q(void *_si, void *arg) 68191336b40SDon Lewis { 68291336b40SDon Lewis struct dn_sch_inst *si = _si; 68391336b40SDon Lewis 68491336b40SDon Lewis if (!(si->sched->fp->flags & DN_MULTIQUEUE)) { 68591336b40SDon Lewis if (si->sched->fs->aqmfp && si->sched->fs->aqmfp->cleanup) 68691336b40SDon Lewis si->sched->fs->aqmfp->cleanup((struct dn_queue *) (si+1)); 68791336b40SDon Lewis } 68891336b40SDon Lewis return 0; 68991336b40SDon Lewis } 69091336b40SDon Lewis 69191336b40SDon Lewis /* callback to clean up queue AQM status.*/ 69291336b40SDon Lewis static int 69391336b40SDon Lewis q_cleanup_q(void *_q, void *arg) 69491336b40SDon Lewis { 69591336b40SDon Lewis struct dn_queue *q = _q; 69691336b40SDon Lewis q->fs->aqmfp->cleanup(q); 69791336b40SDon Lewis return 0; 69891336b40SDon Lewis } 69991336b40SDon Lewis 70091336b40SDon Lewis /* Clean up all AQM queues status belongs to flowset 'fs' and then 70191336b40SDon Lewis * deconfig AQM for flowset 'fs' 70291336b40SDon Lewis */ 70391336b40SDon Lewis static void 70491336b40SDon Lewis aqm_cleanup_deconfig_fs(struct dn_fsk *fs) 70591336b40SDon Lewis { 70691336b40SDon Lewis struct dn_sch_inst *si; 70791336b40SDon Lewis 70891336b40SDon Lewis /* clean up AQM status for all queues for !DN_MULTIQUEUE sched*/ 70991336b40SDon Lewis if (fs->fs.fs_nr > DN_MAX_ID) { 71091336b40SDon Lewis if (fs->sched && !(fs->sched->fp->flags & DN_MULTIQUEUE)) { 71191336b40SDon Lewis if (fs->sched->sch.flags & DN_HAVE_MASK) 71291336b40SDon Lewis dn_ht_scan(fs->sched->siht, si_cleanup_q, NULL); 71391336b40SDon Lewis else { 71491336b40SDon Lewis /* single si i.e. no sched mask */ 71591336b40SDon Lewis si = (struct dn_sch_inst *) fs->sched->siht; 71691336b40SDon Lewis if (si && fs->aqmfp && fs->aqmfp->cleanup) 71791336b40SDon Lewis fs->aqmfp->cleanup((struct dn_queue *) (si+1)); 71891336b40SDon Lewis } 71991336b40SDon Lewis } 72091336b40SDon Lewis } 72191336b40SDon Lewis 72291336b40SDon Lewis /* clean up AQM status for all queues for DN_MULTIQUEUE sched*/ 72391336b40SDon Lewis if (fs->sched && fs->sched->fp->flags & DN_MULTIQUEUE && fs->qht) { 72491336b40SDon Lewis if (fs->fs.flags & DN_QHT_HASH) 72591336b40SDon Lewis dn_ht_scan(fs->qht, q_cleanup_q, NULL); 72691336b40SDon Lewis else 72791336b40SDon Lewis fs->aqmfp->cleanup((struct dn_queue *)(fs->qht)); 72891336b40SDon Lewis } 72991336b40SDon Lewis 73091336b40SDon Lewis /* deconfig AQM */ 73191336b40SDon Lewis if(fs->aqmcfg && fs->aqmfp && fs->aqmfp->deconfig) 73291336b40SDon Lewis fs->aqmfp->deconfig(fs); 73391336b40SDon Lewis } 73491336b40SDon Lewis #endif 73591336b40SDon Lewis 7363b3a8eb9SGleb Smirnoff /* 7373b3a8eb9SGleb Smirnoff * detach flowset from its current scheduler. Flags as follows: 7383b3a8eb9SGleb Smirnoff * DN_DETACH removes from the fsk_list 7393b3a8eb9SGleb Smirnoff * DN_DESTROY deletes individual queues 7403b3a8eb9SGleb Smirnoff * DN_DELETE_FS destroys the flowset (otherwise goes in unlinked). 7413b3a8eb9SGleb Smirnoff */ 7423b3a8eb9SGleb Smirnoff static void 7433b3a8eb9SGleb Smirnoff fsk_detach(struct dn_fsk *fs, int flags) 7443b3a8eb9SGleb Smirnoff { 7453b3a8eb9SGleb Smirnoff if (flags & DN_DELETE_FS) 7463b3a8eb9SGleb Smirnoff flags |= DN_DESTROY; 7473b3a8eb9SGleb Smirnoff ND("fs %d from sched %d flags %s %s %s", 7483b3a8eb9SGleb Smirnoff fs->fs.fs_nr, fs->fs.sched_nr, 7493b3a8eb9SGleb Smirnoff (flags & DN_DELETE_FS) ? "DEL_FS":"", 7503b3a8eb9SGleb Smirnoff (flags & DN_DESTROY) ? "DEL":"", 7513b3a8eb9SGleb Smirnoff (flags & DN_DETACH) ? "DET":""); 7523b3a8eb9SGleb Smirnoff if (flags & DN_DETACH) { /* detach from the list */ 7533b3a8eb9SGleb Smirnoff struct dn_fsk_head *h; 754fe3bcfbdSTom Jones h = fs->sched ? &fs->sched->fsk_list : &V_dn_cfg.fsu; 7553b3a8eb9SGleb Smirnoff SLIST_REMOVE(h, fs, dn_fsk, sch_chain); 7563b3a8eb9SGleb Smirnoff } 7573b3a8eb9SGleb Smirnoff /* Free the RED parameters, they will be recomputed on 7583b3a8eb9SGleb Smirnoff * subsequent attach if needed. 7593b3a8eb9SGleb Smirnoff */ 7603b3a8eb9SGleb Smirnoff if (fs->w_q_lookup) 7613b3a8eb9SGleb Smirnoff free(fs->w_q_lookup, M_DUMMYNET); 7623b3a8eb9SGleb Smirnoff fs->w_q_lookup = NULL; 7633b3a8eb9SGleb Smirnoff qht_delete(fs, flags); 76491336b40SDon Lewis #ifdef NEW_AQM 76591336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 76691336b40SDon Lewis #endif 76791336b40SDon Lewis 7683b3a8eb9SGleb Smirnoff if (fs->sched && fs->sched->fp->free_fsk) 7693b3a8eb9SGleb Smirnoff fs->sched->fp->free_fsk(fs); 7703b3a8eb9SGleb Smirnoff fs->sched = NULL; 7713b3a8eb9SGleb Smirnoff if (flags & DN_DELETE_FS) { 772578acad3SEitan Adler bzero(fs, sizeof(*fs)); /* safety */ 7733b3a8eb9SGleb Smirnoff free(fs, M_DUMMYNET); 774fe3bcfbdSTom Jones V_dn_cfg.fsk_count--; 7753b3a8eb9SGleb Smirnoff } else { 776fe3bcfbdSTom Jones SLIST_INSERT_HEAD(&V_dn_cfg.fsu, fs, sch_chain); 7773b3a8eb9SGleb Smirnoff } 7783b3a8eb9SGleb Smirnoff } 7793b3a8eb9SGleb Smirnoff 7803b3a8eb9SGleb Smirnoff /* 7813b3a8eb9SGleb Smirnoff * Detach or destroy all flowsets in a list. 7823b3a8eb9SGleb Smirnoff * flags specifies what to do: 7833b3a8eb9SGleb Smirnoff * DN_DESTROY: flush all queues 7843b3a8eb9SGleb Smirnoff * DN_DELETE_FS: DN_DESTROY + destroy flowset 7853b3a8eb9SGleb Smirnoff * DN_DELETE_FS implies DN_DESTROY 7863b3a8eb9SGleb Smirnoff */ 7873b3a8eb9SGleb Smirnoff static void 7883b3a8eb9SGleb Smirnoff fsk_detach_list(struct dn_fsk_head *h, int flags) 7893b3a8eb9SGleb Smirnoff { 7903b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 7913b3a8eb9SGleb Smirnoff int n = 0; /* only for stats */ 7923b3a8eb9SGleb Smirnoff 7933b3a8eb9SGleb Smirnoff ND("head %p flags %x", h, flags); 7943b3a8eb9SGleb Smirnoff while ((fs = SLIST_FIRST(h))) { 7953b3a8eb9SGleb Smirnoff SLIST_REMOVE_HEAD(h, sch_chain); 7963b3a8eb9SGleb Smirnoff n++; 7973b3a8eb9SGleb Smirnoff fsk_detach(fs, flags); 7983b3a8eb9SGleb Smirnoff } 7993b3a8eb9SGleb Smirnoff ND("done %d flowsets", n); 8003b3a8eb9SGleb Smirnoff } 8013b3a8eb9SGleb Smirnoff 8023b3a8eb9SGleb Smirnoff /* 8033b3a8eb9SGleb Smirnoff * called on 'queue X delete' -- removes the flowset from fshash, 8043b3a8eb9SGleb Smirnoff * deletes all queues for the flowset, and removes the flowset. 8053b3a8eb9SGleb Smirnoff */ 8063b3a8eb9SGleb Smirnoff static int 8073b3a8eb9SGleb Smirnoff delete_fs(int i, int locked) 8083b3a8eb9SGleb Smirnoff { 8093b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 8103b3a8eb9SGleb Smirnoff int err = 0; 8113b3a8eb9SGleb Smirnoff 8123b3a8eb9SGleb Smirnoff if (!locked) 8133b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 814fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, i, DNHT_REMOVE, NULL); 8153b3a8eb9SGleb Smirnoff ND("fs %d found %p", i, fs); 8163b3a8eb9SGleb Smirnoff if (fs) { 8173b3a8eb9SGleb Smirnoff fsk_detach(fs, DN_DETACH | DN_DELETE_FS); 8183b3a8eb9SGleb Smirnoff err = 0; 8193b3a8eb9SGleb Smirnoff } else 8203b3a8eb9SGleb Smirnoff err = EINVAL; 8213b3a8eb9SGleb Smirnoff if (!locked) 8223b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 8233b3a8eb9SGleb Smirnoff return err; 8243b3a8eb9SGleb Smirnoff } 8253b3a8eb9SGleb Smirnoff 8263b3a8eb9SGleb Smirnoff /*----- end of flowset hashtable support -------------*/ 8273b3a8eb9SGleb Smirnoff 8283b3a8eb9SGleb Smirnoff /*------------------------------------------------------------ 8293b3a8eb9SGleb Smirnoff * Scheduler hash. When searching by index we pass sched_nr, 8303b3a8eb9SGleb Smirnoff * otherwise we pass struct dn_sch * which is the first field in 8313b3a8eb9SGleb Smirnoff * struct dn_schk so we can cast between the two. We use this trick 8323b3a8eb9SGleb Smirnoff * because in the create phase (but it should be fixed). 8333b3a8eb9SGleb Smirnoff */ 8343b3a8eb9SGleb Smirnoff static uint32_t 8353b3a8eb9SGleb Smirnoff schk_hash(uintptr_t key, int flags, void *_arg) 8363b3a8eb9SGleb Smirnoff { 8373b3a8eb9SGleb Smirnoff uint32_t i = !(flags & DNHT_KEY_IS_OBJ) ? key : 8383b3a8eb9SGleb Smirnoff ((struct dn_schk *)key)->sch.sched_nr; 8393b3a8eb9SGleb Smirnoff return ( (i>>8)^(i>>4)^i ); 8403b3a8eb9SGleb Smirnoff } 8413b3a8eb9SGleb Smirnoff 8423b3a8eb9SGleb Smirnoff static int 8433b3a8eb9SGleb Smirnoff schk_match(void *obj, uintptr_t key, int flags, void *_arg) 8443b3a8eb9SGleb Smirnoff { 8453b3a8eb9SGleb Smirnoff struct dn_schk *s = (struct dn_schk *)obj; 8463b3a8eb9SGleb Smirnoff int i = !(flags & DNHT_KEY_IS_OBJ) ? key : 8473b3a8eb9SGleb Smirnoff ((struct dn_schk *)key)->sch.sched_nr; 8483b3a8eb9SGleb Smirnoff return (s->sch.sched_nr == i); 8493b3a8eb9SGleb Smirnoff } 8503b3a8eb9SGleb Smirnoff 8513b3a8eb9SGleb Smirnoff /* 8523b3a8eb9SGleb Smirnoff * Create the entry and intialize with the sched hash if needed. 8533b3a8eb9SGleb Smirnoff * Leave s->fp unset so we can tell whether a dn_ht_find() returns 8543b3a8eb9SGleb Smirnoff * a new object or a previously existing one. 8553b3a8eb9SGleb Smirnoff */ 8563b3a8eb9SGleb Smirnoff static void * 8573b3a8eb9SGleb Smirnoff schk_new(uintptr_t key, int flags, void *arg) 8583b3a8eb9SGleb Smirnoff { 8593b3a8eb9SGleb Smirnoff struct schk_new_arg *a = arg; 8603b3a8eb9SGleb Smirnoff struct dn_schk *s; 8613b3a8eb9SGleb Smirnoff int l = sizeof(*s) +a->fp->schk_datalen; 8623b3a8eb9SGleb Smirnoff 8633b3a8eb9SGleb Smirnoff s = malloc(l, M_DUMMYNET, M_NOWAIT | M_ZERO); 8643b3a8eb9SGleb Smirnoff if (s == NULL) 8653b3a8eb9SGleb Smirnoff return NULL; 8663b3a8eb9SGleb Smirnoff set_oid(&s->link.oid, DN_LINK, sizeof(s->link)); 8673b3a8eb9SGleb Smirnoff s->sch = *a->sch; // copy initial values 8683b3a8eb9SGleb Smirnoff s->link.link_nr = s->sch.sched_nr; 8693b3a8eb9SGleb Smirnoff SLIST_INIT(&s->fsk_list); 8703b3a8eb9SGleb Smirnoff /* initialize the hash table or create the single instance */ 8713b3a8eb9SGleb Smirnoff s->fp = a->fp; /* si_new needs this */ 8723b3a8eb9SGleb Smirnoff s->drain_bucket = 0; 8733b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 8743b3a8eb9SGleb Smirnoff s->siht = dn_ht_init(NULL, s->sch.buckets, 8753b3a8eb9SGleb Smirnoff offsetof(struct dn_sch_inst, si_next), 8763b3a8eb9SGleb Smirnoff si_hash, si_match, si_new); 8773b3a8eb9SGleb Smirnoff if (s->siht == NULL) { 8783b3a8eb9SGleb Smirnoff free(s, M_DUMMYNET); 8793b3a8eb9SGleb Smirnoff return NULL; 8803b3a8eb9SGleb Smirnoff } 8813b3a8eb9SGleb Smirnoff } 8823b3a8eb9SGleb Smirnoff s->fp = NULL; /* mark as a new scheduler */ 883fe3bcfbdSTom Jones V_dn_cfg.schk_count++; 8843b3a8eb9SGleb Smirnoff return s; 8853b3a8eb9SGleb Smirnoff } 8863b3a8eb9SGleb Smirnoff 8873b3a8eb9SGleb Smirnoff /* 8883b3a8eb9SGleb Smirnoff * Callback for sched delete. Notify all attached flowsets to 8893b3a8eb9SGleb Smirnoff * detach from the scheduler, destroy the internal flowset, and 8903b3a8eb9SGleb Smirnoff * all instances. The scheduler goes away too. 8913b3a8eb9SGleb Smirnoff * arg is 0 (only detach flowsets and destroy instances) 8923b3a8eb9SGleb Smirnoff * DN_DESTROY (detach & delete queues, delete schk) 8933b3a8eb9SGleb Smirnoff * or DN_DELETE_FS (delete queues and flowsets, delete schk) 8943b3a8eb9SGleb Smirnoff */ 8953b3a8eb9SGleb Smirnoff static int 8963b3a8eb9SGleb Smirnoff schk_delete_cb(void *obj, void *arg) 8973b3a8eb9SGleb Smirnoff { 8983b3a8eb9SGleb Smirnoff struct dn_schk *s = obj; 8993b3a8eb9SGleb Smirnoff #if 0 9003b3a8eb9SGleb Smirnoff int a = (int)arg; 9013b3a8eb9SGleb Smirnoff ND("sched %d arg %s%s", 9023b3a8eb9SGleb Smirnoff s->sch.sched_nr, 9033b3a8eb9SGleb Smirnoff a&DN_DESTROY ? "DEL ":"", 9043b3a8eb9SGleb Smirnoff a&DN_DELETE_FS ? "DEL_FS":""); 9053b3a8eb9SGleb Smirnoff #endif 9063b3a8eb9SGleb Smirnoff fsk_detach_list(&s->fsk_list, arg ? DN_DESTROY : 0); 9073b3a8eb9SGleb Smirnoff /* no more flowset pointing to us now */ 9083b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 9093b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, si_destroy, NULL); 9103b3a8eb9SGleb Smirnoff dn_ht_free(s->siht, 0); 9113b3a8eb9SGleb Smirnoff } else if (s->siht) 9123b3a8eb9SGleb Smirnoff si_destroy(s->siht, NULL); 9133b3a8eb9SGleb Smirnoff if (s->profile) { 9143b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 9153b3a8eb9SGleb Smirnoff s->profile = NULL; 9163b3a8eb9SGleb Smirnoff } 9173b3a8eb9SGleb Smirnoff s->siht = NULL; 9183b3a8eb9SGleb Smirnoff if (s->fp->destroy) 9193b3a8eb9SGleb Smirnoff s->fp->destroy(s); 9203b3a8eb9SGleb Smirnoff bzero(s, sizeof(*s)); // safety 9213b3a8eb9SGleb Smirnoff free(obj, M_DUMMYNET); 922fe3bcfbdSTom Jones V_dn_cfg.schk_count--; 9233b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; 9243b3a8eb9SGleb Smirnoff } 9253b3a8eb9SGleb Smirnoff 9263b3a8eb9SGleb Smirnoff /* 9273b3a8eb9SGleb Smirnoff * called on a 'sched X delete' command. Deletes a single scheduler. 9283b3a8eb9SGleb Smirnoff * This is done by removing from the schedhash, unlinking all 9293b3a8eb9SGleb Smirnoff * flowsets and deleting their traffic. 9303b3a8eb9SGleb Smirnoff */ 9313b3a8eb9SGleb Smirnoff static int 9323b3a8eb9SGleb Smirnoff delete_schk(int i) 9333b3a8eb9SGleb Smirnoff { 9343b3a8eb9SGleb Smirnoff struct dn_schk *s; 9353b3a8eb9SGleb Smirnoff 936fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, DNHT_REMOVE, NULL); 9373b3a8eb9SGleb Smirnoff ND("%d %p", i, s); 9383b3a8eb9SGleb Smirnoff if (!s) 9393b3a8eb9SGleb Smirnoff return EINVAL; 9403b3a8eb9SGleb Smirnoff delete_fs(i + DN_MAX_ID, 1); /* first delete internal fs */ 9413b3a8eb9SGleb Smirnoff /* then detach flowsets, delete traffic */ 9423b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void*)(uintptr_t)DN_DESTROY); 9433b3a8eb9SGleb Smirnoff return 0; 9443b3a8eb9SGleb Smirnoff } 9453b3a8eb9SGleb Smirnoff /*--- end of schk hashtable support ---*/ 9463b3a8eb9SGleb Smirnoff 9473b3a8eb9SGleb Smirnoff static int 9483b3a8eb9SGleb Smirnoff copy_obj(char **start, char *end, void *_o, const char *msg, int i) 9493b3a8eb9SGleb Smirnoff { 9500ac43d97SMarius Strobl struct dn_id o; 9510ac43d97SMarius Strobl union { 9520ac43d97SMarius Strobl struct dn_link l; 9530ac43d97SMarius Strobl struct dn_schk s; 9540ac43d97SMarius Strobl } dn; 9553b3a8eb9SGleb Smirnoff int have = end - *start; 9563b3a8eb9SGleb Smirnoff 9570ac43d97SMarius Strobl memcpy(&o, _o, sizeof(o)); 9580ac43d97SMarius Strobl if (have < o.len || o.len == 0 || o.type == 0) { 9593b3a8eb9SGleb Smirnoff D("(WARN) type %d %s %d have %d need %d", 9600ac43d97SMarius Strobl o.type, msg, i, have, o.len); 9613b3a8eb9SGleb Smirnoff return 1; 9623b3a8eb9SGleb Smirnoff } 9630ac43d97SMarius Strobl ND("type %d %s %d len %d", o.type, msg, i, o.len); 9640ac43d97SMarius Strobl if (o.type == DN_LINK) { 9650ac43d97SMarius Strobl memcpy(&dn.l, _o, sizeof(dn.l)); 9663b3a8eb9SGleb Smirnoff /* Adjust burst parameter for link */ 9670ac43d97SMarius Strobl dn.l.burst = div64(dn.l.burst, 8 * hz); 9680ac43d97SMarius Strobl dn.l.delay = dn.l.delay * 1000 / hz; 9690ac43d97SMarius Strobl memcpy(*start, &dn.l, sizeof(dn.l)); 9700ac43d97SMarius Strobl } else if (o.type == DN_SCH) { 9710ac43d97SMarius Strobl /* Set dn.s.sch.oid.id to the number of instances */ 9720ac43d97SMarius Strobl memcpy(&dn.s, _o, sizeof(dn.s)); 9730ac43d97SMarius Strobl dn.s.sch.oid.id = (dn.s.sch.flags & DN_HAVE_MASK) ? 9740ac43d97SMarius Strobl dn_ht_entries(dn.s.siht) : (dn.s.siht ? 1 : 0); 9750ac43d97SMarius Strobl memcpy(*start, &dn.s, sizeof(dn.s)); 9760ac43d97SMarius Strobl } else 9770ac43d97SMarius Strobl memcpy(*start, _o, o.len); 9780ac43d97SMarius Strobl *start += o.len; 9793b3a8eb9SGleb Smirnoff return 0; 9803b3a8eb9SGleb Smirnoff } 9813b3a8eb9SGleb Smirnoff 9823b3a8eb9SGleb Smirnoff /* Specific function to copy a queue. 9833b3a8eb9SGleb Smirnoff * Copies only the user-visible part of a queue (which is in 9843b3a8eb9SGleb Smirnoff * a struct dn_flow), and sets len accordingly. 9853b3a8eb9SGleb Smirnoff */ 9863b3a8eb9SGleb Smirnoff static int 9873b3a8eb9SGleb Smirnoff copy_obj_q(char **start, char *end, void *_o, const char *msg, int i) 9883b3a8eb9SGleb Smirnoff { 9893b3a8eb9SGleb Smirnoff struct dn_id *o = _o; 9903b3a8eb9SGleb Smirnoff int have = end - *start; 9913b3a8eb9SGleb Smirnoff int len = sizeof(struct dn_flow); /* see above comment */ 9923b3a8eb9SGleb Smirnoff 9933b3a8eb9SGleb Smirnoff if (have < len || o->len == 0 || o->type != DN_QUEUE) { 9943b3a8eb9SGleb Smirnoff D("ERROR type %d %s %d have %d need %d", 9953b3a8eb9SGleb Smirnoff o->type, msg, i, have, len); 9963b3a8eb9SGleb Smirnoff return 1; 9973b3a8eb9SGleb Smirnoff } 9983b3a8eb9SGleb Smirnoff ND("type %d %s %d len %d", o->type, msg, i, len); 9990ac43d97SMarius Strobl memcpy(*start, _o, len); 10003b3a8eb9SGleb Smirnoff ((struct dn_id*)(*start))->len = len; 10013b3a8eb9SGleb Smirnoff *start += len; 10023b3a8eb9SGleb Smirnoff return 0; 10033b3a8eb9SGleb Smirnoff } 10043b3a8eb9SGleb Smirnoff 10053b3a8eb9SGleb Smirnoff static int 10063b3a8eb9SGleb Smirnoff copy_q_cb(void *obj, void *arg) 10073b3a8eb9SGleb Smirnoff { 10083b3a8eb9SGleb Smirnoff struct dn_queue *q = obj; 10093b3a8eb9SGleb Smirnoff struct copy_args *a = arg; 10103b3a8eb9SGleb Smirnoff struct dn_flow *ni = (struct dn_flow *)(*a->start); 10113b3a8eb9SGleb Smirnoff if (copy_obj_q(a->start, a->end, &q->ni, "queue", -1)) 10123b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10133b3a8eb9SGleb Smirnoff ni->oid.type = DN_FLOW; /* override the DN_QUEUE */ 10143b3a8eb9SGleb Smirnoff ni->oid.id = si_hash((uintptr_t)&ni->fid, 0, NULL); 10153b3a8eb9SGleb Smirnoff return 0; 10163b3a8eb9SGleb Smirnoff } 10173b3a8eb9SGleb Smirnoff 10183b3a8eb9SGleb Smirnoff static int 10193b3a8eb9SGleb Smirnoff copy_q(struct copy_args *a, struct dn_fsk *fs, int flags) 10203b3a8eb9SGleb Smirnoff { 10213b3a8eb9SGleb Smirnoff if (!fs->qht) 10223b3a8eb9SGleb Smirnoff return 0; 10233b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) 10243b3a8eb9SGleb Smirnoff dn_ht_scan(fs->qht, copy_q_cb, a); 10253b3a8eb9SGleb Smirnoff else 10263b3a8eb9SGleb Smirnoff copy_q_cb(fs->qht, a); 10273b3a8eb9SGleb Smirnoff return 0; 10283b3a8eb9SGleb Smirnoff } 10293b3a8eb9SGleb Smirnoff 10303b3a8eb9SGleb Smirnoff /* 10313b3a8eb9SGleb Smirnoff * This routine only copies the initial part of a profile ? XXX 10323b3a8eb9SGleb Smirnoff */ 10333b3a8eb9SGleb Smirnoff static int 10343b3a8eb9SGleb Smirnoff copy_profile(struct copy_args *a, struct dn_profile *p) 10353b3a8eb9SGleb Smirnoff { 10363b3a8eb9SGleb Smirnoff int have = a->end - *a->start; 10373b3a8eb9SGleb Smirnoff /* XXX here we check for max length */ 10383b3a8eb9SGleb Smirnoff int profile_len = sizeof(struct dn_profile) - 10393b3a8eb9SGleb Smirnoff ED_MAX_SAMPLES_NO*sizeof(int); 10403b3a8eb9SGleb Smirnoff 10413b3a8eb9SGleb Smirnoff if (p == NULL) 10423b3a8eb9SGleb Smirnoff return 0; 10433b3a8eb9SGleb Smirnoff if (have < profile_len) { 10443b3a8eb9SGleb Smirnoff D("error have %d need %d", have, profile_len); 10453b3a8eb9SGleb Smirnoff return 1; 10463b3a8eb9SGleb Smirnoff } 10470ac43d97SMarius Strobl memcpy(*a->start, p, profile_len); 10483b3a8eb9SGleb Smirnoff ((struct dn_id *)(*a->start))->len = profile_len; 10493b3a8eb9SGleb Smirnoff *a->start += profile_len; 10503b3a8eb9SGleb Smirnoff return 0; 10513b3a8eb9SGleb Smirnoff } 10523b3a8eb9SGleb Smirnoff 10533b3a8eb9SGleb Smirnoff static int 10543b3a8eb9SGleb Smirnoff copy_flowset(struct copy_args *a, struct dn_fsk *fs, int flags) 10553b3a8eb9SGleb Smirnoff { 10563b3a8eb9SGleb Smirnoff struct dn_fs *ufs = (struct dn_fs *)(*a->start); 10573b3a8eb9SGleb Smirnoff if (!fs) 10583b3a8eb9SGleb Smirnoff return 0; 10593b3a8eb9SGleb Smirnoff ND("flowset %d", fs->fs.fs_nr); 10603b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, &fs->fs, "flowset", fs->fs.fs_nr)) 10613b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10623b3a8eb9SGleb Smirnoff ufs->oid.id = (fs->fs.flags & DN_QHT_HASH) ? 10633b3a8eb9SGleb Smirnoff dn_ht_entries(fs->qht) : (fs->qht ? 1 : 0); 10643b3a8eb9SGleb Smirnoff if (flags) { /* copy queues */ 10653b3a8eb9SGleb Smirnoff copy_q(a, fs, 0); 10663b3a8eb9SGleb Smirnoff } 10673b3a8eb9SGleb Smirnoff return 0; 10683b3a8eb9SGleb Smirnoff } 10693b3a8eb9SGleb Smirnoff 10703b3a8eb9SGleb Smirnoff static int 10713b3a8eb9SGleb Smirnoff copy_si_cb(void *obj, void *arg) 10723b3a8eb9SGleb Smirnoff { 10733b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = obj; 10743b3a8eb9SGleb Smirnoff struct copy_args *a = arg; 10753b3a8eb9SGleb Smirnoff struct dn_flow *ni = (struct dn_flow *)(*a->start); 10763b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, &si->ni, "inst", 10773b3a8eb9SGleb Smirnoff si->sched->sch.sched_nr)) 10783b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10793b3a8eb9SGleb Smirnoff ni->oid.type = DN_FLOW; /* override the DN_SCH_I */ 10803b3a8eb9SGleb Smirnoff ni->oid.id = si_hash((uintptr_t)si, DNHT_KEY_IS_OBJ, NULL); 10813b3a8eb9SGleb Smirnoff return 0; 10823b3a8eb9SGleb Smirnoff } 10833b3a8eb9SGleb Smirnoff 10843b3a8eb9SGleb Smirnoff static int 10853b3a8eb9SGleb Smirnoff copy_si(struct copy_args *a, struct dn_schk *s, int flags) 10863b3a8eb9SGleb Smirnoff { 10873b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 10883b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, copy_si_cb, a); 10893b3a8eb9SGleb Smirnoff else if (s->siht) 10903b3a8eb9SGleb Smirnoff copy_si_cb(s->siht, a); 10913b3a8eb9SGleb Smirnoff return 0; 10923b3a8eb9SGleb Smirnoff } 10933b3a8eb9SGleb Smirnoff 10943b3a8eb9SGleb Smirnoff /* 10953b3a8eb9SGleb Smirnoff * compute a list of children of a scheduler and copy up 10963b3a8eb9SGleb Smirnoff */ 10973b3a8eb9SGleb Smirnoff static int 10983b3a8eb9SGleb Smirnoff copy_fsk_list(struct copy_args *a, struct dn_schk *s, int flags) 10993b3a8eb9SGleb Smirnoff { 11003b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 11013b3a8eb9SGleb Smirnoff struct dn_id *o; 11023b3a8eb9SGleb Smirnoff uint32_t *p; 11033b3a8eb9SGleb Smirnoff 11043b3a8eb9SGleb Smirnoff int n = 0, space = sizeof(*o); 11053b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) { 11063b3a8eb9SGleb Smirnoff if (fs->fs.fs_nr < DN_MAX_ID) 11073b3a8eb9SGleb Smirnoff n++; 11083b3a8eb9SGleb Smirnoff } 11093b3a8eb9SGleb Smirnoff space += n * sizeof(uint32_t); 11103b3a8eb9SGleb Smirnoff DX(3, "sched %d has %d flowsets", s->sch.sched_nr, n); 11113b3a8eb9SGleb Smirnoff if (a->end - *(a->start) < space) 11123b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11133b3a8eb9SGleb Smirnoff o = (struct dn_id *)(*(a->start)); 11143b3a8eb9SGleb Smirnoff o->len = space; 11153b3a8eb9SGleb Smirnoff *a->start += o->len; 11163b3a8eb9SGleb Smirnoff o->type = DN_TEXT; 11173b3a8eb9SGleb Smirnoff p = (uint32_t *)(o+1); 11183b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) 11193b3a8eb9SGleb Smirnoff if (fs->fs.fs_nr < DN_MAX_ID) 11203b3a8eb9SGleb Smirnoff *p++ = fs->fs.fs_nr; 11213b3a8eb9SGleb Smirnoff return 0; 11223b3a8eb9SGleb Smirnoff } 11233b3a8eb9SGleb Smirnoff 11243b3a8eb9SGleb Smirnoff static int 11253b3a8eb9SGleb Smirnoff copy_data_helper(void *_o, void *_arg) 11263b3a8eb9SGleb Smirnoff { 11273b3a8eb9SGleb Smirnoff struct copy_args *a = _arg; 11283b3a8eb9SGleb Smirnoff uint32_t *r = a->extra->r; /* start of first range */ 11293b3a8eb9SGleb Smirnoff uint32_t *lim; /* first invalid pointer */ 11303b3a8eb9SGleb Smirnoff int n; 11313b3a8eb9SGleb Smirnoff 11323b3a8eb9SGleb Smirnoff lim = (uint32_t *)((char *)(a->extra) + a->extra->o.len); 11333b3a8eb9SGleb Smirnoff 11343b3a8eb9SGleb Smirnoff if (a->type == DN_LINK || a->type == DN_SCH) { 11353b3a8eb9SGleb Smirnoff /* pipe|sched show, we receive a dn_schk */ 11363b3a8eb9SGleb Smirnoff struct dn_schk *s = _o; 11373b3a8eb9SGleb Smirnoff 11383b3a8eb9SGleb Smirnoff n = s->sch.sched_nr; 11393b3a8eb9SGleb Smirnoff if (a->type == DN_SCH && n >= DN_MAX_ID) 11403b3a8eb9SGleb Smirnoff return 0; /* not a scheduler */ 11413b3a8eb9SGleb Smirnoff if (a->type == DN_LINK && n <= DN_MAX_ID) 11423b3a8eb9SGleb Smirnoff return 0; /* not a pipe */ 11433b3a8eb9SGleb Smirnoff 11443b3a8eb9SGleb Smirnoff /* see if the object is within one of our ranges */ 11453b3a8eb9SGleb Smirnoff for (;r < lim; r += 2) { 11463b3a8eb9SGleb Smirnoff if (n < r[0] || n > r[1]) 11473b3a8eb9SGleb Smirnoff continue; 11483b3a8eb9SGleb Smirnoff /* Found a valid entry, copy and we are done */ 11493b3a8eb9SGleb Smirnoff if (a->flags & DN_C_LINK) { 11503b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, 11513b3a8eb9SGleb Smirnoff &s->link, "link", n)) 11523b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11533b3a8eb9SGleb Smirnoff if (copy_profile(a, s->profile)) 11543b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11553b3a8eb9SGleb Smirnoff if (copy_flowset(a, s->fs, 0)) 11563b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11573b3a8eb9SGleb Smirnoff } 11583b3a8eb9SGleb Smirnoff if (a->flags & DN_C_SCH) { 11593b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, 11603b3a8eb9SGleb Smirnoff &s->sch, "sched", n)) 11613b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11623b3a8eb9SGleb Smirnoff /* list all attached flowsets */ 11633b3a8eb9SGleb Smirnoff if (copy_fsk_list(a, s, 0)) 11643b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11653b3a8eb9SGleb Smirnoff } 11663b3a8eb9SGleb Smirnoff if (a->flags & DN_C_FLOW) 11673b3a8eb9SGleb Smirnoff copy_si(a, s, 0); 11683b3a8eb9SGleb Smirnoff break; 11693b3a8eb9SGleb Smirnoff } 11703b3a8eb9SGleb Smirnoff } else if (a->type == DN_FS) { 11713b3a8eb9SGleb Smirnoff /* queue show, skip internal flowsets */ 11723b3a8eb9SGleb Smirnoff struct dn_fsk *fs = _o; 11733b3a8eb9SGleb Smirnoff 11743b3a8eb9SGleb Smirnoff n = fs->fs.fs_nr; 11753b3a8eb9SGleb Smirnoff if (n >= DN_MAX_ID) 11763b3a8eb9SGleb Smirnoff return 0; 11773b3a8eb9SGleb Smirnoff /* see if the object is within one of our ranges */ 11783b3a8eb9SGleb Smirnoff for (;r < lim; r += 2) { 11793b3a8eb9SGleb Smirnoff if (n < r[0] || n > r[1]) 11803b3a8eb9SGleb Smirnoff continue; 11813b3a8eb9SGleb Smirnoff if (copy_flowset(a, fs, 0)) 11823b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11833b3a8eb9SGleb Smirnoff copy_q(a, fs, 0); 11843b3a8eb9SGleb Smirnoff break; /* we are done */ 11853b3a8eb9SGleb Smirnoff } 11863b3a8eb9SGleb Smirnoff } 11873b3a8eb9SGleb Smirnoff return 0; 11883b3a8eb9SGleb Smirnoff } 11893b3a8eb9SGleb Smirnoff 11903b3a8eb9SGleb Smirnoff static inline struct dn_schk * 11913b3a8eb9SGleb Smirnoff locate_scheduler(int i) 11923b3a8eb9SGleb Smirnoff { 1193fe3bcfbdSTom Jones return dn_ht_find(V_dn_cfg.schedhash, i, 0, NULL); 11943b3a8eb9SGleb Smirnoff } 11953b3a8eb9SGleb Smirnoff 11963b3a8eb9SGleb Smirnoff /* 11973b3a8eb9SGleb Smirnoff * red parameters are in fixed point arithmetic. 11983b3a8eb9SGleb Smirnoff */ 11993b3a8eb9SGleb Smirnoff static int 12003b3a8eb9SGleb Smirnoff config_red(struct dn_fsk *fs) 12013b3a8eb9SGleb Smirnoff { 12023b3a8eb9SGleb Smirnoff int64_t s, idle, weight, w0; 12033b3a8eb9SGleb Smirnoff int t, i; 12043b3a8eb9SGleb Smirnoff 12053b3a8eb9SGleb Smirnoff fs->w_q = fs->fs.w_q; 12063b3a8eb9SGleb Smirnoff fs->max_p = fs->fs.max_p; 12073b3a8eb9SGleb Smirnoff ND("called"); 12083b3a8eb9SGleb Smirnoff /* Doing stuff that was in userland */ 12093b3a8eb9SGleb Smirnoff i = fs->sched->link.bandwidth; 12103b3a8eb9SGleb Smirnoff s = (i <= 0) ? 0 : 1211fe3bcfbdSTom Jones hz * V_dn_cfg.red_avg_pkt_size * 8 * SCALE(1) / i; 12123b3a8eb9SGleb Smirnoff 12133b3a8eb9SGleb Smirnoff idle = div64((s * 3) , fs->w_q); /* s, fs->w_q scaled; idle not scaled */ 1214fe3bcfbdSTom Jones fs->lookup_step = div64(idle , V_dn_cfg.red_lookup_depth); 12153b3a8eb9SGleb Smirnoff /* fs->lookup_step not scaled, */ 12163b3a8eb9SGleb Smirnoff if (!fs->lookup_step) 12173b3a8eb9SGleb Smirnoff fs->lookup_step = 1; 12183b3a8eb9SGleb Smirnoff w0 = weight = SCALE(1) - fs->w_q; //fs->w_q scaled 12193b3a8eb9SGleb Smirnoff 12203b3a8eb9SGleb Smirnoff for (t = fs->lookup_step; t > 1; --t) 12213b3a8eb9SGleb Smirnoff weight = SCALE_MUL(weight, w0); 12223b3a8eb9SGleb Smirnoff fs->lookup_weight = (int)(weight); // scaled 12233b3a8eb9SGleb Smirnoff 12243b3a8eb9SGleb Smirnoff /* Now doing stuff that was in kerneland */ 12253b3a8eb9SGleb Smirnoff fs->min_th = SCALE(fs->fs.min_th); 12263b3a8eb9SGleb Smirnoff fs->max_th = SCALE(fs->fs.max_th); 12273b3a8eb9SGleb Smirnoff 1228fc5e1956SHiren Panchasara if (fs->fs.max_th == fs->fs.min_th) 1229fc5e1956SHiren Panchasara fs->c_1 = fs->max_p; 1230fc5e1956SHiren Panchasara else 1231fc5e1956SHiren Panchasara fs->c_1 = SCALE((int64_t)(fs->max_p)) / (fs->fs.max_th - fs->fs.min_th); 12323b3a8eb9SGleb Smirnoff fs->c_2 = SCALE_MUL(fs->c_1, SCALE(fs->fs.min_th)); 12333b3a8eb9SGleb Smirnoff 12343b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_IS_GENTLE_RED) { 12353b3a8eb9SGleb Smirnoff fs->c_3 = (SCALE(1) - fs->max_p) / fs->fs.max_th; 12363b3a8eb9SGleb Smirnoff fs->c_4 = SCALE(1) - 2 * fs->max_p; 12373b3a8eb9SGleb Smirnoff } 12383b3a8eb9SGleb Smirnoff 12393b3a8eb9SGleb Smirnoff /* If the lookup table already exist, free and create it again. */ 12403b3a8eb9SGleb Smirnoff if (fs->w_q_lookup) { 12413b3a8eb9SGleb Smirnoff free(fs->w_q_lookup, M_DUMMYNET); 12423b3a8eb9SGleb Smirnoff fs->w_q_lookup = NULL; 12433b3a8eb9SGleb Smirnoff } 1244fe3bcfbdSTom Jones if (V_dn_cfg.red_lookup_depth == 0) { 12453b3a8eb9SGleb Smirnoff printf("\ndummynet: net.inet.ip.dummynet.red_lookup_depth" 12463b3a8eb9SGleb Smirnoff "must be > 0\n"); 12473b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_RED; 12483b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_GENTLE_RED; 12493b3a8eb9SGleb Smirnoff return (EINVAL); 12503b3a8eb9SGleb Smirnoff } 1251fe3bcfbdSTom Jones fs->lookup_depth = V_dn_cfg.red_lookup_depth; 12523b3a8eb9SGleb Smirnoff fs->w_q_lookup = (u_int *)malloc(fs->lookup_depth * sizeof(int), 12533b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT); 12543b3a8eb9SGleb Smirnoff if (fs->w_q_lookup == NULL) { 12553b3a8eb9SGleb Smirnoff printf("dummynet: sorry, cannot allocate red lookup table\n"); 12563b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_RED; 12573b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_GENTLE_RED; 12583b3a8eb9SGleb Smirnoff return(ENOSPC); 12593b3a8eb9SGleb Smirnoff } 12603b3a8eb9SGleb Smirnoff 12613b3a8eb9SGleb Smirnoff /* Fill the lookup table with (1 - w_q)^x */ 12623b3a8eb9SGleb Smirnoff fs->w_q_lookup[0] = SCALE(1) - fs->w_q; 12633b3a8eb9SGleb Smirnoff 12643b3a8eb9SGleb Smirnoff for (i = 1; i < fs->lookup_depth; i++) 12653b3a8eb9SGleb Smirnoff fs->w_q_lookup[i] = 12663b3a8eb9SGleb Smirnoff SCALE_MUL(fs->w_q_lookup[i - 1], fs->lookup_weight); 12673b3a8eb9SGleb Smirnoff 1268fe3bcfbdSTom Jones if (V_dn_cfg.red_avg_pkt_size < 1) 1269fe3bcfbdSTom Jones V_dn_cfg.red_avg_pkt_size = 512; 1270fe3bcfbdSTom Jones fs->avg_pkt_size = V_dn_cfg.red_avg_pkt_size; 1271fe3bcfbdSTom Jones if (V_dn_cfg.red_max_pkt_size < 1) 1272fe3bcfbdSTom Jones V_dn_cfg.red_max_pkt_size = 1500; 1273fe3bcfbdSTom Jones fs->max_pkt_size = V_dn_cfg.red_max_pkt_size; 12743b3a8eb9SGleb Smirnoff ND("exit"); 12753b3a8eb9SGleb Smirnoff return 0; 12763b3a8eb9SGleb Smirnoff } 12773b3a8eb9SGleb Smirnoff 12783b3a8eb9SGleb Smirnoff /* Scan all flowset attached to this scheduler and update red */ 12793b3a8eb9SGleb Smirnoff static void 12803b3a8eb9SGleb Smirnoff update_red(struct dn_schk *s) 12813b3a8eb9SGleb Smirnoff { 12823b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 12833b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) { 12843b3a8eb9SGleb Smirnoff if (fs && (fs->fs.flags & DN_IS_RED)) 12853b3a8eb9SGleb Smirnoff config_red(fs); 12863b3a8eb9SGleb Smirnoff } 12873b3a8eb9SGleb Smirnoff } 12883b3a8eb9SGleb Smirnoff 12893b3a8eb9SGleb Smirnoff /* attach flowset to scheduler s, possibly requeue */ 12903b3a8eb9SGleb Smirnoff static void 12913b3a8eb9SGleb Smirnoff fsk_attach(struct dn_fsk *fs, struct dn_schk *s) 12923b3a8eb9SGleb Smirnoff { 12933b3a8eb9SGleb Smirnoff ND("remove fs %d from fsunlinked, link to sched %d", 12943b3a8eb9SGleb Smirnoff fs->fs.fs_nr, s->sch.sched_nr); 1295fe3bcfbdSTom Jones SLIST_REMOVE(&V_dn_cfg.fsu, fs, dn_fsk, sch_chain); 12963b3a8eb9SGleb Smirnoff fs->sched = s; 12973b3a8eb9SGleb Smirnoff SLIST_INSERT_HEAD(&s->fsk_list, fs, sch_chain); 12983b3a8eb9SGleb Smirnoff if (s->fp->new_fsk) 12993b3a8eb9SGleb Smirnoff s->fp->new_fsk(fs); 13003b3a8eb9SGleb Smirnoff /* XXX compute fsk_mask */ 13013b3a8eb9SGleb Smirnoff fs->fsk_mask = fs->fs.flow_mask; 13023b3a8eb9SGleb Smirnoff if (fs->sched->sch.flags & DN_HAVE_MASK) 13033b3a8eb9SGleb Smirnoff flow_id_or(&fs->sched->sch.sched_mask, &fs->fsk_mask); 13043b3a8eb9SGleb Smirnoff if (fs->qht) { 13053b3a8eb9SGleb Smirnoff /* 13063b3a8eb9SGleb Smirnoff * we must drain qht according to the old 13073b3a8eb9SGleb Smirnoff * type, and reinsert according to the new one. 13083b3a8eb9SGleb Smirnoff * The requeue is complex -- in general we need to 13093b3a8eb9SGleb Smirnoff * reclassify every single packet. 13103b3a8eb9SGleb Smirnoff * For the time being, let's hope qht is never set 13113b3a8eb9SGleb Smirnoff * when we reach this point. 13123b3a8eb9SGleb Smirnoff */ 13133b3a8eb9SGleb Smirnoff D("XXX TODO requeue from fs %d to sch %d", 13143b3a8eb9SGleb Smirnoff fs->fs.fs_nr, s->sch.sched_nr); 13153b3a8eb9SGleb Smirnoff fs->qht = NULL; 13163b3a8eb9SGleb Smirnoff } 13173b3a8eb9SGleb Smirnoff /* set the new type for qht */ 13183b3a8eb9SGleb Smirnoff if (nonzero_mask(&fs->fsk_mask)) 13193b3a8eb9SGleb Smirnoff fs->fs.flags |= DN_QHT_HASH; 13203b3a8eb9SGleb Smirnoff else 13213b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_QHT_HASH; 13223b3a8eb9SGleb Smirnoff 13233b3a8eb9SGleb Smirnoff /* XXX config_red() can fail... */ 13243b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_IS_RED) 13253b3a8eb9SGleb Smirnoff config_red(fs); 13263b3a8eb9SGleb Smirnoff } 13273b3a8eb9SGleb Smirnoff 13283b3a8eb9SGleb Smirnoff /* update all flowsets which may refer to this scheduler */ 13293b3a8eb9SGleb Smirnoff static void 13303b3a8eb9SGleb Smirnoff update_fs(struct dn_schk *s) 13313b3a8eb9SGleb Smirnoff { 13323b3a8eb9SGleb Smirnoff struct dn_fsk *fs, *tmp; 13333b3a8eb9SGleb Smirnoff 1334fe3bcfbdSTom Jones SLIST_FOREACH_SAFE(fs, &V_dn_cfg.fsu, sch_chain, tmp) { 13353b3a8eb9SGleb Smirnoff if (s->sch.sched_nr != fs->fs.sched_nr) { 13363b3a8eb9SGleb Smirnoff D("fs %d for sch %d not %d still unlinked", 13373b3a8eb9SGleb Smirnoff fs->fs.fs_nr, fs->fs.sched_nr, 13383b3a8eb9SGleb Smirnoff s->sch.sched_nr); 13393b3a8eb9SGleb Smirnoff continue; 13403b3a8eb9SGleb Smirnoff } 13413b3a8eb9SGleb Smirnoff fsk_attach(fs, s); 13423b3a8eb9SGleb Smirnoff } 13433b3a8eb9SGleb Smirnoff } 13443b3a8eb9SGleb Smirnoff 134591336b40SDon Lewis #ifdef NEW_AQM 134691336b40SDon Lewis /* Retrieve AQM configurations to ipfw userland 134791336b40SDon Lewis */ 134891336b40SDon Lewis static int 134991336b40SDon Lewis get_aqm_parms(struct sockopt *sopt) 135091336b40SDon Lewis { 135191336b40SDon Lewis struct dn_extra_parms *ep; 135291336b40SDon Lewis struct dn_fsk *fs; 135391336b40SDon Lewis size_t sopt_valsize; 135491336b40SDon Lewis int l, err = 0; 135591336b40SDon Lewis 135691336b40SDon Lewis sopt_valsize = sopt->sopt_valsize; 135791336b40SDon Lewis l = sizeof(*ep); 135891336b40SDon Lewis if (sopt->sopt_valsize < l) { 135991336b40SDon Lewis D("bad len sopt->sopt_valsize %d len %d", 136091336b40SDon Lewis (int) sopt->sopt_valsize , l); 136191336b40SDon Lewis err = EINVAL; 136291336b40SDon Lewis return err; 136391336b40SDon Lewis } 1364*51d73df1SKristof Provost ep = malloc(l, M_DUMMYNET, M_NOWAIT); 136591336b40SDon Lewis if(!ep) { 136691336b40SDon Lewis err = ENOMEM ; 136791336b40SDon Lewis return err; 136891336b40SDon Lewis } 136991336b40SDon Lewis do { 137091336b40SDon Lewis err = sooptcopyin(sopt, ep, l, l); 137191336b40SDon Lewis if(err) 137291336b40SDon Lewis break; 137391336b40SDon Lewis sopt->sopt_valsize = sopt_valsize; 137491336b40SDon Lewis if (ep->oid.len < l) { 137591336b40SDon Lewis err = EINVAL; 137691336b40SDon Lewis break; 137791336b40SDon Lewis } 137891336b40SDon Lewis 1379fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, ep->nr, 0, NULL); 138091336b40SDon Lewis if (!fs) { 138191336b40SDon Lewis D("fs %d not found", ep->nr); 138291336b40SDon Lewis err = EINVAL; 138391336b40SDon Lewis break; 138491336b40SDon Lewis } 138591336b40SDon Lewis 138691336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->getconfig) { 138791336b40SDon Lewis if(fs->aqmfp->getconfig(fs, ep)) { 138891336b40SDon Lewis D("Error while trying to get AQM params"); 138991336b40SDon Lewis err = EINVAL; 139091336b40SDon Lewis break; 139191336b40SDon Lewis } 139291336b40SDon Lewis ep->oid.len = l; 139391336b40SDon Lewis err = sooptcopyout(sopt, ep, l); 139491336b40SDon Lewis } 139591336b40SDon Lewis }while(0); 139691336b40SDon Lewis 139791336b40SDon Lewis free(ep, M_DUMMYNET); 139891336b40SDon Lewis return err; 139991336b40SDon Lewis } 140091336b40SDon Lewis 140191336b40SDon Lewis /* Retrieve AQM configurations to ipfw userland 140291336b40SDon Lewis */ 140391336b40SDon Lewis static int 140491336b40SDon Lewis get_sched_parms(struct sockopt *sopt) 140591336b40SDon Lewis { 140691336b40SDon Lewis struct dn_extra_parms *ep; 140791336b40SDon Lewis struct dn_schk *schk; 140891336b40SDon Lewis size_t sopt_valsize; 140991336b40SDon Lewis int l, err = 0; 141091336b40SDon Lewis 141191336b40SDon Lewis sopt_valsize = sopt->sopt_valsize; 141291336b40SDon Lewis l = sizeof(*ep); 141391336b40SDon Lewis if (sopt->sopt_valsize < l) { 141491336b40SDon Lewis D("bad len sopt->sopt_valsize %d len %d", 141591336b40SDon Lewis (int) sopt->sopt_valsize , l); 141691336b40SDon Lewis err = EINVAL; 141791336b40SDon Lewis return err; 141891336b40SDon Lewis } 1419*51d73df1SKristof Provost ep = malloc(l, M_DUMMYNET, M_NOWAIT); 142091336b40SDon Lewis if(!ep) { 142191336b40SDon Lewis err = ENOMEM ; 142291336b40SDon Lewis return err; 142391336b40SDon Lewis } 142491336b40SDon Lewis do { 142591336b40SDon Lewis err = sooptcopyin(sopt, ep, l, l); 142691336b40SDon Lewis if(err) 142791336b40SDon Lewis break; 142891336b40SDon Lewis sopt->sopt_valsize = sopt_valsize; 142991336b40SDon Lewis if (ep->oid.len < l) { 143091336b40SDon Lewis err = EINVAL; 143191336b40SDon Lewis break; 143291336b40SDon Lewis } 143391336b40SDon Lewis 143491336b40SDon Lewis schk = locate_scheduler(ep->nr); 143591336b40SDon Lewis if (!schk) { 143691336b40SDon Lewis D("sched %d not found", ep->nr); 143791336b40SDon Lewis err = EINVAL; 143891336b40SDon Lewis break; 143991336b40SDon Lewis } 144091336b40SDon Lewis 144191336b40SDon Lewis if (schk->fp && schk->fp->getconfig) { 144291336b40SDon Lewis if(schk->fp->getconfig(schk, ep)) { 144391336b40SDon Lewis D("Error while trying to get sched params"); 144491336b40SDon Lewis err = EINVAL; 144591336b40SDon Lewis break; 144691336b40SDon Lewis } 144791336b40SDon Lewis ep->oid.len = l; 144891336b40SDon Lewis err = sooptcopyout(sopt, ep, l); 144991336b40SDon Lewis } 145091336b40SDon Lewis }while(0); 145191336b40SDon Lewis free(ep, M_DUMMYNET); 145291336b40SDon Lewis 145391336b40SDon Lewis return err; 145491336b40SDon Lewis } 145591336b40SDon Lewis 145691336b40SDon Lewis /* Configure AQM for flowset 'fs'. 145791336b40SDon Lewis * extra parameters are passed from userland. 145891336b40SDon Lewis */ 145991336b40SDon Lewis static int 146091336b40SDon Lewis config_aqm(struct dn_fsk *fs, struct dn_extra_parms *ep, int busy) 146191336b40SDon Lewis { 146291336b40SDon Lewis int err = 0; 146391336b40SDon Lewis 1464*51d73df1SKristof Provost NET_EPOCH_ASSERT(); 1465*51d73df1SKristof Provost 146691336b40SDon Lewis do { 146791336b40SDon Lewis /* no configurations */ 146891336b40SDon Lewis if (!ep) { 146991336b40SDon Lewis err = 0; 147091336b40SDon Lewis break; 147191336b40SDon Lewis } 147291336b40SDon Lewis 147391336b40SDon Lewis /* no AQM for this flowset*/ 147491336b40SDon Lewis if (!strcmp(ep->name,"")) { 147591336b40SDon Lewis err = 0; 147691336b40SDon Lewis break; 147791336b40SDon Lewis } 147891336b40SDon Lewis if (ep->oid.len < sizeof(*ep)) { 147991336b40SDon Lewis D("short aqm len %d", ep->oid.len); 148091336b40SDon Lewis err = EINVAL; 148191336b40SDon Lewis break; 148291336b40SDon Lewis } 148391336b40SDon Lewis 148491336b40SDon Lewis if (busy) { 148591336b40SDon Lewis D("Unable to configure flowset, flowset busy!"); 148691336b40SDon Lewis err = EINVAL; 148791336b40SDon Lewis break; 148891336b40SDon Lewis } 148991336b40SDon Lewis 149091336b40SDon Lewis /* deconfigure old aqm if exist */ 149191336b40SDon Lewis if (fs->aqmcfg && fs->aqmfp && fs->aqmfp->deconfig) { 149291336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 149391336b40SDon Lewis } 149491336b40SDon Lewis 149591336b40SDon Lewis if (!(fs->aqmfp = find_aqm_type(0, ep->name))) { 149691336b40SDon Lewis D("AQM functions not found for type %s!", ep->name); 149791336b40SDon Lewis fs->fs.flags &= ~DN_IS_AQM; 149891336b40SDon Lewis err = EINVAL; 149991336b40SDon Lewis break; 150091336b40SDon Lewis } else 150191336b40SDon Lewis fs->fs.flags |= DN_IS_AQM; 150291336b40SDon Lewis 150391336b40SDon Lewis if (ep->oid.subtype != DN_AQM_PARAMS) { 150491336b40SDon Lewis D("Wrong subtype"); 150591336b40SDon Lewis err = EINVAL; 150691336b40SDon Lewis break; 150791336b40SDon Lewis } 150891336b40SDon Lewis 150991336b40SDon Lewis if (fs->aqmfp->config) { 151091336b40SDon Lewis err = fs->aqmfp->config(fs, ep, ep->oid.len); 151191336b40SDon Lewis if (err) { 151291336b40SDon Lewis D("Unable to configure AQM for FS %d", fs->fs.fs_nr ); 151391336b40SDon Lewis fs->fs.flags &= ~DN_IS_AQM; 151491336b40SDon Lewis fs->aqmfp = NULL; 151591336b40SDon Lewis break; 151691336b40SDon Lewis } 151791336b40SDon Lewis } 151891336b40SDon Lewis } while(0); 151991336b40SDon Lewis 152091336b40SDon Lewis return err; 152191336b40SDon Lewis } 152291336b40SDon Lewis #endif 152391336b40SDon Lewis 15243b3a8eb9SGleb Smirnoff /* 15253b3a8eb9SGleb Smirnoff * Configuration -- to preserve backward compatibility we use 15263b3a8eb9SGleb Smirnoff * the following scheme (N is 65536) 15273b3a8eb9SGleb Smirnoff * NUMBER SCHED LINK FLOWSET 15283b3a8eb9SGleb Smirnoff * 1 .. N-1 (1)WFQ (2)WFQ (3)queue 15293b3a8eb9SGleb Smirnoff * N+1 .. 2N-1 (4)FIFO (5)FIFO (6)FIFO for sched 1..N-1 15303b3a8eb9SGleb Smirnoff * 2N+1 .. 3N-1 -- -- (7)FIFO for sched N+1..2N-1 15313b3a8eb9SGleb Smirnoff * 15323b3a8eb9SGleb Smirnoff * "pipe i config" configures #1, #2 and #3 15333b3a8eb9SGleb Smirnoff * "sched i config" configures #1 and possibly #6 15343b3a8eb9SGleb Smirnoff * "queue i config" configures #3 15353b3a8eb9SGleb Smirnoff * #1 is configured with 'pipe i config' or 'sched i config' 15363b3a8eb9SGleb Smirnoff * #2 is configured with 'pipe i config', and created if not 15373b3a8eb9SGleb Smirnoff * existing with 'sched i config' 15383b3a8eb9SGleb Smirnoff * #3 is configured with 'queue i config' 15393b3a8eb9SGleb Smirnoff * #4 is automatically configured after #1, can only be FIFO 15403b3a8eb9SGleb Smirnoff * #5 is automatically configured after #2 15413b3a8eb9SGleb Smirnoff * #6 is automatically created when #1 is !MULTIQUEUE, 15423b3a8eb9SGleb Smirnoff * and can be updated. 15433b3a8eb9SGleb Smirnoff * #7 is automatically configured after #2 15443b3a8eb9SGleb Smirnoff */ 15453b3a8eb9SGleb Smirnoff 15463b3a8eb9SGleb Smirnoff /* 15473b3a8eb9SGleb Smirnoff * configure a link (and its FIFO instance) 15483b3a8eb9SGleb Smirnoff */ 15493b3a8eb9SGleb Smirnoff static int 15503b3a8eb9SGleb Smirnoff config_link(struct dn_link *p, struct dn_id *arg) 15513b3a8eb9SGleb Smirnoff { 15523b3a8eb9SGleb Smirnoff int i; 15533b3a8eb9SGleb Smirnoff 15543b3a8eb9SGleb Smirnoff if (p->oid.len != sizeof(*p)) { 15553b3a8eb9SGleb Smirnoff D("invalid pipe len %d", p->oid.len); 15563b3a8eb9SGleb Smirnoff return EINVAL; 15573b3a8eb9SGleb Smirnoff } 15583b3a8eb9SGleb Smirnoff i = p->link_nr; 15593b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 15603b3a8eb9SGleb Smirnoff return EINVAL; 15613b3a8eb9SGleb Smirnoff /* 15623b3a8eb9SGleb Smirnoff * The config program passes parameters as follows: 15633b3a8eb9SGleb Smirnoff * bw = bits/second (0 means no limits), 15643b3a8eb9SGleb Smirnoff * delay = ms, must be translated into ticks. 15653b3a8eb9SGleb Smirnoff * qsize = slots/bytes 15663b3a8eb9SGleb Smirnoff * burst ??? 15673b3a8eb9SGleb Smirnoff */ 15683b3a8eb9SGleb Smirnoff p->delay = (p->delay * hz) / 1000; 15693b3a8eb9SGleb Smirnoff /* Scale burst size: bytes -> bits * hz */ 15703b3a8eb9SGleb Smirnoff p->burst *= 8 * hz; 15713b3a8eb9SGleb Smirnoff 15723b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 15733b3a8eb9SGleb Smirnoff /* do it twice, base link and FIFO link */ 15743b3a8eb9SGleb Smirnoff for (; i < 2*DN_MAX_ID; i += DN_MAX_ID) { 15753b3a8eb9SGleb Smirnoff struct dn_schk *s = locate_scheduler(i); 15763b3a8eb9SGleb Smirnoff if (s == NULL) { 15773b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 15783b3a8eb9SGleb Smirnoff D("sched %d not found", i); 15793b3a8eb9SGleb Smirnoff return EINVAL; 15803b3a8eb9SGleb Smirnoff } 15813b3a8eb9SGleb Smirnoff /* remove profile if exists */ 15823b3a8eb9SGleb Smirnoff if (s->profile) { 15833b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 15843b3a8eb9SGleb Smirnoff s->profile = NULL; 15853b3a8eb9SGleb Smirnoff } 15863b3a8eb9SGleb Smirnoff /* copy all parameters */ 15873b3a8eb9SGleb Smirnoff s->link.oid = p->oid; 15883b3a8eb9SGleb Smirnoff s->link.link_nr = i; 15893b3a8eb9SGleb Smirnoff s->link.delay = p->delay; 15903b3a8eb9SGleb Smirnoff if (s->link.bandwidth != p->bandwidth) { 15913b3a8eb9SGleb Smirnoff /* XXX bandwidth changes, need to update red params */ 15923b3a8eb9SGleb Smirnoff s->link.bandwidth = p->bandwidth; 15933b3a8eb9SGleb Smirnoff update_red(s); 15943b3a8eb9SGleb Smirnoff } 15953b3a8eb9SGleb Smirnoff s->link.burst = p->burst; 15963b3a8eb9SGleb Smirnoff schk_reset_credit(s); 15973b3a8eb9SGleb Smirnoff } 1598fe3bcfbdSTom Jones V_dn_cfg.id++; 15993b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 16003b3a8eb9SGleb Smirnoff return 0; 16013b3a8eb9SGleb Smirnoff } 16023b3a8eb9SGleb Smirnoff 16033b3a8eb9SGleb Smirnoff /* 16043b3a8eb9SGleb Smirnoff * configure a flowset. Can be called from inside with locked=1, 16053b3a8eb9SGleb Smirnoff */ 16063b3a8eb9SGleb Smirnoff static struct dn_fsk * 16073b3a8eb9SGleb Smirnoff config_fs(struct dn_fs *nfs, struct dn_id *arg, int locked) 16083b3a8eb9SGleb Smirnoff { 16093b3a8eb9SGleb Smirnoff int i; 16103b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 16110ac43d97SMarius Strobl #ifdef NEW_AQM 16120ac43d97SMarius Strobl struct dn_extra_parms *ep; 16130ac43d97SMarius Strobl #endif 16143b3a8eb9SGleb Smirnoff 16153b3a8eb9SGleb Smirnoff if (nfs->oid.len != sizeof(*nfs)) { 16163b3a8eb9SGleb Smirnoff D("invalid flowset len %d", nfs->oid.len); 16173b3a8eb9SGleb Smirnoff return NULL; 16183b3a8eb9SGleb Smirnoff } 16193b3a8eb9SGleb Smirnoff i = nfs->fs_nr; 16203b3a8eb9SGleb Smirnoff if (i <= 0 || i >= 3*DN_MAX_ID) 16213b3a8eb9SGleb Smirnoff return NULL; 16220ac43d97SMarius Strobl #ifdef NEW_AQM 16230ac43d97SMarius Strobl ep = NULL; 16240ac43d97SMarius Strobl if (arg != NULL) { 1625*51d73df1SKristof Provost ep = malloc(sizeof(*ep), M_TEMP, M_NOWAIT); 16260ac43d97SMarius Strobl if (ep == NULL) 16270ac43d97SMarius Strobl return (NULL); 16280ac43d97SMarius Strobl memcpy(ep, arg, sizeof(*ep)); 16290ac43d97SMarius Strobl } 16300ac43d97SMarius Strobl #endif 16313b3a8eb9SGleb Smirnoff ND("flowset %d", i); 16323b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 16333b3a8eb9SGleb Smirnoff if (nfs->flags & DN_QSIZE_BYTES) { 16343b3a8eb9SGleb Smirnoff ipdn_bound_var(&nfs->qsize, 16384, 1635fe3bcfbdSTom Jones 1500, V_dn_cfg.byte_limit, NULL); // "queue byte size"); 16363b3a8eb9SGleb Smirnoff } else { 16373b3a8eb9SGleb Smirnoff ipdn_bound_var(&nfs->qsize, 50, 1638fe3bcfbdSTom Jones 1, V_dn_cfg.slot_limit, NULL); // "queue slot size"); 16393b3a8eb9SGleb Smirnoff } 16403b3a8eb9SGleb Smirnoff if (nfs->flags & DN_HAVE_MASK) { 16413b3a8eb9SGleb Smirnoff /* make sure we have some buckets */ 1642fe3bcfbdSTom Jones ipdn_bound_var((int *)&nfs->buckets, V_dn_cfg.hash_size, 1643fe3bcfbdSTom Jones 1, V_dn_cfg.max_hash_size, "flowset buckets"); 16443b3a8eb9SGleb Smirnoff } else { 16453b3a8eb9SGleb Smirnoff nfs->buckets = 1; /* we only need 1 */ 16463b3a8eb9SGleb Smirnoff } 16473b3a8eb9SGleb Smirnoff if (!locked) 16483b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 16493b3a8eb9SGleb Smirnoff do { /* exit with break when done */ 16503b3a8eb9SGleb Smirnoff struct dn_schk *s; 16513b3a8eb9SGleb Smirnoff int flags = nfs->sched_nr ? DNHT_INSERT : 0; 16523b3a8eb9SGleb Smirnoff int j; 1653fe3bcfbdSTom Jones int oldc = V_dn_cfg.fsk_count; 1654fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, i, flags, NULL); 16553b3a8eb9SGleb Smirnoff if (fs == NULL) { 16563b3a8eb9SGleb Smirnoff D("missing sched for flowset %d", i); 16573b3a8eb9SGleb Smirnoff break; 16583b3a8eb9SGleb Smirnoff } 16593b3a8eb9SGleb Smirnoff /* grab some defaults from the existing one */ 16603b3a8eb9SGleb Smirnoff if (nfs->sched_nr == 0) /* reuse */ 16613b3a8eb9SGleb Smirnoff nfs->sched_nr = fs->fs.sched_nr; 16623b3a8eb9SGleb Smirnoff for (j = 0; j < sizeof(nfs->par)/sizeof(nfs->par[0]); j++) { 16633b3a8eb9SGleb Smirnoff if (nfs->par[j] == -1) /* reuse */ 16643b3a8eb9SGleb Smirnoff nfs->par[j] = fs->fs.par[j]; 16653b3a8eb9SGleb Smirnoff } 16663b3a8eb9SGleb Smirnoff if (bcmp(&fs->fs, nfs, sizeof(*nfs)) == 0) { 16673b3a8eb9SGleb Smirnoff ND("flowset %d unchanged", i); 166891336b40SDon Lewis #ifdef NEW_AQM 16690ac43d97SMarius Strobl if (ep != NULL) { 16700ac43d97SMarius Strobl /* 16710ac43d97SMarius Strobl * Reconfigure AQM as the parameters can be changed. 16720ac43d97SMarius Strobl * We consider the flowset as busy if it has scheduler 16730ac43d97SMarius Strobl * instance(s). 167491336b40SDon Lewis */ 167591336b40SDon Lewis s = locate_scheduler(nfs->sched_nr); 16760ac43d97SMarius Strobl config_aqm(fs, ep, s != NULL && s->siht != NULL); 16770ac43d97SMarius Strobl } 167891336b40SDon Lewis #endif 16793b3a8eb9SGleb Smirnoff break; /* no change, nothing to do */ 16803b3a8eb9SGleb Smirnoff } 1681fe3bcfbdSTom Jones if (oldc != V_dn_cfg.fsk_count) /* new item */ 1682fe3bcfbdSTom Jones V_dn_cfg.id++; 16833b3a8eb9SGleb Smirnoff s = locate_scheduler(nfs->sched_nr); 16843b3a8eb9SGleb Smirnoff /* detach from old scheduler if needed, preserving 16853b3a8eb9SGleb Smirnoff * queues if we need to reattach. Then update the 16863b3a8eb9SGleb Smirnoff * configuration, and possibly attach to the new sched. 16873b3a8eb9SGleb Smirnoff */ 16883b3a8eb9SGleb Smirnoff DX(2, "fs %d changed sched %d@%p to %d@%p", 16893b3a8eb9SGleb Smirnoff fs->fs.fs_nr, 16903b3a8eb9SGleb Smirnoff fs->fs.sched_nr, fs->sched, nfs->sched_nr, s); 16913b3a8eb9SGleb Smirnoff if (fs->sched) { 16923b3a8eb9SGleb Smirnoff int flags = s ? DN_DETACH : (DN_DETACH | DN_DESTROY); 16933b3a8eb9SGleb Smirnoff flags |= DN_DESTROY; /* XXX temporary */ 16943b3a8eb9SGleb Smirnoff fsk_detach(fs, flags); 16953b3a8eb9SGleb Smirnoff } 16963b3a8eb9SGleb Smirnoff fs->fs = *nfs; /* copy configuration */ 169791336b40SDon Lewis #ifdef NEW_AQM 169891336b40SDon Lewis fs->aqmfp = NULL; 16990ac43d97SMarius Strobl if (ep != NULL) 17000ac43d97SMarius Strobl config_aqm(fs, ep, s != NULL && 17010ac43d97SMarius Strobl s->siht != NULL); 170291336b40SDon Lewis #endif 17033b3a8eb9SGleb Smirnoff if (s != NULL) 17043b3a8eb9SGleb Smirnoff fsk_attach(fs, s); 17053b3a8eb9SGleb Smirnoff } while (0); 17063b3a8eb9SGleb Smirnoff if (!locked) 17073b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 17080ac43d97SMarius Strobl #ifdef NEW_AQM 17090ac43d97SMarius Strobl if (ep != NULL) 17100ac43d97SMarius Strobl free(ep, M_TEMP); 17110ac43d97SMarius Strobl #endif 17123b3a8eb9SGleb Smirnoff return fs; 17133b3a8eb9SGleb Smirnoff } 17143b3a8eb9SGleb Smirnoff 17153b3a8eb9SGleb Smirnoff /* 17163b3a8eb9SGleb Smirnoff * config/reconfig a scheduler and its FIFO variant. 17173b3a8eb9SGleb Smirnoff * For !MULTIQUEUE schedulers, also set up the flowset. 17183b3a8eb9SGleb Smirnoff * 17193b3a8eb9SGleb Smirnoff * On reconfigurations (detected because s->fp is set), 17203b3a8eb9SGleb Smirnoff * detach existing flowsets preserving traffic, preserve link, 17213b3a8eb9SGleb Smirnoff * and delete the old scheduler creating a new one. 17223b3a8eb9SGleb Smirnoff */ 17233b3a8eb9SGleb Smirnoff static int 17243b3a8eb9SGleb Smirnoff config_sched(struct dn_sch *_nsch, struct dn_id *arg) 17253b3a8eb9SGleb Smirnoff { 17263b3a8eb9SGleb Smirnoff struct dn_schk *s; 17273b3a8eb9SGleb Smirnoff struct schk_new_arg a; /* argument for schk_new */ 17283b3a8eb9SGleb Smirnoff int i; 17293b3a8eb9SGleb Smirnoff struct dn_link p; /* copy of oldlink */ 17303b3a8eb9SGleb Smirnoff struct dn_profile *pf = NULL; /* copy of old link profile */ 17313b3a8eb9SGleb Smirnoff /* Used to preserv mask parameter */ 17323b3a8eb9SGleb Smirnoff struct ipfw_flow_id new_mask; 17333b3a8eb9SGleb Smirnoff int new_buckets = 0; 17343b3a8eb9SGleb Smirnoff int new_flags = 0; 17353b3a8eb9SGleb Smirnoff int pipe_cmd; 17363b3a8eb9SGleb Smirnoff int err = ENOMEM; 17373b3a8eb9SGleb Smirnoff 1738*51d73df1SKristof Provost NET_EPOCH_ASSERT(); 1739*51d73df1SKristof Provost 17403b3a8eb9SGleb Smirnoff a.sch = _nsch; 17413b3a8eb9SGleb Smirnoff if (a.sch->oid.len != sizeof(*a.sch)) { 17423b3a8eb9SGleb Smirnoff D("bad sched len %d", a.sch->oid.len); 17433b3a8eb9SGleb Smirnoff return EINVAL; 17443b3a8eb9SGleb Smirnoff } 17453b3a8eb9SGleb Smirnoff i = a.sch->sched_nr; 17463b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 17473b3a8eb9SGleb Smirnoff return EINVAL; 17483b3a8eb9SGleb Smirnoff /* make sure we have some buckets */ 17493b3a8eb9SGleb Smirnoff if (a.sch->flags & DN_HAVE_MASK) 1750fe3bcfbdSTom Jones ipdn_bound_var((int *)&a.sch->buckets, V_dn_cfg.hash_size, 1751fe3bcfbdSTom Jones 1, V_dn_cfg.max_hash_size, "sched buckets"); 17523b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 17533b3a8eb9SGleb Smirnoff bzero(&p, sizeof(p)); 17543b3a8eb9SGleb Smirnoff 17553b3a8eb9SGleb Smirnoff pipe_cmd = a.sch->flags & DN_PIPE_CMD; 17563b3a8eb9SGleb Smirnoff a.sch->flags &= ~DN_PIPE_CMD; //XXX do it even if is not set? 17573b3a8eb9SGleb Smirnoff if (pipe_cmd) { 17583b3a8eb9SGleb Smirnoff /* Copy mask parameter */ 17593b3a8eb9SGleb Smirnoff new_mask = a.sch->sched_mask; 17603b3a8eb9SGleb Smirnoff new_buckets = a.sch->buckets; 17613b3a8eb9SGleb Smirnoff new_flags = a.sch->flags; 17623b3a8eb9SGleb Smirnoff } 17633b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 17643b3a8eb9SGleb Smirnoff again: /* run twice, for wfq and fifo */ 17653b3a8eb9SGleb Smirnoff /* 17663b3a8eb9SGleb Smirnoff * lookup the type. If not supplied, use the previous one 17673b3a8eb9SGleb Smirnoff * or default to WF2Q+. Otherwise, return an error. 17683b3a8eb9SGleb Smirnoff */ 1769fe3bcfbdSTom Jones V_dn_cfg.id++; 17703b3a8eb9SGleb Smirnoff a.fp = find_sched_type(a.sch->oid.subtype, a.sch->name); 17713b3a8eb9SGleb Smirnoff if (a.fp != NULL) { 17723b3a8eb9SGleb Smirnoff /* found. Lookup or create entry */ 1773fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, DNHT_INSERT, &a); 17743b3a8eb9SGleb Smirnoff } else if (a.sch->oid.subtype == 0 && !a.sch->name[0]) { 17753b3a8eb9SGleb Smirnoff /* No type. search existing s* or retry with WF2Q+ */ 1776fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, 0, &a); 17773b3a8eb9SGleb Smirnoff if (s != NULL) { 17783b3a8eb9SGleb Smirnoff a.fp = s->fp; 17793b3a8eb9SGleb Smirnoff /* Scheduler exists, skip to FIFO scheduler 17803b3a8eb9SGleb Smirnoff * if command was pipe config... 17813b3a8eb9SGleb Smirnoff */ 17823b3a8eb9SGleb Smirnoff if (pipe_cmd) 17833b3a8eb9SGleb Smirnoff goto next; 17843b3a8eb9SGleb Smirnoff } else { 17853b3a8eb9SGleb Smirnoff /* New scheduler, create a wf2q+ with no mask 17863b3a8eb9SGleb Smirnoff * if command was pipe config... 17873b3a8eb9SGleb Smirnoff */ 17883b3a8eb9SGleb Smirnoff if (pipe_cmd) { 17893b3a8eb9SGleb Smirnoff /* clear mask parameter */ 17903b3a8eb9SGleb Smirnoff bzero(&a.sch->sched_mask, sizeof(new_mask)); 17913b3a8eb9SGleb Smirnoff a.sch->buckets = 0; 17923b3a8eb9SGleb Smirnoff a.sch->flags &= ~DN_HAVE_MASK; 17933b3a8eb9SGleb Smirnoff } 17943b3a8eb9SGleb Smirnoff a.sch->oid.subtype = DN_SCHED_WF2QP; 17953b3a8eb9SGleb Smirnoff goto again; 17963b3a8eb9SGleb Smirnoff } 17973b3a8eb9SGleb Smirnoff } else { 17983b3a8eb9SGleb Smirnoff D("invalid scheduler type %d %s", 17993b3a8eb9SGleb Smirnoff a.sch->oid.subtype, a.sch->name); 18003b3a8eb9SGleb Smirnoff err = EINVAL; 18013b3a8eb9SGleb Smirnoff goto error; 18023b3a8eb9SGleb Smirnoff } 18033b3a8eb9SGleb Smirnoff /* normalize name and subtype */ 18043b3a8eb9SGleb Smirnoff a.sch->oid.subtype = a.fp->type; 18053b3a8eb9SGleb Smirnoff bzero(a.sch->name, sizeof(a.sch->name)); 18063b3a8eb9SGleb Smirnoff strlcpy(a.sch->name, a.fp->name, sizeof(a.sch->name)); 18073b3a8eb9SGleb Smirnoff if (s == NULL) { 18083b3a8eb9SGleb Smirnoff D("cannot allocate scheduler %d", i); 18093b3a8eb9SGleb Smirnoff goto error; 18103b3a8eb9SGleb Smirnoff } 18113b3a8eb9SGleb Smirnoff /* restore existing link if any */ 18123b3a8eb9SGleb Smirnoff if (p.link_nr) { 18133b3a8eb9SGleb Smirnoff s->link = p; 18143b3a8eb9SGleb Smirnoff if (!pf || pf->link_nr != p.link_nr) { /* no saved value */ 18153b3a8eb9SGleb Smirnoff s->profile = NULL; /* XXX maybe not needed */ 18163b3a8eb9SGleb Smirnoff } else { 18173b3a8eb9SGleb Smirnoff s->profile = malloc(sizeof(struct dn_profile), 18183b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 18193b3a8eb9SGleb Smirnoff if (s->profile == NULL) { 18203b3a8eb9SGleb Smirnoff D("cannot allocate profile"); 18213b3a8eb9SGleb Smirnoff goto error; //XXX 18223b3a8eb9SGleb Smirnoff } 18230ac43d97SMarius Strobl memcpy(s->profile, pf, sizeof(*pf)); 18243b3a8eb9SGleb Smirnoff } 18253b3a8eb9SGleb Smirnoff } 18263b3a8eb9SGleb Smirnoff p.link_nr = 0; 18273b3a8eb9SGleb Smirnoff if (s->fp == NULL) { 18283b3a8eb9SGleb Smirnoff DX(2, "sched %d new type %s", i, a.fp->name); 18293b3a8eb9SGleb Smirnoff } else if (s->fp != a.fp || 18303b3a8eb9SGleb Smirnoff bcmp(a.sch, &s->sch, sizeof(*a.sch)) ) { 18313b3a8eb9SGleb Smirnoff /* already existing. */ 18323b3a8eb9SGleb Smirnoff DX(2, "sched %d type changed from %s to %s", 18333b3a8eb9SGleb Smirnoff i, s->fp->name, a.fp->name); 18343b3a8eb9SGleb Smirnoff DX(4, " type/sub %d/%d -> %d/%d", 18353b3a8eb9SGleb Smirnoff s->sch.oid.type, s->sch.oid.subtype, 18363b3a8eb9SGleb Smirnoff a.sch->oid.type, a.sch->oid.subtype); 18373b3a8eb9SGleb Smirnoff if (s->link.link_nr == 0) 18383b3a8eb9SGleb Smirnoff D("XXX WARNING link 0 for sched %d", i); 18393b3a8eb9SGleb Smirnoff p = s->link; /* preserve link */ 18403b3a8eb9SGleb Smirnoff if (s->profile) {/* preserve profile */ 18413b3a8eb9SGleb Smirnoff if (!pf) 18423b3a8eb9SGleb Smirnoff pf = malloc(sizeof(*pf), 18433b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 18443b3a8eb9SGleb Smirnoff if (pf) /* XXX should issue a warning otherwise */ 18450ac43d97SMarius Strobl memcpy(pf, s->profile, sizeof(*pf)); 18463b3a8eb9SGleb Smirnoff } 18473b3a8eb9SGleb Smirnoff /* remove from the hash */ 1848fe3bcfbdSTom Jones dn_ht_find(V_dn_cfg.schedhash, i, DNHT_REMOVE, NULL); 18493b3a8eb9SGleb Smirnoff /* Detach flowsets, preserve queues. */ 18503b3a8eb9SGleb Smirnoff // schk_delete_cb(s, NULL); 18513b3a8eb9SGleb Smirnoff // XXX temporarily, kill queues 18523b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void *)DN_DESTROY); 18533b3a8eb9SGleb Smirnoff goto again; 18543b3a8eb9SGleb Smirnoff } else { 18553b3a8eb9SGleb Smirnoff DX(4, "sched %d unchanged type %s", i, a.fp->name); 18563b3a8eb9SGleb Smirnoff } 18573b3a8eb9SGleb Smirnoff /* complete initialization */ 18583b3a8eb9SGleb Smirnoff s->sch = *a.sch; 18593b3a8eb9SGleb Smirnoff s->fp = a.fp; 18603b3a8eb9SGleb Smirnoff s->cfg = arg; 18613b3a8eb9SGleb Smirnoff // XXX schk_reset_credit(s); 18623b3a8eb9SGleb Smirnoff /* create the internal flowset if needed, 18633b3a8eb9SGleb Smirnoff * trying to reuse existing ones if available 18643b3a8eb9SGleb Smirnoff */ 18653b3a8eb9SGleb Smirnoff if (!(s->fp->flags & DN_MULTIQUEUE) && !s->fs) { 1866fe3bcfbdSTom Jones s->fs = dn_ht_find(V_dn_cfg.fshash, i, 0, NULL); 18673b3a8eb9SGleb Smirnoff if (!s->fs) { 18683b3a8eb9SGleb Smirnoff struct dn_fs fs; 18693b3a8eb9SGleb Smirnoff bzero(&fs, sizeof(fs)); 18703b3a8eb9SGleb Smirnoff set_oid(&fs.oid, DN_FS, sizeof(fs)); 18713b3a8eb9SGleb Smirnoff fs.fs_nr = i + DN_MAX_ID; 18723b3a8eb9SGleb Smirnoff fs.sched_nr = i; 18733b3a8eb9SGleb Smirnoff s->fs = config_fs(&fs, NULL, 1 /* locked */); 18743b3a8eb9SGleb Smirnoff } 18753b3a8eb9SGleb Smirnoff if (!s->fs) { 18763b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void *)DN_DESTROY); 18773b3a8eb9SGleb Smirnoff D("error creating internal fs for %d", i); 18783b3a8eb9SGleb Smirnoff goto error; 18793b3a8eb9SGleb Smirnoff } 18803b3a8eb9SGleb Smirnoff } 18813b3a8eb9SGleb Smirnoff /* call init function after the flowset is created */ 18823b3a8eb9SGleb Smirnoff if (s->fp->config) 18833b3a8eb9SGleb Smirnoff s->fp->config(s); 18843b3a8eb9SGleb Smirnoff update_fs(s); 18853b3a8eb9SGleb Smirnoff next: 18863b3a8eb9SGleb Smirnoff if (i < DN_MAX_ID) { /* now configure the FIFO instance */ 18873b3a8eb9SGleb Smirnoff i += DN_MAX_ID; 18883b3a8eb9SGleb Smirnoff if (pipe_cmd) { 18893b3a8eb9SGleb Smirnoff /* Restore mask parameter for FIFO */ 18903b3a8eb9SGleb Smirnoff a.sch->sched_mask = new_mask; 18913b3a8eb9SGleb Smirnoff a.sch->buckets = new_buckets; 18923b3a8eb9SGleb Smirnoff a.sch->flags = new_flags; 18933b3a8eb9SGleb Smirnoff } else { 18943b3a8eb9SGleb Smirnoff /* sched config shouldn't modify the FIFO scheduler */ 1895fe3bcfbdSTom Jones if (dn_ht_find(V_dn_cfg.schedhash, i, 0, &a) != NULL) { 18963b3a8eb9SGleb Smirnoff /* FIFO already exist, don't touch it */ 18973b3a8eb9SGleb Smirnoff err = 0; /* and this is not an error */ 18983b3a8eb9SGleb Smirnoff goto error; 18993b3a8eb9SGleb Smirnoff } 19003b3a8eb9SGleb Smirnoff } 19013b3a8eb9SGleb Smirnoff a.sch->sched_nr = i; 19023b3a8eb9SGleb Smirnoff a.sch->oid.subtype = DN_SCHED_FIFO; 19033b3a8eb9SGleb Smirnoff bzero(a.sch->name, sizeof(a.sch->name)); 19043b3a8eb9SGleb Smirnoff goto again; 19053b3a8eb9SGleb Smirnoff } 19063b3a8eb9SGleb Smirnoff err = 0; 19073b3a8eb9SGleb Smirnoff error: 19083b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 19093b3a8eb9SGleb Smirnoff if (pf) 19103b3a8eb9SGleb Smirnoff free(pf, M_DUMMYNET); 19113b3a8eb9SGleb Smirnoff return err; 19123b3a8eb9SGleb Smirnoff } 19133b3a8eb9SGleb Smirnoff 19143b3a8eb9SGleb Smirnoff /* 19153b3a8eb9SGleb Smirnoff * attach a profile to a link 19163b3a8eb9SGleb Smirnoff */ 19173b3a8eb9SGleb Smirnoff static int 19183b3a8eb9SGleb Smirnoff config_profile(struct dn_profile *pf, struct dn_id *arg) 19193b3a8eb9SGleb Smirnoff { 19203b3a8eb9SGleb Smirnoff struct dn_schk *s; 19213b3a8eb9SGleb Smirnoff int i, olen, err = 0; 19223b3a8eb9SGleb Smirnoff 19233b3a8eb9SGleb Smirnoff if (pf->oid.len < sizeof(*pf)) { 19243b3a8eb9SGleb Smirnoff D("short profile len %d", pf->oid.len); 19253b3a8eb9SGleb Smirnoff return EINVAL; 19263b3a8eb9SGleb Smirnoff } 19273b3a8eb9SGleb Smirnoff i = pf->link_nr; 19283b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 19293b3a8eb9SGleb Smirnoff return EINVAL; 19303b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 19313b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 19323b3a8eb9SGleb Smirnoff for (; i < 2*DN_MAX_ID; i += DN_MAX_ID) { 19333b3a8eb9SGleb Smirnoff s = locate_scheduler(i); 19343b3a8eb9SGleb Smirnoff 19353b3a8eb9SGleb Smirnoff if (s == NULL) { 19363b3a8eb9SGleb Smirnoff err = EINVAL; 19373b3a8eb9SGleb Smirnoff break; 19383b3a8eb9SGleb Smirnoff } 1939fe3bcfbdSTom Jones V_dn_cfg.id++; 19403b3a8eb9SGleb Smirnoff /* 19413b3a8eb9SGleb Smirnoff * If we had a profile and the new one does not fit, 19423b3a8eb9SGleb Smirnoff * or it is deleted, then we need to free memory. 19433b3a8eb9SGleb Smirnoff */ 19443b3a8eb9SGleb Smirnoff if (s->profile && (pf->samples_no == 0 || 19453b3a8eb9SGleb Smirnoff s->profile->oid.len < pf->oid.len)) { 19463b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 19473b3a8eb9SGleb Smirnoff s->profile = NULL; 19483b3a8eb9SGleb Smirnoff } 19493b3a8eb9SGleb Smirnoff if (pf->samples_no == 0) 19503b3a8eb9SGleb Smirnoff continue; 19513b3a8eb9SGleb Smirnoff /* 19523b3a8eb9SGleb Smirnoff * new profile, possibly allocate memory 19533b3a8eb9SGleb Smirnoff * and copy data. 19543b3a8eb9SGleb Smirnoff */ 19553b3a8eb9SGleb Smirnoff if (s->profile == NULL) 19563b3a8eb9SGleb Smirnoff s->profile = malloc(pf->oid.len, 19573b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 19583b3a8eb9SGleb Smirnoff if (s->profile == NULL) { 19593b3a8eb9SGleb Smirnoff D("no memory for profile %d", i); 19603b3a8eb9SGleb Smirnoff err = ENOMEM; 19613b3a8eb9SGleb Smirnoff break; 19623b3a8eb9SGleb Smirnoff } 19633b3a8eb9SGleb Smirnoff /* preserve larger length XXX double check */ 19643b3a8eb9SGleb Smirnoff olen = s->profile->oid.len; 19653b3a8eb9SGleb Smirnoff if (olen < pf->oid.len) 19663b3a8eb9SGleb Smirnoff olen = pf->oid.len; 19670ac43d97SMarius Strobl memcpy(s->profile, pf, pf->oid.len); 19683b3a8eb9SGleb Smirnoff s->profile->oid.len = olen; 19693b3a8eb9SGleb Smirnoff } 19703b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 19713b3a8eb9SGleb Smirnoff return err; 19723b3a8eb9SGleb Smirnoff } 19733b3a8eb9SGleb Smirnoff 19743b3a8eb9SGleb Smirnoff /* 19753b3a8eb9SGleb Smirnoff * Delete all objects: 19763b3a8eb9SGleb Smirnoff */ 19773b3a8eb9SGleb Smirnoff static void 19783b3a8eb9SGleb Smirnoff dummynet_flush(void) 19793b3a8eb9SGleb Smirnoff { 19803b3a8eb9SGleb Smirnoff 19813b3a8eb9SGleb Smirnoff /* delete all schedulers and related links/queues/flowsets */ 1982fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, schk_delete_cb, 19833b3a8eb9SGleb Smirnoff (void *)(uintptr_t)DN_DELETE_FS); 19843b3a8eb9SGleb Smirnoff /* delete all remaining (unlinked) flowsets */ 1985fe3bcfbdSTom Jones DX(4, "still %d unlinked fs", V_dn_cfg.fsk_count); 1986fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.fshash, DNHT_REMOVE); 1987fe3bcfbdSTom Jones fsk_detach_list(&V_dn_cfg.fsu, DN_DELETE_FS); 19883b3a8eb9SGleb Smirnoff /* Reinitialize system heap... */ 1989fe3bcfbdSTom Jones heap_init(&V_dn_cfg.evheap, 16, offsetof(struct dn_id, id)); 19903b3a8eb9SGleb Smirnoff } 19913b3a8eb9SGleb Smirnoff 19923b3a8eb9SGleb Smirnoff /* 19933b3a8eb9SGleb Smirnoff * Main handler for configuration. We are guaranteed to be called 19943b3a8eb9SGleb Smirnoff * with an oid which is at least a dn_id. 19953b3a8eb9SGleb Smirnoff * - the first object is the command (config, delete, flush, ...) 19963b3a8eb9SGleb Smirnoff * - config_link must be issued after the corresponding config_sched 1997a4641f4eSPedro F. Giffuni * - parameters (DN_TXT) for an object must precede the object 19983b3a8eb9SGleb Smirnoff * processed on a config_sched. 19993b3a8eb9SGleb Smirnoff */ 20003b3a8eb9SGleb Smirnoff int 20013b3a8eb9SGleb Smirnoff do_config(void *p, int l) 20023b3a8eb9SGleb Smirnoff { 20030ac43d97SMarius Strobl struct dn_id o; 20040ac43d97SMarius Strobl union { 20050ac43d97SMarius Strobl struct dn_profile profile; 20060ac43d97SMarius Strobl struct dn_fs fs; 20070ac43d97SMarius Strobl struct dn_link link; 20080ac43d97SMarius Strobl struct dn_sch sched; 20090ac43d97SMarius Strobl } *dn; 20100ac43d97SMarius Strobl struct dn_id *arg; 20110ac43d97SMarius Strobl uintptr_t a; 20120ac43d97SMarius Strobl int err, err2, off; 20133b3a8eb9SGleb Smirnoff 20140ac43d97SMarius Strobl memcpy(&o, p, sizeof(o)); 20150ac43d97SMarius Strobl if (o.id != DN_API_VERSION) { 20160ac43d97SMarius Strobl D("invalid api version got %d need %d", o.id, DN_API_VERSION); 20173b3a8eb9SGleb Smirnoff return EINVAL; 20183b3a8eb9SGleb Smirnoff } 20190ac43d97SMarius Strobl arg = NULL; 20200ac43d97SMarius Strobl dn = NULL; 20210ac43d97SMarius Strobl for (off = 0; l >= sizeof(o); memcpy(&o, (char *)p + off, sizeof(o))) { 20220ac43d97SMarius Strobl if (o.len < sizeof(o) || l < o.len) { 20230ac43d97SMarius Strobl D("bad len o.len %d len %d", o.len, l); 20243b3a8eb9SGleb Smirnoff err = EINVAL; 20253b3a8eb9SGleb Smirnoff break; 20263b3a8eb9SGleb Smirnoff } 20270ac43d97SMarius Strobl l -= o.len; 20283b3a8eb9SGleb Smirnoff err = 0; 20290ac43d97SMarius Strobl switch (o.type) { 20303b3a8eb9SGleb Smirnoff default: 20310ac43d97SMarius Strobl D("cmd %d not implemented", o.type); 20323b3a8eb9SGleb Smirnoff break; 20333b3a8eb9SGleb Smirnoff 20343b3a8eb9SGleb Smirnoff #ifdef EMULATE_SYSCTL 20353b3a8eb9SGleb Smirnoff /* sysctl emulation. 20363b3a8eb9SGleb Smirnoff * if we recognize the command, jump to the correct 20373b3a8eb9SGleb Smirnoff * handler and return 20383b3a8eb9SGleb Smirnoff */ 20393b3a8eb9SGleb Smirnoff case DN_SYSCTL_SET: 20403b3a8eb9SGleb Smirnoff err = kesysctl_emu_set(p, l); 20413b3a8eb9SGleb Smirnoff return err; 20423b3a8eb9SGleb Smirnoff #endif 20433b3a8eb9SGleb Smirnoff 20443b3a8eb9SGleb Smirnoff case DN_CMD_CONFIG: /* simply a header */ 20453b3a8eb9SGleb Smirnoff break; 20463b3a8eb9SGleb Smirnoff 20473b3a8eb9SGleb Smirnoff case DN_CMD_DELETE: 20483b3a8eb9SGleb Smirnoff /* the argument is in the first uintptr_t after o */ 20490ac43d97SMarius Strobl if (o.len < sizeof(o) + sizeof(a)) { 20503b3a8eb9SGleb Smirnoff err = EINVAL; 20513b3a8eb9SGleb Smirnoff break; 20523b3a8eb9SGleb Smirnoff } 20530ac43d97SMarius Strobl memcpy(&a, (char *)p + off + sizeof(o), sizeof(a)); 20540ac43d97SMarius Strobl switch (o.subtype) { 20553b3a8eb9SGleb Smirnoff case DN_LINK: 20563b3a8eb9SGleb Smirnoff /* delete base and derived schedulers */ 20573b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 20580ac43d97SMarius Strobl err = delete_schk(a); 20590ac43d97SMarius Strobl err2 = delete_schk(a + DN_MAX_ID); 20603b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 20613b3a8eb9SGleb Smirnoff if (!err) 20623b3a8eb9SGleb Smirnoff err = err2; 20633b3a8eb9SGleb Smirnoff break; 20643b3a8eb9SGleb Smirnoff 20653b3a8eb9SGleb Smirnoff default: 20660ac43d97SMarius Strobl D("invalid delete type %d", o.subtype); 20673b3a8eb9SGleb Smirnoff err = EINVAL; 20683b3a8eb9SGleb Smirnoff break; 20693b3a8eb9SGleb Smirnoff 20703b3a8eb9SGleb Smirnoff case DN_FS: 20710ac43d97SMarius Strobl err = (a < 1 || a >= DN_MAX_ID) ? 20720ac43d97SMarius Strobl EINVAL : delete_fs(a, 0) ; 20733b3a8eb9SGleb Smirnoff break; 20743b3a8eb9SGleb Smirnoff } 20753b3a8eb9SGleb Smirnoff break; 20763b3a8eb9SGleb Smirnoff 20773b3a8eb9SGleb Smirnoff case DN_CMD_FLUSH: 20783b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 20793b3a8eb9SGleb Smirnoff dummynet_flush(); 20803b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 20813b3a8eb9SGleb Smirnoff break; 20820ac43d97SMarius Strobl case DN_TEXT: /* store argument of next block */ 20830ac43d97SMarius Strobl free(arg, M_TEMP); 2084*51d73df1SKristof Provost arg = malloc(o.len, M_TEMP, M_NOWAIT); 2085*51d73df1SKristof Provost if (arg == NULL) { 2086*51d73df1SKristof Provost err = ENOMEM; 2087*51d73df1SKristof Provost break; 2088*51d73df1SKristof Provost } 20890ac43d97SMarius Strobl memcpy(arg, (char *)p + off, o.len); 20903b3a8eb9SGleb Smirnoff break; 20913b3a8eb9SGleb Smirnoff case DN_LINK: 20920ac43d97SMarius Strobl if (dn == NULL) 2093*51d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 2094*51d73df1SKristof Provost if (dn == NULL) { 2095*51d73df1SKristof Provost err = ENOMEM; 2096*51d73df1SKristof Provost break; 2097*51d73df1SKristof Provost } 20980ac43d97SMarius Strobl memcpy(&dn->link, (char *)p + off, sizeof(dn->link)); 20990ac43d97SMarius Strobl err = config_link(&dn->link, arg); 21003b3a8eb9SGleb Smirnoff break; 21013b3a8eb9SGleb Smirnoff case DN_PROFILE: 21020ac43d97SMarius Strobl if (dn == NULL) 2103*51d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 2104*51d73df1SKristof Provost if (dn == NULL) { 2105*51d73df1SKristof Provost err = ENOMEM; 2106*51d73df1SKristof Provost break; 2107*51d73df1SKristof Provost } 21080ac43d97SMarius Strobl memcpy(&dn->profile, (char *)p + off, 21090ac43d97SMarius Strobl sizeof(dn->profile)); 21100ac43d97SMarius Strobl err = config_profile(&dn->profile, arg); 21113b3a8eb9SGleb Smirnoff break; 21123b3a8eb9SGleb Smirnoff case DN_SCH: 21130ac43d97SMarius Strobl if (dn == NULL) 2114*51d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 2115*51d73df1SKristof Provost if (dn == NULL) { 2116*51d73df1SKristof Provost err = ENOMEM; 2117*51d73df1SKristof Provost break; 2118*51d73df1SKristof Provost } 21190ac43d97SMarius Strobl memcpy(&dn->sched, (char *)p + off, 21200ac43d97SMarius Strobl sizeof(dn->sched)); 21210ac43d97SMarius Strobl err = config_sched(&dn->sched, arg); 21223b3a8eb9SGleb Smirnoff break; 21233b3a8eb9SGleb Smirnoff case DN_FS: 21240ac43d97SMarius Strobl if (dn == NULL) 2125*51d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 2126*51d73df1SKristof Provost if (dn == NULL) { 2127*51d73df1SKristof Provost err = ENOMEM; 2128*51d73df1SKristof Provost break; 2129*51d73df1SKristof Provost } 21300ac43d97SMarius Strobl memcpy(&dn->fs, (char *)p + off, sizeof(dn->fs)); 21310ac43d97SMarius Strobl err = (NULL == config_fs(&dn->fs, arg, 0)); 21323b3a8eb9SGleb Smirnoff break; 21333b3a8eb9SGleb Smirnoff } 21343b3a8eb9SGleb Smirnoff if (err != 0) 21353b3a8eb9SGleb Smirnoff break; 21360ac43d97SMarius Strobl off += o.len; 21373b3a8eb9SGleb Smirnoff } 21380ac43d97SMarius Strobl if (arg != NULL) 21390ac43d97SMarius Strobl free(arg, M_TEMP); 21400ac43d97SMarius Strobl if (dn != NULL) 21410ac43d97SMarius Strobl free(dn, M_TEMP); 21423b3a8eb9SGleb Smirnoff return err; 21433b3a8eb9SGleb Smirnoff } 21443b3a8eb9SGleb Smirnoff 21453b3a8eb9SGleb Smirnoff static int 21463b3a8eb9SGleb Smirnoff compute_space(struct dn_id *cmd, struct copy_args *a) 21473b3a8eb9SGleb Smirnoff { 21483b3a8eb9SGleb Smirnoff int x = 0, need = 0; 21493b3a8eb9SGleb Smirnoff int profile_size = sizeof(struct dn_profile) - 21503b3a8eb9SGleb Smirnoff ED_MAX_SAMPLES_NO*sizeof(int); 21513b3a8eb9SGleb Smirnoff 21523b3a8eb9SGleb Smirnoff /* NOTE about compute space: 2153fe3bcfbdSTom Jones * NP = V_dn_cfg.schk_count 2154fe3bcfbdSTom Jones * NSI = V_dn_cfg.si_count 2155fe3bcfbdSTom Jones * NF = V_dn_cfg.fsk_count 2156fe3bcfbdSTom Jones * NQ = V_dn_cfg.queue_count 21573b3a8eb9SGleb Smirnoff * - ipfw pipe show 21583b3a8eb9SGleb Smirnoff * (NP/2)*(dn_link + dn_sch + dn_id + dn_fs) only half scheduler 21593b3a8eb9SGleb Smirnoff * link, scheduler template, flowset 21603b3a8eb9SGleb Smirnoff * integrated in scheduler and header 21613b3a8eb9SGleb Smirnoff * for flowset list 21623b3a8eb9SGleb Smirnoff * (NSI)*(dn_flow) all scheduler instance (includes 21633b3a8eb9SGleb Smirnoff * the queue instance) 21643b3a8eb9SGleb Smirnoff * - ipfw sched show 21653b3a8eb9SGleb Smirnoff * (NP/2)*(dn_link + dn_sch + dn_id + dn_fs) only half scheduler 21663b3a8eb9SGleb Smirnoff * link, scheduler template, flowset 21673b3a8eb9SGleb Smirnoff * integrated in scheduler and header 21683b3a8eb9SGleb Smirnoff * for flowset list 21693b3a8eb9SGleb Smirnoff * (NSI * dn_flow) all scheduler instances 21703b3a8eb9SGleb Smirnoff * (NF * sizeof(uint_32)) space for flowset list linked to scheduler 21713b3a8eb9SGleb Smirnoff * (NQ * dn_queue) all queue [XXXfor now not listed] 21723b3a8eb9SGleb Smirnoff * - ipfw queue show 21733b3a8eb9SGleb Smirnoff * (NF * dn_fs) all flowset 21743b3a8eb9SGleb Smirnoff * (NQ * dn_queue) all queues 21753b3a8eb9SGleb Smirnoff */ 21763b3a8eb9SGleb Smirnoff switch (cmd->subtype) { 21773b3a8eb9SGleb Smirnoff default: 21783b3a8eb9SGleb Smirnoff return -1; 21793b3a8eb9SGleb Smirnoff /* XXX where do LINK and SCH differ ? */ 21803b3a8eb9SGleb Smirnoff /* 'ipfw sched show' could list all queues associated to 21813b3a8eb9SGleb Smirnoff * a scheduler. This feature for now is disabled 21823b3a8eb9SGleb Smirnoff */ 21833b3a8eb9SGleb Smirnoff case DN_LINK: /* pipe show */ 21843b3a8eb9SGleb Smirnoff x = DN_C_LINK | DN_C_SCH | DN_C_FLOW; 2185fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * 21863b3a8eb9SGleb Smirnoff (sizeof(struct dn_fs) + profile_size) / 2; 2187fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(uint32_t); 21883b3a8eb9SGleb Smirnoff break; 21893b3a8eb9SGleb Smirnoff case DN_SCH: /* sched show */ 2190fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * 21913b3a8eb9SGleb Smirnoff (sizeof(struct dn_fs) + profile_size) / 2; 2192fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(uint32_t); 21933b3a8eb9SGleb Smirnoff x = DN_C_SCH | DN_C_LINK | DN_C_FLOW; 21943b3a8eb9SGleb Smirnoff break; 21953b3a8eb9SGleb Smirnoff case DN_FS: /* queue show */ 21963b3a8eb9SGleb Smirnoff x = DN_C_FS | DN_C_QUEUE; 21973b3a8eb9SGleb Smirnoff break; 21983b3a8eb9SGleb Smirnoff case DN_GET_COMPAT: /* compatibility mode */ 21993b3a8eb9SGleb Smirnoff need = dn_compat_calc_size(); 22003b3a8eb9SGleb Smirnoff break; 22013b3a8eb9SGleb Smirnoff } 22023b3a8eb9SGleb Smirnoff a->flags = x; 22033b3a8eb9SGleb Smirnoff if (x & DN_C_SCH) { 2204fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_sch) / 2; 22053b3a8eb9SGleb Smirnoff /* NOT also, each fs might be attached to a sched */ 2206fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_id) / 2; 22073b3a8eb9SGleb Smirnoff } 22083b3a8eb9SGleb Smirnoff if (x & DN_C_FS) 2209fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(struct dn_fs); 22103b3a8eb9SGleb Smirnoff if (x & DN_C_LINK) { 2211fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_link) / 2; 22123b3a8eb9SGleb Smirnoff } 22133b3a8eb9SGleb Smirnoff /* 22143b3a8eb9SGleb Smirnoff * When exporting a queue to userland, only pass up the 22153b3a8eb9SGleb Smirnoff * struct dn_flow, which is the only visible part. 22163b3a8eb9SGleb Smirnoff */ 22173b3a8eb9SGleb Smirnoff 22183b3a8eb9SGleb Smirnoff if (x & DN_C_QUEUE) 2219fe3bcfbdSTom Jones need += V_dn_cfg.queue_count * sizeof(struct dn_flow); 22203b3a8eb9SGleb Smirnoff if (x & DN_C_FLOW) 2221fe3bcfbdSTom Jones need += V_dn_cfg.si_count * (sizeof(struct dn_flow)); 22223b3a8eb9SGleb Smirnoff return need; 22233b3a8eb9SGleb Smirnoff } 22243b3a8eb9SGleb Smirnoff 22253b3a8eb9SGleb Smirnoff /* 22263b3a8eb9SGleb Smirnoff * If compat != NULL dummynet_get is called in compatibility mode. 22273b3a8eb9SGleb Smirnoff * *compat will be the pointer to the buffer to pass to ipfw 22283b3a8eb9SGleb Smirnoff */ 22293b3a8eb9SGleb Smirnoff int 22303b3a8eb9SGleb Smirnoff dummynet_get(struct sockopt *sopt, void **compat) 22313b3a8eb9SGleb Smirnoff { 22323b3a8eb9SGleb Smirnoff int have, i, need, error; 22333b3a8eb9SGleb Smirnoff char *start = NULL, *buf; 22343b3a8eb9SGleb Smirnoff size_t sopt_valsize; 22353b3a8eb9SGleb Smirnoff struct dn_id *cmd; 22363b3a8eb9SGleb Smirnoff struct copy_args a; 22373b3a8eb9SGleb Smirnoff struct copy_range r; 22383b3a8eb9SGleb Smirnoff int l = sizeof(struct dn_id); 22393b3a8eb9SGleb Smirnoff 22403b3a8eb9SGleb Smirnoff bzero(&a, sizeof(a)); 22413b3a8eb9SGleb Smirnoff bzero(&r, sizeof(r)); 22423b3a8eb9SGleb Smirnoff 22433b3a8eb9SGleb Smirnoff /* save and restore original sopt_valsize around copyin */ 22443b3a8eb9SGleb Smirnoff sopt_valsize = sopt->sopt_valsize; 22453b3a8eb9SGleb Smirnoff 22463b3a8eb9SGleb Smirnoff cmd = &r.o; 22473b3a8eb9SGleb Smirnoff 22483b3a8eb9SGleb Smirnoff if (!compat) { 22493b3a8eb9SGleb Smirnoff /* copy at least an oid, and possibly a full object */ 22503b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, cmd, sizeof(r), sizeof(*cmd)); 22513b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 22523b3a8eb9SGleb Smirnoff if (error) 22533b3a8eb9SGleb Smirnoff goto done; 22543b3a8eb9SGleb Smirnoff l = cmd->len; 22553b3a8eb9SGleb Smirnoff #ifdef EMULATE_SYSCTL 22563b3a8eb9SGleb Smirnoff /* sysctl emulation. */ 22573b3a8eb9SGleb Smirnoff if (cmd->type == DN_SYSCTL_GET) 22583b3a8eb9SGleb Smirnoff return kesysctl_emu_get(sopt); 22593b3a8eb9SGleb Smirnoff #endif 22603b3a8eb9SGleb Smirnoff if (l > sizeof(r)) { 22613b3a8eb9SGleb Smirnoff /* request larger than default, allocate buffer */ 2262*51d73df1SKristof Provost cmd = malloc(l, M_DUMMYNET, M_NOWAIT); 2263*51d73df1SKristof Provost if (cmd == NULL) { 2264*51d73df1SKristof Provost error = ENOMEM; 2265*51d73df1SKristof Provost goto done; 2266*51d73df1SKristof Provost } 22673b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, cmd, l, l); 22683b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 22693b3a8eb9SGleb Smirnoff if (error) 22703b3a8eb9SGleb Smirnoff goto done; 22713b3a8eb9SGleb Smirnoff } 22723b3a8eb9SGleb Smirnoff } else { /* compatibility */ 22733b3a8eb9SGleb Smirnoff error = 0; 22743b3a8eb9SGleb Smirnoff cmd->type = DN_CMD_GET; 22753b3a8eb9SGleb Smirnoff cmd->len = sizeof(struct dn_id); 22763b3a8eb9SGleb Smirnoff cmd->subtype = DN_GET_COMPAT; 22773b3a8eb9SGleb Smirnoff // cmd->id = sopt_valsize; 22783b3a8eb9SGleb Smirnoff D("compatibility mode"); 22793b3a8eb9SGleb Smirnoff } 228091336b40SDon Lewis 228191336b40SDon Lewis #ifdef NEW_AQM 228291336b40SDon Lewis /* get AQM params */ 228391336b40SDon Lewis if(cmd->subtype == DN_AQM_PARAMS) { 228491336b40SDon Lewis error = get_aqm_parms(sopt); 228591336b40SDon Lewis goto done; 228691336b40SDon Lewis /* get Scheduler params */ 228791336b40SDon Lewis } else if (cmd->subtype == DN_SCH_PARAMS) { 228891336b40SDon Lewis error = get_sched_parms(sopt); 228991336b40SDon Lewis goto done; 229091336b40SDon Lewis } 229191336b40SDon Lewis #endif 229291336b40SDon Lewis 22933b3a8eb9SGleb Smirnoff a.extra = (struct copy_range *)cmd; 22943b3a8eb9SGleb Smirnoff if (cmd->len == sizeof(*cmd)) { /* no range, create a default */ 22953b3a8eb9SGleb Smirnoff uint32_t *rp = (uint32_t *)(cmd + 1); 22963b3a8eb9SGleb Smirnoff cmd->len += 2* sizeof(uint32_t); 22973b3a8eb9SGleb Smirnoff rp[0] = 1; 22983b3a8eb9SGleb Smirnoff rp[1] = DN_MAX_ID - 1; 22993b3a8eb9SGleb Smirnoff if (cmd->subtype == DN_LINK) { 23003b3a8eb9SGleb Smirnoff rp[0] += DN_MAX_ID; 23013b3a8eb9SGleb Smirnoff rp[1] += DN_MAX_ID; 23023b3a8eb9SGleb Smirnoff } 23033b3a8eb9SGleb Smirnoff } 23043b3a8eb9SGleb Smirnoff /* Count space (under lock) and allocate (outside lock). 23053b3a8eb9SGleb Smirnoff * Exit with lock held if we manage to get enough buffer. 23063b3a8eb9SGleb Smirnoff * Try a few times then give up. 23073b3a8eb9SGleb Smirnoff */ 23083b3a8eb9SGleb Smirnoff for (have = 0, i = 0; i < 10; i++) { 23093b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 23103b3a8eb9SGleb Smirnoff need = compute_space(cmd, &a); 23113b3a8eb9SGleb Smirnoff 23123b3a8eb9SGleb Smirnoff /* if there is a range, ignore value from compute_space() */ 23133b3a8eb9SGleb Smirnoff if (l > sizeof(*cmd)) 23143b3a8eb9SGleb Smirnoff need = sopt_valsize - sizeof(*cmd); 23153b3a8eb9SGleb Smirnoff 23163b3a8eb9SGleb Smirnoff if (need < 0) { 23173b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23183b3a8eb9SGleb Smirnoff error = EINVAL; 23193b3a8eb9SGleb Smirnoff goto done; 23203b3a8eb9SGleb Smirnoff } 23213b3a8eb9SGleb Smirnoff need += sizeof(*cmd); 23223b3a8eb9SGleb Smirnoff cmd->id = need; 23233b3a8eb9SGleb Smirnoff if (have >= need) 23243b3a8eb9SGleb Smirnoff break; 23253b3a8eb9SGleb Smirnoff 23263b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23273b3a8eb9SGleb Smirnoff if (start) 23283b3a8eb9SGleb Smirnoff free(start, M_DUMMYNET); 23293b3a8eb9SGleb Smirnoff start = NULL; 23303b3a8eb9SGleb Smirnoff if (need > sopt_valsize) 23313b3a8eb9SGleb Smirnoff break; 23323b3a8eb9SGleb Smirnoff 23333b3a8eb9SGleb Smirnoff have = need; 2334*51d73df1SKristof Provost start = malloc(have, M_DUMMYNET, M_NOWAIT | M_ZERO); 23353b3a8eb9SGleb Smirnoff } 23363b3a8eb9SGleb Smirnoff 23373b3a8eb9SGleb Smirnoff if (start == NULL) { 23383b3a8eb9SGleb Smirnoff if (compat) { 23393b3a8eb9SGleb Smirnoff *compat = NULL; 23403b3a8eb9SGleb Smirnoff error = 1; // XXX 23413b3a8eb9SGleb Smirnoff } else { 23423b3a8eb9SGleb Smirnoff error = sooptcopyout(sopt, cmd, sizeof(*cmd)); 23433b3a8eb9SGleb Smirnoff } 23443b3a8eb9SGleb Smirnoff goto done; 23453b3a8eb9SGleb Smirnoff } 23463b3a8eb9SGleb Smirnoff ND("have %d:%d sched %d, %d:%d links %d, %d:%d flowsets %d, " 23473b3a8eb9SGleb Smirnoff "%d:%d si %d, %d:%d queues %d", 2348fe3bcfbdSTom Jones V_dn_cfg.schk_count, sizeof(struct dn_sch), DN_SCH, 2349fe3bcfbdSTom Jones V_dn_cfg.schk_count, sizeof(struct dn_link), DN_LINK, 2350fe3bcfbdSTom Jones V_dn_cfg.fsk_count, sizeof(struct dn_fs), DN_FS, 2351fe3bcfbdSTom Jones V_dn_cfg.si_count, sizeof(struct dn_flow), DN_SCH_I, 2352fe3bcfbdSTom Jones V_dn_cfg.queue_count, sizeof(struct dn_queue), DN_QUEUE); 23533b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 23543b3a8eb9SGleb Smirnoff a.type = cmd->subtype; 23553b3a8eb9SGleb Smirnoff 23563b3a8eb9SGleb Smirnoff if (compat == NULL) { 23570ac43d97SMarius Strobl memcpy(start, cmd, sizeof(*cmd)); 23583b3a8eb9SGleb Smirnoff ((struct dn_id*)(start))->len = sizeof(struct dn_id); 23593b3a8eb9SGleb Smirnoff buf = start + sizeof(*cmd); 23603b3a8eb9SGleb Smirnoff } else 23613b3a8eb9SGleb Smirnoff buf = start; 23623b3a8eb9SGleb Smirnoff a.start = &buf; 23633b3a8eb9SGleb Smirnoff a.end = start + have; 23643b3a8eb9SGleb Smirnoff /* start copying other objects */ 23653b3a8eb9SGleb Smirnoff if (compat) { 23663b3a8eb9SGleb Smirnoff a.type = DN_COMPAT_PIPE; 2367fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, copy_data_helper_compat, &a); 23683b3a8eb9SGleb Smirnoff a.type = DN_COMPAT_QUEUE; 2369fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, copy_data_helper_compat, &a); 23703b3a8eb9SGleb Smirnoff } else if (a.type == DN_FS) { 2371fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, copy_data_helper, &a); 23723b3a8eb9SGleb Smirnoff } else { 2373fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, copy_data_helper, &a); 23743b3a8eb9SGleb Smirnoff } 23753b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23763b3a8eb9SGleb Smirnoff 23773b3a8eb9SGleb Smirnoff if (compat) { 23783b3a8eb9SGleb Smirnoff *compat = start; 23793b3a8eb9SGleb Smirnoff sopt->sopt_valsize = buf - start; 23803b3a8eb9SGleb Smirnoff /* free() is done by ip_dummynet_compat() */ 23813b3a8eb9SGleb Smirnoff start = NULL; //XXX hack 23823b3a8eb9SGleb Smirnoff } else { 23833b3a8eb9SGleb Smirnoff error = sooptcopyout(sopt, start, buf - start); 23843b3a8eb9SGleb Smirnoff } 23853b3a8eb9SGleb Smirnoff done: 23863b3a8eb9SGleb Smirnoff if (cmd && cmd != &r.o) 23873b3a8eb9SGleb Smirnoff free(cmd, M_DUMMYNET); 23883b3a8eb9SGleb Smirnoff if (start) 23893b3a8eb9SGleb Smirnoff free(start, M_DUMMYNET); 23903b3a8eb9SGleb Smirnoff return error; 23913b3a8eb9SGleb Smirnoff } 23923b3a8eb9SGleb Smirnoff 23933b3a8eb9SGleb Smirnoff /* Callback called on scheduler instance to delete it if idle */ 23943b3a8eb9SGleb Smirnoff static int 23953b3a8eb9SGleb Smirnoff drain_scheduler_cb(void *_si, void *arg) 23963b3a8eb9SGleb Smirnoff { 23973b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 23983b3a8eb9SGleb Smirnoff 23993b3a8eb9SGleb Smirnoff if ((si->kflags & DN_ACTIVE) || si->dline.mq.head != NULL) 24003b3a8eb9SGleb Smirnoff return 0; 24013b3a8eb9SGleb Smirnoff 24023b3a8eb9SGleb Smirnoff if (si->sched->fp->flags & DN_MULTIQUEUE) { 24033b3a8eb9SGleb Smirnoff if (si->q_count == 0) 24043b3a8eb9SGleb Smirnoff return si_destroy(si, NULL); 24053b3a8eb9SGleb Smirnoff else 24063b3a8eb9SGleb Smirnoff return 0; 24073b3a8eb9SGleb Smirnoff } else { /* !DN_MULTIQUEUE */ 24083b3a8eb9SGleb Smirnoff if ((si+1)->ni.length == 0) 24093b3a8eb9SGleb Smirnoff return si_destroy(si, NULL); 24103b3a8eb9SGleb Smirnoff else 24113b3a8eb9SGleb Smirnoff return 0; 24123b3a8eb9SGleb Smirnoff } 24133b3a8eb9SGleb Smirnoff return 0; /* unreachable */ 24143b3a8eb9SGleb Smirnoff } 24153b3a8eb9SGleb Smirnoff 24163b3a8eb9SGleb Smirnoff /* Callback called on scheduler to check if it has instances */ 24173b3a8eb9SGleb Smirnoff static int 24183b3a8eb9SGleb Smirnoff drain_scheduler_sch_cb(void *_s, void *arg) 24193b3a8eb9SGleb Smirnoff { 24203b3a8eb9SGleb Smirnoff struct dn_schk *s = _s; 24213b3a8eb9SGleb Smirnoff 24223b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 24233b3a8eb9SGleb Smirnoff dn_ht_scan_bucket(s->siht, &s->drain_bucket, 24243b3a8eb9SGleb Smirnoff drain_scheduler_cb, NULL); 24253b3a8eb9SGleb Smirnoff s->drain_bucket++; 24263b3a8eb9SGleb Smirnoff } else { 24273b3a8eb9SGleb Smirnoff if (s->siht) { 24283b3a8eb9SGleb Smirnoff if (drain_scheduler_cb(s->siht, NULL) == DNHT_SCAN_DEL) 24293b3a8eb9SGleb Smirnoff s->siht = NULL; 24303b3a8eb9SGleb Smirnoff } 24313b3a8eb9SGleb Smirnoff } 24323b3a8eb9SGleb Smirnoff return 0; 24333b3a8eb9SGleb Smirnoff } 24343b3a8eb9SGleb Smirnoff 24353b3a8eb9SGleb Smirnoff /* Called every tick, try to delete a 'bucket' of scheduler */ 24363b3a8eb9SGleb Smirnoff void 24373b3a8eb9SGleb Smirnoff dn_drain_scheduler(void) 24383b3a8eb9SGleb Smirnoff { 2439fe3bcfbdSTom Jones dn_ht_scan_bucket(V_dn_cfg.schedhash, &V_dn_cfg.drain_sch, 24403b3a8eb9SGleb Smirnoff drain_scheduler_sch_cb, NULL); 2441fe3bcfbdSTom Jones V_dn_cfg.drain_sch++; 24423b3a8eb9SGleb Smirnoff } 24433b3a8eb9SGleb Smirnoff 24443b3a8eb9SGleb Smirnoff /* Callback called on queue to delete if it is idle */ 24453b3a8eb9SGleb Smirnoff static int 24463b3a8eb9SGleb Smirnoff drain_queue_cb(void *_q, void *arg) 24473b3a8eb9SGleb Smirnoff { 24483b3a8eb9SGleb Smirnoff struct dn_queue *q = _q; 24493b3a8eb9SGleb Smirnoff 24503b3a8eb9SGleb Smirnoff if (q->ni.length == 0) { 24513b3a8eb9SGleb Smirnoff dn_delete_queue(q, DN_DESTROY); 24523b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; /* queue is deleted */ 24533b3a8eb9SGleb Smirnoff } 24543b3a8eb9SGleb Smirnoff 24553b3a8eb9SGleb Smirnoff return 0; /* queue isn't deleted */ 24563b3a8eb9SGleb Smirnoff } 24573b3a8eb9SGleb Smirnoff 24583b3a8eb9SGleb Smirnoff /* Callback called on flowset used to check if it has queues */ 24593b3a8eb9SGleb Smirnoff static int 24603b3a8eb9SGleb Smirnoff drain_queue_fs_cb(void *_fs, void *arg) 24613b3a8eb9SGleb Smirnoff { 24623b3a8eb9SGleb Smirnoff struct dn_fsk *fs = _fs; 24633b3a8eb9SGleb Smirnoff 24643b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 24653b3a8eb9SGleb Smirnoff /* Flowset has a hash table for queues */ 24663b3a8eb9SGleb Smirnoff dn_ht_scan_bucket(fs->qht, &fs->drain_bucket, 24673b3a8eb9SGleb Smirnoff drain_queue_cb, NULL); 24683b3a8eb9SGleb Smirnoff fs->drain_bucket++; 24693b3a8eb9SGleb Smirnoff } else { 24703b3a8eb9SGleb Smirnoff /* No hash table for this flowset, null the pointer 24713b3a8eb9SGleb Smirnoff * if the queue is deleted 24723b3a8eb9SGleb Smirnoff */ 24733b3a8eb9SGleb Smirnoff if (fs->qht) { 24743b3a8eb9SGleb Smirnoff if (drain_queue_cb(fs->qht, NULL) == DNHT_SCAN_DEL) 24753b3a8eb9SGleb Smirnoff fs->qht = NULL; 24763b3a8eb9SGleb Smirnoff } 24773b3a8eb9SGleb Smirnoff } 24783b3a8eb9SGleb Smirnoff return 0; 24793b3a8eb9SGleb Smirnoff } 24803b3a8eb9SGleb Smirnoff 24813b3a8eb9SGleb Smirnoff /* Called every tick, try to delete a 'bucket' of queue */ 24823b3a8eb9SGleb Smirnoff void 24833b3a8eb9SGleb Smirnoff dn_drain_queue(void) 24843b3a8eb9SGleb Smirnoff { 24853b3a8eb9SGleb Smirnoff /* scan a bucket of flowset */ 2486fe3bcfbdSTom Jones dn_ht_scan_bucket(V_dn_cfg.fshash, &V_dn_cfg.drain_fs, 24873b3a8eb9SGleb Smirnoff drain_queue_fs_cb, NULL); 2488fe3bcfbdSTom Jones V_dn_cfg.drain_fs++; 24893b3a8eb9SGleb Smirnoff } 24903b3a8eb9SGleb Smirnoff 24913b3a8eb9SGleb Smirnoff /* 24923b3a8eb9SGleb Smirnoff * Handler for the various dummynet socket options 24933b3a8eb9SGleb Smirnoff */ 24943b3a8eb9SGleb Smirnoff static int 24953b3a8eb9SGleb Smirnoff ip_dn_ctl(struct sockopt *sopt) 24963b3a8eb9SGleb Smirnoff { 2497*51d73df1SKristof Provost struct epoch_tracker et; 24983b3a8eb9SGleb Smirnoff void *p = NULL; 24993b3a8eb9SGleb Smirnoff int error, l; 25003b3a8eb9SGleb Smirnoff 25013b3a8eb9SGleb Smirnoff error = priv_check(sopt->sopt_td, PRIV_NETINET_DUMMYNET); 25023b3a8eb9SGleb Smirnoff if (error) 25033b3a8eb9SGleb Smirnoff return (error); 25043b3a8eb9SGleb Smirnoff 25053b3a8eb9SGleb Smirnoff /* Disallow sets in really-really secure mode. */ 25063b3a8eb9SGleb Smirnoff if (sopt->sopt_dir == SOPT_SET) { 25073b3a8eb9SGleb Smirnoff error = securelevel_ge(sopt->sopt_td->td_ucred, 3); 25083b3a8eb9SGleb Smirnoff if (error) 25093b3a8eb9SGleb Smirnoff return (error); 25103b3a8eb9SGleb Smirnoff } 25113b3a8eb9SGleb Smirnoff 2512*51d73df1SKristof Provost NET_EPOCH_ENTER(et); 2513*51d73df1SKristof Provost 25143b3a8eb9SGleb Smirnoff switch (sopt->sopt_name) { 25153b3a8eb9SGleb Smirnoff default : 25163b3a8eb9SGleb Smirnoff D("dummynet: unknown option %d", sopt->sopt_name); 25173b3a8eb9SGleb Smirnoff error = EINVAL; 25183b3a8eb9SGleb Smirnoff break; 25193b3a8eb9SGleb Smirnoff 25203b3a8eb9SGleb Smirnoff case IP_DUMMYNET_FLUSH: 25213b3a8eb9SGleb Smirnoff case IP_DUMMYNET_CONFIGURE: 25223b3a8eb9SGleb Smirnoff case IP_DUMMYNET_DEL: /* remove a pipe or queue */ 25233b3a8eb9SGleb Smirnoff case IP_DUMMYNET_GET: 25243b3a8eb9SGleb Smirnoff D("dummynet: compat option %d", sopt->sopt_name); 25253b3a8eb9SGleb Smirnoff error = ip_dummynet_compat(sopt); 25263b3a8eb9SGleb Smirnoff break; 25273b3a8eb9SGleb Smirnoff 25283b3a8eb9SGleb Smirnoff case IP_DUMMYNET3 : 25293b3a8eb9SGleb Smirnoff if (sopt->sopt_dir == SOPT_GET) { 25303b3a8eb9SGleb Smirnoff error = dummynet_get(sopt, NULL); 25313b3a8eb9SGleb Smirnoff break; 25323b3a8eb9SGleb Smirnoff } 25333b3a8eb9SGleb Smirnoff l = sopt->sopt_valsize; 25343b3a8eb9SGleb Smirnoff if (l < sizeof(struct dn_id) || l > 12000) { 25353b3a8eb9SGleb Smirnoff D("argument len %d invalid", l); 25363b3a8eb9SGleb Smirnoff break; 25373b3a8eb9SGleb Smirnoff } 2538*51d73df1SKristof Provost p = malloc(l, M_TEMP, M_NOWAIT); 2539*51d73df1SKristof Provost if (p == NULL) { 2540*51d73df1SKristof Provost error = ENOMEM; 2541*51d73df1SKristof Provost break; 2542*51d73df1SKristof Provost } 25433b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, p, l, l); 25443b3a8eb9SGleb Smirnoff if (error) 25453b3a8eb9SGleb Smirnoff break ; 25463b3a8eb9SGleb Smirnoff error = do_config(p, l); 25473b3a8eb9SGleb Smirnoff break; 25483b3a8eb9SGleb Smirnoff } 25493b3a8eb9SGleb Smirnoff 25503b3a8eb9SGleb Smirnoff if (p != NULL) 25513b3a8eb9SGleb Smirnoff free(p, M_TEMP); 25523b3a8eb9SGleb Smirnoff 2553*51d73df1SKristof Provost NET_EPOCH_EXIT(et); 2554*51d73df1SKristof Provost 25553b3a8eb9SGleb Smirnoff return error ; 25563b3a8eb9SGleb Smirnoff } 25573b3a8eb9SGleb Smirnoff 25583b3a8eb9SGleb Smirnoff static void 2559fe3bcfbdSTom Jones ip_dn_vnet_init(void) 25603b3a8eb9SGleb Smirnoff { 2561fe3bcfbdSTom Jones if (V_dn_cfg.init_done) 25623b3a8eb9SGleb Smirnoff return; 2563fe3bcfbdSTom Jones V_dn_cfg.init_done = 1; 25643b3a8eb9SGleb Smirnoff /* Set defaults here. MSVC does not accept initializers, 25653b3a8eb9SGleb Smirnoff * and this is also useful for vimages 25663b3a8eb9SGleb Smirnoff */ 25673b3a8eb9SGleb Smirnoff /* queue limits */ 2568fe3bcfbdSTom Jones V_dn_cfg.slot_limit = 100; /* Foot shooting limit for queues. */ 2569fe3bcfbdSTom Jones V_dn_cfg.byte_limit = 1024 * 1024; 2570fe3bcfbdSTom Jones V_dn_cfg.expire = 1; 25713b3a8eb9SGleb Smirnoff 25723b3a8eb9SGleb Smirnoff /* RED parameters */ 2573fe3bcfbdSTom Jones V_dn_cfg.red_lookup_depth = 256; /* default lookup table depth */ 2574fe3bcfbdSTom Jones V_dn_cfg.red_avg_pkt_size = 512; /* default medium packet size */ 2575fe3bcfbdSTom Jones V_dn_cfg.red_max_pkt_size = 1500; /* default max packet size */ 25763b3a8eb9SGleb Smirnoff 25773b3a8eb9SGleb Smirnoff /* hash tables */ 2578fe3bcfbdSTom Jones V_dn_cfg.max_hash_size = 65536; /* max in the hash tables */ 2579fe3bcfbdSTom Jones V_dn_cfg.hash_size = 64; /* default hash size */ 25803b3a8eb9SGleb Smirnoff 25813b3a8eb9SGleb Smirnoff /* create hash tables for schedulers and flowsets. 25823b3a8eb9SGleb Smirnoff * In both we search by key and by pointer. 25833b3a8eb9SGleb Smirnoff */ 2584fe3bcfbdSTom Jones V_dn_cfg.schedhash = dn_ht_init(NULL, V_dn_cfg.hash_size, 25853b3a8eb9SGleb Smirnoff offsetof(struct dn_schk, schk_next), 25863b3a8eb9SGleb Smirnoff schk_hash, schk_match, schk_new); 2587fe3bcfbdSTom Jones V_dn_cfg.fshash = dn_ht_init(NULL, V_dn_cfg.hash_size, 25883b3a8eb9SGleb Smirnoff offsetof(struct dn_fsk, fsk_next), 25893b3a8eb9SGleb Smirnoff fsk_hash, fsk_match, fsk_new); 25903b3a8eb9SGleb Smirnoff 25913b3a8eb9SGleb Smirnoff /* bucket index to drain object */ 2592fe3bcfbdSTom Jones V_dn_cfg.drain_fs = 0; 2593fe3bcfbdSTom Jones V_dn_cfg.drain_sch = 0; 25943b3a8eb9SGleb Smirnoff 2595fe3bcfbdSTom Jones heap_init(&V_dn_cfg.evheap, 16, offsetof(struct dn_id, id)); 2596fe3bcfbdSTom Jones SLIST_INIT(&V_dn_cfg.fsu); 25973b3a8eb9SGleb Smirnoff 25983b3a8eb9SGleb Smirnoff DN_LOCK_INIT(); 25993b3a8eb9SGleb Smirnoff 2600fe3bcfbdSTom Jones /* Initialize curr_time adjustment mechanics. */ 2601fe3bcfbdSTom Jones getmicrouptime(&V_dn_cfg.prev_t); 2602fe3bcfbdSTom Jones } 2603fe3bcfbdSTom Jones 2604fe3bcfbdSTom Jones static void 2605fe3bcfbdSTom Jones ip_dn_vnet_destroy(void) 2606fe3bcfbdSTom Jones { 2607fe3bcfbdSTom Jones DN_BH_WLOCK(); 2608fe3bcfbdSTom Jones dummynet_flush(); 2609fe3bcfbdSTom Jones DN_BH_WUNLOCK(); 2610fe3bcfbdSTom Jones 2611fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.schedhash, 0); 2612fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.fshash, 0); 2613fe3bcfbdSTom Jones heap_free(&V_dn_cfg.evheap); 2614fe3bcfbdSTom Jones 2615fe3bcfbdSTom Jones DN_LOCK_DESTROY(); 2616fe3bcfbdSTom Jones } 2617fe3bcfbdSTom Jones 2618fe3bcfbdSTom Jones static void 2619fe3bcfbdSTom Jones ip_dn_init(void) 2620fe3bcfbdSTom Jones { 2621fe3bcfbdSTom Jones if (dn_tasks_started) 2622fe3bcfbdSTom Jones return; 2623*51d73df1SKristof Provost 2624*51d73df1SKristof Provost mtx_init(&sched_mtx, "dn_sched", NULL, MTX_DEF); 2625*51d73df1SKristof Provost 2626fe3bcfbdSTom Jones dn_tasks_started = 1; 2627fe3bcfbdSTom Jones TASK_INIT(&dn_task, 0, dummynet_task, NULL); 26285f4fc3dbSAlexander Motin dn_tq = taskqueue_create_fast("dummynet", M_WAITOK, 26293b3a8eb9SGleb Smirnoff taskqueue_thread_enqueue, &dn_tq); 26303b3a8eb9SGleb Smirnoff taskqueue_start_threads(&dn_tq, 1, PI_NET, "dummynet"); 26313b3a8eb9SGleb Smirnoff 2632*51d73df1SKristof Provost CK_LIST_INIT(&schedlist); 2633fd90e2edSJung-uk Kim callout_init(&dn_timeout, 1); 26345f4fc3dbSAlexander Motin dn_reschedule(); 26353b3a8eb9SGleb Smirnoff } 26363b3a8eb9SGleb Smirnoff 26373b3a8eb9SGleb Smirnoff static void 26383b3a8eb9SGleb Smirnoff ip_dn_destroy(int last) 26393b3a8eb9SGleb Smirnoff { 2640c8cfbc06SHans Petter Selasky /* ensure no more callouts are started */ 2641c8cfbc06SHans Petter Selasky dn_gone = 1; 2642c8cfbc06SHans Petter Selasky 2643c8cfbc06SHans Petter Selasky /* check for last */ 26443b3a8eb9SGleb Smirnoff if (last) { 26453b3a8eb9SGleb Smirnoff ND("removing last instance\n"); 26463b3a8eb9SGleb Smirnoff ip_dn_ctl_ptr = NULL; 26473b3a8eb9SGleb Smirnoff ip_dn_io_ptr = NULL; 26483b3a8eb9SGleb Smirnoff } 26493b3a8eb9SGleb Smirnoff 2650c8cfbc06SHans Petter Selasky callout_drain(&dn_timeout); 26513b3a8eb9SGleb Smirnoff taskqueue_drain(dn_tq, &dn_task); 26523b3a8eb9SGleb Smirnoff taskqueue_free(dn_tq); 26533b3a8eb9SGleb Smirnoff } 26543b3a8eb9SGleb Smirnoff 26553b3a8eb9SGleb Smirnoff static int 26563b3a8eb9SGleb Smirnoff dummynet_modevent(module_t mod, int type, void *data) 26573b3a8eb9SGleb Smirnoff { 26583b3a8eb9SGleb Smirnoff 26593b3a8eb9SGleb Smirnoff if (type == MOD_LOAD) { 26603b3a8eb9SGleb Smirnoff if (ip_dn_io_ptr) { 26613b3a8eb9SGleb Smirnoff printf("DUMMYNET already loaded\n"); 26623b3a8eb9SGleb Smirnoff return EEXIST ; 26633b3a8eb9SGleb Smirnoff } 26643b3a8eb9SGleb Smirnoff ip_dn_init(); 26653b3a8eb9SGleb Smirnoff ip_dn_ctl_ptr = ip_dn_ctl; 26663b3a8eb9SGleb Smirnoff ip_dn_io_ptr = dummynet_io; 26673b3a8eb9SGleb Smirnoff return 0; 26683b3a8eb9SGleb Smirnoff } else if (type == MOD_UNLOAD) { 26693b3a8eb9SGleb Smirnoff ip_dn_destroy(1 /* last */); 26703b3a8eb9SGleb Smirnoff return 0; 26713b3a8eb9SGleb Smirnoff } else 26723b3a8eb9SGleb Smirnoff return EOPNOTSUPP; 26733b3a8eb9SGleb Smirnoff } 26743b3a8eb9SGleb Smirnoff 26753b3a8eb9SGleb Smirnoff /* modevent helpers for the modules */ 26763b3a8eb9SGleb Smirnoff static int 26773b3a8eb9SGleb Smirnoff load_dn_sched(struct dn_alg *d) 26783b3a8eb9SGleb Smirnoff { 26793b3a8eb9SGleb Smirnoff struct dn_alg *s; 26803b3a8eb9SGleb Smirnoff 26813b3a8eb9SGleb Smirnoff if (d == NULL) 26823b3a8eb9SGleb Smirnoff return 1; /* error */ 26833b3a8eb9SGleb Smirnoff ip_dn_init(); /* just in case, we need the lock */ 26843b3a8eb9SGleb Smirnoff 26853b3a8eb9SGleb Smirnoff /* Check that mandatory funcs exists */ 26863b3a8eb9SGleb Smirnoff if (d->enqueue == NULL || d->dequeue == NULL) { 26873b3a8eb9SGleb Smirnoff D("missing enqueue or dequeue for %s", d->name); 26883b3a8eb9SGleb Smirnoff return 1; 26893b3a8eb9SGleb Smirnoff } 26903b3a8eb9SGleb Smirnoff 26913b3a8eb9SGleb Smirnoff /* Search if scheduler already exists */ 2692*51d73df1SKristof Provost mtx_lock(&sched_mtx); 2693*51d73df1SKristof Provost CK_LIST_FOREACH(s, &schedlist, next) { 26943b3a8eb9SGleb Smirnoff if (strcmp(s->name, d->name) == 0) { 26953b3a8eb9SGleb Smirnoff D("%s already loaded", d->name); 26963b3a8eb9SGleb Smirnoff break; /* scheduler already exists */ 26973b3a8eb9SGleb Smirnoff } 26983b3a8eb9SGleb Smirnoff } 26993b3a8eb9SGleb Smirnoff if (s == NULL) 2700*51d73df1SKristof Provost CK_LIST_INSERT_HEAD(&schedlist, d, next); 2701*51d73df1SKristof Provost mtx_unlock(&sched_mtx); 27023b3a8eb9SGleb Smirnoff D("dn_sched %s %sloaded", d->name, s ? "not ":""); 27033b3a8eb9SGleb Smirnoff return s ? 1 : 0; 27043b3a8eb9SGleb Smirnoff } 27053b3a8eb9SGleb Smirnoff 27063b3a8eb9SGleb Smirnoff static int 27073b3a8eb9SGleb Smirnoff unload_dn_sched(struct dn_alg *s) 27083b3a8eb9SGleb Smirnoff { 27093b3a8eb9SGleb Smirnoff struct dn_alg *tmp, *r; 27103b3a8eb9SGleb Smirnoff int err = EINVAL; 27113b3a8eb9SGleb Smirnoff 27123b3a8eb9SGleb Smirnoff ND("called for %s", s->name); 27133b3a8eb9SGleb Smirnoff 2714*51d73df1SKristof Provost mtx_lock(&sched_mtx); 2715*51d73df1SKristof Provost CK_LIST_FOREACH_SAFE(r, &schedlist, next, tmp) { 27163b3a8eb9SGleb Smirnoff if (strcmp(s->name, r->name) != 0) 27173b3a8eb9SGleb Smirnoff continue; 27183b3a8eb9SGleb Smirnoff ND("ref_count = %d", r->ref_count); 27193b3a8eb9SGleb Smirnoff err = (r->ref_count != 0) ? EBUSY : 0; 27203b3a8eb9SGleb Smirnoff if (err == 0) 2721*51d73df1SKristof Provost CK_LIST_REMOVE(r, next); 27223b3a8eb9SGleb Smirnoff break; 27233b3a8eb9SGleb Smirnoff } 2724*51d73df1SKristof Provost mtx_unlock(&sched_mtx); 2725*51d73df1SKristof Provost NET_EPOCH_WAIT(); 27263b3a8eb9SGleb Smirnoff D("dn_sched %s %sunloaded", s->name, err ? "not ":""); 27273b3a8eb9SGleb Smirnoff return err; 27283b3a8eb9SGleb Smirnoff } 27293b3a8eb9SGleb Smirnoff 27303b3a8eb9SGleb Smirnoff int 27313b3a8eb9SGleb Smirnoff dn_sched_modevent(module_t mod, int cmd, void *arg) 27323b3a8eb9SGleb Smirnoff { 27333b3a8eb9SGleb Smirnoff struct dn_alg *sch = arg; 27343b3a8eb9SGleb Smirnoff 27353b3a8eb9SGleb Smirnoff if (cmd == MOD_LOAD) 27363b3a8eb9SGleb Smirnoff return load_dn_sched(sch); 27373b3a8eb9SGleb Smirnoff else if (cmd == MOD_UNLOAD) 27383b3a8eb9SGleb Smirnoff return unload_dn_sched(sch); 27393b3a8eb9SGleb Smirnoff else 27403b3a8eb9SGleb Smirnoff return EINVAL; 27413b3a8eb9SGleb Smirnoff } 27423b3a8eb9SGleb Smirnoff 27433b3a8eb9SGleb Smirnoff static moduledata_t dummynet_mod = { 27443b3a8eb9SGleb Smirnoff "dummynet", dummynet_modevent, NULL 27453b3a8eb9SGleb Smirnoff }; 27463b3a8eb9SGleb Smirnoff 274789856f7eSBjoern A. Zeeb #define DN_SI_SUB SI_SUB_PROTO_FIREWALL 27483b3a8eb9SGleb Smirnoff #define DN_MODEV_ORD (SI_ORDER_ANY - 128) /* after ipfw */ 27493b3a8eb9SGleb Smirnoff DECLARE_MODULE(dummynet, dummynet_mod, DN_SI_SUB, DN_MODEV_ORD); 2750f9ab623bSAlexander V. Chernikov MODULE_DEPEND(dummynet, ipfw, 3, 3, 3); 27513b3a8eb9SGleb Smirnoff MODULE_VERSION(dummynet, 3); 27523b3a8eb9SGleb Smirnoff 27533b3a8eb9SGleb Smirnoff /* 27543b3a8eb9SGleb Smirnoff * Starting up. Done in order after dummynet_modevent() has been called. 27553b3a8eb9SGleb Smirnoff * VNET_SYSINIT is also called for each existing vnet and each new vnet. 27563b3a8eb9SGleb Smirnoff */ 2757fe3bcfbdSTom Jones VNET_SYSINIT(vnet_dn_init, DN_SI_SUB, DN_MODEV_ORD+2, ip_dn_vnet_init, NULL); 27583b3a8eb9SGleb Smirnoff 27593b3a8eb9SGleb Smirnoff /* 27603b3a8eb9SGleb Smirnoff * Shutdown handlers up shop. These are done in REVERSE ORDER, but still 27613b3a8eb9SGleb Smirnoff * after dummynet_modevent() has been called. Not called on reboot. 27623b3a8eb9SGleb Smirnoff * VNET_SYSUNINIT is also called for each exiting vnet as it exits. 27633b3a8eb9SGleb Smirnoff * or when the module is unloaded. 27643b3a8eb9SGleb Smirnoff */ 2765fe3bcfbdSTom Jones VNET_SYSUNINIT(vnet_dn_uninit, DN_SI_SUB, DN_MODEV_ORD+2, ip_dn_vnet_destroy, NULL); 27663b3a8eb9SGleb Smirnoff 276791336b40SDon Lewis #ifdef NEW_AQM 276891336b40SDon Lewis 276991336b40SDon Lewis /* modevent helpers for the AQM modules */ 277091336b40SDon Lewis static int 277191336b40SDon Lewis load_dn_aqm(struct dn_aqm *d) 277291336b40SDon Lewis { 277391336b40SDon Lewis struct dn_aqm *aqm=NULL; 277491336b40SDon Lewis 277591336b40SDon Lewis if (d == NULL) 277691336b40SDon Lewis return 1; /* error */ 277791336b40SDon Lewis ip_dn_init(); /* just in case, we need the lock */ 277891336b40SDon Lewis 277991336b40SDon Lewis /* Check that mandatory funcs exists */ 278091336b40SDon Lewis if (d->enqueue == NULL || d->dequeue == NULL) { 278191336b40SDon Lewis D("missing enqueue or dequeue for %s", d->name); 278291336b40SDon Lewis return 1; 278391336b40SDon Lewis } 278491336b40SDon Lewis 2785*51d73df1SKristof Provost mtx_lock(&sched_mtx); 2786*51d73df1SKristof Provost 278791336b40SDon Lewis /* Search if AQM already exists */ 2788*51d73df1SKristof Provost CK_LIST_FOREACH(aqm, &aqmlist, next) { 278991336b40SDon Lewis if (strcmp(aqm->name, d->name) == 0) { 279091336b40SDon Lewis D("%s already loaded", d->name); 279191336b40SDon Lewis break; /* AQM already exists */ 279291336b40SDon Lewis } 279391336b40SDon Lewis } 279491336b40SDon Lewis if (aqm == NULL) 2795*51d73df1SKristof Provost CK_LIST_INSERT_HEAD(&aqmlist, d, next); 2796*51d73df1SKristof Provost 2797*51d73df1SKristof Provost mtx_unlock(&sched_mtx); 2798*51d73df1SKristof Provost 279991336b40SDon Lewis D("dn_aqm %s %sloaded", d->name, aqm ? "not ":""); 280091336b40SDon Lewis return aqm ? 1 : 0; 280191336b40SDon Lewis } 280291336b40SDon Lewis 280391336b40SDon Lewis /* Callback to clean up AQM status for queues connected to a flowset 280491336b40SDon Lewis * and then deconfigure the flowset. 280591336b40SDon Lewis * This function is called before an AQM module is unloaded 280691336b40SDon Lewis */ 280791336b40SDon Lewis static int 280891336b40SDon Lewis fs_cleanup(void *_fs, void *arg) 280991336b40SDon Lewis { 281091336b40SDon Lewis struct dn_fsk *fs = _fs; 281191336b40SDon Lewis uint32_t type = *(uint32_t *)arg; 281291336b40SDon Lewis 281391336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->type == type) 281491336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 281591336b40SDon Lewis 281691336b40SDon Lewis return 0; 281791336b40SDon Lewis } 281891336b40SDon Lewis 281991336b40SDon Lewis static int 282091336b40SDon Lewis unload_dn_aqm(struct dn_aqm *aqm) 282191336b40SDon Lewis { 282291336b40SDon Lewis struct dn_aqm *tmp, *r; 282391336b40SDon Lewis int err = EINVAL; 282491336b40SDon Lewis err = 0; 282591336b40SDon Lewis ND("called for %s", aqm->name); 282691336b40SDon Lewis 282791336b40SDon Lewis /* clean up AQM status and deconfig flowset */ 2828fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, fs_cleanup, &aqm->type); 282991336b40SDon Lewis 2830*51d73df1SKristof Provost mtx_lock(&sched_mtx); 2831*51d73df1SKristof Provost 2832*51d73df1SKristof Provost CK_LIST_FOREACH_SAFE(r, &aqmlist, next, tmp) { 283391336b40SDon Lewis if (strcmp(aqm->name, r->name) != 0) 283491336b40SDon Lewis continue; 283591336b40SDon Lewis ND("ref_count = %d", r->ref_count); 283691336b40SDon Lewis err = (r->ref_count != 0 || r->cfg_ref_count != 0) ? EBUSY : 0; 283791336b40SDon Lewis if (err == 0) 2838*51d73df1SKristof Provost CK_LIST_REMOVE(r, next); 283991336b40SDon Lewis break; 284091336b40SDon Lewis } 2841*51d73df1SKristof Provost 2842*51d73df1SKristof Provost mtx_unlock(&sched_mtx); 2843*51d73df1SKristof Provost NET_EPOCH_WAIT(); 2844*51d73df1SKristof Provost 284591336b40SDon Lewis D("%s %sunloaded", aqm->name, err ? "not ":""); 284691336b40SDon Lewis if (err) 284791336b40SDon Lewis D("ref_count=%d, cfg_ref_count=%d", r->ref_count, r->cfg_ref_count); 284891336b40SDon Lewis return err; 284991336b40SDon Lewis } 285091336b40SDon Lewis 285191336b40SDon Lewis int 285291336b40SDon Lewis dn_aqm_modevent(module_t mod, int cmd, void *arg) 285391336b40SDon Lewis { 285491336b40SDon Lewis struct dn_aqm *aqm = arg; 285591336b40SDon Lewis 285691336b40SDon Lewis if (cmd == MOD_LOAD) 285791336b40SDon Lewis return load_dn_aqm(aqm); 285891336b40SDon Lewis else if (cmd == MOD_UNLOAD) 285991336b40SDon Lewis return unload_dn_aqm(aqm); 286091336b40SDon Lewis else 286191336b40SDon Lewis return EINVAL; 286291336b40SDon Lewis } 286391336b40SDon Lewis #endif 286491336b40SDon Lewis 28653b3a8eb9SGleb Smirnoff /* end of file */ 2866