13b3a8eb9SGleb Smirnoff /*- 2fe267a55SPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3fe267a55SPedro F. Giffuni * 491336b40SDon Lewis * Codel/FQ_Codel and PIE/FQ-PIE Code: 591336b40SDon Lewis * Copyright (C) 2016 Centre for Advanced Internet Architectures, 691336b40SDon Lewis * Swinburne University of Technology, Melbourne, Australia. 791336b40SDon Lewis * Portions of this code were made possible in part by a gift from 891336b40SDon Lewis * The Comcast Innovation Fund. 991336b40SDon Lewis * Implemented by Rasool Al-Saadi <ralsaadi@swin.edu.au> 1091336b40SDon Lewis * 113b3a8eb9SGleb Smirnoff * Copyright (c) 1998-2002,2010 Luigi Rizzo, Universita` di Pisa 123b3a8eb9SGleb Smirnoff * Portions Copyright (c) 2000 Akamba Corp. 133b3a8eb9SGleb Smirnoff * All rights reserved 143b3a8eb9SGleb Smirnoff * 153b3a8eb9SGleb Smirnoff * Redistribution and use in source and binary forms, with or without 163b3a8eb9SGleb Smirnoff * modification, are permitted provided that the following conditions 173b3a8eb9SGleb Smirnoff * are met: 183b3a8eb9SGleb Smirnoff * 1. Redistributions of source code must retain the above copyright 193b3a8eb9SGleb Smirnoff * notice, this list of conditions and the following disclaimer. 203b3a8eb9SGleb Smirnoff * 2. Redistributions in binary form must reproduce the above copyright 213b3a8eb9SGleb Smirnoff * notice, this list of conditions and the following disclaimer in the 223b3a8eb9SGleb Smirnoff * documentation and/or other materials provided with the distribution. 233b3a8eb9SGleb Smirnoff * 243b3a8eb9SGleb Smirnoff * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 253b3a8eb9SGleb Smirnoff * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 263b3a8eb9SGleb Smirnoff * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 273b3a8eb9SGleb Smirnoff * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 283b3a8eb9SGleb Smirnoff * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 293b3a8eb9SGleb Smirnoff * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 303b3a8eb9SGleb Smirnoff * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 313b3a8eb9SGleb Smirnoff * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 323b3a8eb9SGleb Smirnoff * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 333b3a8eb9SGleb Smirnoff * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 343b3a8eb9SGleb Smirnoff * SUCH DAMAGE. 353b3a8eb9SGleb Smirnoff */ 363b3a8eb9SGleb Smirnoff 373b3a8eb9SGleb Smirnoff #include <sys/cdefs.h> 383b3a8eb9SGleb Smirnoff __FBSDID("$FreeBSD$"); 393b3a8eb9SGleb Smirnoff 403b3a8eb9SGleb Smirnoff /* 413b3a8eb9SGleb Smirnoff * Configuration and internal object management for dummynet. 423b3a8eb9SGleb Smirnoff */ 433b3a8eb9SGleb Smirnoff 443b3a8eb9SGleb Smirnoff #include "opt_inet6.h" 453b3a8eb9SGleb Smirnoff 463b3a8eb9SGleb Smirnoff #include <sys/param.h> 4751d73df1SKristof Provost #include <sys/ck.h> 483b3a8eb9SGleb Smirnoff #include <sys/systm.h> 493b3a8eb9SGleb Smirnoff #include <sys/malloc.h> 503b3a8eb9SGleb Smirnoff #include <sys/mbuf.h> 513b3a8eb9SGleb Smirnoff #include <sys/kernel.h> 523b3a8eb9SGleb Smirnoff #include <sys/lock.h> 533b3a8eb9SGleb Smirnoff #include <sys/module.h> 54eedc7fd9SGleb Smirnoff #include <sys/mutex.h> 553b3a8eb9SGleb Smirnoff #include <sys/priv.h> 563b3a8eb9SGleb Smirnoff #include <sys/proc.h> 573b3a8eb9SGleb Smirnoff #include <sys/rwlock.h> 583b3a8eb9SGleb Smirnoff #include <sys/socket.h> 593b3a8eb9SGleb Smirnoff #include <sys/socketvar.h> 603b3a8eb9SGleb Smirnoff #include <sys/time.h> 613b3a8eb9SGleb Smirnoff #include <sys/taskqueue.h> 623b3a8eb9SGleb Smirnoff #include <net/if.h> /* IFNAMSIZ, struct ifaddr, ifq head, lock.h mutex.h */ 633b3a8eb9SGleb Smirnoff #include <netinet/in.h> 643b3a8eb9SGleb Smirnoff #include <netinet/ip_var.h> /* ip_output(), IP_FORWARDING */ 653b3a8eb9SGleb Smirnoff #include <netinet/ip_fw.h> 663b3a8eb9SGleb Smirnoff #include <netinet/ip_dummynet.h> 67fe3bcfbdSTom Jones #include <net/vnet.h> 683b3a8eb9SGleb Smirnoff 693b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/ip_fw_private.h> 703b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/dn_heap.h> 713b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/ip_dn_private.h> 7291336b40SDon Lewis #ifdef NEW_AQM 7391336b40SDon Lewis #include <netpfil/ipfw/dn_aqm.h> 7491336b40SDon Lewis #endif 753b3a8eb9SGleb Smirnoff #include <netpfil/ipfw/dn_sched.h> 763b3a8eb9SGleb Smirnoff 773b3a8eb9SGleb Smirnoff /* which objects to copy */ 783b3a8eb9SGleb Smirnoff #define DN_C_LINK 0x01 793b3a8eb9SGleb Smirnoff #define DN_C_SCH 0x02 803b3a8eb9SGleb Smirnoff #define DN_C_FLOW 0x04 813b3a8eb9SGleb Smirnoff #define DN_C_FS 0x08 823b3a8eb9SGleb Smirnoff #define DN_C_QUEUE 0x10 833b3a8eb9SGleb Smirnoff 843b3a8eb9SGleb Smirnoff /* we use this argument in case of a schk_new */ 853b3a8eb9SGleb Smirnoff struct schk_new_arg { 863b3a8eb9SGleb Smirnoff struct dn_alg *fp; 873b3a8eb9SGleb Smirnoff struct dn_sch *sch; 883b3a8eb9SGleb Smirnoff }; 893b3a8eb9SGleb Smirnoff 903b3a8eb9SGleb Smirnoff /*---- callout hooks. ----*/ 913b3a8eb9SGleb Smirnoff static struct callout dn_timeout; 92fe3bcfbdSTom Jones static int dn_tasks_started = 0; 93c8cfbc06SHans Petter Selasky static int dn_gone; 943b3a8eb9SGleb Smirnoff static struct task dn_task; 953b3a8eb9SGleb Smirnoff static struct taskqueue *dn_tq = NULL; 963b3a8eb9SGleb Smirnoff 97fe3bcfbdSTom Jones /* global scheduler list */ 9851d73df1SKristof Provost struct mtx sched_mtx; 9951d73df1SKristof Provost CK_LIST_HEAD(, dn_alg) schedlist; 100fe3bcfbdSTom Jones #ifdef NEW_AQM 10151d73df1SKristof Provost CK_LIST_HEAD(, dn_aqm) aqmlist; /* list of AQMs */ 102fe3bcfbdSTom Jones #endif 103fe3bcfbdSTom Jones 1043b3a8eb9SGleb Smirnoff static void 1053b3a8eb9SGleb Smirnoff dummynet(void *arg) 1063b3a8eb9SGleb Smirnoff { 1073b3a8eb9SGleb Smirnoff 1083b3a8eb9SGleb Smirnoff (void)arg; /* UNUSED */ 109cbc4d2dbSJohn Baldwin taskqueue_enqueue(dn_tq, &dn_task); 1103b3a8eb9SGleb Smirnoff } 1113b3a8eb9SGleb Smirnoff 1123b3a8eb9SGleb Smirnoff void 1133b3a8eb9SGleb Smirnoff dn_reschedule(void) 1143b3a8eb9SGleb Smirnoff { 1155f4fc3dbSAlexander Motin 116c8cfbc06SHans Petter Selasky if (dn_gone != 0) 117c8cfbc06SHans Petter Selasky return; 1185f4fc3dbSAlexander Motin callout_reset_sbt(&dn_timeout, tick_sbt, 0, dummynet, NULL, 1195f4fc3dbSAlexander Motin C_HARDCLOCK | C_DIRECT_EXEC); 1203b3a8eb9SGleb Smirnoff } 1213b3a8eb9SGleb Smirnoff /*----- end of callout hooks -----*/ 1223b3a8eb9SGleb Smirnoff 12391336b40SDon Lewis #ifdef NEW_AQM 12491336b40SDon Lewis /* Return AQM descriptor for given type or name. */ 12591336b40SDon Lewis static struct dn_aqm * 12691336b40SDon Lewis find_aqm_type(int type, char *name) 12791336b40SDon Lewis { 12891336b40SDon Lewis struct dn_aqm *d; 12991336b40SDon Lewis 13051d73df1SKristof Provost NET_EPOCH_ASSERT(); 13151d73df1SKristof Provost 13251d73df1SKristof Provost CK_LIST_FOREACH(d, &aqmlist, next) { 13391336b40SDon Lewis if (d->type == type || (name && !strcasecmp(d->name, name))) 13491336b40SDon Lewis return d; 13591336b40SDon Lewis } 13691336b40SDon Lewis return NULL; /* not found */ 13791336b40SDon Lewis } 13891336b40SDon Lewis #endif 13991336b40SDon Lewis 1403b3a8eb9SGleb Smirnoff /* Return a scheduler descriptor given the type or name. */ 1413b3a8eb9SGleb Smirnoff static struct dn_alg * 1423b3a8eb9SGleb Smirnoff find_sched_type(int type, char *name) 1433b3a8eb9SGleb Smirnoff { 1443b3a8eb9SGleb Smirnoff struct dn_alg *d; 1453b3a8eb9SGleb Smirnoff 14651d73df1SKristof Provost NET_EPOCH_ASSERT(); 14751d73df1SKristof Provost 14851d73df1SKristof Provost CK_LIST_FOREACH(d, &schedlist, next) { 1493b3a8eb9SGleb Smirnoff if (d->type == type || (name && !strcasecmp(d->name, name))) 1503b3a8eb9SGleb Smirnoff return d; 1513b3a8eb9SGleb Smirnoff } 1523b3a8eb9SGleb Smirnoff return NULL; /* not found */ 1533b3a8eb9SGleb Smirnoff } 1543b3a8eb9SGleb Smirnoff 1553b3a8eb9SGleb Smirnoff int 1563b3a8eb9SGleb Smirnoff ipdn_bound_var(int *v, int dflt, int lo, int hi, const char *msg) 1573b3a8eb9SGleb Smirnoff { 1583b3a8eb9SGleb Smirnoff int oldv = *v; 1593b3a8eb9SGleb Smirnoff const char *op = NULL; 1603b3a8eb9SGleb Smirnoff if (dflt < lo) 1613b3a8eb9SGleb Smirnoff dflt = lo; 1623b3a8eb9SGleb Smirnoff if (dflt > hi) 1633b3a8eb9SGleb Smirnoff dflt = hi; 1643b3a8eb9SGleb Smirnoff if (oldv < lo) { 1653b3a8eb9SGleb Smirnoff *v = dflt; 1663b3a8eb9SGleb Smirnoff op = "Bump"; 1673b3a8eb9SGleb Smirnoff } else if (oldv > hi) { 1683b3a8eb9SGleb Smirnoff *v = hi; 1693b3a8eb9SGleb Smirnoff op = "Clamp"; 1703b3a8eb9SGleb Smirnoff } else 1713b3a8eb9SGleb Smirnoff return *v; 1723b3a8eb9SGleb Smirnoff if (op && msg) 1733b3a8eb9SGleb Smirnoff printf("%s %s to %d (was %d)\n", op, msg, *v, oldv); 1743b3a8eb9SGleb Smirnoff return *v; 1753b3a8eb9SGleb Smirnoff } 1763b3a8eb9SGleb Smirnoff 1773b3a8eb9SGleb Smirnoff /*---- flow_id mask, hash and compare functions ---*/ 1783b3a8eb9SGleb Smirnoff /* 1793b3a8eb9SGleb Smirnoff * The flow_id includes the 5-tuple, the queue/pipe number 1803b3a8eb9SGleb Smirnoff * which we store in the extra area in host order, 1813b3a8eb9SGleb Smirnoff * and for ipv6 also the flow_id6. 1823b3a8eb9SGleb Smirnoff * XXX see if we want the tos byte (can store in 'flags') 1833b3a8eb9SGleb Smirnoff */ 1843b3a8eb9SGleb Smirnoff static struct ipfw_flow_id * 1853b3a8eb9SGleb Smirnoff flow_id_mask(struct ipfw_flow_id *mask, struct ipfw_flow_id *id) 1863b3a8eb9SGleb Smirnoff { 1873b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(id); 1883b3a8eb9SGleb Smirnoff 1893b3a8eb9SGleb Smirnoff id->dst_port &= mask->dst_port; 1903b3a8eb9SGleb Smirnoff id->src_port &= mask->src_port; 1913b3a8eb9SGleb Smirnoff id->proto &= mask->proto; 1923b3a8eb9SGleb Smirnoff id->extra &= mask->extra; 1933b3a8eb9SGleb Smirnoff if (is_v6) { 1943b3a8eb9SGleb Smirnoff APPLY_MASK(&id->dst_ip6, &mask->dst_ip6); 1953b3a8eb9SGleb Smirnoff APPLY_MASK(&id->src_ip6, &mask->src_ip6); 1963b3a8eb9SGleb Smirnoff id->flow_id6 &= mask->flow_id6; 1973b3a8eb9SGleb Smirnoff } else { 1983b3a8eb9SGleb Smirnoff id->dst_ip &= mask->dst_ip; 1993b3a8eb9SGleb Smirnoff id->src_ip &= mask->src_ip; 2003b3a8eb9SGleb Smirnoff } 2013b3a8eb9SGleb Smirnoff return id; 2023b3a8eb9SGleb Smirnoff } 2033b3a8eb9SGleb Smirnoff 2043b3a8eb9SGleb Smirnoff /* computes an OR of two masks, result in dst and also returned */ 2053b3a8eb9SGleb Smirnoff static struct ipfw_flow_id * 2063b3a8eb9SGleb Smirnoff flow_id_or(struct ipfw_flow_id *src, struct ipfw_flow_id *dst) 2073b3a8eb9SGleb Smirnoff { 2083b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(dst); 2093b3a8eb9SGleb Smirnoff 2103b3a8eb9SGleb Smirnoff dst->dst_port |= src->dst_port; 2113b3a8eb9SGleb Smirnoff dst->src_port |= src->src_port; 2123b3a8eb9SGleb Smirnoff dst->proto |= src->proto; 2133b3a8eb9SGleb Smirnoff dst->extra |= src->extra; 2143b3a8eb9SGleb Smirnoff if (is_v6) { 2153b3a8eb9SGleb Smirnoff #define OR_MASK(_d, _s) \ 2163b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[0] |= (_s)->__u6_addr.__u6_addr32[0]; \ 2173b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[1] |= (_s)->__u6_addr.__u6_addr32[1]; \ 2183b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[2] |= (_s)->__u6_addr.__u6_addr32[2]; \ 2193b3a8eb9SGleb Smirnoff (_d)->__u6_addr.__u6_addr32[3] |= (_s)->__u6_addr.__u6_addr32[3]; 2203b3a8eb9SGleb Smirnoff OR_MASK(&dst->dst_ip6, &src->dst_ip6); 2213b3a8eb9SGleb Smirnoff OR_MASK(&dst->src_ip6, &src->src_ip6); 2223b3a8eb9SGleb Smirnoff #undef OR_MASK 2233b3a8eb9SGleb Smirnoff dst->flow_id6 |= src->flow_id6; 2243b3a8eb9SGleb Smirnoff } else { 2253b3a8eb9SGleb Smirnoff dst->dst_ip |= src->dst_ip; 2263b3a8eb9SGleb Smirnoff dst->src_ip |= src->src_ip; 2273b3a8eb9SGleb Smirnoff } 2283b3a8eb9SGleb Smirnoff return dst; 2293b3a8eb9SGleb Smirnoff } 2303b3a8eb9SGleb Smirnoff 2313b3a8eb9SGleb Smirnoff static int 2323b3a8eb9SGleb Smirnoff nonzero_mask(struct ipfw_flow_id *m) 2333b3a8eb9SGleb Smirnoff { 2343b3a8eb9SGleb Smirnoff if (m->dst_port || m->src_port || m->proto || m->extra) 2353b3a8eb9SGleb Smirnoff return 1; 2363b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(m)) { 2373b3a8eb9SGleb Smirnoff return 2383b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[0] || 2393b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[1] || 2403b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[2] || 2413b3a8eb9SGleb Smirnoff m->dst_ip6.__u6_addr.__u6_addr32[3] || 2423b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[0] || 2433b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[1] || 2443b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[2] || 2453b3a8eb9SGleb Smirnoff m->src_ip6.__u6_addr.__u6_addr32[3] || 2463b3a8eb9SGleb Smirnoff m->flow_id6; 2473b3a8eb9SGleb Smirnoff } else { 2483b3a8eb9SGleb Smirnoff return m->dst_ip || m->src_ip; 2493b3a8eb9SGleb Smirnoff } 2503b3a8eb9SGleb Smirnoff } 2513b3a8eb9SGleb Smirnoff 2523b3a8eb9SGleb Smirnoff /* XXX we may want a better hash function */ 2533b3a8eb9SGleb Smirnoff static uint32_t 2543b3a8eb9SGleb Smirnoff flow_id_hash(struct ipfw_flow_id *id) 2553b3a8eb9SGleb Smirnoff { 2563b3a8eb9SGleb Smirnoff uint32_t i; 2573b3a8eb9SGleb Smirnoff 2583b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(id)) { 2593b3a8eb9SGleb Smirnoff uint32_t *d = (uint32_t *)&id->dst_ip6; 2603b3a8eb9SGleb Smirnoff uint32_t *s = (uint32_t *)&id->src_ip6; 2613b3a8eb9SGleb Smirnoff i = (d[0] ) ^ (d[1]) ^ 2623b3a8eb9SGleb Smirnoff (d[2] ) ^ (d[3]) ^ 2633b3a8eb9SGleb Smirnoff (d[0] >> 15) ^ (d[1] >> 15) ^ 2643b3a8eb9SGleb Smirnoff (d[2] >> 15) ^ (d[3] >> 15) ^ 2653b3a8eb9SGleb Smirnoff (s[0] << 1) ^ (s[1] << 1) ^ 2663b3a8eb9SGleb Smirnoff (s[2] << 1) ^ (s[3] << 1) ^ 2673b3a8eb9SGleb Smirnoff (s[0] << 16) ^ (s[1] << 16) ^ 2683b3a8eb9SGleb Smirnoff (s[2] << 16) ^ (s[3] << 16) ^ 2693b3a8eb9SGleb Smirnoff (id->dst_port << 1) ^ (id->src_port) ^ 2703b3a8eb9SGleb Smirnoff (id->extra) ^ 2713b3a8eb9SGleb Smirnoff (id->proto ) ^ (id->flow_id6); 2723b3a8eb9SGleb Smirnoff } else { 2733b3a8eb9SGleb Smirnoff i = (id->dst_ip) ^ (id->dst_ip >> 15) ^ 2743b3a8eb9SGleb Smirnoff (id->src_ip << 1) ^ (id->src_ip >> 16) ^ 2753b3a8eb9SGleb Smirnoff (id->extra) ^ 2763b3a8eb9SGleb Smirnoff (id->dst_port << 1) ^ (id->src_port) ^ (id->proto); 2773b3a8eb9SGleb Smirnoff } 2783b3a8eb9SGleb Smirnoff return i; 2793b3a8eb9SGleb Smirnoff } 2803b3a8eb9SGleb Smirnoff 2813b3a8eb9SGleb Smirnoff /* Like bcmp, returns 0 if ids match, 1 otherwise. */ 2823b3a8eb9SGleb Smirnoff static int 2833b3a8eb9SGleb Smirnoff flow_id_cmp(struct ipfw_flow_id *id1, struct ipfw_flow_id *id2) 2843b3a8eb9SGleb Smirnoff { 2853b3a8eb9SGleb Smirnoff int is_v6 = IS_IP6_FLOW_ID(id1); 2863b3a8eb9SGleb Smirnoff 2873b3a8eb9SGleb Smirnoff if (!is_v6) { 2883b3a8eb9SGleb Smirnoff if (IS_IP6_FLOW_ID(id2)) 2893b3a8eb9SGleb Smirnoff return 1; /* different address families */ 2903b3a8eb9SGleb Smirnoff 2913b3a8eb9SGleb Smirnoff return (id1->dst_ip == id2->dst_ip && 2923b3a8eb9SGleb Smirnoff id1->src_ip == id2->src_ip && 2933b3a8eb9SGleb Smirnoff id1->dst_port == id2->dst_port && 2943b3a8eb9SGleb Smirnoff id1->src_port == id2->src_port && 2953b3a8eb9SGleb Smirnoff id1->proto == id2->proto && 2963b3a8eb9SGleb Smirnoff id1->extra == id2->extra) ? 0 : 1; 2973b3a8eb9SGleb Smirnoff } 2983b3a8eb9SGleb Smirnoff /* the ipv6 case */ 2993b3a8eb9SGleb Smirnoff return ( 3003b3a8eb9SGleb Smirnoff !bcmp(&id1->dst_ip6,&id2->dst_ip6, sizeof(id1->dst_ip6)) && 3013b3a8eb9SGleb Smirnoff !bcmp(&id1->src_ip6,&id2->src_ip6, sizeof(id1->src_ip6)) && 3023b3a8eb9SGleb Smirnoff id1->dst_port == id2->dst_port && 3033b3a8eb9SGleb Smirnoff id1->src_port == id2->src_port && 3043b3a8eb9SGleb Smirnoff id1->proto == id2->proto && 3053b3a8eb9SGleb Smirnoff id1->extra == id2->extra && 3063b3a8eb9SGleb Smirnoff id1->flow_id6 == id2->flow_id6) ? 0 : 1; 3073b3a8eb9SGleb Smirnoff } 3083b3a8eb9SGleb Smirnoff /*--------- end of flow-id mask, hash and compare ---------*/ 3093b3a8eb9SGleb Smirnoff 3103b3a8eb9SGleb Smirnoff /*--- support functions for the qht hashtable ---- 3113b3a8eb9SGleb Smirnoff * Entries are hashed by flow-id 3123b3a8eb9SGleb Smirnoff */ 3133b3a8eb9SGleb Smirnoff static uint32_t 3143b3a8eb9SGleb Smirnoff q_hash(uintptr_t key, int flags, void *arg) 3153b3a8eb9SGleb Smirnoff { 3163b3a8eb9SGleb Smirnoff /* compute the hash slot from the flow id */ 3173b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id = (flags & DNHT_KEY_IS_OBJ) ? 3183b3a8eb9SGleb Smirnoff &((struct dn_queue *)key)->ni.fid : 3193b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 3203b3a8eb9SGleb Smirnoff 3213b3a8eb9SGleb Smirnoff return flow_id_hash(id); 3223b3a8eb9SGleb Smirnoff } 3233b3a8eb9SGleb Smirnoff 3243b3a8eb9SGleb Smirnoff static int 3253b3a8eb9SGleb Smirnoff q_match(void *obj, uintptr_t key, int flags, void *arg) 3263b3a8eb9SGleb Smirnoff { 3273b3a8eb9SGleb Smirnoff struct dn_queue *o = (struct dn_queue *)obj; 3283b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id2; 3293b3a8eb9SGleb Smirnoff 3303b3a8eb9SGleb Smirnoff if (flags & DNHT_KEY_IS_OBJ) { 3313b3a8eb9SGleb Smirnoff /* compare pointers */ 3323b3a8eb9SGleb Smirnoff id2 = &((struct dn_queue *)key)->ni.fid; 3333b3a8eb9SGleb Smirnoff } else { 3343b3a8eb9SGleb Smirnoff id2 = (struct ipfw_flow_id *)key; 3353b3a8eb9SGleb Smirnoff } 3363b3a8eb9SGleb Smirnoff return (0 == flow_id_cmp(&o->ni.fid, id2)); 3373b3a8eb9SGleb Smirnoff } 3383b3a8eb9SGleb Smirnoff 3393b3a8eb9SGleb Smirnoff /* 3403b3a8eb9SGleb Smirnoff * create a new queue instance for the given 'key'. 3413b3a8eb9SGleb Smirnoff */ 3423b3a8eb9SGleb Smirnoff static void * 3433b3a8eb9SGleb Smirnoff q_new(uintptr_t key, int flags, void *arg) 3443b3a8eb9SGleb Smirnoff { 3453b3a8eb9SGleb Smirnoff struct dn_queue *q, *template = arg; 3463b3a8eb9SGleb Smirnoff struct dn_fsk *fs = template->fs; 3473b3a8eb9SGleb Smirnoff int size = sizeof(*q) + fs->sched->fp->q_datalen; 3483b3a8eb9SGleb Smirnoff 3493b3a8eb9SGleb Smirnoff q = malloc(size, M_DUMMYNET, M_NOWAIT | M_ZERO); 3503b3a8eb9SGleb Smirnoff if (q == NULL) { 3513b3a8eb9SGleb Smirnoff D("no memory for new queue"); 3523b3a8eb9SGleb Smirnoff return NULL; 3533b3a8eb9SGleb Smirnoff } 3543b3a8eb9SGleb Smirnoff 3553b3a8eb9SGleb Smirnoff set_oid(&q->ni.oid, DN_QUEUE, size); 3563b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) 3573b3a8eb9SGleb Smirnoff q->ni.fid = *(struct ipfw_flow_id *)key; 3583b3a8eb9SGleb Smirnoff q->fs = fs; 3593b3a8eb9SGleb Smirnoff q->_si = template->_si; 3603b3a8eb9SGleb Smirnoff q->_si->q_count++; 3613b3a8eb9SGleb Smirnoff 3623b3a8eb9SGleb Smirnoff if (fs->sched->fp->new_queue) 3633b3a8eb9SGleb Smirnoff fs->sched->fp->new_queue(q); 36491336b40SDon Lewis 36591336b40SDon Lewis #ifdef NEW_AQM 36691336b40SDon Lewis /* call AQM init function after creating a queue*/ 36791336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->init) 36891336b40SDon Lewis if(fs->aqmfp->init(q)) 36991336b40SDon Lewis D("unable to init AQM for fs %d", fs->fs.fs_nr); 37091336b40SDon Lewis #endif 371fe3bcfbdSTom Jones V_dn_cfg.queue_count++; 37291336b40SDon Lewis 3733b3a8eb9SGleb Smirnoff return q; 3743b3a8eb9SGleb Smirnoff } 3753b3a8eb9SGleb Smirnoff 3763b3a8eb9SGleb Smirnoff /* 3773b3a8eb9SGleb Smirnoff * Notify schedulers that a queue is going away. 3783b3a8eb9SGleb Smirnoff * If (flags & DN_DESTROY), also free the packets. 3793b3a8eb9SGleb Smirnoff * The version for callbacks is called q_delete_cb(). 3803b3a8eb9SGleb Smirnoff */ 3813b3a8eb9SGleb Smirnoff static void 3823b3a8eb9SGleb Smirnoff dn_delete_queue(struct dn_queue *q, int flags) 3833b3a8eb9SGleb Smirnoff { 3843b3a8eb9SGleb Smirnoff struct dn_fsk *fs = q->fs; 3853b3a8eb9SGleb Smirnoff 38691336b40SDon Lewis #ifdef NEW_AQM 38791336b40SDon Lewis /* clean up AQM status for queue 'q' 38891336b40SDon Lewis * cleanup here is called just with MULTIQUEUE 38991336b40SDon Lewis */ 39091336b40SDon Lewis if (fs && fs->aqmfp && fs->aqmfp->cleanup) 39191336b40SDon Lewis fs->aqmfp->cleanup(q); 39291336b40SDon Lewis #endif 3933b3a8eb9SGleb Smirnoff // D("fs %p si %p\n", fs, q->_si); 3943b3a8eb9SGleb Smirnoff /* notify the parent scheduler that the queue is going away */ 3953b3a8eb9SGleb Smirnoff if (fs && fs->sched->fp->free_queue) 3963b3a8eb9SGleb Smirnoff fs->sched->fp->free_queue(q); 3973b3a8eb9SGleb Smirnoff q->_si->q_count--; 3983b3a8eb9SGleb Smirnoff q->_si = NULL; 3993b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) { 4003b3a8eb9SGleb Smirnoff if (q->mq.head) 4013b3a8eb9SGleb Smirnoff dn_free_pkts(q->mq.head); 4023b3a8eb9SGleb Smirnoff bzero(q, sizeof(*q)); // safety 4033b3a8eb9SGleb Smirnoff free(q, M_DUMMYNET); 404fe3bcfbdSTom Jones V_dn_cfg.queue_count--; 4053b3a8eb9SGleb Smirnoff } 4063b3a8eb9SGleb Smirnoff } 4073b3a8eb9SGleb Smirnoff 4083b3a8eb9SGleb Smirnoff static int 4093b3a8eb9SGleb Smirnoff q_delete_cb(void *q, void *arg) 4103b3a8eb9SGleb Smirnoff { 4113b3a8eb9SGleb Smirnoff int flags = (int)(uintptr_t)arg; 4123b3a8eb9SGleb Smirnoff dn_delete_queue(q, flags); 4133b3a8eb9SGleb Smirnoff return (flags & DN_DESTROY) ? DNHT_SCAN_DEL : 0; 4143b3a8eb9SGleb Smirnoff } 4153b3a8eb9SGleb Smirnoff 4163b3a8eb9SGleb Smirnoff /* 4173b3a8eb9SGleb Smirnoff * calls dn_delete_queue/q_delete_cb on all queues, 4183b3a8eb9SGleb Smirnoff * which notifies the parent scheduler and possibly drains packets. 4193b3a8eb9SGleb Smirnoff * flags & DN_DESTROY: drains queues and destroy qht; 4203b3a8eb9SGleb Smirnoff */ 4213b3a8eb9SGleb Smirnoff static void 4223b3a8eb9SGleb Smirnoff qht_delete(struct dn_fsk *fs, int flags) 4233b3a8eb9SGleb Smirnoff { 4243b3a8eb9SGleb Smirnoff ND("fs %d start flags %d qht %p", 4253b3a8eb9SGleb Smirnoff fs->fs.fs_nr, flags, fs->qht); 4263b3a8eb9SGleb Smirnoff if (!fs->qht) 4273b3a8eb9SGleb Smirnoff return; 4283b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 4293b3a8eb9SGleb Smirnoff dn_ht_scan(fs->qht, q_delete_cb, (void *)(uintptr_t)flags); 4303b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) { 4313b3a8eb9SGleb Smirnoff dn_ht_free(fs->qht, 0); 4323b3a8eb9SGleb Smirnoff fs->qht = NULL; 4333b3a8eb9SGleb Smirnoff } 4343b3a8eb9SGleb Smirnoff } else { 4353b3a8eb9SGleb Smirnoff dn_delete_queue((struct dn_queue *)(fs->qht), flags); 4363b3a8eb9SGleb Smirnoff if (flags & DN_DESTROY) 4373b3a8eb9SGleb Smirnoff fs->qht = NULL; 4383b3a8eb9SGleb Smirnoff } 4393b3a8eb9SGleb Smirnoff } 4403b3a8eb9SGleb Smirnoff 4413b3a8eb9SGleb Smirnoff /* 4423b3a8eb9SGleb Smirnoff * Find and possibly create the queue for a MULTIQUEUE scheduler. 4433b3a8eb9SGleb Smirnoff * We never call it for !MULTIQUEUE (the queue is in the sch_inst). 4443b3a8eb9SGleb Smirnoff */ 4453b3a8eb9SGleb Smirnoff struct dn_queue * 4463b3a8eb9SGleb Smirnoff ipdn_q_find(struct dn_fsk *fs, struct dn_sch_inst *si, 4473b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id) 4483b3a8eb9SGleb Smirnoff { 4493b3a8eb9SGleb Smirnoff struct dn_queue template; 4503b3a8eb9SGleb Smirnoff 4513b3a8eb9SGleb Smirnoff template._si = si; 4523b3a8eb9SGleb Smirnoff template.fs = fs; 4533b3a8eb9SGleb Smirnoff 4543b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 4553b3a8eb9SGleb Smirnoff struct ipfw_flow_id masked_id; 4563b3a8eb9SGleb Smirnoff if (fs->qht == NULL) { 4573b3a8eb9SGleb Smirnoff fs->qht = dn_ht_init(NULL, fs->fs.buckets, 4583b3a8eb9SGleb Smirnoff offsetof(struct dn_queue, q_next), 4593b3a8eb9SGleb Smirnoff q_hash, q_match, q_new); 4603b3a8eb9SGleb Smirnoff if (fs->qht == NULL) 4613b3a8eb9SGleb Smirnoff return NULL; 4623b3a8eb9SGleb Smirnoff } 4633b3a8eb9SGleb Smirnoff masked_id = *id; 4643b3a8eb9SGleb Smirnoff flow_id_mask(&fs->fsk_mask, &masked_id); 4653b3a8eb9SGleb Smirnoff return dn_ht_find(fs->qht, (uintptr_t)&masked_id, 4663b3a8eb9SGleb Smirnoff DNHT_INSERT, &template); 4673b3a8eb9SGleb Smirnoff } else { 4683b3a8eb9SGleb Smirnoff if (fs->qht == NULL) 4693b3a8eb9SGleb Smirnoff fs->qht = q_new(0, 0, &template); 4703b3a8eb9SGleb Smirnoff return (struct dn_queue *)fs->qht; 4713b3a8eb9SGleb Smirnoff } 4723b3a8eb9SGleb Smirnoff } 4733b3a8eb9SGleb Smirnoff /*--- end of queue hash table ---*/ 4743b3a8eb9SGleb Smirnoff 4753b3a8eb9SGleb Smirnoff /*--- support functions for the sch_inst hashtable ---- 4763b3a8eb9SGleb Smirnoff * 4773b3a8eb9SGleb Smirnoff * These are hashed by flow-id 4783b3a8eb9SGleb Smirnoff */ 4793b3a8eb9SGleb Smirnoff static uint32_t 4803b3a8eb9SGleb Smirnoff si_hash(uintptr_t key, int flags, void *arg) 4813b3a8eb9SGleb Smirnoff { 4823b3a8eb9SGleb Smirnoff /* compute the hash slot from the flow id */ 4833b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id = (flags & DNHT_KEY_IS_OBJ) ? 4843b3a8eb9SGleb Smirnoff &((struct dn_sch_inst *)key)->ni.fid : 4853b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 4863b3a8eb9SGleb Smirnoff 4873b3a8eb9SGleb Smirnoff return flow_id_hash(id); 4883b3a8eb9SGleb Smirnoff } 4893b3a8eb9SGleb Smirnoff 4903b3a8eb9SGleb Smirnoff static int 4913b3a8eb9SGleb Smirnoff si_match(void *obj, uintptr_t key, int flags, void *arg) 4923b3a8eb9SGleb Smirnoff { 4933b3a8eb9SGleb Smirnoff struct dn_sch_inst *o = obj; 4943b3a8eb9SGleb Smirnoff struct ipfw_flow_id *id2; 4953b3a8eb9SGleb Smirnoff 4963b3a8eb9SGleb Smirnoff id2 = (flags & DNHT_KEY_IS_OBJ) ? 4973b3a8eb9SGleb Smirnoff &((struct dn_sch_inst *)key)->ni.fid : 4983b3a8eb9SGleb Smirnoff (struct ipfw_flow_id *)key; 4993b3a8eb9SGleb Smirnoff return flow_id_cmp(&o->ni.fid, id2) == 0; 5003b3a8eb9SGleb Smirnoff } 5013b3a8eb9SGleb Smirnoff 5023b3a8eb9SGleb Smirnoff /* 5033b3a8eb9SGleb Smirnoff * create a new instance for the given 'key' 5043b3a8eb9SGleb Smirnoff * Allocate memory for instance, delay line and scheduler private data. 5053b3a8eb9SGleb Smirnoff */ 5063b3a8eb9SGleb Smirnoff static void * 5073b3a8eb9SGleb Smirnoff si_new(uintptr_t key, int flags, void *arg) 5083b3a8eb9SGleb Smirnoff { 5093b3a8eb9SGleb Smirnoff struct dn_schk *s = arg; 5103b3a8eb9SGleb Smirnoff struct dn_sch_inst *si; 5113b3a8eb9SGleb Smirnoff int l = sizeof(*si) + s->fp->si_datalen; 5123b3a8eb9SGleb Smirnoff 5133b3a8eb9SGleb Smirnoff si = malloc(l, M_DUMMYNET, M_NOWAIT | M_ZERO); 5143b3a8eb9SGleb Smirnoff if (si == NULL) 5153b3a8eb9SGleb Smirnoff goto error; 5163b3a8eb9SGleb Smirnoff 5173b3a8eb9SGleb Smirnoff /* Set length only for the part passed up to userland. */ 5183b3a8eb9SGleb Smirnoff set_oid(&si->ni.oid, DN_SCH_I, sizeof(struct dn_flow)); 5193b3a8eb9SGleb Smirnoff set_oid(&(si->dline.oid), DN_DELAY_LINE, 5203b3a8eb9SGleb Smirnoff sizeof(struct delay_line)); 5213b3a8eb9SGleb Smirnoff /* mark si and dline as outside the event queue */ 5223b3a8eb9SGleb Smirnoff si->ni.oid.id = si->dline.oid.id = -1; 5233b3a8eb9SGleb Smirnoff 5243b3a8eb9SGleb Smirnoff si->sched = s; 5253b3a8eb9SGleb Smirnoff si->dline.si = si; 5263b3a8eb9SGleb Smirnoff 5273b3a8eb9SGleb Smirnoff if (s->fp->new_sched && s->fp->new_sched(si)) { 5283b3a8eb9SGleb Smirnoff D("new_sched error"); 5293b3a8eb9SGleb Smirnoff goto error; 5303b3a8eb9SGleb Smirnoff } 5313b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 5323b3a8eb9SGleb Smirnoff si->ni.fid = *(struct ipfw_flow_id *)key; 5333b3a8eb9SGleb Smirnoff 53491336b40SDon Lewis #ifdef NEW_AQM 53591336b40SDon Lewis /* init AQM status for !DN_MULTIQUEUE sched*/ 53691336b40SDon Lewis if (!(s->fp->flags & DN_MULTIQUEUE)) 53791336b40SDon Lewis if (s->fs->aqmfp && s->fs->aqmfp->init) 53891336b40SDon Lewis if(s->fs->aqmfp->init((struct dn_queue *)(si + 1))) { 53991336b40SDon Lewis D("unable to init AQM for fs %d", s->fs->fs.fs_nr); 54091336b40SDon Lewis goto error; 54191336b40SDon Lewis } 54291336b40SDon Lewis #endif 54391336b40SDon Lewis 544fe3bcfbdSTom Jones V_dn_cfg.si_count++; 5453b3a8eb9SGleb Smirnoff return si; 5463b3a8eb9SGleb Smirnoff 5473b3a8eb9SGleb Smirnoff error: 5483b3a8eb9SGleb Smirnoff if (si) { 5493b3a8eb9SGleb Smirnoff bzero(si, sizeof(*si)); // safety 5503b3a8eb9SGleb Smirnoff free(si, M_DUMMYNET); 5513b3a8eb9SGleb Smirnoff } 5523b3a8eb9SGleb Smirnoff return NULL; 5533b3a8eb9SGleb Smirnoff } 5543b3a8eb9SGleb Smirnoff 5553b3a8eb9SGleb Smirnoff /* 5563b3a8eb9SGleb Smirnoff * Callback from siht to delete all scheduler instances. Remove 5573b3a8eb9SGleb Smirnoff * si and delay line from the system heap, destroy all queues. 5583b3a8eb9SGleb Smirnoff * We assume that all flowset have been notified and do not 5593b3a8eb9SGleb Smirnoff * point to us anymore. 5603b3a8eb9SGleb Smirnoff */ 5613b3a8eb9SGleb Smirnoff static int 5623b3a8eb9SGleb Smirnoff si_destroy(void *_si, void *arg) 5633b3a8eb9SGleb Smirnoff { 5643b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 5653b3a8eb9SGleb Smirnoff struct dn_schk *s = si->sched; 5663b3a8eb9SGleb Smirnoff struct delay_line *dl = &si->dline; 5673b3a8eb9SGleb Smirnoff 5683b3a8eb9SGleb Smirnoff if (dl->oid.subtype) /* remove delay line from event heap */ 569fe3bcfbdSTom Jones heap_extract(&V_dn_cfg.evheap, dl); 5703b3a8eb9SGleb Smirnoff dn_free_pkts(dl->mq.head); /* drain delay line */ 5713b3a8eb9SGleb Smirnoff if (si->kflags & DN_ACTIVE) /* remove si from event heap */ 572fe3bcfbdSTom Jones heap_extract(&V_dn_cfg.evheap, si); 57391336b40SDon Lewis 57491336b40SDon Lewis #ifdef NEW_AQM 57591336b40SDon Lewis /* clean up AQM status for !DN_MULTIQUEUE sched 57691336b40SDon Lewis * Note that all queues belong to fs were cleaned up in fsk_detach. 57791336b40SDon Lewis * When drain_scheduler is called s->fs and q->fs are pointing 57891336b40SDon Lewis * to a correct fs, so we can use fs in this case. 57991336b40SDon Lewis */ 58091336b40SDon Lewis if (!(s->fp->flags & DN_MULTIQUEUE)) { 58191336b40SDon Lewis struct dn_queue *q = (struct dn_queue *)(si + 1); 58291336b40SDon Lewis if (q->aqm_status && q->fs->aqmfp) 58391336b40SDon Lewis if (q->fs->aqmfp->cleanup) 58491336b40SDon Lewis q->fs->aqmfp->cleanup(q); 58591336b40SDon Lewis } 58691336b40SDon Lewis #endif 5873b3a8eb9SGleb Smirnoff if (s->fp->free_sched) 5883b3a8eb9SGleb Smirnoff s->fp->free_sched(si); 5893b3a8eb9SGleb Smirnoff bzero(si, sizeof(*si)); /* safety */ 5903b3a8eb9SGleb Smirnoff free(si, M_DUMMYNET); 591fe3bcfbdSTom Jones V_dn_cfg.si_count--; 5923b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; 5933b3a8eb9SGleb Smirnoff } 5943b3a8eb9SGleb Smirnoff 5953b3a8eb9SGleb Smirnoff /* 5963b3a8eb9SGleb Smirnoff * Find the scheduler instance for this packet. If we need to apply 5973b3a8eb9SGleb Smirnoff * a mask, do on a local copy of the flow_id to preserve the original. 5983b3a8eb9SGleb Smirnoff * Assume siht is always initialized if we have a mask. 5993b3a8eb9SGleb Smirnoff */ 6003b3a8eb9SGleb Smirnoff struct dn_sch_inst * 6013b3a8eb9SGleb Smirnoff ipdn_si_find(struct dn_schk *s, struct ipfw_flow_id *id) 6023b3a8eb9SGleb Smirnoff { 6033b3a8eb9SGleb Smirnoff 6043b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 6053b3a8eb9SGleb Smirnoff struct ipfw_flow_id id_t = *id; 6063b3a8eb9SGleb Smirnoff flow_id_mask(&s->sch.sched_mask, &id_t); 6073b3a8eb9SGleb Smirnoff return dn_ht_find(s->siht, (uintptr_t)&id_t, 6083b3a8eb9SGleb Smirnoff DNHT_INSERT, s); 6093b3a8eb9SGleb Smirnoff } 6103b3a8eb9SGleb Smirnoff if (!s->siht) 6113b3a8eb9SGleb Smirnoff s->siht = si_new(0, 0, s); 6123b3a8eb9SGleb Smirnoff return (struct dn_sch_inst *)s->siht; 6133b3a8eb9SGleb Smirnoff } 6143b3a8eb9SGleb Smirnoff 6153b3a8eb9SGleb Smirnoff /* callback to flush credit for the scheduler instance */ 6163b3a8eb9SGleb Smirnoff static int 6173b3a8eb9SGleb Smirnoff si_reset_credit(void *_si, void *arg) 6183b3a8eb9SGleb Smirnoff { 6193b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 6203b3a8eb9SGleb Smirnoff struct dn_link *p = &si->sched->link; 6213b3a8eb9SGleb Smirnoff 622fe3bcfbdSTom Jones si->credit = p->burst + (V_dn_cfg.io_fast ? p->bandwidth : 0); 6233b3a8eb9SGleb Smirnoff return 0; 6243b3a8eb9SGleb Smirnoff } 6253b3a8eb9SGleb Smirnoff 6263b3a8eb9SGleb Smirnoff static void 6273b3a8eb9SGleb Smirnoff schk_reset_credit(struct dn_schk *s) 6283b3a8eb9SGleb Smirnoff { 6293b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 6303b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, si_reset_credit, NULL); 6313b3a8eb9SGleb Smirnoff else if (s->siht) 6323b3a8eb9SGleb Smirnoff si_reset_credit(s->siht, NULL); 6333b3a8eb9SGleb Smirnoff } 6343b3a8eb9SGleb Smirnoff /*---- end of sch_inst hashtable ---------------------*/ 6353b3a8eb9SGleb Smirnoff 6363b3a8eb9SGleb Smirnoff /*------------------------------------------------------- 6373b3a8eb9SGleb Smirnoff * flowset hash (fshash) support. Entries are hashed by fs_nr. 6383b3a8eb9SGleb Smirnoff * New allocations are put in the fsunlinked list, from which 6393b3a8eb9SGleb Smirnoff * they are removed when they point to a specific scheduler. 6403b3a8eb9SGleb Smirnoff */ 6413b3a8eb9SGleb Smirnoff static uint32_t 6423b3a8eb9SGleb Smirnoff fsk_hash(uintptr_t key, int flags, void *arg) 6433b3a8eb9SGleb Smirnoff { 6443b3a8eb9SGleb Smirnoff uint32_t i = !(flags & DNHT_KEY_IS_OBJ) ? key : 6453b3a8eb9SGleb Smirnoff ((struct dn_fsk *)key)->fs.fs_nr; 6463b3a8eb9SGleb Smirnoff 6473b3a8eb9SGleb Smirnoff return ( (i>>8)^(i>>4)^i ); 6483b3a8eb9SGleb Smirnoff } 6493b3a8eb9SGleb Smirnoff 6503b3a8eb9SGleb Smirnoff static int 6513b3a8eb9SGleb Smirnoff fsk_match(void *obj, uintptr_t key, int flags, void *arg) 6523b3a8eb9SGleb Smirnoff { 6533b3a8eb9SGleb Smirnoff struct dn_fsk *fs = obj; 6543b3a8eb9SGleb Smirnoff int i = !(flags & DNHT_KEY_IS_OBJ) ? key : 6553b3a8eb9SGleb Smirnoff ((struct dn_fsk *)key)->fs.fs_nr; 6563b3a8eb9SGleb Smirnoff 6573b3a8eb9SGleb Smirnoff return (fs->fs.fs_nr == i); 6583b3a8eb9SGleb Smirnoff } 6593b3a8eb9SGleb Smirnoff 6603b3a8eb9SGleb Smirnoff static void * 6613b3a8eb9SGleb Smirnoff fsk_new(uintptr_t key, int flags, void *arg) 6623b3a8eb9SGleb Smirnoff { 6633b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 6643b3a8eb9SGleb Smirnoff 6653b3a8eb9SGleb Smirnoff fs = malloc(sizeof(*fs), M_DUMMYNET, M_NOWAIT | M_ZERO); 6663b3a8eb9SGleb Smirnoff if (fs) { 6673b3a8eb9SGleb Smirnoff set_oid(&fs->fs.oid, DN_FS, sizeof(fs->fs)); 668fe3bcfbdSTom Jones V_dn_cfg.fsk_count++; 6693b3a8eb9SGleb Smirnoff fs->drain_bucket = 0; 670fe3bcfbdSTom Jones SLIST_INSERT_HEAD(&V_dn_cfg.fsu, fs, sch_chain); 6713b3a8eb9SGleb Smirnoff } 6723b3a8eb9SGleb Smirnoff return fs; 6733b3a8eb9SGleb Smirnoff } 6743b3a8eb9SGleb Smirnoff 67591336b40SDon Lewis #ifdef NEW_AQM 67691336b40SDon Lewis /* callback function for cleaning up AQM queue status belongs to a flowset 67791336b40SDon Lewis * connected to scheduler instance '_si' (for !DN_MULTIQUEUE only). 67891336b40SDon Lewis */ 67991336b40SDon Lewis static int 68091336b40SDon Lewis si_cleanup_q(void *_si, void *arg) 68191336b40SDon Lewis { 68291336b40SDon Lewis struct dn_sch_inst *si = _si; 68391336b40SDon Lewis 68491336b40SDon Lewis if (!(si->sched->fp->flags & DN_MULTIQUEUE)) { 68591336b40SDon Lewis if (si->sched->fs->aqmfp && si->sched->fs->aqmfp->cleanup) 68691336b40SDon Lewis si->sched->fs->aqmfp->cleanup((struct dn_queue *) (si+1)); 68791336b40SDon Lewis } 68891336b40SDon Lewis return 0; 68991336b40SDon Lewis } 69091336b40SDon Lewis 69191336b40SDon Lewis /* callback to clean up queue AQM status.*/ 69291336b40SDon Lewis static int 69391336b40SDon Lewis q_cleanup_q(void *_q, void *arg) 69491336b40SDon Lewis { 69591336b40SDon Lewis struct dn_queue *q = _q; 69691336b40SDon Lewis q->fs->aqmfp->cleanup(q); 69791336b40SDon Lewis return 0; 69891336b40SDon Lewis } 69991336b40SDon Lewis 70091336b40SDon Lewis /* Clean up all AQM queues status belongs to flowset 'fs' and then 70191336b40SDon Lewis * deconfig AQM for flowset 'fs' 70291336b40SDon Lewis */ 70391336b40SDon Lewis static void 70491336b40SDon Lewis aqm_cleanup_deconfig_fs(struct dn_fsk *fs) 70591336b40SDon Lewis { 70691336b40SDon Lewis struct dn_sch_inst *si; 70791336b40SDon Lewis 70891336b40SDon Lewis /* clean up AQM status for all queues for !DN_MULTIQUEUE sched*/ 70991336b40SDon Lewis if (fs->fs.fs_nr > DN_MAX_ID) { 71091336b40SDon Lewis if (fs->sched && !(fs->sched->fp->flags & DN_MULTIQUEUE)) { 71191336b40SDon Lewis if (fs->sched->sch.flags & DN_HAVE_MASK) 71291336b40SDon Lewis dn_ht_scan(fs->sched->siht, si_cleanup_q, NULL); 71391336b40SDon Lewis else { 71491336b40SDon Lewis /* single si i.e. no sched mask */ 71591336b40SDon Lewis si = (struct dn_sch_inst *) fs->sched->siht; 71691336b40SDon Lewis if (si && fs->aqmfp && fs->aqmfp->cleanup) 71791336b40SDon Lewis fs->aqmfp->cleanup((struct dn_queue *) (si+1)); 71891336b40SDon Lewis } 71991336b40SDon Lewis } 72091336b40SDon Lewis } 72191336b40SDon Lewis 72291336b40SDon Lewis /* clean up AQM status for all queues for DN_MULTIQUEUE sched*/ 72391336b40SDon Lewis if (fs->sched && fs->sched->fp->flags & DN_MULTIQUEUE && fs->qht) { 72491336b40SDon Lewis if (fs->fs.flags & DN_QHT_HASH) 72591336b40SDon Lewis dn_ht_scan(fs->qht, q_cleanup_q, NULL); 72691336b40SDon Lewis else 72791336b40SDon Lewis fs->aqmfp->cleanup((struct dn_queue *)(fs->qht)); 72891336b40SDon Lewis } 72991336b40SDon Lewis 73091336b40SDon Lewis /* deconfig AQM */ 73191336b40SDon Lewis if(fs->aqmcfg && fs->aqmfp && fs->aqmfp->deconfig) 73291336b40SDon Lewis fs->aqmfp->deconfig(fs); 73391336b40SDon Lewis } 73491336b40SDon Lewis #endif 73591336b40SDon Lewis 7363b3a8eb9SGleb Smirnoff /* 7373b3a8eb9SGleb Smirnoff * detach flowset from its current scheduler. Flags as follows: 7383b3a8eb9SGleb Smirnoff * DN_DETACH removes from the fsk_list 7393b3a8eb9SGleb Smirnoff * DN_DESTROY deletes individual queues 7403b3a8eb9SGleb Smirnoff * DN_DELETE_FS destroys the flowset (otherwise goes in unlinked). 7413b3a8eb9SGleb Smirnoff */ 7423b3a8eb9SGleb Smirnoff static void 7433b3a8eb9SGleb Smirnoff fsk_detach(struct dn_fsk *fs, int flags) 7443b3a8eb9SGleb Smirnoff { 7453b3a8eb9SGleb Smirnoff if (flags & DN_DELETE_FS) 7463b3a8eb9SGleb Smirnoff flags |= DN_DESTROY; 7473b3a8eb9SGleb Smirnoff ND("fs %d from sched %d flags %s %s %s", 7483b3a8eb9SGleb Smirnoff fs->fs.fs_nr, fs->fs.sched_nr, 7493b3a8eb9SGleb Smirnoff (flags & DN_DELETE_FS) ? "DEL_FS":"", 7503b3a8eb9SGleb Smirnoff (flags & DN_DESTROY) ? "DEL":"", 7513b3a8eb9SGleb Smirnoff (flags & DN_DETACH) ? "DET":""); 7523b3a8eb9SGleb Smirnoff if (flags & DN_DETACH) { /* detach from the list */ 7533b3a8eb9SGleb Smirnoff struct dn_fsk_head *h; 754fe3bcfbdSTom Jones h = fs->sched ? &fs->sched->fsk_list : &V_dn_cfg.fsu; 7553b3a8eb9SGleb Smirnoff SLIST_REMOVE(h, fs, dn_fsk, sch_chain); 7563b3a8eb9SGleb Smirnoff } 7573b3a8eb9SGleb Smirnoff /* Free the RED parameters, they will be recomputed on 7583b3a8eb9SGleb Smirnoff * subsequent attach if needed. 7593b3a8eb9SGleb Smirnoff */ 7603b3a8eb9SGleb Smirnoff free(fs->w_q_lookup, M_DUMMYNET); 7613b3a8eb9SGleb Smirnoff fs->w_q_lookup = NULL; 7623b3a8eb9SGleb Smirnoff qht_delete(fs, flags); 76391336b40SDon Lewis #ifdef NEW_AQM 76491336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 76591336b40SDon Lewis #endif 76691336b40SDon Lewis 7673b3a8eb9SGleb Smirnoff if (fs->sched && fs->sched->fp->free_fsk) 7683b3a8eb9SGleb Smirnoff fs->sched->fp->free_fsk(fs); 7693b3a8eb9SGleb Smirnoff fs->sched = NULL; 7703b3a8eb9SGleb Smirnoff if (flags & DN_DELETE_FS) { 771578acad3SEitan Adler bzero(fs, sizeof(*fs)); /* safety */ 7723b3a8eb9SGleb Smirnoff free(fs, M_DUMMYNET); 773fe3bcfbdSTom Jones V_dn_cfg.fsk_count--; 7743b3a8eb9SGleb Smirnoff } else { 775fe3bcfbdSTom Jones SLIST_INSERT_HEAD(&V_dn_cfg.fsu, fs, sch_chain); 7763b3a8eb9SGleb Smirnoff } 7773b3a8eb9SGleb Smirnoff } 7783b3a8eb9SGleb Smirnoff 7793b3a8eb9SGleb Smirnoff /* 7803b3a8eb9SGleb Smirnoff * Detach or destroy all flowsets in a list. 7813b3a8eb9SGleb Smirnoff * flags specifies what to do: 7823b3a8eb9SGleb Smirnoff * DN_DESTROY: flush all queues 7833b3a8eb9SGleb Smirnoff * DN_DELETE_FS: DN_DESTROY + destroy flowset 7843b3a8eb9SGleb Smirnoff * DN_DELETE_FS implies DN_DESTROY 7853b3a8eb9SGleb Smirnoff */ 7863b3a8eb9SGleb Smirnoff static void 7873b3a8eb9SGleb Smirnoff fsk_detach_list(struct dn_fsk_head *h, int flags) 7883b3a8eb9SGleb Smirnoff { 7893b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 7903b3a8eb9SGleb Smirnoff int n = 0; /* only for stats */ 7913b3a8eb9SGleb Smirnoff 7923b3a8eb9SGleb Smirnoff ND("head %p flags %x", h, flags); 7933b3a8eb9SGleb Smirnoff while ((fs = SLIST_FIRST(h))) { 7943b3a8eb9SGleb Smirnoff SLIST_REMOVE_HEAD(h, sch_chain); 7953b3a8eb9SGleb Smirnoff n++; 7963b3a8eb9SGleb Smirnoff fsk_detach(fs, flags); 7973b3a8eb9SGleb Smirnoff } 7983b3a8eb9SGleb Smirnoff ND("done %d flowsets", n); 7993b3a8eb9SGleb Smirnoff } 8003b3a8eb9SGleb Smirnoff 8013b3a8eb9SGleb Smirnoff /* 8023b3a8eb9SGleb Smirnoff * called on 'queue X delete' -- removes the flowset from fshash, 8033b3a8eb9SGleb Smirnoff * deletes all queues for the flowset, and removes the flowset. 8043b3a8eb9SGleb Smirnoff */ 8053b3a8eb9SGleb Smirnoff static int 8063b3a8eb9SGleb Smirnoff delete_fs(int i, int locked) 8073b3a8eb9SGleb Smirnoff { 8083b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 8093b3a8eb9SGleb Smirnoff int err = 0; 8103b3a8eb9SGleb Smirnoff 8113b3a8eb9SGleb Smirnoff if (!locked) 8123b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 813fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, i, DNHT_REMOVE, NULL); 8143b3a8eb9SGleb Smirnoff ND("fs %d found %p", i, fs); 8153b3a8eb9SGleb Smirnoff if (fs) { 8163b3a8eb9SGleb Smirnoff fsk_detach(fs, DN_DETACH | DN_DELETE_FS); 8173b3a8eb9SGleb Smirnoff err = 0; 8183b3a8eb9SGleb Smirnoff } else 8193b3a8eb9SGleb Smirnoff err = EINVAL; 8203b3a8eb9SGleb Smirnoff if (!locked) 8213b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 8223b3a8eb9SGleb Smirnoff return err; 8233b3a8eb9SGleb Smirnoff } 8243b3a8eb9SGleb Smirnoff 8253b3a8eb9SGleb Smirnoff /*----- end of flowset hashtable support -------------*/ 8263b3a8eb9SGleb Smirnoff 8273b3a8eb9SGleb Smirnoff /*------------------------------------------------------------ 8283b3a8eb9SGleb Smirnoff * Scheduler hash. When searching by index we pass sched_nr, 8293b3a8eb9SGleb Smirnoff * otherwise we pass struct dn_sch * which is the first field in 8303b3a8eb9SGleb Smirnoff * struct dn_schk so we can cast between the two. We use this trick 8313b3a8eb9SGleb Smirnoff * because in the create phase (but it should be fixed). 8323b3a8eb9SGleb Smirnoff */ 8333b3a8eb9SGleb Smirnoff static uint32_t 8343b3a8eb9SGleb Smirnoff schk_hash(uintptr_t key, int flags, void *_arg) 8353b3a8eb9SGleb Smirnoff { 8363b3a8eb9SGleb Smirnoff uint32_t i = !(flags & DNHT_KEY_IS_OBJ) ? key : 8373b3a8eb9SGleb Smirnoff ((struct dn_schk *)key)->sch.sched_nr; 8383b3a8eb9SGleb Smirnoff return ( (i>>8)^(i>>4)^i ); 8393b3a8eb9SGleb Smirnoff } 8403b3a8eb9SGleb Smirnoff 8413b3a8eb9SGleb Smirnoff static int 8423b3a8eb9SGleb Smirnoff schk_match(void *obj, uintptr_t key, int flags, void *_arg) 8433b3a8eb9SGleb Smirnoff { 8443b3a8eb9SGleb Smirnoff struct dn_schk *s = (struct dn_schk *)obj; 8453b3a8eb9SGleb Smirnoff int i = !(flags & DNHT_KEY_IS_OBJ) ? key : 8463b3a8eb9SGleb Smirnoff ((struct dn_schk *)key)->sch.sched_nr; 8473b3a8eb9SGleb Smirnoff return (s->sch.sched_nr == i); 8483b3a8eb9SGleb Smirnoff } 8493b3a8eb9SGleb Smirnoff 8503b3a8eb9SGleb Smirnoff /* 8513b3a8eb9SGleb Smirnoff * Create the entry and intialize with the sched hash if needed. 8523b3a8eb9SGleb Smirnoff * Leave s->fp unset so we can tell whether a dn_ht_find() returns 8533b3a8eb9SGleb Smirnoff * a new object or a previously existing one. 8543b3a8eb9SGleb Smirnoff */ 8553b3a8eb9SGleb Smirnoff static void * 8563b3a8eb9SGleb Smirnoff schk_new(uintptr_t key, int flags, void *arg) 8573b3a8eb9SGleb Smirnoff { 8583b3a8eb9SGleb Smirnoff struct schk_new_arg *a = arg; 8593b3a8eb9SGleb Smirnoff struct dn_schk *s; 8603b3a8eb9SGleb Smirnoff int l = sizeof(*s) +a->fp->schk_datalen; 8613b3a8eb9SGleb Smirnoff 8623b3a8eb9SGleb Smirnoff s = malloc(l, M_DUMMYNET, M_NOWAIT | M_ZERO); 8633b3a8eb9SGleb Smirnoff if (s == NULL) 8643b3a8eb9SGleb Smirnoff return NULL; 8653b3a8eb9SGleb Smirnoff set_oid(&s->link.oid, DN_LINK, sizeof(s->link)); 8663b3a8eb9SGleb Smirnoff s->sch = *a->sch; // copy initial values 8673b3a8eb9SGleb Smirnoff s->link.link_nr = s->sch.sched_nr; 8683b3a8eb9SGleb Smirnoff SLIST_INIT(&s->fsk_list); 8693b3a8eb9SGleb Smirnoff /* initialize the hash table or create the single instance */ 8703b3a8eb9SGleb Smirnoff s->fp = a->fp; /* si_new needs this */ 8713b3a8eb9SGleb Smirnoff s->drain_bucket = 0; 8723b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 8733b3a8eb9SGleb Smirnoff s->siht = dn_ht_init(NULL, s->sch.buckets, 8743b3a8eb9SGleb Smirnoff offsetof(struct dn_sch_inst, si_next), 8753b3a8eb9SGleb Smirnoff si_hash, si_match, si_new); 8763b3a8eb9SGleb Smirnoff if (s->siht == NULL) { 8773b3a8eb9SGleb Smirnoff free(s, M_DUMMYNET); 8783b3a8eb9SGleb Smirnoff return NULL; 8793b3a8eb9SGleb Smirnoff } 8803b3a8eb9SGleb Smirnoff } 8813b3a8eb9SGleb Smirnoff s->fp = NULL; /* mark as a new scheduler */ 882fe3bcfbdSTom Jones V_dn_cfg.schk_count++; 8833b3a8eb9SGleb Smirnoff return s; 8843b3a8eb9SGleb Smirnoff } 8853b3a8eb9SGleb Smirnoff 8863b3a8eb9SGleb Smirnoff /* 8873b3a8eb9SGleb Smirnoff * Callback for sched delete. Notify all attached flowsets to 8883b3a8eb9SGleb Smirnoff * detach from the scheduler, destroy the internal flowset, and 8893b3a8eb9SGleb Smirnoff * all instances. The scheduler goes away too. 8903b3a8eb9SGleb Smirnoff * arg is 0 (only detach flowsets and destroy instances) 8913b3a8eb9SGleb Smirnoff * DN_DESTROY (detach & delete queues, delete schk) 8923b3a8eb9SGleb Smirnoff * or DN_DELETE_FS (delete queues and flowsets, delete schk) 8933b3a8eb9SGleb Smirnoff */ 8943b3a8eb9SGleb Smirnoff static int 8953b3a8eb9SGleb Smirnoff schk_delete_cb(void *obj, void *arg) 8963b3a8eb9SGleb Smirnoff { 8973b3a8eb9SGleb Smirnoff struct dn_schk *s = obj; 8983b3a8eb9SGleb Smirnoff #if 0 8993b3a8eb9SGleb Smirnoff int a = (int)arg; 9003b3a8eb9SGleb Smirnoff ND("sched %d arg %s%s", 9013b3a8eb9SGleb Smirnoff s->sch.sched_nr, 9023b3a8eb9SGleb Smirnoff a&DN_DESTROY ? "DEL ":"", 9033b3a8eb9SGleb Smirnoff a&DN_DELETE_FS ? "DEL_FS":""); 9043b3a8eb9SGleb Smirnoff #endif 9053b3a8eb9SGleb Smirnoff fsk_detach_list(&s->fsk_list, arg ? DN_DESTROY : 0); 9063b3a8eb9SGleb Smirnoff /* no more flowset pointing to us now */ 9073b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 9083b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, si_destroy, NULL); 9093b3a8eb9SGleb Smirnoff dn_ht_free(s->siht, 0); 9103b3a8eb9SGleb Smirnoff } else if (s->siht) 9113b3a8eb9SGleb Smirnoff si_destroy(s->siht, NULL); 912*1b2dbe37SKristof Provost 9133b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 9143b3a8eb9SGleb Smirnoff s->profile = NULL; 9153b3a8eb9SGleb Smirnoff s->siht = NULL; 9163b3a8eb9SGleb Smirnoff if (s->fp->destroy) 9173b3a8eb9SGleb Smirnoff s->fp->destroy(s); 9183b3a8eb9SGleb Smirnoff bzero(s, sizeof(*s)); // safety 9193b3a8eb9SGleb Smirnoff free(obj, M_DUMMYNET); 920fe3bcfbdSTom Jones V_dn_cfg.schk_count--; 9213b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; 9223b3a8eb9SGleb Smirnoff } 9233b3a8eb9SGleb Smirnoff 9243b3a8eb9SGleb Smirnoff /* 9253b3a8eb9SGleb Smirnoff * called on a 'sched X delete' command. Deletes a single scheduler. 9263b3a8eb9SGleb Smirnoff * This is done by removing from the schedhash, unlinking all 9273b3a8eb9SGleb Smirnoff * flowsets and deleting their traffic. 9283b3a8eb9SGleb Smirnoff */ 9293b3a8eb9SGleb Smirnoff static int 9303b3a8eb9SGleb Smirnoff delete_schk(int i) 9313b3a8eb9SGleb Smirnoff { 9323b3a8eb9SGleb Smirnoff struct dn_schk *s; 9333b3a8eb9SGleb Smirnoff 934fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, DNHT_REMOVE, NULL); 9353b3a8eb9SGleb Smirnoff ND("%d %p", i, s); 9363b3a8eb9SGleb Smirnoff if (!s) 9373b3a8eb9SGleb Smirnoff return EINVAL; 9383b3a8eb9SGleb Smirnoff delete_fs(i + DN_MAX_ID, 1); /* first delete internal fs */ 9393b3a8eb9SGleb Smirnoff /* then detach flowsets, delete traffic */ 9403b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void*)(uintptr_t)DN_DESTROY); 9413b3a8eb9SGleb Smirnoff return 0; 9423b3a8eb9SGleb Smirnoff } 9433b3a8eb9SGleb Smirnoff /*--- end of schk hashtable support ---*/ 9443b3a8eb9SGleb Smirnoff 9453b3a8eb9SGleb Smirnoff static int 9463b3a8eb9SGleb Smirnoff copy_obj(char **start, char *end, void *_o, const char *msg, int i) 9473b3a8eb9SGleb Smirnoff { 9480ac43d97SMarius Strobl struct dn_id o; 9490ac43d97SMarius Strobl union { 9500ac43d97SMarius Strobl struct dn_link l; 9510ac43d97SMarius Strobl struct dn_schk s; 9520ac43d97SMarius Strobl } dn; 9533b3a8eb9SGleb Smirnoff int have = end - *start; 9543b3a8eb9SGleb Smirnoff 9550ac43d97SMarius Strobl memcpy(&o, _o, sizeof(o)); 9560ac43d97SMarius Strobl if (have < o.len || o.len == 0 || o.type == 0) { 9573b3a8eb9SGleb Smirnoff D("(WARN) type %d %s %d have %d need %d", 9580ac43d97SMarius Strobl o.type, msg, i, have, o.len); 9593b3a8eb9SGleb Smirnoff return 1; 9603b3a8eb9SGleb Smirnoff } 9610ac43d97SMarius Strobl ND("type %d %s %d len %d", o.type, msg, i, o.len); 9620ac43d97SMarius Strobl if (o.type == DN_LINK) { 9630ac43d97SMarius Strobl memcpy(&dn.l, _o, sizeof(dn.l)); 9643b3a8eb9SGleb Smirnoff /* Adjust burst parameter for link */ 9650ac43d97SMarius Strobl dn.l.burst = div64(dn.l.burst, 8 * hz); 9660ac43d97SMarius Strobl dn.l.delay = dn.l.delay * 1000 / hz; 9670ac43d97SMarius Strobl memcpy(*start, &dn.l, sizeof(dn.l)); 9680ac43d97SMarius Strobl } else if (o.type == DN_SCH) { 9690ac43d97SMarius Strobl /* Set dn.s.sch.oid.id to the number of instances */ 9700ac43d97SMarius Strobl memcpy(&dn.s, _o, sizeof(dn.s)); 9710ac43d97SMarius Strobl dn.s.sch.oid.id = (dn.s.sch.flags & DN_HAVE_MASK) ? 9720ac43d97SMarius Strobl dn_ht_entries(dn.s.siht) : (dn.s.siht ? 1 : 0); 9730ac43d97SMarius Strobl memcpy(*start, &dn.s, sizeof(dn.s)); 9740ac43d97SMarius Strobl } else 9750ac43d97SMarius Strobl memcpy(*start, _o, o.len); 9760ac43d97SMarius Strobl *start += o.len; 9773b3a8eb9SGleb Smirnoff return 0; 9783b3a8eb9SGleb Smirnoff } 9793b3a8eb9SGleb Smirnoff 9803b3a8eb9SGleb Smirnoff /* Specific function to copy a queue. 9813b3a8eb9SGleb Smirnoff * Copies only the user-visible part of a queue (which is in 9823b3a8eb9SGleb Smirnoff * a struct dn_flow), and sets len accordingly. 9833b3a8eb9SGleb Smirnoff */ 9843b3a8eb9SGleb Smirnoff static int 9853b3a8eb9SGleb Smirnoff copy_obj_q(char **start, char *end, void *_o, const char *msg, int i) 9863b3a8eb9SGleb Smirnoff { 9873b3a8eb9SGleb Smirnoff struct dn_id *o = _o; 9883b3a8eb9SGleb Smirnoff int have = end - *start; 9893b3a8eb9SGleb Smirnoff int len = sizeof(struct dn_flow); /* see above comment */ 9903b3a8eb9SGleb Smirnoff 9913b3a8eb9SGleb Smirnoff if (have < len || o->len == 0 || o->type != DN_QUEUE) { 9923b3a8eb9SGleb Smirnoff D("ERROR type %d %s %d have %d need %d", 9933b3a8eb9SGleb Smirnoff o->type, msg, i, have, len); 9943b3a8eb9SGleb Smirnoff return 1; 9953b3a8eb9SGleb Smirnoff } 9963b3a8eb9SGleb Smirnoff ND("type %d %s %d len %d", o->type, msg, i, len); 9970ac43d97SMarius Strobl memcpy(*start, _o, len); 9983b3a8eb9SGleb Smirnoff ((struct dn_id*)(*start))->len = len; 9993b3a8eb9SGleb Smirnoff *start += len; 10003b3a8eb9SGleb Smirnoff return 0; 10013b3a8eb9SGleb Smirnoff } 10023b3a8eb9SGleb Smirnoff 10033b3a8eb9SGleb Smirnoff static int 10043b3a8eb9SGleb Smirnoff copy_q_cb(void *obj, void *arg) 10053b3a8eb9SGleb Smirnoff { 10063b3a8eb9SGleb Smirnoff struct dn_queue *q = obj; 10073b3a8eb9SGleb Smirnoff struct copy_args *a = arg; 10083b3a8eb9SGleb Smirnoff struct dn_flow *ni = (struct dn_flow *)(*a->start); 10093b3a8eb9SGleb Smirnoff if (copy_obj_q(a->start, a->end, &q->ni, "queue", -1)) 10103b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10113b3a8eb9SGleb Smirnoff ni->oid.type = DN_FLOW; /* override the DN_QUEUE */ 10123b3a8eb9SGleb Smirnoff ni->oid.id = si_hash((uintptr_t)&ni->fid, 0, NULL); 10133b3a8eb9SGleb Smirnoff return 0; 10143b3a8eb9SGleb Smirnoff } 10153b3a8eb9SGleb Smirnoff 10163b3a8eb9SGleb Smirnoff static int 10173b3a8eb9SGleb Smirnoff copy_q(struct copy_args *a, struct dn_fsk *fs, int flags) 10183b3a8eb9SGleb Smirnoff { 10193b3a8eb9SGleb Smirnoff if (!fs->qht) 10203b3a8eb9SGleb Smirnoff return 0; 10213b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) 10223b3a8eb9SGleb Smirnoff dn_ht_scan(fs->qht, copy_q_cb, a); 10233b3a8eb9SGleb Smirnoff else 10243b3a8eb9SGleb Smirnoff copy_q_cb(fs->qht, a); 10253b3a8eb9SGleb Smirnoff return 0; 10263b3a8eb9SGleb Smirnoff } 10273b3a8eb9SGleb Smirnoff 10283b3a8eb9SGleb Smirnoff /* 10293b3a8eb9SGleb Smirnoff * This routine only copies the initial part of a profile ? XXX 10303b3a8eb9SGleb Smirnoff */ 10313b3a8eb9SGleb Smirnoff static int 10323b3a8eb9SGleb Smirnoff copy_profile(struct copy_args *a, struct dn_profile *p) 10333b3a8eb9SGleb Smirnoff { 10343b3a8eb9SGleb Smirnoff int have = a->end - *a->start; 10353b3a8eb9SGleb Smirnoff /* XXX here we check for max length */ 10363b3a8eb9SGleb Smirnoff int profile_len = sizeof(struct dn_profile) - 10373b3a8eb9SGleb Smirnoff ED_MAX_SAMPLES_NO*sizeof(int); 10383b3a8eb9SGleb Smirnoff 10393b3a8eb9SGleb Smirnoff if (p == NULL) 10403b3a8eb9SGleb Smirnoff return 0; 10413b3a8eb9SGleb Smirnoff if (have < profile_len) { 10423b3a8eb9SGleb Smirnoff D("error have %d need %d", have, profile_len); 10433b3a8eb9SGleb Smirnoff return 1; 10443b3a8eb9SGleb Smirnoff } 10450ac43d97SMarius Strobl memcpy(*a->start, p, profile_len); 10463b3a8eb9SGleb Smirnoff ((struct dn_id *)(*a->start))->len = profile_len; 10473b3a8eb9SGleb Smirnoff *a->start += profile_len; 10483b3a8eb9SGleb Smirnoff return 0; 10493b3a8eb9SGleb Smirnoff } 10503b3a8eb9SGleb Smirnoff 10513b3a8eb9SGleb Smirnoff static int 10523b3a8eb9SGleb Smirnoff copy_flowset(struct copy_args *a, struct dn_fsk *fs, int flags) 10533b3a8eb9SGleb Smirnoff { 10543b3a8eb9SGleb Smirnoff struct dn_fs *ufs = (struct dn_fs *)(*a->start); 10553b3a8eb9SGleb Smirnoff if (!fs) 10563b3a8eb9SGleb Smirnoff return 0; 10573b3a8eb9SGleb Smirnoff ND("flowset %d", fs->fs.fs_nr); 10583b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, &fs->fs, "flowset", fs->fs.fs_nr)) 10593b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10603b3a8eb9SGleb Smirnoff ufs->oid.id = (fs->fs.flags & DN_QHT_HASH) ? 10613b3a8eb9SGleb Smirnoff dn_ht_entries(fs->qht) : (fs->qht ? 1 : 0); 10623b3a8eb9SGleb Smirnoff if (flags) { /* copy queues */ 10633b3a8eb9SGleb Smirnoff copy_q(a, fs, 0); 10643b3a8eb9SGleb Smirnoff } 10653b3a8eb9SGleb Smirnoff return 0; 10663b3a8eb9SGleb Smirnoff } 10673b3a8eb9SGleb Smirnoff 10683b3a8eb9SGleb Smirnoff static int 10693b3a8eb9SGleb Smirnoff copy_si_cb(void *obj, void *arg) 10703b3a8eb9SGleb Smirnoff { 10713b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = obj; 10723b3a8eb9SGleb Smirnoff struct copy_args *a = arg; 10733b3a8eb9SGleb Smirnoff struct dn_flow *ni = (struct dn_flow *)(*a->start); 10743b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, &si->ni, "inst", 10753b3a8eb9SGleb Smirnoff si->sched->sch.sched_nr)) 10763b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 10773b3a8eb9SGleb Smirnoff ni->oid.type = DN_FLOW; /* override the DN_SCH_I */ 10783b3a8eb9SGleb Smirnoff ni->oid.id = si_hash((uintptr_t)si, DNHT_KEY_IS_OBJ, NULL); 10793b3a8eb9SGleb Smirnoff return 0; 10803b3a8eb9SGleb Smirnoff } 10813b3a8eb9SGleb Smirnoff 10823b3a8eb9SGleb Smirnoff static int 10833b3a8eb9SGleb Smirnoff copy_si(struct copy_args *a, struct dn_schk *s, int flags) 10843b3a8eb9SGleb Smirnoff { 10853b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) 10863b3a8eb9SGleb Smirnoff dn_ht_scan(s->siht, copy_si_cb, a); 10873b3a8eb9SGleb Smirnoff else if (s->siht) 10883b3a8eb9SGleb Smirnoff copy_si_cb(s->siht, a); 10893b3a8eb9SGleb Smirnoff return 0; 10903b3a8eb9SGleb Smirnoff } 10913b3a8eb9SGleb Smirnoff 10923b3a8eb9SGleb Smirnoff /* 10933b3a8eb9SGleb Smirnoff * compute a list of children of a scheduler and copy up 10943b3a8eb9SGleb Smirnoff */ 10953b3a8eb9SGleb Smirnoff static int 10963b3a8eb9SGleb Smirnoff copy_fsk_list(struct copy_args *a, struct dn_schk *s, int flags) 10973b3a8eb9SGleb Smirnoff { 10983b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 10993b3a8eb9SGleb Smirnoff struct dn_id *o; 11003b3a8eb9SGleb Smirnoff uint32_t *p; 11013b3a8eb9SGleb Smirnoff 11023b3a8eb9SGleb Smirnoff int n = 0, space = sizeof(*o); 11033b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) { 11043b3a8eb9SGleb Smirnoff if (fs->fs.fs_nr < DN_MAX_ID) 11053b3a8eb9SGleb Smirnoff n++; 11063b3a8eb9SGleb Smirnoff } 11073b3a8eb9SGleb Smirnoff space += n * sizeof(uint32_t); 11083b3a8eb9SGleb Smirnoff DX(3, "sched %d has %d flowsets", s->sch.sched_nr, n); 11093b3a8eb9SGleb Smirnoff if (a->end - *(a->start) < space) 11103b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11113b3a8eb9SGleb Smirnoff o = (struct dn_id *)(*(a->start)); 11123b3a8eb9SGleb Smirnoff o->len = space; 11133b3a8eb9SGleb Smirnoff *a->start += o->len; 11143b3a8eb9SGleb Smirnoff o->type = DN_TEXT; 11153b3a8eb9SGleb Smirnoff p = (uint32_t *)(o+1); 11163b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) 11173b3a8eb9SGleb Smirnoff if (fs->fs.fs_nr < DN_MAX_ID) 11183b3a8eb9SGleb Smirnoff *p++ = fs->fs.fs_nr; 11193b3a8eb9SGleb Smirnoff return 0; 11203b3a8eb9SGleb Smirnoff } 11213b3a8eb9SGleb Smirnoff 11223b3a8eb9SGleb Smirnoff static int 11233b3a8eb9SGleb Smirnoff copy_data_helper(void *_o, void *_arg) 11243b3a8eb9SGleb Smirnoff { 11253b3a8eb9SGleb Smirnoff struct copy_args *a = _arg; 11263b3a8eb9SGleb Smirnoff uint32_t *r = a->extra->r; /* start of first range */ 11273b3a8eb9SGleb Smirnoff uint32_t *lim; /* first invalid pointer */ 11283b3a8eb9SGleb Smirnoff int n; 11293b3a8eb9SGleb Smirnoff 11303b3a8eb9SGleb Smirnoff lim = (uint32_t *)((char *)(a->extra) + a->extra->o.len); 11313b3a8eb9SGleb Smirnoff 11323b3a8eb9SGleb Smirnoff if (a->type == DN_LINK || a->type == DN_SCH) { 11333b3a8eb9SGleb Smirnoff /* pipe|sched show, we receive a dn_schk */ 11343b3a8eb9SGleb Smirnoff struct dn_schk *s = _o; 11353b3a8eb9SGleb Smirnoff 11363b3a8eb9SGleb Smirnoff n = s->sch.sched_nr; 11373b3a8eb9SGleb Smirnoff if (a->type == DN_SCH && n >= DN_MAX_ID) 11383b3a8eb9SGleb Smirnoff return 0; /* not a scheduler */ 11393b3a8eb9SGleb Smirnoff if (a->type == DN_LINK && n <= DN_MAX_ID) 11403b3a8eb9SGleb Smirnoff return 0; /* not a pipe */ 11413b3a8eb9SGleb Smirnoff 11423b3a8eb9SGleb Smirnoff /* see if the object is within one of our ranges */ 11433b3a8eb9SGleb Smirnoff for (;r < lim; r += 2) { 11443b3a8eb9SGleb Smirnoff if (n < r[0] || n > r[1]) 11453b3a8eb9SGleb Smirnoff continue; 11463b3a8eb9SGleb Smirnoff /* Found a valid entry, copy and we are done */ 11473b3a8eb9SGleb Smirnoff if (a->flags & DN_C_LINK) { 11483b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, 11493b3a8eb9SGleb Smirnoff &s->link, "link", n)) 11503b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11513b3a8eb9SGleb Smirnoff if (copy_profile(a, s->profile)) 11523b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11533b3a8eb9SGleb Smirnoff if (copy_flowset(a, s->fs, 0)) 11543b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11553b3a8eb9SGleb Smirnoff } 11563b3a8eb9SGleb Smirnoff if (a->flags & DN_C_SCH) { 11573b3a8eb9SGleb Smirnoff if (copy_obj(a->start, a->end, 11583b3a8eb9SGleb Smirnoff &s->sch, "sched", n)) 11593b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11603b3a8eb9SGleb Smirnoff /* list all attached flowsets */ 11613b3a8eb9SGleb Smirnoff if (copy_fsk_list(a, s, 0)) 11623b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11633b3a8eb9SGleb Smirnoff } 11643b3a8eb9SGleb Smirnoff if (a->flags & DN_C_FLOW) 11653b3a8eb9SGleb Smirnoff copy_si(a, s, 0); 11663b3a8eb9SGleb Smirnoff break; 11673b3a8eb9SGleb Smirnoff } 11683b3a8eb9SGleb Smirnoff } else if (a->type == DN_FS) { 11693b3a8eb9SGleb Smirnoff /* queue show, skip internal flowsets */ 11703b3a8eb9SGleb Smirnoff struct dn_fsk *fs = _o; 11713b3a8eb9SGleb Smirnoff 11723b3a8eb9SGleb Smirnoff n = fs->fs.fs_nr; 11733b3a8eb9SGleb Smirnoff if (n >= DN_MAX_ID) 11743b3a8eb9SGleb Smirnoff return 0; 11753b3a8eb9SGleb Smirnoff /* see if the object is within one of our ranges */ 11763b3a8eb9SGleb Smirnoff for (;r < lim; r += 2) { 11773b3a8eb9SGleb Smirnoff if (n < r[0] || n > r[1]) 11783b3a8eb9SGleb Smirnoff continue; 11793b3a8eb9SGleb Smirnoff if (copy_flowset(a, fs, 0)) 11803b3a8eb9SGleb Smirnoff return DNHT_SCAN_END; 11813b3a8eb9SGleb Smirnoff copy_q(a, fs, 0); 11823b3a8eb9SGleb Smirnoff break; /* we are done */ 11833b3a8eb9SGleb Smirnoff } 11843b3a8eb9SGleb Smirnoff } 11853b3a8eb9SGleb Smirnoff return 0; 11863b3a8eb9SGleb Smirnoff } 11873b3a8eb9SGleb Smirnoff 11883b3a8eb9SGleb Smirnoff static inline struct dn_schk * 11893b3a8eb9SGleb Smirnoff locate_scheduler(int i) 11903b3a8eb9SGleb Smirnoff { 1191fe3bcfbdSTom Jones return dn_ht_find(V_dn_cfg.schedhash, i, 0, NULL); 11923b3a8eb9SGleb Smirnoff } 11933b3a8eb9SGleb Smirnoff 11943b3a8eb9SGleb Smirnoff /* 11953b3a8eb9SGleb Smirnoff * red parameters are in fixed point arithmetic. 11963b3a8eb9SGleb Smirnoff */ 11973b3a8eb9SGleb Smirnoff static int 11983b3a8eb9SGleb Smirnoff config_red(struct dn_fsk *fs) 11993b3a8eb9SGleb Smirnoff { 12003b3a8eb9SGleb Smirnoff int64_t s, idle, weight, w0; 12013b3a8eb9SGleb Smirnoff int t, i; 12023b3a8eb9SGleb Smirnoff 12033b3a8eb9SGleb Smirnoff fs->w_q = fs->fs.w_q; 12043b3a8eb9SGleb Smirnoff fs->max_p = fs->fs.max_p; 12053b3a8eb9SGleb Smirnoff ND("called"); 12063b3a8eb9SGleb Smirnoff /* Doing stuff that was in userland */ 12073b3a8eb9SGleb Smirnoff i = fs->sched->link.bandwidth; 12083b3a8eb9SGleb Smirnoff s = (i <= 0) ? 0 : 1209fe3bcfbdSTom Jones hz * V_dn_cfg.red_avg_pkt_size * 8 * SCALE(1) / i; 12103b3a8eb9SGleb Smirnoff 12113b3a8eb9SGleb Smirnoff idle = div64((s * 3) , fs->w_q); /* s, fs->w_q scaled; idle not scaled */ 1212fe3bcfbdSTom Jones fs->lookup_step = div64(idle , V_dn_cfg.red_lookup_depth); 12133b3a8eb9SGleb Smirnoff /* fs->lookup_step not scaled, */ 12143b3a8eb9SGleb Smirnoff if (!fs->lookup_step) 12153b3a8eb9SGleb Smirnoff fs->lookup_step = 1; 12163b3a8eb9SGleb Smirnoff w0 = weight = SCALE(1) - fs->w_q; //fs->w_q scaled 12173b3a8eb9SGleb Smirnoff 12183b3a8eb9SGleb Smirnoff for (t = fs->lookup_step; t > 1; --t) 12193b3a8eb9SGleb Smirnoff weight = SCALE_MUL(weight, w0); 12203b3a8eb9SGleb Smirnoff fs->lookup_weight = (int)(weight); // scaled 12213b3a8eb9SGleb Smirnoff 12223b3a8eb9SGleb Smirnoff /* Now doing stuff that was in kerneland */ 12233b3a8eb9SGleb Smirnoff fs->min_th = SCALE(fs->fs.min_th); 12243b3a8eb9SGleb Smirnoff fs->max_th = SCALE(fs->fs.max_th); 12253b3a8eb9SGleb Smirnoff 1226fc5e1956SHiren Panchasara if (fs->fs.max_th == fs->fs.min_th) 1227fc5e1956SHiren Panchasara fs->c_1 = fs->max_p; 1228fc5e1956SHiren Panchasara else 1229fc5e1956SHiren Panchasara fs->c_1 = SCALE((int64_t)(fs->max_p)) / (fs->fs.max_th - fs->fs.min_th); 12303b3a8eb9SGleb Smirnoff fs->c_2 = SCALE_MUL(fs->c_1, SCALE(fs->fs.min_th)); 12313b3a8eb9SGleb Smirnoff 12323b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_IS_GENTLE_RED) { 12333b3a8eb9SGleb Smirnoff fs->c_3 = (SCALE(1) - fs->max_p) / fs->fs.max_th; 12343b3a8eb9SGleb Smirnoff fs->c_4 = SCALE(1) - 2 * fs->max_p; 12353b3a8eb9SGleb Smirnoff } 12363b3a8eb9SGleb Smirnoff 12373b3a8eb9SGleb Smirnoff /* If the lookup table already exist, free and create it again. */ 12383b3a8eb9SGleb Smirnoff free(fs->w_q_lookup, M_DUMMYNET); 12393b3a8eb9SGleb Smirnoff fs->w_q_lookup = NULL; 1240fe3bcfbdSTom Jones if (V_dn_cfg.red_lookup_depth == 0) { 12413b3a8eb9SGleb Smirnoff printf("\ndummynet: net.inet.ip.dummynet.red_lookup_depth" 12423b3a8eb9SGleb Smirnoff "must be > 0\n"); 12433b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_RED; 12443b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_GENTLE_RED; 12453b3a8eb9SGleb Smirnoff return (EINVAL); 12463b3a8eb9SGleb Smirnoff } 1247fe3bcfbdSTom Jones fs->lookup_depth = V_dn_cfg.red_lookup_depth; 12483b3a8eb9SGleb Smirnoff fs->w_q_lookup = (u_int *)malloc(fs->lookup_depth * sizeof(int), 12493b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT); 12503b3a8eb9SGleb Smirnoff if (fs->w_q_lookup == NULL) { 12513b3a8eb9SGleb Smirnoff printf("dummynet: sorry, cannot allocate red lookup table\n"); 12523b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_RED; 12533b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_IS_GENTLE_RED; 12543b3a8eb9SGleb Smirnoff return(ENOSPC); 12553b3a8eb9SGleb Smirnoff } 12563b3a8eb9SGleb Smirnoff 12573b3a8eb9SGleb Smirnoff /* Fill the lookup table with (1 - w_q)^x */ 12583b3a8eb9SGleb Smirnoff fs->w_q_lookup[0] = SCALE(1) - fs->w_q; 12593b3a8eb9SGleb Smirnoff 12603b3a8eb9SGleb Smirnoff for (i = 1; i < fs->lookup_depth; i++) 12613b3a8eb9SGleb Smirnoff fs->w_q_lookup[i] = 12623b3a8eb9SGleb Smirnoff SCALE_MUL(fs->w_q_lookup[i - 1], fs->lookup_weight); 12633b3a8eb9SGleb Smirnoff 1264fe3bcfbdSTom Jones if (V_dn_cfg.red_avg_pkt_size < 1) 1265fe3bcfbdSTom Jones V_dn_cfg.red_avg_pkt_size = 512; 1266fe3bcfbdSTom Jones fs->avg_pkt_size = V_dn_cfg.red_avg_pkt_size; 1267fe3bcfbdSTom Jones if (V_dn_cfg.red_max_pkt_size < 1) 1268fe3bcfbdSTom Jones V_dn_cfg.red_max_pkt_size = 1500; 1269fe3bcfbdSTom Jones fs->max_pkt_size = V_dn_cfg.red_max_pkt_size; 12703b3a8eb9SGleb Smirnoff ND("exit"); 12713b3a8eb9SGleb Smirnoff return 0; 12723b3a8eb9SGleb Smirnoff } 12733b3a8eb9SGleb Smirnoff 12743b3a8eb9SGleb Smirnoff /* Scan all flowset attached to this scheduler and update red */ 12753b3a8eb9SGleb Smirnoff static void 12763b3a8eb9SGleb Smirnoff update_red(struct dn_schk *s) 12773b3a8eb9SGleb Smirnoff { 12783b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 12793b3a8eb9SGleb Smirnoff SLIST_FOREACH(fs, &s->fsk_list, sch_chain) { 12803b3a8eb9SGleb Smirnoff if (fs && (fs->fs.flags & DN_IS_RED)) 12813b3a8eb9SGleb Smirnoff config_red(fs); 12823b3a8eb9SGleb Smirnoff } 12833b3a8eb9SGleb Smirnoff } 12843b3a8eb9SGleb Smirnoff 12853b3a8eb9SGleb Smirnoff /* attach flowset to scheduler s, possibly requeue */ 12863b3a8eb9SGleb Smirnoff static void 12873b3a8eb9SGleb Smirnoff fsk_attach(struct dn_fsk *fs, struct dn_schk *s) 12883b3a8eb9SGleb Smirnoff { 12893b3a8eb9SGleb Smirnoff ND("remove fs %d from fsunlinked, link to sched %d", 12903b3a8eb9SGleb Smirnoff fs->fs.fs_nr, s->sch.sched_nr); 1291fe3bcfbdSTom Jones SLIST_REMOVE(&V_dn_cfg.fsu, fs, dn_fsk, sch_chain); 12923b3a8eb9SGleb Smirnoff fs->sched = s; 12933b3a8eb9SGleb Smirnoff SLIST_INSERT_HEAD(&s->fsk_list, fs, sch_chain); 12943b3a8eb9SGleb Smirnoff if (s->fp->new_fsk) 12953b3a8eb9SGleb Smirnoff s->fp->new_fsk(fs); 12963b3a8eb9SGleb Smirnoff /* XXX compute fsk_mask */ 12973b3a8eb9SGleb Smirnoff fs->fsk_mask = fs->fs.flow_mask; 12983b3a8eb9SGleb Smirnoff if (fs->sched->sch.flags & DN_HAVE_MASK) 12993b3a8eb9SGleb Smirnoff flow_id_or(&fs->sched->sch.sched_mask, &fs->fsk_mask); 13003b3a8eb9SGleb Smirnoff if (fs->qht) { 13013b3a8eb9SGleb Smirnoff /* 13023b3a8eb9SGleb Smirnoff * we must drain qht according to the old 13033b3a8eb9SGleb Smirnoff * type, and reinsert according to the new one. 13043b3a8eb9SGleb Smirnoff * The requeue is complex -- in general we need to 13053b3a8eb9SGleb Smirnoff * reclassify every single packet. 13063b3a8eb9SGleb Smirnoff * For the time being, let's hope qht is never set 13073b3a8eb9SGleb Smirnoff * when we reach this point. 13083b3a8eb9SGleb Smirnoff */ 13093b3a8eb9SGleb Smirnoff D("XXX TODO requeue from fs %d to sch %d", 13103b3a8eb9SGleb Smirnoff fs->fs.fs_nr, s->sch.sched_nr); 13113b3a8eb9SGleb Smirnoff fs->qht = NULL; 13123b3a8eb9SGleb Smirnoff } 13133b3a8eb9SGleb Smirnoff /* set the new type for qht */ 13143b3a8eb9SGleb Smirnoff if (nonzero_mask(&fs->fsk_mask)) 13153b3a8eb9SGleb Smirnoff fs->fs.flags |= DN_QHT_HASH; 13163b3a8eb9SGleb Smirnoff else 13173b3a8eb9SGleb Smirnoff fs->fs.flags &= ~DN_QHT_HASH; 13183b3a8eb9SGleb Smirnoff 13193b3a8eb9SGleb Smirnoff /* XXX config_red() can fail... */ 13203b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_IS_RED) 13213b3a8eb9SGleb Smirnoff config_red(fs); 13223b3a8eb9SGleb Smirnoff } 13233b3a8eb9SGleb Smirnoff 13243b3a8eb9SGleb Smirnoff /* update all flowsets which may refer to this scheduler */ 13253b3a8eb9SGleb Smirnoff static void 13263b3a8eb9SGleb Smirnoff update_fs(struct dn_schk *s) 13273b3a8eb9SGleb Smirnoff { 13283b3a8eb9SGleb Smirnoff struct dn_fsk *fs, *tmp; 13293b3a8eb9SGleb Smirnoff 1330fe3bcfbdSTom Jones SLIST_FOREACH_SAFE(fs, &V_dn_cfg.fsu, sch_chain, tmp) { 13313b3a8eb9SGleb Smirnoff if (s->sch.sched_nr != fs->fs.sched_nr) { 13323b3a8eb9SGleb Smirnoff D("fs %d for sch %d not %d still unlinked", 13333b3a8eb9SGleb Smirnoff fs->fs.fs_nr, fs->fs.sched_nr, 13343b3a8eb9SGleb Smirnoff s->sch.sched_nr); 13353b3a8eb9SGleb Smirnoff continue; 13363b3a8eb9SGleb Smirnoff } 13373b3a8eb9SGleb Smirnoff fsk_attach(fs, s); 13383b3a8eb9SGleb Smirnoff } 13393b3a8eb9SGleb Smirnoff } 13403b3a8eb9SGleb Smirnoff 134191336b40SDon Lewis #ifdef NEW_AQM 134291336b40SDon Lewis /* Retrieve AQM configurations to ipfw userland 134391336b40SDon Lewis */ 134491336b40SDon Lewis static int 134591336b40SDon Lewis get_aqm_parms(struct sockopt *sopt) 134691336b40SDon Lewis { 134791336b40SDon Lewis struct dn_extra_parms *ep; 134891336b40SDon Lewis struct dn_fsk *fs; 134991336b40SDon Lewis size_t sopt_valsize; 135091336b40SDon Lewis int l, err = 0; 135191336b40SDon Lewis 135291336b40SDon Lewis sopt_valsize = sopt->sopt_valsize; 135391336b40SDon Lewis l = sizeof(*ep); 135491336b40SDon Lewis if (sopt->sopt_valsize < l) { 135591336b40SDon Lewis D("bad len sopt->sopt_valsize %d len %d", 135691336b40SDon Lewis (int) sopt->sopt_valsize , l); 135791336b40SDon Lewis err = EINVAL; 135891336b40SDon Lewis return err; 135991336b40SDon Lewis } 136051d73df1SKristof Provost ep = malloc(l, M_DUMMYNET, M_NOWAIT); 136191336b40SDon Lewis if(!ep) { 136291336b40SDon Lewis err = ENOMEM ; 136391336b40SDon Lewis return err; 136491336b40SDon Lewis } 136591336b40SDon Lewis do { 136691336b40SDon Lewis err = sooptcopyin(sopt, ep, l, l); 136791336b40SDon Lewis if(err) 136891336b40SDon Lewis break; 136991336b40SDon Lewis sopt->sopt_valsize = sopt_valsize; 137091336b40SDon Lewis if (ep->oid.len < l) { 137191336b40SDon Lewis err = EINVAL; 137291336b40SDon Lewis break; 137391336b40SDon Lewis } 137491336b40SDon Lewis 1375fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, ep->nr, 0, NULL); 137691336b40SDon Lewis if (!fs) { 137791336b40SDon Lewis D("fs %d not found", ep->nr); 137891336b40SDon Lewis err = EINVAL; 137991336b40SDon Lewis break; 138091336b40SDon Lewis } 138191336b40SDon Lewis 138291336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->getconfig) { 138391336b40SDon Lewis if(fs->aqmfp->getconfig(fs, ep)) { 138491336b40SDon Lewis D("Error while trying to get AQM params"); 138591336b40SDon Lewis err = EINVAL; 138691336b40SDon Lewis break; 138791336b40SDon Lewis } 138891336b40SDon Lewis ep->oid.len = l; 138991336b40SDon Lewis err = sooptcopyout(sopt, ep, l); 139091336b40SDon Lewis } 139191336b40SDon Lewis }while(0); 139291336b40SDon Lewis 139391336b40SDon Lewis free(ep, M_DUMMYNET); 139491336b40SDon Lewis return err; 139591336b40SDon Lewis } 139691336b40SDon Lewis 139791336b40SDon Lewis /* Retrieve AQM configurations to ipfw userland 139891336b40SDon Lewis */ 139991336b40SDon Lewis static int 140091336b40SDon Lewis get_sched_parms(struct sockopt *sopt) 140191336b40SDon Lewis { 140291336b40SDon Lewis struct dn_extra_parms *ep; 140391336b40SDon Lewis struct dn_schk *schk; 140491336b40SDon Lewis size_t sopt_valsize; 140591336b40SDon Lewis int l, err = 0; 140691336b40SDon Lewis 140791336b40SDon Lewis sopt_valsize = sopt->sopt_valsize; 140891336b40SDon Lewis l = sizeof(*ep); 140991336b40SDon Lewis if (sopt->sopt_valsize < l) { 141091336b40SDon Lewis D("bad len sopt->sopt_valsize %d len %d", 141191336b40SDon Lewis (int) sopt->sopt_valsize , l); 141291336b40SDon Lewis err = EINVAL; 141391336b40SDon Lewis return err; 141491336b40SDon Lewis } 141551d73df1SKristof Provost ep = malloc(l, M_DUMMYNET, M_NOWAIT); 141691336b40SDon Lewis if(!ep) { 141791336b40SDon Lewis err = ENOMEM ; 141891336b40SDon Lewis return err; 141991336b40SDon Lewis } 142091336b40SDon Lewis do { 142191336b40SDon Lewis err = sooptcopyin(sopt, ep, l, l); 142291336b40SDon Lewis if(err) 142391336b40SDon Lewis break; 142491336b40SDon Lewis sopt->sopt_valsize = sopt_valsize; 142591336b40SDon Lewis if (ep->oid.len < l) { 142691336b40SDon Lewis err = EINVAL; 142791336b40SDon Lewis break; 142891336b40SDon Lewis } 142991336b40SDon Lewis 143091336b40SDon Lewis schk = locate_scheduler(ep->nr); 143191336b40SDon Lewis if (!schk) { 143291336b40SDon Lewis D("sched %d not found", ep->nr); 143391336b40SDon Lewis err = EINVAL; 143491336b40SDon Lewis break; 143591336b40SDon Lewis } 143691336b40SDon Lewis 143791336b40SDon Lewis if (schk->fp && schk->fp->getconfig) { 143891336b40SDon Lewis if(schk->fp->getconfig(schk, ep)) { 143991336b40SDon Lewis D("Error while trying to get sched params"); 144091336b40SDon Lewis err = EINVAL; 144191336b40SDon Lewis break; 144291336b40SDon Lewis } 144391336b40SDon Lewis ep->oid.len = l; 144491336b40SDon Lewis err = sooptcopyout(sopt, ep, l); 144591336b40SDon Lewis } 144691336b40SDon Lewis }while(0); 144791336b40SDon Lewis free(ep, M_DUMMYNET); 144891336b40SDon Lewis 144991336b40SDon Lewis return err; 145091336b40SDon Lewis } 145191336b40SDon Lewis 145291336b40SDon Lewis /* Configure AQM for flowset 'fs'. 145391336b40SDon Lewis * extra parameters are passed from userland. 145491336b40SDon Lewis */ 145591336b40SDon Lewis static int 145691336b40SDon Lewis config_aqm(struct dn_fsk *fs, struct dn_extra_parms *ep, int busy) 145791336b40SDon Lewis { 145891336b40SDon Lewis int err = 0; 145991336b40SDon Lewis 146051d73df1SKristof Provost NET_EPOCH_ASSERT(); 146151d73df1SKristof Provost 146291336b40SDon Lewis do { 146391336b40SDon Lewis /* no configurations */ 146491336b40SDon Lewis if (!ep) { 146591336b40SDon Lewis err = 0; 146691336b40SDon Lewis break; 146791336b40SDon Lewis } 146891336b40SDon Lewis 146991336b40SDon Lewis /* no AQM for this flowset*/ 147091336b40SDon Lewis if (!strcmp(ep->name,"")) { 147191336b40SDon Lewis err = 0; 147291336b40SDon Lewis break; 147391336b40SDon Lewis } 147491336b40SDon Lewis if (ep->oid.len < sizeof(*ep)) { 147591336b40SDon Lewis D("short aqm len %d", ep->oid.len); 147691336b40SDon Lewis err = EINVAL; 147791336b40SDon Lewis break; 147891336b40SDon Lewis } 147991336b40SDon Lewis 148091336b40SDon Lewis if (busy) { 148191336b40SDon Lewis D("Unable to configure flowset, flowset busy!"); 148291336b40SDon Lewis err = EINVAL; 148391336b40SDon Lewis break; 148491336b40SDon Lewis } 148591336b40SDon Lewis 148691336b40SDon Lewis /* deconfigure old aqm if exist */ 148791336b40SDon Lewis if (fs->aqmcfg && fs->aqmfp && fs->aqmfp->deconfig) { 148891336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 148991336b40SDon Lewis } 149091336b40SDon Lewis 149191336b40SDon Lewis if (!(fs->aqmfp = find_aqm_type(0, ep->name))) { 149291336b40SDon Lewis D("AQM functions not found for type %s!", ep->name); 149391336b40SDon Lewis fs->fs.flags &= ~DN_IS_AQM; 149491336b40SDon Lewis err = EINVAL; 149591336b40SDon Lewis break; 149691336b40SDon Lewis } else 149791336b40SDon Lewis fs->fs.flags |= DN_IS_AQM; 149891336b40SDon Lewis 149991336b40SDon Lewis if (ep->oid.subtype != DN_AQM_PARAMS) { 150091336b40SDon Lewis D("Wrong subtype"); 150191336b40SDon Lewis err = EINVAL; 150291336b40SDon Lewis break; 150391336b40SDon Lewis } 150491336b40SDon Lewis 150591336b40SDon Lewis if (fs->aqmfp->config) { 150691336b40SDon Lewis err = fs->aqmfp->config(fs, ep, ep->oid.len); 150791336b40SDon Lewis if (err) { 150891336b40SDon Lewis D("Unable to configure AQM for FS %d", fs->fs.fs_nr ); 150991336b40SDon Lewis fs->fs.flags &= ~DN_IS_AQM; 151091336b40SDon Lewis fs->aqmfp = NULL; 151191336b40SDon Lewis break; 151291336b40SDon Lewis } 151391336b40SDon Lewis } 151491336b40SDon Lewis } while(0); 151591336b40SDon Lewis 151691336b40SDon Lewis return err; 151791336b40SDon Lewis } 151891336b40SDon Lewis #endif 151991336b40SDon Lewis 15203b3a8eb9SGleb Smirnoff /* 15213b3a8eb9SGleb Smirnoff * Configuration -- to preserve backward compatibility we use 15223b3a8eb9SGleb Smirnoff * the following scheme (N is 65536) 15233b3a8eb9SGleb Smirnoff * NUMBER SCHED LINK FLOWSET 15243b3a8eb9SGleb Smirnoff * 1 .. N-1 (1)WFQ (2)WFQ (3)queue 15253b3a8eb9SGleb Smirnoff * N+1 .. 2N-1 (4)FIFO (5)FIFO (6)FIFO for sched 1..N-1 15263b3a8eb9SGleb Smirnoff * 2N+1 .. 3N-1 -- -- (7)FIFO for sched N+1..2N-1 15273b3a8eb9SGleb Smirnoff * 15283b3a8eb9SGleb Smirnoff * "pipe i config" configures #1, #2 and #3 15293b3a8eb9SGleb Smirnoff * "sched i config" configures #1 and possibly #6 15303b3a8eb9SGleb Smirnoff * "queue i config" configures #3 15313b3a8eb9SGleb Smirnoff * #1 is configured with 'pipe i config' or 'sched i config' 15323b3a8eb9SGleb Smirnoff * #2 is configured with 'pipe i config', and created if not 15333b3a8eb9SGleb Smirnoff * existing with 'sched i config' 15343b3a8eb9SGleb Smirnoff * #3 is configured with 'queue i config' 15353b3a8eb9SGleb Smirnoff * #4 is automatically configured after #1, can only be FIFO 15363b3a8eb9SGleb Smirnoff * #5 is automatically configured after #2 15373b3a8eb9SGleb Smirnoff * #6 is automatically created when #1 is !MULTIQUEUE, 15383b3a8eb9SGleb Smirnoff * and can be updated. 15393b3a8eb9SGleb Smirnoff * #7 is automatically configured after #2 15403b3a8eb9SGleb Smirnoff */ 15413b3a8eb9SGleb Smirnoff 15423b3a8eb9SGleb Smirnoff /* 15433b3a8eb9SGleb Smirnoff * configure a link (and its FIFO instance) 15443b3a8eb9SGleb Smirnoff */ 15453b3a8eb9SGleb Smirnoff static int 15463b3a8eb9SGleb Smirnoff config_link(struct dn_link *p, struct dn_id *arg) 15473b3a8eb9SGleb Smirnoff { 15483b3a8eb9SGleb Smirnoff int i; 15493b3a8eb9SGleb Smirnoff 15503b3a8eb9SGleb Smirnoff if (p->oid.len != sizeof(*p)) { 15513b3a8eb9SGleb Smirnoff D("invalid pipe len %d", p->oid.len); 15523b3a8eb9SGleb Smirnoff return EINVAL; 15533b3a8eb9SGleb Smirnoff } 15543b3a8eb9SGleb Smirnoff i = p->link_nr; 15553b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 15563b3a8eb9SGleb Smirnoff return EINVAL; 15573b3a8eb9SGleb Smirnoff /* 15583b3a8eb9SGleb Smirnoff * The config program passes parameters as follows: 15593b3a8eb9SGleb Smirnoff * bw = bits/second (0 means no limits), 15603b3a8eb9SGleb Smirnoff * delay = ms, must be translated into ticks. 15613b3a8eb9SGleb Smirnoff * qsize = slots/bytes 15623b3a8eb9SGleb Smirnoff * burst ??? 15633b3a8eb9SGleb Smirnoff */ 15643b3a8eb9SGleb Smirnoff p->delay = (p->delay * hz) / 1000; 15653b3a8eb9SGleb Smirnoff /* Scale burst size: bytes -> bits * hz */ 15663b3a8eb9SGleb Smirnoff p->burst *= 8 * hz; 15673b3a8eb9SGleb Smirnoff 15683b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 15693b3a8eb9SGleb Smirnoff /* do it twice, base link and FIFO link */ 15703b3a8eb9SGleb Smirnoff for (; i < 2*DN_MAX_ID; i += DN_MAX_ID) { 15713b3a8eb9SGleb Smirnoff struct dn_schk *s = locate_scheduler(i); 15723b3a8eb9SGleb Smirnoff if (s == NULL) { 15733b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 15743b3a8eb9SGleb Smirnoff D("sched %d not found", i); 15753b3a8eb9SGleb Smirnoff return EINVAL; 15763b3a8eb9SGleb Smirnoff } 15773b3a8eb9SGleb Smirnoff /* remove profile if exists */ 15783b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 15793b3a8eb9SGleb Smirnoff s->profile = NULL; 1580*1b2dbe37SKristof Provost 15813b3a8eb9SGleb Smirnoff /* copy all parameters */ 15823b3a8eb9SGleb Smirnoff s->link.oid = p->oid; 15833b3a8eb9SGleb Smirnoff s->link.link_nr = i; 15843b3a8eb9SGleb Smirnoff s->link.delay = p->delay; 15853b3a8eb9SGleb Smirnoff if (s->link.bandwidth != p->bandwidth) { 15863b3a8eb9SGleb Smirnoff /* XXX bandwidth changes, need to update red params */ 15873b3a8eb9SGleb Smirnoff s->link.bandwidth = p->bandwidth; 15883b3a8eb9SGleb Smirnoff update_red(s); 15893b3a8eb9SGleb Smirnoff } 15903b3a8eb9SGleb Smirnoff s->link.burst = p->burst; 15913b3a8eb9SGleb Smirnoff schk_reset_credit(s); 15923b3a8eb9SGleb Smirnoff } 1593fe3bcfbdSTom Jones V_dn_cfg.id++; 15943b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 15953b3a8eb9SGleb Smirnoff return 0; 15963b3a8eb9SGleb Smirnoff } 15973b3a8eb9SGleb Smirnoff 15983b3a8eb9SGleb Smirnoff /* 15993b3a8eb9SGleb Smirnoff * configure a flowset. Can be called from inside with locked=1, 16003b3a8eb9SGleb Smirnoff */ 16013b3a8eb9SGleb Smirnoff static struct dn_fsk * 16023b3a8eb9SGleb Smirnoff config_fs(struct dn_fs *nfs, struct dn_id *arg, int locked) 16033b3a8eb9SGleb Smirnoff { 16043b3a8eb9SGleb Smirnoff int i; 16053b3a8eb9SGleb Smirnoff struct dn_fsk *fs; 16060ac43d97SMarius Strobl #ifdef NEW_AQM 16070ac43d97SMarius Strobl struct dn_extra_parms *ep; 16080ac43d97SMarius Strobl #endif 16093b3a8eb9SGleb Smirnoff 16103b3a8eb9SGleb Smirnoff if (nfs->oid.len != sizeof(*nfs)) { 16113b3a8eb9SGleb Smirnoff D("invalid flowset len %d", nfs->oid.len); 16123b3a8eb9SGleb Smirnoff return NULL; 16133b3a8eb9SGleb Smirnoff } 16143b3a8eb9SGleb Smirnoff i = nfs->fs_nr; 16153b3a8eb9SGleb Smirnoff if (i <= 0 || i >= 3*DN_MAX_ID) 16163b3a8eb9SGleb Smirnoff return NULL; 16170ac43d97SMarius Strobl #ifdef NEW_AQM 16180ac43d97SMarius Strobl ep = NULL; 16190ac43d97SMarius Strobl if (arg != NULL) { 162051d73df1SKristof Provost ep = malloc(sizeof(*ep), M_TEMP, M_NOWAIT); 16210ac43d97SMarius Strobl if (ep == NULL) 16220ac43d97SMarius Strobl return (NULL); 16230ac43d97SMarius Strobl memcpy(ep, arg, sizeof(*ep)); 16240ac43d97SMarius Strobl } 16250ac43d97SMarius Strobl #endif 16263b3a8eb9SGleb Smirnoff ND("flowset %d", i); 16273b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 16283b3a8eb9SGleb Smirnoff if (nfs->flags & DN_QSIZE_BYTES) { 16293b3a8eb9SGleb Smirnoff ipdn_bound_var(&nfs->qsize, 16384, 1630fe3bcfbdSTom Jones 1500, V_dn_cfg.byte_limit, NULL); // "queue byte size"); 16313b3a8eb9SGleb Smirnoff } else { 16323b3a8eb9SGleb Smirnoff ipdn_bound_var(&nfs->qsize, 50, 1633fe3bcfbdSTom Jones 1, V_dn_cfg.slot_limit, NULL); // "queue slot size"); 16343b3a8eb9SGleb Smirnoff } 16353b3a8eb9SGleb Smirnoff if (nfs->flags & DN_HAVE_MASK) { 16363b3a8eb9SGleb Smirnoff /* make sure we have some buckets */ 1637fe3bcfbdSTom Jones ipdn_bound_var((int *)&nfs->buckets, V_dn_cfg.hash_size, 1638fe3bcfbdSTom Jones 1, V_dn_cfg.max_hash_size, "flowset buckets"); 16393b3a8eb9SGleb Smirnoff } else { 16403b3a8eb9SGleb Smirnoff nfs->buckets = 1; /* we only need 1 */ 16413b3a8eb9SGleb Smirnoff } 16423b3a8eb9SGleb Smirnoff if (!locked) 16433b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 16443b3a8eb9SGleb Smirnoff do { /* exit with break when done */ 16453b3a8eb9SGleb Smirnoff struct dn_schk *s; 16463b3a8eb9SGleb Smirnoff int flags = nfs->sched_nr ? DNHT_INSERT : 0; 16473b3a8eb9SGleb Smirnoff int j; 1648fe3bcfbdSTom Jones int oldc = V_dn_cfg.fsk_count; 1649fe3bcfbdSTom Jones fs = dn_ht_find(V_dn_cfg.fshash, i, flags, NULL); 16503b3a8eb9SGleb Smirnoff if (fs == NULL) { 16513b3a8eb9SGleb Smirnoff D("missing sched for flowset %d", i); 16523b3a8eb9SGleb Smirnoff break; 16533b3a8eb9SGleb Smirnoff } 16543b3a8eb9SGleb Smirnoff /* grab some defaults from the existing one */ 16553b3a8eb9SGleb Smirnoff if (nfs->sched_nr == 0) /* reuse */ 16563b3a8eb9SGleb Smirnoff nfs->sched_nr = fs->fs.sched_nr; 16573b3a8eb9SGleb Smirnoff for (j = 0; j < sizeof(nfs->par)/sizeof(nfs->par[0]); j++) { 16583b3a8eb9SGleb Smirnoff if (nfs->par[j] == -1) /* reuse */ 16593b3a8eb9SGleb Smirnoff nfs->par[j] = fs->fs.par[j]; 16603b3a8eb9SGleb Smirnoff } 16613b3a8eb9SGleb Smirnoff if (bcmp(&fs->fs, nfs, sizeof(*nfs)) == 0) { 16623b3a8eb9SGleb Smirnoff ND("flowset %d unchanged", i); 166391336b40SDon Lewis #ifdef NEW_AQM 16640ac43d97SMarius Strobl if (ep != NULL) { 16650ac43d97SMarius Strobl /* 16660ac43d97SMarius Strobl * Reconfigure AQM as the parameters can be changed. 16670ac43d97SMarius Strobl * We consider the flowset as busy if it has scheduler 16680ac43d97SMarius Strobl * instance(s). 166991336b40SDon Lewis */ 167091336b40SDon Lewis s = locate_scheduler(nfs->sched_nr); 16710ac43d97SMarius Strobl config_aqm(fs, ep, s != NULL && s->siht != NULL); 16720ac43d97SMarius Strobl } 167391336b40SDon Lewis #endif 16743b3a8eb9SGleb Smirnoff break; /* no change, nothing to do */ 16753b3a8eb9SGleb Smirnoff } 1676fe3bcfbdSTom Jones if (oldc != V_dn_cfg.fsk_count) /* new item */ 1677fe3bcfbdSTom Jones V_dn_cfg.id++; 16783b3a8eb9SGleb Smirnoff s = locate_scheduler(nfs->sched_nr); 16793b3a8eb9SGleb Smirnoff /* detach from old scheduler if needed, preserving 16803b3a8eb9SGleb Smirnoff * queues if we need to reattach. Then update the 16813b3a8eb9SGleb Smirnoff * configuration, and possibly attach to the new sched. 16823b3a8eb9SGleb Smirnoff */ 16833b3a8eb9SGleb Smirnoff DX(2, "fs %d changed sched %d@%p to %d@%p", 16843b3a8eb9SGleb Smirnoff fs->fs.fs_nr, 16853b3a8eb9SGleb Smirnoff fs->fs.sched_nr, fs->sched, nfs->sched_nr, s); 16863b3a8eb9SGleb Smirnoff if (fs->sched) { 16873b3a8eb9SGleb Smirnoff int flags = s ? DN_DETACH : (DN_DETACH | DN_DESTROY); 16883b3a8eb9SGleb Smirnoff flags |= DN_DESTROY; /* XXX temporary */ 16893b3a8eb9SGleb Smirnoff fsk_detach(fs, flags); 16903b3a8eb9SGleb Smirnoff } 16913b3a8eb9SGleb Smirnoff fs->fs = *nfs; /* copy configuration */ 169291336b40SDon Lewis #ifdef NEW_AQM 169391336b40SDon Lewis fs->aqmfp = NULL; 16940ac43d97SMarius Strobl if (ep != NULL) 16950ac43d97SMarius Strobl config_aqm(fs, ep, s != NULL && 16960ac43d97SMarius Strobl s->siht != NULL); 169791336b40SDon Lewis #endif 16983b3a8eb9SGleb Smirnoff if (s != NULL) 16993b3a8eb9SGleb Smirnoff fsk_attach(fs, s); 17003b3a8eb9SGleb Smirnoff } while (0); 17013b3a8eb9SGleb Smirnoff if (!locked) 17023b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 17030ac43d97SMarius Strobl #ifdef NEW_AQM 17040ac43d97SMarius Strobl free(ep, M_TEMP); 17050ac43d97SMarius Strobl #endif 17063b3a8eb9SGleb Smirnoff return fs; 17073b3a8eb9SGleb Smirnoff } 17083b3a8eb9SGleb Smirnoff 17093b3a8eb9SGleb Smirnoff /* 17103b3a8eb9SGleb Smirnoff * config/reconfig a scheduler and its FIFO variant. 17113b3a8eb9SGleb Smirnoff * For !MULTIQUEUE schedulers, also set up the flowset. 17123b3a8eb9SGleb Smirnoff * 17133b3a8eb9SGleb Smirnoff * On reconfigurations (detected because s->fp is set), 17143b3a8eb9SGleb Smirnoff * detach existing flowsets preserving traffic, preserve link, 17153b3a8eb9SGleb Smirnoff * and delete the old scheduler creating a new one. 17163b3a8eb9SGleb Smirnoff */ 17173b3a8eb9SGleb Smirnoff static int 17183b3a8eb9SGleb Smirnoff config_sched(struct dn_sch *_nsch, struct dn_id *arg) 17193b3a8eb9SGleb Smirnoff { 17203b3a8eb9SGleb Smirnoff struct dn_schk *s; 17213b3a8eb9SGleb Smirnoff struct schk_new_arg a; /* argument for schk_new */ 17223b3a8eb9SGleb Smirnoff int i; 17233b3a8eb9SGleb Smirnoff struct dn_link p; /* copy of oldlink */ 17243b3a8eb9SGleb Smirnoff struct dn_profile *pf = NULL; /* copy of old link profile */ 17253b3a8eb9SGleb Smirnoff /* Used to preserv mask parameter */ 17263b3a8eb9SGleb Smirnoff struct ipfw_flow_id new_mask; 17273b3a8eb9SGleb Smirnoff int new_buckets = 0; 17283b3a8eb9SGleb Smirnoff int new_flags = 0; 17293b3a8eb9SGleb Smirnoff int pipe_cmd; 17303b3a8eb9SGleb Smirnoff int err = ENOMEM; 17313b3a8eb9SGleb Smirnoff 173251d73df1SKristof Provost NET_EPOCH_ASSERT(); 173351d73df1SKristof Provost 17343b3a8eb9SGleb Smirnoff a.sch = _nsch; 17353b3a8eb9SGleb Smirnoff if (a.sch->oid.len != sizeof(*a.sch)) { 17363b3a8eb9SGleb Smirnoff D("bad sched len %d", a.sch->oid.len); 17373b3a8eb9SGleb Smirnoff return EINVAL; 17383b3a8eb9SGleb Smirnoff } 17393b3a8eb9SGleb Smirnoff i = a.sch->sched_nr; 17403b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 17413b3a8eb9SGleb Smirnoff return EINVAL; 17423b3a8eb9SGleb Smirnoff /* make sure we have some buckets */ 17433b3a8eb9SGleb Smirnoff if (a.sch->flags & DN_HAVE_MASK) 1744fe3bcfbdSTom Jones ipdn_bound_var((int *)&a.sch->buckets, V_dn_cfg.hash_size, 1745fe3bcfbdSTom Jones 1, V_dn_cfg.max_hash_size, "sched buckets"); 17463b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 17473b3a8eb9SGleb Smirnoff bzero(&p, sizeof(p)); 17483b3a8eb9SGleb Smirnoff 17493b3a8eb9SGleb Smirnoff pipe_cmd = a.sch->flags & DN_PIPE_CMD; 17503b3a8eb9SGleb Smirnoff a.sch->flags &= ~DN_PIPE_CMD; //XXX do it even if is not set? 17513b3a8eb9SGleb Smirnoff if (pipe_cmd) { 17523b3a8eb9SGleb Smirnoff /* Copy mask parameter */ 17533b3a8eb9SGleb Smirnoff new_mask = a.sch->sched_mask; 17543b3a8eb9SGleb Smirnoff new_buckets = a.sch->buckets; 17553b3a8eb9SGleb Smirnoff new_flags = a.sch->flags; 17563b3a8eb9SGleb Smirnoff } 17573b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 17583b3a8eb9SGleb Smirnoff again: /* run twice, for wfq and fifo */ 17593b3a8eb9SGleb Smirnoff /* 17603b3a8eb9SGleb Smirnoff * lookup the type. If not supplied, use the previous one 17613b3a8eb9SGleb Smirnoff * or default to WF2Q+. Otherwise, return an error. 17623b3a8eb9SGleb Smirnoff */ 1763fe3bcfbdSTom Jones V_dn_cfg.id++; 17643b3a8eb9SGleb Smirnoff a.fp = find_sched_type(a.sch->oid.subtype, a.sch->name); 17653b3a8eb9SGleb Smirnoff if (a.fp != NULL) { 17663b3a8eb9SGleb Smirnoff /* found. Lookup or create entry */ 1767fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, DNHT_INSERT, &a); 17683b3a8eb9SGleb Smirnoff } else if (a.sch->oid.subtype == 0 && !a.sch->name[0]) { 17693b3a8eb9SGleb Smirnoff /* No type. search existing s* or retry with WF2Q+ */ 1770fe3bcfbdSTom Jones s = dn_ht_find(V_dn_cfg.schedhash, i, 0, &a); 17713b3a8eb9SGleb Smirnoff if (s != NULL) { 17723b3a8eb9SGleb Smirnoff a.fp = s->fp; 17733b3a8eb9SGleb Smirnoff /* Scheduler exists, skip to FIFO scheduler 17743b3a8eb9SGleb Smirnoff * if command was pipe config... 17753b3a8eb9SGleb Smirnoff */ 17763b3a8eb9SGleb Smirnoff if (pipe_cmd) 17773b3a8eb9SGleb Smirnoff goto next; 17783b3a8eb9SGleb Smirnoff } else { 17793b3a8eb9SGleb Smirnoff /* New scheduler, create a wf2q+ with no mask 17803b3a8eb9SGleb Smirnoff * if command was pipe config... 17813b3a8eb9SGleb Smirnoff */ 17823b3a8eb9SGleb Smirnoff if (pipe_cmd) { 17833b3a8eb9SGleb Smirnoff /* clear mask parameter */ 17843b3a8eb9SGleb Smirnoff bzero(&a.sch->sched_mask, sizeof(new_mask)); 17853b3a8eb9SGleb Smirnoff a.sch->buckets = 0; 17863b3a8eb9SGleb Smirnoff a.sch->flags &= ~DN_HAVE_MASK; 17873b3a8eb9SGleb Smirnoff } 17883b3a8eb9SGleb Smirnoff a.sch->oid.subtype = DN_SCHED_WF2QP; 17893b3a8eb9SGleb Smirnoff goto again; 17903b3a8eb9SGleb Smirnoff } 17913b3a8eb9SGleb Smirnoff } else { 17923b3a8eb9SGleb Smirnoff D("invalid scheduler type %d %s", 17933b3a8eb9SGleb Smirnoff a.sch->oid.subtype, a.sch->name); 17943b3a8eb9SGleb Smirnoff err = EINVAL; 17953b3a8eb9SGleb Smirnoff goto error; 17963b3a8eb9SGleb Smirnoff } 17973b3a8eb9SGleb Smirnoff /* normalize name and subtype */ 17983b3a8eb9SGleb Smirnoff a.sch->oid.subtype = a.fp->type; 17993b3a8eb9SGleb Smirnoff bzero(a.sch->name, sizeof(a.sch->name)); 18003b3a8eb9SGleb Smirnoff strlcpy(a.sch->name, a.fp->name, sizeof(a.sch->name)); 18013b3a8eb9SGleb Smirnoff if (s == NULL) { 18023b3a8eb9SGleb Smirnoff D("cannot allocate scheduler %d", i); 18033b3a8eb9SGleb Smirnoff goto error; 18043b3a8eb9SGleb Smirnoff } 18053b3a8eb9SGleb Smirnoff /* restore existing link if any */ 18063b3a8eb9SGleb Smirnoff if (p.link_nr) { 18073b3a8eb9SGleb Smirnoff s->link = p; 18083b3a8eb9SGleb Smirnoff if (!pf || pf->link_nr != p.link_nr) { /* no saved value */ 18093b3a8eb9SGleb Smirnoff s->profile = NULL; /* XXX maybe not needed */ 18103b3a8eb9SGleb Smirnoff } else { 18113b3a8eb9SGleb Smirnoff s->profile = malloc(sizeof(struct dn_profile), 18123b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 18133b3a8eb9SGleb Smirnoff if (s->profile == NULL) { 18143b3a8eb9SGleb Smirnoff D("cannot allocate profile"); 18153b3a8eb9SGleb Smirnoff goto error; //XXX 18163b3a8eb9SGleb Smirnoff } 18170ac43d97SMarius Strobl memcpy(s->profile, pf, sizeof(*pf)); 18183b3a8eb9SGleb Smirnoff } 18193b3a8eb9SGleb Smirnoff } 18203b3a8eb9SGleb Smirnoff p.link_nr = 0; 18213b3a8eb9SGleb Smirnoff if (s->fp == NULL) { 18223b3a8eb9SGleb Smirnoff DX(2, "sched %d new type %s", i, a.fp->name); 18233b3a8eb9SGleb Smirnoff } else if (s->fp != a.fp || 18243b3a8eb9SGleb Smirnoff bcmp(a.sch, &s->sch, sizeof(*a.sch)) ) { 18253b3a8eb9SGleb Smirnoff /* already existing. */ 18263b3a8eb9SGleb Smirnoff DX(2, "sched %d type changed from %s to %s", 18273b3a8eb9SGleb Smirnoff i, s->fp->name, a.fp->name); 18283b3a8eb9SGleb Smirnoff DX(4, " type/sub %d/%d -> %d/%d", 18293b3a8eb9SGleb Smirnoff s->sch.oid.type, s->sch.oid.subtype, 18303b3a8eb9SGleb Smirnoff a.sch->oid.type, a.sch->oid.subtype); 18313b3a8eb9SGleb Smirnoff if (s->link.link_nr == 0) 18323b3a8eb9SGleb Smirnoff D("XXX WARNING link 0 for sched %d", i); 18333b3a8eb9SGleb Smirnoff p = s->link; /* preserve link */ 18343b3a8eb9SGleb Smirnoff if (s->profile) {/* preserve profile */ 18353b3a8eb9SGleb Smirnoff if (!pf) 18363b3a8eb9SGleb Smirnoff pf = malloc(sizeof(*pf), 18373b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 18383b3a8eb9SGleb Smirnoff if (pf) /* XXX should issue a warning otherwise */ 18390ac43d97SMarius Strobl memcpy(pf, s->profile, sizeof(*pf)); 18403b3a8eb9SGleb Smirnoff } 18413b3a8eb9SGleb Smirnoff /* remove from the hash */ 1842fe3bcfbdSTom Jones dn_ht_find(V_dn_cfg.schedhash, i, DNHT_REMOVE, NULL); 18433b3a8eb9SGleb Smirnoff /* Detach flowsets, preserve queues. */ 18443b3a8eb9SGleb Smirnoff // schk_delete_cb(s, NULL); 18453b3a8eb9SGleb Smirnoff // XXX temporarily, kill queues 18463b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void *)DN_DESTROY); 18473b3a8eb9SGleb Smirnoff goto again; 18483b3a8eb9SGleb Smirnoff } else { 18493b3a8eb9SGleb Smirnoff DX(4, "sched %d unchanged type %s", i, a.fp->name); 18503b3a8eb9SGleb Smirnoff } 18513b3a8eb9SGleb Smirnoff /* complete initialization */ 18523b3a8eb9SGleb Smirnoff s->sch = *a.sch; 18533b3a8eb9SGleb Smirnoff s->fp = a.fp; 18543b3a8eb9SGleb Smirnoff s->cfg = arg; 18553b3a8eb9SGleb Smirnoff // XXX schk_reset_credit(s); 18563b3a8eb9SGleb Smirnoff /* create the internal flowset if needed, 18573b3a8eb9SGleb Smirnoff * trying to reuse existing ones if available 18583b3a8eb9SGleb Smirnoff */ 18593b3a8eb9SGleb Smirnoff if (!(s->fp->flags & DN_MULTIQUEUE) && !s->fs) { 1860fe3bcfbdSTom Jones s->fs = dn_ht_find(V_dn_cfg.fshash, i, 0, NULL); 18613b3a8eb9SGleb Smirnoff if (!s->fs) { 18623b3a8eb9SGleb Smirnoff struct dn_fs fs; 18633b3a8eb9SGleb Smirnoff bzero(&fs, sizeof(fs)); 18643b3a8eb9SGleb Smirnoff set_oid(&fs.oid, DN_FS, sizeof(fs)); 18653b3a8eb9SGleb Smirnoff fs.fs_nr = i + DN_MAX_ID; 18663b3a8eb9SGleb Smirnoff fs.sched_nr = i; 18673b3a8eb9SGleb Smirnoff s->fs = config_fs(&fs, NULL, 1 /* locked */); 18683b3a8eb9SGleb Smirnoff } 18693b3a8eb9SGleb Smirnoff if (!s->fs) { 18703b3a8eb9SGleb Smirnoff schk_delete_cb(s, (void *)DN_DESTROY); 18713b3a8eb9SGleb Smirnoff D("error creating internal fs for %d", i); 18723b3a8eb9SGleb Smirnoff goto error; 18733b3a8eb9SGleb Smirnoff } 18743b3a8eb9SGleb Smirnoff } 18753b3a8eb9SGleb Smirnoff /* call init function after the flowset is created */ 18763b3a8eb9SGleb Smirnoff if (s->fp->config) 18773b3a8eb9SGleb Smirnoff s->fp->config(s); 18783b3a8eb9SGleb Smirnoff update_fs(s); 18793b3a8eb9SGleb Smirnoff next: 18803b3a8eb9SGleb Smirnoff if (i < DN_MAX_ID) { /* now configure the FIFO instance */ 18813b3a8eb9SGleb Smirnoff i += DN_MAX_ID; 18823b3a8eb9SGleb Smirnoff if (pipe_cmd) { 18833b3a8eb9SGleb Smirnoff /* Restore mask parameter for FIFO */ 18843b3a8eb9SGleb Smirnoff a.sch->sched_mask = new_mask; 18853b3a8eb9SGleb Smirnoff a.sch->buckets = new_buckets; 18863b3a8eb9SGleb Smirnoff a.sch->flags = new_flags; 18873b3a8eb9SGleb Smirnoff } else { 18883b3a8eb9SGleb Smirnoff /* sched config shouldn't modify the FIFO scheduler */ 1889fe3bcfbdSTom Jones if (dn_ht_find(V_dn_cfg.schedhash, i, 0, &a) != NULL) { 18903b3a8eb9SGleb Smirnoff /* FIFO already exist, don't touch it */ 18913b3a8eb9SGleb Smirnoff err = 0; /* and this is not an error */ 18923b3a8eb9SGleb Smirnoff goto error; 18933b3a8eb9SGleb Smirnoff } 18943b3a8eb9SGleb Smirnoff } 18953b3a8eb9SGleb Smirnoff a.sch->sched_nr = i; 18963b3a8eb9SGleb Smirnoff a.sch->oid.subtype = DN_SCHED_FIFO; 18973b3a8eb9SGleb Smirnoff bzero(a.sch->name, sizeof(a.sch->name)); 18983b3a8eb9SGleb Smirnoff goto again; 18993b3a8eb9SGleb Smirnoff } 19003b3a8eb9SGleb Smirnoff err = 0; 19013b3a8eb9SGleb Smirnoff error: 19023b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 19033b3a8eb9SGleb Smirnoff free(pf, M_DUMMYNET); 19043b3a8eb9SGleb Smirnoff return err; 19053b3a8eb9SGleb Smirnoff } 19063b3a8eb9SGleb Smirnoff 19073b3a8eb9SGleb Smirnoff /* 19083b3a8eb9SGleb Smirnoff * attach a profile to a link 19093b3a8eb9SGleb Smirnoff */ 19103b3a8eb9SGleb Smirnoff static int 19113b3a8eb9SGleb Smirnoff config_profile(struct dn_profile *pf, struct dn_id *arg) 19123b3a8eb9SGleb Smirnoff { 19133b3a8eb9SGleb Smirnoff struct dn_schk *s; 19143b3a8eb9SGleb Smirnoff int i, olen, err = 0; 19153b3a8eb9SGleb Smirnoff 19163b3a8eb9SGleb Smirnoff if (pf->oid.len < sizeof(*pf)) { 19173b3a8eb9SGleb Smirnoff D("short profile len %d", pf->oid.len); 19183b3a8eb9SGleb Smirnoff return EINVAL; 19193b3a8eb9SGleb Smirnoff } 19203b3a8eb9SGleb Smirnoff i = pf->link_nr; 19213b3a8eb9SGleb Smirnoff if (i <= 0 || i >= DN_MAX_ID) 19223b3a8eb9SGleb Smirnoff return EINVAL; 19233b3a8eb9SGleb Smirnoff /* XXX other sanity checks */ 19243b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 19253b3a8eb9SGleb Smirnoff for (; i < 2*DN_MAX_ID; i += DN_MAX_ID) { 19263b3a8eb9SGleb Smirnoff s = locate_scheduler(i); 19273b3a8eb9SGleb Smirnoff 19283b3a8eb9SGleb Smirnoff if (s == NULL) { 19293b3a8eb9SGleb Smirnoff err = EINVAL; 19303b3a8eb9SGleb Smirnoff break; 19313b3a8eb9SGleb Smirnoff } 1932fe3bcfbdSTom Jones V_dn_cfg.id++; 19333b3a8eb9SGleb Smirnoff /* 19343b3a8eb9SGleb Smirnoff * If we had a profile and the new one does not fit, 19353b3a8eb9SGleb Smirnoff * or it is deleted, then we need to free memory. 19363b3a8eb9SGleb Smirnoff */ 19373b3a8eb9SGleb Smirnoff if (s->profile && (pf->samples_no == 0 || 19383b3a8eb9SGleb Smirnoff s->profile->oid.len < pf->oid.len)) { 19393b3a8eb9SGleb Smirnoff free(s->profile, M_DUMMYNET); 19403b3a8eb9SGleb Smirnoff s->profile = NULL; 19413b3a8eb9SGleb Smirnoff } 19423b3a8eb9SGleb Smirnoff if (pf->samples_no == 0) 19433b3a8eb9SGleb Smirnoff continue; 19443b3a8eb9SGleb Smirnoff /* 19453b3a8eb9SGleb Smirnoff * new profile, possibly allocate memory 19463b3a8eb9SGleb Smirnoff * and copy data. 19473b3a8eb9SGleb Smirnoff */ 19483b3a8eb9SGleb Smirnoff if (s->profile == NULL) 19493b3a8eb9SGleb Smirnoff s->profile = malloc(pf->oid.len, 19503b3a8eb9SGleb Smirnoff M_DUMMYNET, M_NOWAIT | M_ZERO); 19513b3a8eb9SGleb Smirnoff if (s->profile == NULL) { 19523b3a8eb9SGleb Smirnoff D("no memory for profile %d", i); 19533b3a8eb9SGleb Smirnoff err = ENOMEM; 19543b3a8eb9SGleb Smirnoff break; 19553b3a8eb9SGleb Smirnoff } 19563b3a8eb9SGleb Smirnoff /* preserve larger length XXX double check */ 19573b3a8eb9SGleb Smirnoff olen = s->profile->oid.len; 19583b3a8eb9SGleb Smirnoff if (olen < pf->oid.len) 19593b3a8eb9SGleb Smirnoff olen = pf->oid.len; 19600ac43d97SMarius Strobl memcpy(s->profile, pf, pf->oid.len); 19613b3a8eb9SGleb Smirnoff s->profile->oid.len = olen; 19623b3a8eb9SGleb Smirnoff } 19633b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 19643b3a8eb9SGleb Smirnoff return err; 19653b3a8eb9SGleb Smirnoff } 19663b3a8eb9SGleb Smirnoff 19673b3a8eb9SGleb Smirnoff /* 19683b3a8eb9SGleb Smirnoff * Delete all objects: 19693b3a8eb9SGleb Smirnoff */ 19703b3a8eb9SGleb Smirnoff static void 19713b3a8eb9SGleb Smirnoff dummynet_flush(void) 19723b3a8eb9SGleb Smirnoff { 19733b3a8eb9SGleb Smirnoff 19743b3a8eb9SGleb Smirnoff /* delete all schedulers and related links/queues/flowsets */ 1975fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, schk_delete_cb, 19763b3a8eb9SGleb Smirnoff (void *)(uintptr_t)DN_DELETE_FS); 19773b3a8eb9SGleb Smirnoff /* delete all remaining (unlinked) flowsets */ 1978fe3bcfbdSTom Jones DX(4, "still %d unlinked fs", V_dn_cfg.fsk_count); 1979fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.fshash, DNHT_REMOVE); 1980fe3bcfbdSTom Jones fsk_detach_list(&V_dn_cfg.fsu, DN_DELETE_FS); 19813b3a8eb9SGleb Smirnoff /* Reinitialize system heap... */ 1982fe3bcfbdSTom Jones heap_init(&V_dn_cfg.evheap, 16, offsetof(struct dn_id, id)); 19833b3a8eb9SGleb Smirnoff } 19843b3a8eb9SGleb Smirnoff 19853b3a8eb9SGleb Smirnoff /* 19863b3a8eb9SGleb Smirnoff * Main handler for configuration. We are guaranteed to be called 19873b3a8eb9SGleb Smirnoff * with an oid which is at least a dn_id. 19883b3a8eb9SGleb Smirnoff * - the first object is the command (config, delete, flush, ...) 19893b3a8eb9SGleb Smirnoff * - config_link must be issued after the corresponding config_sched 1990a4641f4eSPedro F. Giffuni * - parameters (DN_TXT) for an object must precede the object 19913b3a8eb9SGleb Smirnoff * processed on a config_sched. 19923b3a8eb9SGleb Smirnoff */ 19933b3a8eb9SGleb Smirnoff int 19943b3a8eb9SGleb Smirnoff do_config(void *p, int l) 19953b3a8eb9SGleb Smirnoff { 19960ac43d97SMarius Strobl struct dn_id o; 19970ac43d97SMarius Strobl union { 19980ac43d97SMarius Strobl struct dn_profile profile; 19990ac43d97SMarius Strobl struct dn_fs fs; 20000ac43d97SMarius Strobl struct dn_link link; 20010ac43d97SMarius Strobl struct dn_sch sched; 20020ac43d97SMarius Strobl } *dn; 20030ac43d97SMarius Strobl struct dn_id *arg; 20040ac43d97SMarius Strobl uintptr_t a; 20050ac43d97SMarius Strobl int err, err2, off; 20063b3a8eb9SGleb Smirnoff 20070ac43d97SMarius Strobl memcpy(&o, p, sizeof(o)); 20080ac43d97SMarius Strobl if (o.id != DN_API_VERSION) { 20090ac43d97SMarius Strobl D("invalid api version got %d need %d", o.id, DN_API_VERSION); 20103b3a8eb9SGleb Smirnoff return EINVAL; 20113b3a8eb9SGleb Smirnoff } 20120ac43d97SMarius Strobl arg = NULL; 20130ac43d97SMarius Strobl dn = NULL; 20140ac43d97SMarius Strobl for (off = 0; l >= sizeof(o); memcpy(&o, (char *)p + off, sizeof(o))) { 20150ac43d97SMarius Strobl if (o.len < sizeof(o) || l < o.len) { 20160ac43d97SMarius Strobl D("bad len o.len %d len %d", o.len, l); 20173b3a8eb9SGleb Smirnoff err = EINVAL; 20183b3a8eb9SGleb Smirnoff break; 20193b3a8eb9SGleb Smirnoff } 20200ac43d97SMarius Strobl l -= o.len; 20213b3a8eb9SGleb Smirnoff err = 0; 20220ac43d97SMarius Strobl switch (o.type) { 20233b3a8eb9SGleb Smirnoff default: 20240ac43d97SMarius Strobl D("cmd %d not implemented", o.type); 20253b3a8eb9SGleb Smirnoff break; 20263b3a8eb9SGleb Smirnoff 20273b3a8eb9SGleb Smirnoff #ifdef EMULATE_SYSCTL 20283b3a8eb9SGleb Smirnoff /* sysctl emulation. 20293b3a8eb9SGleb Smirnoff * if we recognize the command, jump to the correct 20303b3a8eb9SGleb Smirnoff * handler and return 20313b3a8eb9SGleb Smirnoff */ 20323b3a8eb9SGleb Smirnoff case DN_SYSCTL_SET: 20333b3a8eb9SGleb Smirnoff err = kesysctl_emu_set(p, l); 20343b3a8eb9SGleb Smirnoff return err; 20353b3a8eb9SGleb Smirnoff #endif 20363b3a8eb9SGleb Smirnoff 20373b3a8eb9SGleb Smirnoff case DN_CMD_CONFIG: /* simply a header */ 20383b3a8eb9SGleb Smirnoff break; 20393b3a8eb9SGleb Smirnoff 20403b3a8eb9SGleb Smirnoff case DN_CMD_DELETE: 20413b3a8eb9SGleb Smirnoff /* the argument is in the first uintptr_t after o */ 20420ac43d97SMarius Strobl if (o.len < sizeof(o) + sizeof(a)) { 20433b3a8eb9SGleb Smirnoff err = EINVAL; 20443b3a8eb9SGleb Smirnoff break; 20453b3a8eb9SGleb Smirnoff } 20460ac43d97SMarius Strobl memcpy(&a, (char *)p + off + sizeof(o), sizeof(a)); 20470ac43d97SMarius Strobl switch (o.subtype) { 20483b3a8eb9SGleb Smirnoff case DN_LINK: 20493b3a8eb9SGleb Smirnoff /* delete base and derived schedulers */ 20503b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 20510ac43d97SMarius Strobl err = delete_schk(a); 20520ac43d97SMarius Strobl err2 = delete_schk(a + DN_MAX_ID); 20533b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 20543b3a8eb9SGleb Smirnoff if (!err) 20553b3a8eb9SGleb Smirnoff err = err2; 20563b3a8eb9SGleb Smirnoff break; 20573b3a8eb9SGleb Smirnoff 20583b3a8eb9SGleb Smirnoff default: 20590ac43d97SMarius Strobl D("invalid delete type %d", o.subtype); 20603b3a8eb9SGleb Smirnoff err = EINVAL; 20613b3a8eb9SGleb Smirnoff break; 20623b3a8eb9SGleb Smirnoff 20633b3a8eb9SGleb Smirnoff case DN_FS: 20640ac43d97SMarius Strobl err = (a < 1 || a >= DN_MAX_ID) ? 20650ac43d97SMarius Strobl EINVAL : delete_fs(a, 0) ; 20663b3a8eb9SGleb Smirnoff break; 20673b3a8eb9SGleb Smirnoff } 20683b3a8eb9SGleb Smirnoff break; 20693b3a8eb9SGleb Smirnoff 20703b3a8eb9SGleb Smirnoff case DN_CMD_FLUSH: 20713b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 20723b3a8eb9SGleb Smirnoff dummynet_flush(); 20733b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 20743b3a8eb9SGleb Smirnoff break; 20750ac43d97SMarius Strobl case DN_TEXT: /* store argument of next block */ 20760ac43d97SMarius Strobl free(arg, M_TEMP); 207751d73df1SKristof Provost arg = malloc(o.len, M_TEMP, M_NOWAIT); 207851d73df1SKristof Provost if (arg == NULL) { 207951d73df1SKristof Provost err = ENOMEM; 208051d73df1SKristof Provost break; 208151d73df1SKristof Provost } 20820ac43d97SMarius Strobl memcpy(arg, (char *)p + off, o.len); 20833b3a8eb9SGleb Smirnoff break; 20843b3a8eb9SGleb Smirnoff case DN_LINK: 20850ac43d97SMarius Strobl if (dn == NULL) 208651d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 208751d73df1SKristof Provost if (dn == NULL) { 208851d73df1SKristof Provost err = ENOMEM; 208951d73df1SKristof Provost break; 209051d73df1SKristof Provost } 20910ac43d97SMarius Strobl memcpy(&dn->link, (char *)p + off, sizeof(dn->link)); 20920ac43d97SMarius Strobl err = config_link(&dn->link, arg); 20933b3a8eb9SGleb Smirnoff break; 20943b3a8eb9SGleb Smirnoff case DN_PROFILE: 20950ac43d97SMarius Strobl if (dn == NULL) 209651d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 209751d73df1SKristof Provost if (dn == NULL) { 209851d73df1SKristof Provost err = ENOMEM; 209951d73df1SKristof Provost break; 210051d73df1SKristof Provost } 21010ac43d97SMarius Strobl memcpy(&dn->profile, (char *)p + off, 21020ac43d97SMarius Strobl sizeof(dn->profile)); 21030ac43d97SMarius Strobl err = config_profile(&dn->profile, arg); 21043b3a8eb9SGleb Smirnoff break; 21053b3a8eb9SGleb Smirnoff case DN_SCH: 21060ac43d97SMarius Strobl if (dn == NULL) 210751d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 210851d73df1SKristof Provost if (dn == NULL) { 210951d73df1SKristof Provost err = ENOMEM; 211051d73df1SKristof Provost break; 211151d73df1SKristof Provost } 21120ac43d97SMarius Strobl memcpy(&dn->sched, (char *)p + off, 21130ac43d97SMarius Strobl sizeof(dn->sched)); 21140ac43d97SMarius Strobl err = config_sched(&dn->sched, arg); 21153b3a8eb9SGleb Smirnoff break; 21163b3a8eb9SGleb Smirnoff case DN_FS: 21170ac43d97SMarius Strobl if (dn == NULL) 211851d73df1SKristof Provost dn = malloc(sizeof(*dn), M_TEMP, M_NOWAIT); 211951d73df1SKristof Provost if (dn == NULL) { 212051d73df1SKristof Provost err = ENOMEM; 212151d73df1SKristof Provost break; 212251d73df1SKristof Provost } 21230ac43d97SMarius Strobl memcpy(&dn->fs, (char *)p + off, sizeof(dn->fs)); 21240ac43d97SMarius Strobl err = (NULL == config_fs(&dn->fs, arg, 0)); 21253b3a8eb9SGleb Smirnoff break; 21263b3a8eb9SGleb Smirnoff } 21273b3a8eb9SGleb Smirnoff if (err != 0) 21283b3a8eb9SGleb Smirnoff break; 21290ac43d97SMarius Strobl off += o.len; 21303b3a8eb9SGleb Smirnoff } 21310ac43d97SMarius Strobl free(arg, M_TEMP); 21320ac43d97SMarius Strobl free(dn, M_TEMP); 21333b3a8eb9SGleb Smirnoff return err; 21343b3a8eb9SGleb Smirnoff } 21353b3a8eb9SGleb Smirnoff 21363b3a8eb9SGleb Smirnoff static int 21373b3a8eb9SGleb Smirnoff compute_space(struct dn_id *cmd, struct copy_args *a) 21383b3a8eb9SGleb Smirnoff { 21393b3a8eb9SGleb Smirnoff int x = 0, need = 0; 21403b3a8eb9SGleb Smirnoff int profile_size = sizeof(struct dn_profile) - 21413b3a8eb9SGleb Smirnoff ED_MAX_SAMPLES_NO*sizeof(int); 21423b3a8eb9SGleb Smirnoff 21433b3a8eb9SGleb Smirnoff /* NOTE about compute space: 2144fe3bcfbdSTom Jones * NP = V_dn_cfg.schk_count 2145fe3bcfbdSTom Jones * NSI = V_dn_cfg.si_count 2146fe3bcfbdSTom Jones * NF = V_dn_cfg.fsk_count 2147fe3bcfbdSTom Jones * NQ = V_dn_cfg.queue_count 21483b3a8eb9SGleb Smirnoff * - ipfw pipe show 21493b3a8eb9SGleb Smirnoff * (NP/2)*(dn_link + dn_sch + dn_id + dn_fs) only half scheduler 21503b3a8eb9SGleb Smirnoff * link, scheduler template, flowset 21513b3a8eb9SGleb Smirnoff * integrated in scheduler and header 21523b3a8eb9SGleb Smirnoff * for flowset list 21533b3a8eb9SGleb Smirnoff * (NSI)*(dn_flow) all scheduler instance (includes 21543b3a8eb9SGleb Smirnoff * the queue instance) 21553b3a8eb9SGleb Smirnoff * - ipfw sched show 21563b3a8eb9SGleb Smirnoff * (NP/2)*(dn_link + dn_sch + dn_id + dn_fs) only half scheduler 21573b3a8eb9SGleb Smirnoff * link, scheduler template, flowset 21583b3a8eb9SGleb Smirnoff * integrated in scheduler and header 21593b3a8eb9SGleb Smirnoff * for flowset list 21603b3a8eb9SGleb Smirnoff * (NSI * dn_flow) all scheduler instances 21613b3a8eb9SGleb Smirnoff * (NF * sizeof(uint_32)) space for flowset list linked to scheduler 21623b3a8eb9SGleb Smirnoff * (NQ * dn_queue) all queue [XXXfor now not listed] 21633b3a8eb9SGleb Smirnoff * - ipfw queue show 21643b3a8eb9SGleb Smirnoff * (NF * dn_fs) all flowset 21653b3a8eb9SGleb Smirnoff * (NQ * dn_queue) all queues 21663b3a8eb9SGleb Smirnoff */ 21673b3a8eb9SGleb Smirnoff switch (cmd->subtype) { 21683b3a8eb9SGleb Smirnoff default: 21693b3a8eb9SGleb Smirnoff return -1; 21703b3a8eb9SGleb Smirnoff /* XXX where do LINK and SCH differ ? */ 21713b3a8eb9SGleb Smirnoff /* 'ipfw sched show' could list all queues associated to 21723b3a8eb9SGleb Smirnoff * a scheduler. This feature for now is disabled 21733b3a8eb9SGleb Smirnoff */ 21743b3a8eb9SGleb Smirnoff case DN_LINK: /* pipe show */ 21753b3a8eb9SGleb Smirnoff x = DN_C_LINK | DN_C_SCH | DN_C_FLOW; 2176fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * 21773b3a8eb9SGleb Smirnoff (sizeof(struct dn_fs) + profile_size) / 2; 2178fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(uint32_t); 21793b3a8eb9SGleb Smirnoff break; 21803b3a8eb9SGleb Smirnoff case DN_SCH: /* sched show */ 2181fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * 21823b3a8eb9SGleb Smirnoff (sizeof(struct dn_fs) + profile_size) / 2; 2183fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(uint32_t); 21843b3a8eb9SGleb Smirnoff x = DN_C_SCH | DN_C_LINK | DN_C_FLOW; 21853b3a8eb9SGleb Smirnoff break; 21863b3a8eb9SGleb Smirnoff case DN_FS: /* queue show */ 21873b3a8eb9SGleb Smirnoff x = DN_C_FS | DN_C_QUEUE; 21883b3a8eb9SGleb Smirnoff break; 21893b3a8eb9SGleb Smirnoff case DN_GET_COMPAT: /* compatibility mode */ 21903b3a8eb9SGleb Smirnoff need = dn_compat_calc_size(); 21913b3a8eb9SGleb Smirnoff break; 21923b3a8eb9SGleb Smirnoff } 21933b3a8eb9SGleb Smirnoff a->flags = x; 21943b3a8eb9SGleb Smirnoff if (x & DN_C_SCH) { 2195fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_sch) / 2; 21963b3a8eb9SGleb Smirnoff /* NOT also, each fs might be attached to a sched */ 2197fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_id) / 2; 21983b3a8eb9SGleb Smirnoff } 21993b3a8eb9SGleb Smirnoff if (x & DN_C_FS) 2200fe3bcfbdSTom Jones need += V_dn_cfg.fsk_count * sizeof(struct dn_fs); 22013b3a8eb9SGleb Smirnoff if (x & DN_C_LINK) { 2202fe3bcfbdSTom Jones need += V_dn_cfg.schk_count * sizeof(struct dn_link) / 2; 22033b3a8eb9SGleb Smirnoff } 22043b3a8eb9SGleb Smirnoff /* 22053b3a8eb9SGleb Smirnoff * When exporting a queue to userland, only pass up the 22063b3a8eb9SGleb Smirnoff * struct dn_flow, which is the only visible part. 22073b3a8eb9SGleb Smirnoff */ 22083b3a8eb9SGleb Smirnoff 22093b3a8eb9SGleb Smirnoff if (x & DN_C_QUEUE) 2210fe3bcfbdSTom Jones need += V_dn_cfg.queue_count * sizeof(struct dn_flow); 22113b3a8eb9SGleb Smirnoff if (x & DN_C_FLOW) 2212fe3bcfbdSTom Jones need += V_dn_cfg.si_count * (sizeof(struct dn_flow)); 22133b3a8eb9SGleb Smirnoff return need; 22143b3a8eb9SGleb Smirnoff } 22153b3a8eb9SGleb Smirnoff 22163b3a8eb9SGleb Smirnoff /* 22173b3a8eb9SGleb Smirnoff * If compat != NULL dummynet_get is called in compatibility mode. 22183b3a8eb9SGleb Smirnoff * *compat will be the pointer to the buffer to pass to ipfw 22193b3a8eb9SGleb Smirnoff */ 22203b3a8eb9SGleb Smirnoff int 22213b3a8eb9SGleb Smirnoff dummynet_get(struct sockopt *sopt, void **compat) 22223b3a8eb9SGleb Smirnoff { 22233b3a8eb9SGleb Smirnoff int have, i, need, error; 22243b3a8eb9SGleb Smirnoff char *start = NULL, *buf; 22253b3a8eb9SGleb Smirnoff size_t sopt_valsize; 22263b3a8eb9SGleb Smirnoff struct dn_id *cmd; 22273b3a8eb9SGleb Smirnoff struct copy_args a; 22283b3a8eb9SGleb Smirnoff struct copy_range r; 22293b3a8eb9SGleb Smirnoff int l = sizeof(struct dn_id); 22303b3a8eb9SGleb Smirnoff 22313b3a8eb9SGleb Smirnoff bzero(&a, sizeof(a)); 22323b3a8eb9SGleb Smirnoff bzero(&r, sizeof(r)); 22333b3a8eb9SGleb Smirnoff 22343b3a8eb9SGleb Smirnoff /* save and restore original sopt_valsize around copyin */ 22353b3a8eb9SGleb Smirnoff sopt_valsize = sopt->sopt_valsize; 22363b3a8eb9SGleb Smirnoff 22373b3a8eb9SGleb Smirnoff cmd = &r.o; 22383b3a8eb9SGleb Smirnoff 22393b3a8eb9SGleb Smirnoff if (!compat) { 22403b3a8eb9SGleb Smirnoff /* copy at least an oid, and possibly a full object */ 22413b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, cmd, sizeof(r), sizeof(*cmd)); 22423b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 22433b3a8eb9SGleb Smirnoff if (error) 22443b3a8eb9SGleb Smirnoff goto done; 22453b3a8eb9SGleb Smirnoff l = cmd->len; 22463b3a8eb9SGleb Smirnoff #ifdef EMULATE_SYSCTL 22473b3a8eb9SGleb Smirnoff /* sysctl emulation. */ 22483b3a8eb9SGleb Smirnoff if (cmd->type == DN_SYSCTL_GET) 22493b3a8eb9SGleb Smirnoff return kesysctl_emu_get(sopt); 22503b3a8eb9SGleb Smirnoff #endif 22513b3a8eb9SGleb Smirnoff if (l > sizeof(r)) { 22523b3a8eb9SGleb Smirnoff /* request larger than default, allocate buffer */ 225351d73df1SKristof Provost cmd = malloc(l, M_DUMMYNET, M_NOWAIT); 225451d73df1SKristof Provost if (cmd == NULL) { 225551d73df1SKristof Provost error = ENOMEM; 225651d73df1SKristof Provost goto done; 225751d73df1SKristof Provost } 22583b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, cmd, l, l); 22593b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 22603b3a8eb9SGleb Smirnoff if (error) 22613b3a8eb9SGleb Smirnoff goto done; 22623b3a8eb9SGleb Smirnoff } 22633b3a8eb9SGleb Smirnoff } else { /* compatibility */ 22643b3a8eb9SGleb Smirnoff error = 0; 22653b3a8eb9SGleb Smirnoff cmd->type = DN_CMD_GET; 22663b3a8eb9SGleb Smirnoff cmd->len = sizeof(struct dn_id); 22673b3a8eb9SGleb Smirnoff cmd->subtype = DN_GET_COMPAT; 22683b3a8eb9SGleb Smirnoff // cmd->id = sopt_valsize; 22693b3a8eb9SGleb Smirnoff D("compatibility mode"); 22703b3a8eb9SGleb Smirnoff } 227191336b40SDon Lewis 227291336b40SDon Lewis #ifdef NEW_AQM 227391336b40SDon Lewis /* get AQM params */ 227491336b40SDon Lewis if(cmd->subtype == DN_AQM_PARAMS) { 227591336b40SDon Lewis error = get_aqm_parms(sopt); 227691336b40SDon Lewis goto done; 227791336b40SDon Lewis /* get Scheduler params */ 227891336b40SDon Lewis } else if (cmd->subtype == DN_SCH_PARAMS) { 227991336b40SDon Lewis error = get_sched_parms(sopt); 228091336b40SDon Lewis goto done; 228191336b40SDon Lewis } 228291336b40SDon Lewis #endif 228391336b40SDon Lewis 22843b3a8eb9SGleb Smirnoff a.extra = (struct copy_range *)cmd; 22853b3a8eb9SGleb Smirnoff if (cmd->len == sizeof(*cmd)) { /* no range, create a default */ 22863b3a8eb9SGleb Smirnoff uint32_t *rp = (uint32_t *)(cmd + 1); 22873b3a8eb9SGleb Smirnoff cmd->len += 2* sizeof(uint32_t); 22883b3a8eb9SGleb Smirnoff rp[0] = 1; 22893b3a8eb9SGleb Smirnoff rp[1] = DN_MAX_ID - 1; 22903b3a8eb9SGleb Smirnoff if (cmd->subtype == DN_LINK) { 22913b3a8eb9SGleb Smirnoff rp[0] += DN_MAX_ID; 22923b3a8eb9SGleb Smirnoff rp[1] += DN_MAX_ID; 22933b3a8eb9SGleb Smirnoff } 22943b3a8eb9SGleb Smirnoff } 22953b3a8eb9SGleb Smirnoff /* Count space (under lock) and allocate (outside lock). 22963b3a8eb9SGleb Smirnoff * Exit with lock held if we manage to get enough buffer. 22973b3a8eb9SGleb Smirnoff * Try a few times then give up. 22983b3a8eb9SGleb Smirnoff */ 22993b3a8eb9SGleb Smirnoff for (have = 0, i = 0; i < 10; i++) { 23003b3a8eb9SGleb Smirnoff DN_BH_WLOCK(); 23013b3a8eb9SGleb Smirnoff need = compute_space(cmd, &a); 23023b3a8eb9SGleb Smirnoff 23033b3a8eb9SGleb Smirnoff /* if there is a range, ignore value from compute_space() */ 23043b3a8eb9SGleb Smirnoff if (l > sizeof(*cmd)) 23053b3a8eb9SGleb Smirnoff need = sopt_valsize - sizeof(*cmd); 23063b3a8eb9SGleb Smirnoff 23073b3a8eb9SGleb Smirnoff if (need < 0) { 23083b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23093b3a8eb9SGleb Smirnoff error = EINVAL; 23103b3a8eb9SGleb Smirnoff goto done; 23113b3a8eb9SGleb Smirnoff } 23123b3a8eb9SGleb Smirnoff need += sizeof(*cmd); 23133b3a8eb9SGleb Smirnoff cmd->id = need; 23143b3a8eb9SGleb Smirnoff if (have >= need) 23153b3a8eb9SGleb Smirnoff break; 23163b3a8eb9SGleb Smirnoff 23173b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23183b3a8eb9SGleb Smirnoff free(start, M_DUMMYNET); 23193b3a8eb9SGleb Smirnoff start = NULL; 23203b3a8eb9SGleb Smirnoff if (need > sopt_valsize) 23213b3a8eb9SGleb Smirnoff break; 23223b3a8eb9SGleb Smirnoff 23233b3a8eb9SGleb Smirnoff have = need; 232451d73df1SKristof Provost start = malloc(have, M_DUMMYNET, M_NOWAIT | M_ZERO); 23253b3a8eb9SGleb Smirnoff } 23263b3a8eb9SGleb Smirnoff 23273b3a8eb9SGleb Smirnoff if (start == NULL) { 23283b3a8eb9SGleb Smirnoff if (compat) { 23293b3a8eb9SGleb Smirnoff *compat = NULL; 23303b3a8eb9SGleb Smirnoff error = 1; // XXX 23313b3a8eb9SGleb Smirnoff } else { 23323b3a8eb9SGleb Smirnoff error = sooptcopyout(sopt, cmd, sizeof(*cmd)); 23333b3a8eb9SGleb Smirnoff } 23343b3a8eb9SGleb Smirnoff goto done; 23353b3a8eb9SGleb Smirnoff } 23363b3a8eb9SGleb Smirnoff ND("have %d:%d sched %d, %d:%d links %d, %d:%d flowsets %d, " 23373b3a8eb9SGleb Smirnoff "%d:%d si %d, %d:%d queues %d", 2338fe3bcfbdSTom Jones V_dn_cfg.schk_count, sizeof(struct dn_sch), DN_SCH, 2339fe3bcfbdSTom Jones V_dn_cfg.schk_count, sizeof(struct dn_link), DN_LINK, 2340fe3bcfbdSTom Jones V_dn_cfg.fsk_count, sizeof(struct dn_fs), DN_FS, 2341fe3bcfbdSTom Jones V_dn_cfg.si_count, sizeof(struct dn_flow), DN_SCH_I, 2342fe3bcfbdSTom Jones V_dn_cfg.queue_count, sizeof(struct dn_queue), DN_QUEUE); 23433b3a8eb9SGleb Smirnoff sopt->sopt_valsize = sopt_valsize; 23443b3a8eb9SGleb Smirnoff a.type = cmd->subtype; 23453b3a8eb9SGleb Smirnoff 23463b3a8eb9SGleb Smirnoff if (compat == NULL) { 23470ac43d97SMarius Strobl memcpy(start, cmd, sizeof(*cmd)); 23483b3a8eb9SGleb Smirnoff ((struct dn_id*)(start))->len = sizeof(struct dn_id); 23493b3a8eb9SGleb Smirnoff buf = start + sizeof(*cmd); 23503b3a8eb9SGleb Smirnoff } else 23513b3a8eb9SGleb Smirnoff buf = start; 23523b3a8eb9SGleb Smirnoff a.start = &buf; 23533b3a8eb9SGleb Smirnoff a.end = start + have; 23543b3a8eb9SGleb Smirnoff /* start copying other objects */ 23553b3a8eb9SGleb Smirnoff if (compat) { 23563b3a8eb9SGleb Smirnoff a.type = DN_COMPAT_PIPE; 2357fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, copy_data_helper_compat, &a); 23583b3a8eb9SGleb Smirnoff a.type = DN_COMPAT_QUEUE; 2359fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, copy_data_helper_compat, &a); 23603b3a8eb9SGleb Smirnoff } else if (a.type == DN_FS) { 2361fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, copy_data_helper, &a); 23623b3a8eb9SGleb Smirnoff } else { 2363fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.schedhash, copy_data_helper, &a); 23643b3a8eb9SGleb Smirnoff } 23653b3a8eb9SGleb Smirnoff DN_BH_WUNLOCK(); 23663b3a8eb9SGleb Smirnoff 23673b3a8eb9SGleb Smirnoff if (compat) { 23683b3a8eb9SGleb Smirnoff *compat = start; 23693b3a8eb9SGleb Smirnoff sopt->sopt_valsize = buf - start; 23703b3a8eb9SGleb Smirnoff /* free() is done by ip_dummynet_compat() */ 23713b3a8eb9SGleb Smirnoff start = NULL; //XXX hack 23723b3a8eb9SGleb Smirnoff } else { 23733b3a8eb9SGleb Smirnoff error = sooptcopyout(sopt, start, buf - start); 23743b3a8eb9SGleb Smirnoff } 23753b3a8eb9SGleb Smirnoff done: 2376*1b2dbe37SKristof Provost if (cmd != &r.o) 23773b3a8eb9SGleb Smirnoff free(cmd, M_DUMMYNET); 23783b3a8eb9SGleb Smirnoff free(start, M_DUMMYNET); 23793b3a8eb9SGleb Smirnoff return error; 23803b3a8eb9SGleb Smirnoff } 23813b3a8eb9SGleb Smirnoff 23823b3a8eb9SGleb Smirnoff /* Callback called on scheduler instance to delete it if idle */ 23833b3a8eb9SGleb Smirnoff static int 23843b3a8eb9SGleb Smirnoff drain_scheduler_cb(void *_si, void *arg) 23853b3a8eb9SGleb Smirnoff { 23863b3a8eb9SGleb Smirnoff struct dn_sch_inst *si = _si; 23873b3a8eb9SGleb Smirnoff 23883b3a8eb9SGleb Smirnoff if ((si->kflags & DN_ACTIVE) || si->dline.mq.head != NULL) 23893b3a8eb9SGleb Smirnoff return 0; 23903b3a8eb9SGleb Smirnoff 23913b3a8eb9SGleb Smirnoff if (si->sched->fp->flags & DN_MULTIQUEUE) { 23923b3a8eb9SGleb Smirnoff if (si->q_count == 0) 23933b3a8eb9SGleb Smirnoff return si_destroy(si, NULL); 23943b3a8eb9SGleb Smirnoff else 23953b3a8eb9SGleb Smirnoff return 0; 23963b3a8eb9SGleb Smirnoff } else { /* !DN_MULTIQUEUE */ 23973b3a8eb9SGleb Smirnoff if ((si+1)->ni.length == 0) 23983b3a8eb9SGleb Smirnoff return si_destroy(si, NULL); 23993b3a8eb9SGleb Smirnoff else 24003b3a8eb9SGleb Smirnoff return 0; 24013b3a8eb9SGleb Smirnoff } 24023b3a8eb9SGleb Smirnoff return 0; /* unreachable */ 24033b3a8eb9SGleb Smirnoff } 24043b3a8eb9SGleb Smirnoff 24053b3a8eb9SGleb Smirnoff /* Callback called on scheduler to check if it has instances */ 24063b3a8eb9SGleb Smirnoff static int 24073b3a8eb9SGleb Smirnoff drain_scheduler_sch_cb(void *_s, void *arg) 24083b3a8eb9SGleb Smirnoff { 24093b3a8eb9SGleb Smirnoff struct dn_schk *s = _s; 24103b3a8eb9SGleb Smirnoff 24113b3a8eb9SGleb Smirnoff if (s->sch.flags & DN_HAVE_MASK) { 24123b3a8eb9SGleb Smirnoff dn_ht_scan_bucket(s->siht, &s->drain_bucket, 24133b3a8eb9SGleb Smirnoff drain_scheduler_cb, NULL); 24143b3a8eb9SGleb Smirnoff s->drain_bucket++; 24153b3a8eb9SGleb Smirnoff } else { 24163b3a8eb9SGleb Smirnoff if (s->siht) { 24173b3a8eb9SGleb Smirnoff if (drain_scheduler_cb(s->siht, NULL) == DNHT_SCAN_DEL) 24183b3a8eb9SGleb Smirnoff s->siht = NULL; 24193b3a8eb9SGleb Smirnoff } 24203b3a8eb9SGleb Smirnoff } 24213b3a8eb9SGleb Smirnoff return 0; 24223b3a8eb9SGleb Smirnoff } 24233b3a8eb9SGleb Smirnoff 24243b3a8eb9SGleb Smirnoff /* Called every tick, try to delete a 'bucket' of scheduler */ 24253b3a8eb9SGleb Smirnoff void 24263b3a8eb9SGleb Smirnoff dn_drain_scheduler(void) 24273b3a8eb9SGleb Smirnoff { 2428fe3bcfbdSTom Jones dn_ht_scan_bucket(V_dn_cfg.schedhash, &V_dn_cfg.drain_sch, 24293b3a8eb9SGleb Smirnoff drain_scheduler_sch_cb, NULL); 2430fe3bcfbdSTom Jones V_dn_cfg.drain_sch++; 24313b3a8eb9SGleb Smirnoff } 24323b3a8eb9SGleb Smirnoff 24333b3a8eb9SGleb Smirnoff /* Callback called on queue to delete if it is idle */ 24343b3a8eb9SGleb Smirnoff static int 24353b3a8eb9SGleb Smirnoff drain_queue_cb(void *_q, void *arg) 24363b3a8eb9SGleb Smirnoff { 24373b3a8eb9SGleb Smirnoff struct dn_queue *q = _q; 24383b3a8eb9SGleb Smirnoff 24393b3a8eb9SGleb Smirnoff if (q->ni.length == 0) { 24403b3a8eb9SGleb Smirnoff dn_delete_queue(q, DN_DESTROY); 24413b3a8eb9SGleb Smirnoff return DNHT_SCAN_DEL; /* queue is deleted */ 24423b3a8eb9SGleb Smirnoff } 24433b3a8eb9SGleb Smirnoff 24443b3a8eb9SGleb Smirnoff return 0; /* queue isn't deleted */ 24453b3a8eb9SGleb Smirnoff } 24463b3a8eb9SGleb Smirnoff 24473b3a8eb9SGleb Smirnoff /* Callback called on flowset used to check if it has queues */ 24483b3a8eb9SGleb Smirnoff static int 24493b3a8eb9SGleb Smirnoff drain_queue_fs_cb(void *_fs, void *arg) 24503b3a8eb9SGleb Smirnoff { 24513b3a8eb9SGleb Smirnoff struct dn_fsk *fs = _fs; 24523b3a8eb9SGleb Smirnoff 24533b3a8eb9SGleb Smirnoff if (fs->fs.flags & DN_QHT_HASH) { 24543b3a8eb9SGleb Smirnoff /* Flowset has a hash table for queues */ 24553b3a8eb9SGleb Smirnoff dn_ht_scan_bucket(fs->qht, &fs->drain_bucket, 24563b3a8eb9SGleb Smirnoff drain_queue_cb, NULL); 24573b3a8eb9SGleb Smirnoff fs->drain_bucket++; 24583b3a8eb9SGleb Smirnoff } else { 24593b3a8eb9SGleb Smirnoff /* No hash table for this flowset, null the pointer 24603b3a8eb9SGleb Smirnoff * if the queue is deleted 24613b3a8eb9SGleb Smirnoff */ 24623b3a8eb9SGleb Smirnoff if (fs->qht) { 24633b3a8eb9SGleb Smirnoff if (drain_queue_cb(fs->qht, NULL) == DNHT_SCAN_DEL) 24643b3a8eb9SGleb Smirnoff fs->qht = NULL; 24653b3a8eb9SGleb Smirnoff } 24663b3a8eb9SGleb Smirnoff } 24673b3a8eb9SGleb Smirnoff return 0; 24683b3a8eb9SGleb Smirnoff } 24693b3a8eb9SGleb Smirnoff 24703b3a8eb9SGleb Smirnoff /* Called every tick, try to delete a 'bucket' of queue */ 24713b3a8eb9SGleb Smirnoff void 24723b3a8eb9SGleb Smirnoff dn_drain_queue(void) 24733b3a8eb9SGleb Smirnoff { 24743b3a8eb9SGleb Smirnoff /* scan a bucket of flowset */ 2475fe3bcfbdSTom Jones dn_ht_scan_bucket(V_dn_cfg.fshash, &V_dn_cfg.drain_fs, 24763b3a8eb9SGleb Smirnoff drain_queue_fs_cb, NULL); 2477fe3bcfbdSTom Jones V_dn_cfg.drain_fs++; 24783b3a8eb9SGleb Smirnoff } 24793b3a8eb9SGleb Smirnoff 24803b3a8eb9SGleb Smirnoff /* 24813b3a8eb9SGleb Smirnoff * Handler for the various dummynet socket options 24823b3a8eb9SGleb Smirnoff */ 24833b3a8eb9SGleb Smirnoff static int 24843b3a8eb9SGleb Smirnoff ip_dn_ctl(struct sockopt *sopt) 24853b3a8eb9SGleb Smirnoff { 248651d73df1SKristof Provost struct epoch_tracker et; 24873b3a8eb9SGleb Smirnoff void *p = NULL; 24883b3a8eb9SGleb Smirnoff int error, l; 24893b3a8eb9SGleb Smirnoff 24903b3a8eb9SGleb Smirnoff error = priv_check(sopt->sopt_td, PRIV_NETINET_DUMMYNET); 24913b3a8eb9SGleb Smirnoff if (error) 24923b3a8eb9SGleb Smirnoff return (error); 24933b3a8eb9SGleb Smirnoff 24943b3a8eb9SGleb Smirnoff /* Disallow sets in really-really secure mode. */ 24953b3a8eb9SGleb Smirnoff if (sopt->sopt_dir == SOPT_SET) { 24963b3a8eb9SGleb Smirnoff error = securelevel_ge(sopt->sopt_td->td_ucred, 3); 24973b3a8eb9SGleb Smirnoff if (error) 24983b3a8eb9SGleb Smirnoff return (error); 24993b3a8eb9SGleb Smirnoff } 25003b3a8eb9SGleb Smirnoff 250151d73df1SKristof Provost NET_EPOCH_ENTER(et); 250251d73df1SKristof Provost 25033b3a8eb9SGleb Smirnoff switch (sopt->sopt_name) { 25043b3a8eb9SGleb Smirnoff default : 25053b3a8eb9SGleb Smirnoff D("dummynet: unknown option %d", sopt->sopt_name); 25063b3a8eb9SGleb Smirnoff error = EINVAL; 25073b3a8eb9SGleb Smirnoff break; 25083b3a8eb9SGleb Smirnoff 25093b3a8eb9SGleb Smirnoff case IP_DUMMYNET_FLUSH: 25103b3a8eb9SGleb Smirnoff case IP_DUMMYNET_CONFIGURE: 25113b3a8eb9SGleb Smirnoff case IP_DUMMYNET_DEL: /* remove a pipe or queue */ 25123b3a8eb9SGleb Smirnoff case IP_DUMMYNET_GET: 25133b3a8eb9SGleb Smirnoff D("dummynet: compat option %d", sopt->sopt_name); 25143b3a8eb9SGleb Smirnoff error = ip_dummynet_compat(sopt); 25153b3a8eb9SGleb Smirnoff break; 25163b3a8eb9SGleb Smirnoff 25173b3a8eb9SGleb Smirnoff case IP_DUMMYNET3 : 25183b3a8eb9SGleb Smirnoff if (sopt->sopt_dir == SOPT_GET) { 25193b3a8eb9SGleb Smirnoff error = dummynet_get(sopt, NULL); 25203b3a8eb9SGleb Smirnoff break; 25213b3a8eb9SGleb Smirnoff } 25223b3a8eb9SGleb Smirnoff l = sopt->sopt_valsize; 25233b3a8eb9SGleb Smirnoff if (l < sizeof(struct dn_id) || l > 12000) { 25243b3a8eb9SGleb Smirnoff D("argument len %d invalid", l); 25253b3a8eb9SGleb Smirnoff break; 25263b3a8eb9SGleb Smirnoff } 252751d73df1SKristof Provost p = malloc(l, M_TEMP, M_NOWAIT); 252851d73df1SKristof Provost if (p == NULL) { 252951d73df1SKristof Provost error = ENOMEM; 253051d73df1SKristof Provost break; 253151d73df1SKristof Provost } 25323b3a8eb9SGleb Smirnoff error = sooptcopyin(sopt, p, l, l); 25333b3a8eb9SGleb Smirnoff if (error) 25343b3a8eb9SGleb Smirnoff break ; 25353b3a8eb9SGleb Smirnoff error = do_config(p, l); 25363b3a8eb9SGleb Smirnoff break; 25373b3a8eb9SGleb Smirnoff } 25383b3a8eb9SGleb Smirnoff 25393b3a8eb9SGleb Smirnoff free(p, M_TEMP); 25403b3a8eb9SGleb Smirnoff 254151d73df1SKristof Provost NET_EPOCH_EXIT(et); 254251d73df1SKristof Provost 25433b3a8eb9SGleb Smirnoff return error ; 25443b3a8eb9SGleb Smirnoff } 25453b3a8eb9SGleb Smirnoff 25463b3a8eb9SGleb Smirnoff static void 2547fe3bcfbdSTom Jones ip_dn_vnet_init(void) 25483b3a8eb9SGleb Smirnoff { 2549fe3bcfbdSTom Jones if (V_dn_cfg.init_done) 25503b3a8eb9SGleb Smirnoff return; 2551fe3bcfbdSTom Jones V_dn_cfg.init_done = 1; 25523b3a8eb9SGleb Smirnoff /* Set defaults here. MSVC does not accept initializers, 25533b3a8eb9SGleb Smirnoff * and this is also useful for vimages 25543b3a8eb9SGleb Smirnoff */ 25553b3a8eb9SGleb Smirnoff /* queue limits */ 2556fe3bcfbdSTom Jones V_dn_cfg.slot_limit = 100; /* Foot shooting limit for queues. */ 2557fe3bcfbdSTom Jones V_dn_cfg.byte_limit = 1024 * 1024; 2558fe3bcfbdSTom Jones V_dn_cfg.expire = 1; 25593b3a8eb9SGleb Smirnoff 25603b3a8eb9SGleb Smirnoff /* RED parameters */ 2561fe3bcfbdSTom Jones V_dn_cfg.red_lookup_depth = 256; /* default lookup table depth */ 2562fe3bcfbdSTom Jones V_dn_cfg.red_avg_pkt_size = 512; /* default medium packet size */ 2563fe3bcfbdSTom Jones V_dn_cfg.red_max_pkt_size = 1500; /* default max packet size */ 25643b3a8eb9SGleb Smirnoff 25653b3a8eb9SGleb Smirnoff /* hash tables */ 2566fe3bcfbdSTom Jones V_dn_cfg.max_hash_size = 65536; /* max in the hash tables */ 2567fe3bcfbdSTom Jones V_dn_cfg.hash_size = 64; /* default hash size */ 25683b3a8eb9SGleb Smirnoff 25693b3a8eb9SGleb Smirnoff /* create hash tables for schedulers and flowsets. 25703b3a8eb9SGleb Smirnoff * In both we search by key and by pointer. 25713b3a8eb9SGleb Smirnoff */ 2572fe3bcfbdSTom Jones V_dn_cfg.schedhash = dn_ht_init(NULL, V_dn_cfg.hash_size, 25733b3a8eb9SGleb Smirnoff offsetof(struct dn_schk, schk_next), 25743b3a8eb9SGleb Smirnoff schk_hash, schk_match, schk_new); 2575fe3bcfbdSTom Jones V_dn_cfg.fshash = dn_ht_init(NULL, V_dn_cfg.hash_size, 25763b3a8eb9SGleb Smirnoff offsetof(struct dn_fsk, fsk_next), 25773b3a8eb9SGleb Smirnoff fsk_hash, fsk_match, fsk_new); 25783b3a8eb9SGleb Smirnoff 25793b3a8eb9SGleb Smirnoff /* bucket index to drain object */ 2580fe3bcfbdSTom Jones V_dn_cfg.drain_fs = 0; 2581fe3bcfbdSTom Jones V_dn_cfg.drain_sch = 0; 25823b3a8eb9SGleb Smirnoff 2583fe3bcfbdSTom Jones heap_init(&V_dn_cfg.evheap, 16, offsetof(struct dn_id, id)); 2584fe3bcfbdSTom Jones SLIST_INIT(&V_dn_cfg.fsu); 25853b3a8eb9SGleb Smirnoff 25863b3a8eb9SGleb Smirnoff DN_LOCK_INIT(); 25873b3a8eb9SGleb Smirnoff 2588fe3bcfbdSTom Jones /* Initialize curr_time adjustment mechanics. */ 2589fe3bcfbdSTom Jones getmicrouptime(&V_dn_cfg.prev_t); 2590fe3bcfbdSTom Jones } 2591fe3bcfbdSTom Jones 2592fe3bcfbdSTom Jones static void 2593fe3bcfbdSTom Jones ip_dn_vnet_destroy(void) 2594fe3bcfbdSTom Jones { 2595fe3bcfbdSTom Jones DN_BH_WLOCK(); 2596fe3bcfbdSTom Jones dummynet_flush(); 2597fe3bcfbdSTom Jones DN_BH_WUNLOCK(); 2598fe3bcfbdSTom Jones 2599fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.schedhash, 0); 2600fe3bcfbdSTom Jones dn_ht_free(V_dn_cfg.fshash, 0); 2601fe3bcfbdSTom Jones heap_free(&V_dn_cfg.evheap); 2602fe3bcfbdSTom Jones 2603fe3bcfbdSTom Jones DN_LOCK_DESTROY(); 2604fe3bcfbdSTom Jones } 2605fe3bcfbdSTom Jones 2606fe3bcfbdSTom Jones static void 2607fe3bcfbdSTom Jones ip_dn_init(void) 2608fe3bcfbdSTom Jones { 2609fe3bcfbdSTom Jones if (dn_tasks_started) 2610fe3bcfbdSTom Jones return; 261151d73df1SKristof Provost 261251d73df1SKristof Provost mtx_init(&sched_mtx, "dn_sched", NULL, MTX_DEF); 261351d73df1SKristof Provost 2614fe3bcfbdSTom Jones dn_tasks_started = 1; 2615fe3bcfbdSTom Jones TASK_INIT(&dn_task, 0, dummynet_task, NULL); 26165f4fc3dbSAlexander Motin dn_tq = taskqueue_create_fast("dummynet", M_WAITOK, 26173b3a8eb9SGleb Smirnoff taskqueue_thread_enqueue, &dn_tq); 26183b3a8eb9SGleb Smirnoff taskqueue_start_threads(&dn_tq, 1, PI_NET, "dummynet"); 26193b3a8eb9SGleb Smirnoff 262051d73df1SKristof Provost CK_LIST_INIT(&schedlist); 2621fd90e2edSJung-uk Kim callout_init(&dn_timeout, 1); 26225f4fc3dbSAlexander Motin dn_reschedule(); 26233b3a8eb9SGleb Smirnoff } 26243b3a8eb9SGleb Smirnoff 26253b3a8eb9SGleb Smirnoff static void 26263b3a8eb9SGleb Smirnoff ip_dn_destroy(int last) 26273b3a8eb9SGleb Smirnoff { 2628c8cfbc06SHans Petter Selasky /* ensure no more callouts are started */ 2629c8cfbc06SHans Petter Selasky dn_gone = 1; 2630c8cfbc06SHans Petter Selasky 2631c8cfbc06SHans Petter Selasky /* check for last */ 26323b3a8eb9SGleb Smirnoff if (last) { 26333b3a8eb9SGleb Smirnoff ND("removing last instance\n"); 26343b3a8eb9SGleb Smirnoff ip_dn_ctl_ptr = NULL; 26353b3a8eb9SGleb Smirnoff ip_dn_io_ptr = NULL; 26363b3a8eb9SGleb Smirnoff } 26373b3a8eb9SGleb Smirnoff 2638c8cfbc06SHans Petter Selasky callout_drain(&dn_timeout); 26393b3a8eb9SGleb Smirnoff taskqueue_drain(dn_tq, &dn_task); 26403b3a8eb9SGleb Smirnoff taskqueue_free(dn_tq); 26413b3a8eb9SGleb Smirnoff } 26423b3a8eb9SGleb Smirnoff 26433b3a8eb9SGleb Smirnoff static int 26443b3a8eb9SGleb Smirnoff dummynet_modevent(module_t mod, int type, void *data) 26453b3a8eb9SGleb Smirnoff { 26463b3a8eb9SGleb Smirnoff 26473b3a8eb9SGleb Smirnoff if (type == MOD_LOAD) { 26483b3a8eb9SGleb Smirnoff if (ip_dn_io_ptr) { 26493b3a8eb9SGleb Smirnoff printf("DUMMYNET already loaded\n"); 26503b3a8eb9SGleb Smirnoff return EEXIST ; 26513b3a8eb9SGleb Smirnoff } 26523b3a8eb9SGleb Smirnoff ip_dn_init(); 26533b3a8eb9SGleb Smirnoff ip_dn_ctl_ptr = ip_dn_ctl; 26543b3a8eb9SGleb Smirnoff ip_dn_io_ptr = dummynet_io; 26553b3a8eb9SGleb Smirnoff return 0; 26563b3a8eb9SGleb Smirnoff } else if (type == MOD_UNLOAD) { 26573b3a8eb9SGleb Smirnoff ip_dn_destroy(1 /* last */); 26583b3a8eb9SGleb Smirnoff return 0; 26593b3a8eb9SGleb Smirnoff } else 26603b3a8eb9SGleb Smirnoff return EOPNOTSUPP; 26613b3a8eb9SGleb Smirnoff } 26623b3a8eb9SGleb Smirnoff 26633b3a8eb9SGleb Smirnoff /* modevent helpers for the modules */ 26643b3a8eb9SGleb Smirnoff static int 26653b3a8eb9SGleb Smirnoff load_dn_sched(struct dn_alg *d) 26663b3a8eb9SGleb Smirnoff { 26673b3a8eb9SGleb Smirnoff struct dn_alg *s; 26683b3a8eb9SGleb Smirnoff 26693b3a8eb9SGleb Smirnoff if (d == NULL) 26703b3a8eb9SGleb Smirnoff return 1; /* error */ 26713b3a8eb9SGleb Smirnoff ip_dn_init(); /* just in case, we need the lock */ 26723b3a8eb9SGleb Smirnoff 26733b3a8eb9SGleb Smirnoff /* Check that mandatory funcs exists */ 26743b3a8eb9SGleb Smirnoff if (d->enqueue == NULL || d->dequeue == NULL) { 26753b3a8eb9SGleb Smirnoff D("missing enqueue or dequeue for %s", d->name); 26763b3a8eb9SGleb Smirnoff return 1; 26773b3a8eb9SGleb Smirnoff } 26783b3a8eb9SGleb Smirnoff 26793b3a8eb9SGleb Smirnoff /* Search if scheduler already exists */ 268051d73df1SKristof Provost mtx_lock(&sched_mtx); 268151d73df1SKristof Provost CK_LIST_FOREACH(s, &schedlist, next) { 26823b3a8eb9SGleb Smirnoff if (strcmp(s->name, d->name) == 0) { 26833b3a8eb9SGleb Smirnoff D("%s already loaded", d->name); 26843b3a8eb9SGleb Smirnoff break; /* scheduler already exists */ 26853b3a8eb9SGleb Smirnoff } 26863b3a8eb9SGleb Smirnoff } 26873b3a8eb9SGleb Smirnoff if (s == NULL) 268851d73df1SKristof Provost CK_LIST_INSERT_HEAD(&schedlist, d, next); 268951d73df1SKristof Provost mtx_unlock(&sched_mtx); 26903b3a8eb9SGleb Smirnoff D("dn_sched %s %sloaded", d->name, s ? "not ":""); 26913b3a8eb9SGleb Smirnoff return s ? 1 : 0; 26923b3a8eb9SGleb Smirnoff } 26933b3a8eb9SGleb Smirnoff 26943b3a8eb9SGleb Smirnoff static int 26953b3a8eb9SGleb Smirnoff unload_dn_sched(struct dn_alg *s) 26963b3a8eb9SGleb Smirnoff { 26973b3a8eb9SGleb Smirnoff struct dn_alg *tmp, *r; 26983b3a8eb9SGleb Smirnoff int err = EINVAL; 26993b3a8eb9SGleb Smirnoff 27003b3a8eb9SGleb Smirnoff ND("called for %s", s->name); 27013b3a8eb9SGleb Smirnoff 270251d73df1SKristof Provost mtx_lock(&sched_mtx); 270351d73df1SKristof Provost CK_LIST_FOREACH_SAFE(r, &schedlist, next, tmp) { 27043b3a8eb9SGleb Smirnoff if (strcmp(s->name, r->name) != 0) 27053b3a8eb9SGleb Smirnoff continue; 27063b3a8eb9SGleb Smirnoff ND("ref_count = %d", r->ref_count); 27073b3a8eb9SGleb Smirnoff err = (r->ref_count != 0) ? EBUSY : 0; 27083b3a8eb9SGleb Smirnoff if (err == 0) 270951d73df1SKristof Provost CK_LIST_REMOVE(r, next); 27103b3a8eb9SGleb Smirnoff break; 27113b3a8eb9SGleb Smirnoff } 271251d73df1SKristof Provost mtx_unlock(&sched_mtx); 271351d73df1SKristof Provost NET_EPOCH_WAIT(); 27143b3a8eb9SGleb Smirnoff D("dn_sched %s %sunloaded", s->name, err ? "not ":""); 27153b3a8eb9SGleb Smirnoff return err; 27163b3a8eb9SGleb Smirnoff } 27173b3a8eb9SGleb Smirnoff 27183b3a8eb9SGleb Smirnoff int 27193b3a8eb9SGleb Smirnoff dn_sched_modevent(module_t mod, int cmd, void *arg) 27203b3a8eb9SGleb Smirnoff { 27213b3a8eb9SGleb Smirnoff struct dn_alg *sch = arg; 27223b3a8eb9SGleb Smirnoff 27233b3a8eb9SGleb Smirnoff if (cmd == MOD_LOAD) 27243b3a8eb9SGleb Smirnoff return load_dn_sched(sch); 27253b3a8eb9SGleb Smirnoff else if (cmd == MOD_UNLOAD) 27263b3a8eb9SGleb Smirnoff return unload_dn_sched(sch); 27273b3a8eb9SGleb Smirnoff else 27283b3a8eb9SGleb Smirnoff return EINVAL; 27293b3a8eb9SGleb Smirnoff } 27303b3a8eb9SGleb Smirnoff 27313b3a8eb9SGleb Smirnoff static moduledata_t dummynet_mod = { 27323b3a8eb9SGleb Smirnoff "dummynet", dummynet_modevent, NULL 27333b3a8eb9SGleb Smirnoff }; 27343b3a8eb9SGleb Smirnoff 273589856f7eSBjoern A. Zeeb #define DN_SI_SUB SI_SUB_PROTO_FIREWALL 27363b3a8eb9SGleb Smirnoff #define DN_MODEV_ORD (SI_ORDER_ANY - 128) /* after ipfw */ 27373b3a8eb9SGleb Smirnoff DECLARE_MODULE(dummynet, dummynet_mod, DN_SI_SUB, DN_MODEV_ORD); 2738f9ab623bSAlexander V. Chernikov MODULE_DEPEND(dummynet, ipfw, 3, 3, 3); 27393b3a8eb9SGleb Smirnoff MODULE_VERSION(dummynet, 3); 27403b3a8eb9SGleb Smirnoff 27413b3a8eb9SGleb Smirnoff /* 27423b3a8eb9SGleb Smirnoff * Starting up. Done in order after dummynet_modevent() has been called. 27433b3a8eb9SGleb Smirnoff * VNET_SYSINIT is also called for each existing vnet and each new vnet. 27443b3a8eb9SGleb Smirnoff */ 2745fe3bcfbdSTom Jones VNET_SYSINIT(vnet_dn_init, DN_SI_SUB, DN_MODEV_ORD+2, ip_dn_vnet_init, NULL); 27463b3a8eb9SGleb Smirnoff 27473b3a8eb9SGleb Smirnoff /* 27483b3a8eb9SGleb Smirnoff * Shutdown handlers up shop. These are done in REVERSE ORDER, but still 27493b3a8eb9SGleb Smirnoff * after dummynet_modevent() has been called. Not called on reboot. 27503b3a8eb9SGleb Smirnoff * VNET_SYSUNINIT is also called for each exiting vnet as it exits. 27513b3a8eb9SGleb Smirnoff * or when the module is unloaded. 27523b3a8eb9SGleb Smirnoff */ 2753fe3bcfbdSTom Jones VNET_SYSUNINIT(vnet_dn_uninit, DN_SI_SUB, DN_MODEV_ORD+2, ip_dn_vnet_destroy, NULL); 27543b3a8eb9SGleb Smirnoff 275591336b40SDon Lewis #ifdef NEW_AQM 275691336b40SDon Lewis 275791336b40SDon Lewis /* modevent helpers for the AQM modules */ 275891336b40SDon Lewis static int 275991336b40SDon Lewis load_dn_aqm(struct dn_aqm *d) 276091336b40SDon Lewis { 276191336b40SDon Lewis struct dn_aqm *aqm=NULL; 276291336b40SDon Lewis 276391336b40SDon Lewis if (d == NULL) 276491336b40SDon Lewis return 1; /* error */ 276591336b40SDon Lewis ip_dn_init(); /* just in case, we need the lock */ 276691336b40SDon Lewis 276791336b40SDon Lewis /* Check that mandatory funcs exists */ 276891336b40SDon Lewis if (d->enqueue == NULL || d->dequeue == NULL) { 276991336b40SDon Lewis D("missing enqueue or dequeue for %s", d->name); 277091336b40SDon Lewis return 1; 277191336b40SDon Lewis } 277291336b40SDon Lewis 277351d73df1SKristof Provost mtx_lock(&sched_mtx); 277451d73df1SKristof Provost 277591336b40SDon Lewis /* Search if AQM already exists */ 277651d73df1SKristof Provost CK_LIST_FOREACH(aqm, &aqmlist, next) { 277791336b40SDon Lewis if (strcmp(aqm->name, d->name) == 0) { 277891336b40SDon Lewis D("%s already loaded", d->name); 277991336b40SDon Lewis break; /* AQM already exists */ 278091336b40SDon Lewis } 278191336b40SDon Lewis } 278291336b40SDon Lewis if (aqm == NULL) 278351d73df1SKristof Provost CK_LIST_INSERT_HEAD(&aqmlist, d, next); 278451d73df1SKristof Provost 278551d73df1SKristof Provost mtx_unlock(&sched_mtx); 278651d73df1SKristof Provost 278791336b40SDon Lewis D("dn_aqm %s %sloaded", d->name, aqm ? "not ":""); 278891336b40SDon Lewis return aqm ? 1 : 0; 278991336b40SDon Lewis } 279091336b40SDon Lewis 279191336b40SDon Lewis /* Callback to clean up AQM status for queues connected to a flowset 279291336b40SDon Lewis * and then deconfigure the flowset. 279391336b40SDon Lewis * This function is called before an AQM module is unloaded 279491336b40SDon Lewis */ 279591336b40SDon Lewis static int 279691336b40SDon Lewis fs_cleanup(void *_fs, void *arg) 279791336b40SDon Lewis { 279891336b40SDon Lewis struct dn_fsk *fs = _fs; 279991336b40SDon Lewis uint32_t type = *(uint32_t *)arg; 280091336b40SDon Lewis 280191336b40SDon Lewis if (fs->aqmfp && fs->aqmfp->type == type) 280291336b40SDon Lewis aqm_cleanup_deconfig_fs(fs); 280391336b40SDon Lewis 280491336b40SDon Lewis return 0; 280591336b40SDon Lewis } 280691336b40SDon Lewis 280791336b40SDon Lewis static int 280891336b40SDon Lewis unload_dn_aqm(struct dn_aqm *aqm) 280991336b40SDon Lewis { 281091336b40SDon Lewis struct dn_aqm *tmp, *r; 281191336b40SDon Lewis int err = EINVAL; 281291336b40SDon Lewis err = 0; 281391336b40SDon Lewis ND("called for %s", aqm->name); 281491336b40SDon Lewis 281591336b40SDon Lewis /* clean up AQM status and deconfig flowset */ 2816fe3bcfbdSTom Jones dn_ht_scan(V_dn_cfg.fshash, fs_cleanup, &aqm->type); 281791336b40SDon Lewis 281851d73df1SKristof Provost mtx_lock(&sched_mtx); 281951d73df1SKristof Provost 282051d73df1SKristof Provost CK_LIST_FOREACH_SAFE(r, &aqmlist, next, tmp) { 282191336b40SDon Lewis if (strcmp(aqm->name, r->name) != 0) 282291336b40SDon Lewis continue; 282391336b40SDon Lewis ND("ref_count = %d", r->ref_count); 282491336b40SDon Lewis err = (r->ref_count != 0 || r->cfg_ref_count != 0) ? EBUSY : 0; 282591336b40SDon Lewis if (err == 0) 282651d73df1SKristof Provost CK_LIST_REMOVE(r, next); 282791336b40SDon Lewis break; 282891336b40SDon Lewis } 282951d73df1SKristof Provost 283051d73df1SKristof Provost mtx_unlock(&sched_mtx); 283151d73df1SKristof Provost NET_EPOCH_WAIT(); 283251d73df1SKristof Provost 283391336b40SDon Lewis D("%s %sunloaded", aqm->name, err ? "not ":""); 283491336b40SDon Lewis if (err) 283591336b40SDon Lewis D("ref_count=%d, cfg_ref_count=%d", r->ref_count, r->cfg_ref_count); 283691336b40SDon Lewis return err; 283791336b40SDon Lewis } 283891336b40SDon Lewis 283991336b40SDon Lewis int 284091336b40SDon Lewis dn_aqm_modevent(module_t mod, int cmd, void *arg) 284191336b40SDon Lewis { 284291336b40SDon Lewis struct dn_aqm *aqm = arg; 284391336b40SDon Lewis 284491336b40SDon Lewis if (cmd == MOD_LOAD) 284591336b40SDon Lewis return load_dn_aqm(aqm); 284691336b40SDon Lewis else if (cmd == MOD_UNLOAD) 284791336b40SDon Lewis return unload_dn_aqm(aqm); 284891336b40SDon Lewis else 284991336b40SDon Lewis return EINVAL; 285091336b40SDon Lewis } 285191336b40SDon Lewis #endif 285291336b40SDon Lewis 28533b3a8eb9SGleb Smirnoff /* end of file */ 2854