14644fda3SGleb Smirnoff /*- 24644fda3SGleb Smirnoff * Copyright (c) 2007-2008 34644fda3SGleb Smirnoff * Swinburne University of Technology, Melbourne, Australia. 44644fda3SGleb Smirnoff * Copyright (c) 2009-2010 Lawrence Stewart <lstewart@freebsd.org> 54644fda3SGleb Smirnoff * Copyright (c) 2010 The FreeBSD Foundation 64644fda3SGleb Smirnoff * All rights reserved. 74644fda3SGleb Smirnoff * 84644fda3SGleb Smirnoff * This software was developed at the Centre for Advanced Internet 94644fda3SGleb Smirnoff * Architectures, Swinburne University of Technology, by Lawrence Stewart and 104644fda3SGleb Smirnoff * James Healy, made possible in part by a grant from the Cisco University 114644fda3SGleb Smirnoff * Research Program Fund at Community Foundation Silicon Valley. 124644fda3SGleb Smirnoff * 134644fda3SGleb Smirnoff * Portions of this software were developed at the Centre for Advanced 144644fda3SGleb Smirnoff * Internet Architectures, Swinburne University of Technology, Melbourne, 154644fda3SGleb Smirnoff * Australia by David Hayes under sponsorship from the FreeBSD Foundation. 164644fda3SGleb Smirnoff * 174644fda3SGleb Smirnoff * Redistribution and use in source and binary forms, with or without 184644fda3SGleb Smirnoff * modification, are permitted provided that the following conditions 194644fda3SGleb Smirnoff * are met: 204644fda3SGleb Smirnoff * 1. Redistributions of source code must retain the above copyright 214644fda3SGleb Smirnoff * notice, this list of conditions and the following disclaimer. 224644fda3SGleb Smirnoff * 2. Redistributions in binary form must reproduce the above copyright 234644fda3SGleb Smirnoff * notice, this list of conditions and the following disclaimer in the 244644fda3SGleb Smirnoff * documentation and/or other materials provided with the distribution. 254644fda3SGleb Smirnoff * 264644fda3SGleb Smirnoff * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 274644fda3SGleb Smirnoff * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 284644fda3SGleb Smirnoff * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 294644fda3SGleb Smirnoff * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 304644fda3SGleb Smirnoff * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 314644fda3SGleb Smirnoff * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 324644fda3SGleb Smirnoff * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 334644fda3SGleb Smirnoff * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 344644fda3SGleb Smirnoff * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 354644fda3SGleb Smirnoff * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 364644fda3SGleb Smirnoff * SUCH DAMAGE. 374644fda3SGleb Smirnoff */ 384644fda3SGleb Smirnoff 394644fda3SGleb Smirnoff /* 404644fda3SGleb Smirnoff * This software was first released in 2007 by James Healy and Lawrence Stewart 414644fda3SGleb Smirnoff * whilst working on the NewTCP research project at Swinburne University of 424644fda3SGleb Smirnoff * Technology's Centre for Advanced Internet Architectures, Melbourne, 434644fda3SGleb Smirnoff * Australia, which was made possible in part by a grant from the Cisco 444644fda3SGleb Smirnoff * University Research Program Fund at Community Foundation Silicon Valley. 454644fda3SGleb Smirnoff * More details are available at: 464644fda3SGleb Smirnoff * http://caia.swin.edu.au/urp/newtcp/ 474644fda3SGleb Smirnoff */ 484644fda3SGleb Smirnoff 494644fda3SGleb Smirnoff #ifndef _NETINET_CC_CC_H_ 504644fda3SGleb Smirnoff #define _NETINET_CC_CC_H_ 514644fda3SGleb Smirnoff 52adc56f5aSEdward Tomasz Napierala #ifdef _KERNEL 534644fda3SGleb Smirnoff 54b8d60729SRandall Stewart MALLOC_DECLARE(M_CC_MEM); 55b8d60729SRandall Stewart 564644fda3SGleb Smirnoff /* Global CC vars. */ 574644fda3SGleb Smirnoff extern STAILQ_HEAD(cc_head, cc_algo) cc_list; 584644fda3SGleb Smirnoff extern const int tcprexmtthresh; 594644fda3SGleb Smirnoff 604644fda3SGleb Smirnoff /* Per-netstack bits. */ 614644fda3SGleb Smirnoff VNET_DECLARE(struct cc_algo *, default_cc_ptr); 624644fda3SGleb Smirnoff #define V_default_cc_ptr VNET(default_cc_ptr) 634644fda3SGleb Smirnoff 64370efe5aSLawrence Stewart VNET_DECLARE(int, cc_do_abe); 65370efe5aSLawrence Stewart #define V_cc_do_abe VNET(cc_do_abe) 66370efe5aSLawrence Stewart 67370efe5aSLawrence Stewart VNET_DECLARE(int, cc_abe_frlossreduce); 68370efe5aSLawrence Stewart #define V_cc_abe_frlossreduce VNET(cc_abe_frlossreduce) 69370efe5aSLawrence Stewart 704644fda3SGleb Smirnoff /* Define the new net.inet.tcp.cc sysctl tree. */ 71e68b3792SGleb Smirnoff #ifdef _SYS_SYSCTL_H_ 724644fda3SGleb Smirnoff SYSCTL_DECL(_net_inet_tcp_cc); 73e68b3792SGleb Smirnoff #endif 744644fda3SGleb Smirnoff 75a9696510SRandall Stewart /* For CC modules that use hystart++ */ 76a9696510SRandall Stewart extern uint32_t hystart_lowcwnd; 77a9696510SRandall Stewart extern uint32_t hystart_minrtt_thresh; 78a9696510SRandall Stewart extern uint32_t hystart_maxrtt_thresh; 79a9696510SRandall Stewart extern uint32_t hystart_n_rttsamples; 80a9696510SRandall Stewart extern uint32_t hystart_css_growth_div; 81a9696510SRandall Stewart extern uint32_t hystart_css_rounds; 82a9696510SRandall Stewart extern uint32_t hystart_bblogs; 83a9696510SRandall Stewart 844644fda3SGleb Smirnoff /* CC housekeeping functions. */ 854644fda3SGleb Smirnoff int cc_register_algo(struct cc_algo *add_cc); 864644fda3SGleb Smirnoff int cc_deregister_algo(struct cc_algo *remove_cc); 87e68b3792SGleb Smirnoff #endif /* _KERNEL */ 884644fda3SGleb Smirnoff 89e68b3792SGleb Smirnoff #if defined(_KERNEL) || defined(_WANT_TCPCB) 904644fda3SGleb Smirnoff struct cc_var { 914644fda3SGleb Smirnoff void *cc_data; /* Per-connection private CC algorithm data. */ 924644fda3SGleb Smirnoff int bytes_this_ack; /* # bytes acked by the current ACK. */ 934644fda3SGleb Smirnoff tcp_seq curack; /* Most recent ACK. */ 944644fda3SGleb Smirnoff uint32_t flags; /* Flags for cc_var (see below) */ 9500d3b744SMichael Tuexen struct tcpcb *tp; /* Pointer to tcpcb */ 964b7b743cSLawrence Stewart uint16_t nsegs; /* # segments coalesced into current chain. */ 975d8fd932SRandall Stewart uint8_t labc; /* Dont use system abc use passed in */ 984644fda3SGleb Smirnoff }; 994644fda3SGleb Smirnoff 1004644fda3SGleb Smirnoff /* cc_var flags. */ 1014644fda3SGleb Smirnoff #define CCF_ABC_SENTAWND 0x0001 /* ABC counted cwnd worth of bytes? */ 1024644fda3SGleb Smirnoff #define CCF_CWND_LIMITED 0x0002 /* Are we currently cwnd limited? */ 1035d8fd932SRandall Stewart #define CCF_USE_LOCAL_ABC 0x0004 /* Dont use the system l_abc val */ 1044644fda3SGleb Smirnoff #define CCF_ACKNOW 0x0008 /* Will this ack be sent now? */ 1054644fda3SGleb Smirnoff #define CCF_IPHDR_CE 0x0010 /* Does this packet set CE bit? */ 1064644fda3SGleb Smirnoff #define CCF_TCPHDR_CWR 0x0020 /* Does this packet set CWR bit? */ 1078cc528c6SCheng Cui #define CCF_UNUSED1 0x0040 1088cc528c6SCheng Cui #define CCF_UNUSED2 0x0080 1098cc528c6SCheng Cui #define CCF_UNUSED3 0x0100 1108cc528c6SCheng Cui #define CCF_UNUSED4 0x0200 111a9696510SRandall Stewart #define CCF_HYSTART_ALLOWED 0x0400 /* If the CC supports it Hystart is allowed */ 112a9696510SRandall Stewart #define CCF_HYSTART_CAN_SH_CWND 0x0800 /* Can hystart when going CSS -> CA slam the cwnd */ 113a9696510SRandall Stewart #define CCF_HYSTART_CONS_SSTH 0x1000 /* Should hystart use the more conservative ssthresh */ 1144644fda3SGleb Smirnoff 1155e248c23SRichard Scheffenegger #endif /* defined(_KERNEL) || defined(_WANT_TCPCB) */ 116f74352fbSRichard Scheffenegger typedef enum { 1175e248c23SRichard Scheffenegger #if defined(_KERNEL) || defined(_WANT_TCPCB) 1184644fda3SGleb Smirnoff /* ACK types passed to the ack_received() hook. */ 119f74352fbSRichard Scheffenegger CC_ACK = 0x0001, /* Regular in sequence ACK. */ 120f74352fbSRichard Scheffenegger CC_DUPACK = 0x0002, /* Duplicate ACK. */ 121f74352fbSRichard Scheffenegger CC_PARTIALACK = 0x0004, /* Not yet. */ 122f74352fbSRichard Scheffenegger CC_SACK = 0x0008, /* Not yet. */ 1235e248c23SRichard Scheffenegger #endif /* defined(_KERNEL) || defined(_WANT_TCPCB) */ 124f74352fbSRichard Scheffenegger /* Congestion signal types passed to the cong_signal() hook. */ 125f74352fbSRichard Scheffenegger CC_ECN = 0x0100, /* ECN marked packet received. */ 126f74352fbSRichard Scheffenegger CC_RTO = 0x0200, /* RTO fired. */ 127f74352fbSRichard Scheffenegger CC_RTO_ERR = 0x0400, /* RTO fired in error. */ 128f74352fbSRichard Scheffenegger CC_NDUPACK = 0x0800, /* Threshold of dupack's reached. */ 1294644fda3SGleb Smirnoff /* 130f74352fbSRichard Scheffenegger * The highest order 8 bits (0x01000000 - 0x80000000) are reserved 131f74352fbSRichard Scheffenegger * for CC algos to declare their own congestion signal types. 1324644fda3SGleb Smirnoff */ 133f74352fbSRichard Scheffenegger CC_SIGPRIVMASK = 0xFF000000 /* Mask to check if sig is private. */ 134f74352fbSRichard Scheffenegger } ccsignal_t; 1354644fda3SGleb Smirnoff 136adc56f5aSEdward Tomasz Napierala #ifdef _KERNEL 1374644fda3SGleb Smirnoff /* 1384644fda3SGleb Smirnoff * Structure to hold data and function pointers that together represent a 1394644fda3SGleb Smirnoff * congestion control algorithm. 1404644fda3SGleb Smirnoff */ 1414644fda3SGleb Smirnoff struct cc_algo { 1424644fda3SGleb Smirnoff char name[TCP_CA_NAME_MAX]; 1434644fda3SGleb Smirnoff 1444644fda3SGleb Smirnoff /* Init global module state on kldload. */ 1454644fda3SGleb Smirnoff int (*mod_init)(void); 1464644fda3SGleb Smirnoff 1474644fda3SGleb Smirnoff /* Cleanup global module state on kldunload. */ 1484644fda3SGleb Smirnoff int (*mod_destroy)(void); 1494644fda3SGleb Smirnoff 150b8d60729SRandall Stewart /* Return the size of the void pointer the CC needs for state */ 151b8d60729SRandall Stewart size_t (*cc_data_sz)(void); 152b8d60729SRandall Stewart 153b8d60729SRandall Stewart /* 154b8d60729SRandall Stewart * Init CC state for a new control block. The CC 155b8d60729SRandall Stewart * module may be passed a NULL ptr indicating that 156b8d60729SRandall Stewart * it must allocate the memory. If it is passed a 157b8d60729SRandall Stewart * non-null pointer it is pre-allocated memory by 158b8d60729SRandall Stewart * the caller and the cb_init is expected to use that memory. 159b8d60729SRandall Stewart * It is not expected to fail if memory is passed in and 160b8d60729SRandall Stewart * all currently defined modules do not. 161b8d60729SRandall Stewart */ 162b8d60729SRandall Stewart int (*cb_init)(struct cc_var *ccv, void *ptr); 1634644fda3SGleb Smirnoff 1644644fda3SGleb Smirnoff /* Cleanup CC state for a terminating control block. */ 1654644fda3SGleb Smirnoff void (*cb_destroy)(struct cc_var *ccv); 1664644fda3SGleb Smirnoff 1674644fda3SGleb Smirnoff /* Init variables for a newly established connection. */ 1684644fda3SGleb Smirnoff void (*conn_init)(struct cc_var *ccv); 1694644fda3SGleb Smirnoff 1704644fda3SGleb Smirnoff /* Called on receipt of an ack. */ 171f74352fbSRichard Scheffenegger void (*ack_received)(struct cc_var *ccv, ccsignal_t type); 1724644fda3SGleb Smirnoff 1734644fda3SGleb Smirnoff /* Called on detection of a congestion signal. */ 174f74352fbSRichard Scheffenegger void (*cong_signal)(struct cc_var *ccv, ccsignal_t type); 1754644fda3SGleb Smirnoff 1764644fda3SGleb Smirnoff /* Called after exiting congestion recovery. */ 1774644fda3SGleb Smirnoff void (*post_recovery)(struct cc_var *ccv); 1784644fda3SGleb Smirnoff 1794644fda3SGleb Smirnoff /* Called when data transfer resumes after an idle period. */ 1804644fda3SGleb Smirnoff void (*after_idle)(struct cc_var *ccv); 1814644fda3SGleb Smirnoff 1824644fda3SGleb Smirnoff /* Called for an additional ECN processing apart from RFC3168. */ 1834644fda3SGleb Smirnoff void (*ecnpkt_handler)(struct cc_var *ccv); 1844644fda3SGleb Smirnoff 1854e4c84f8SRandall Stewart /* Called when a new "round" begins, if the transport is tracking rounds. */ 1864e4c84f8SRandall Stewart void (*newround)(struct cc_var *ccv, uint32_t round_cnt); 1874e4c84f8SRandall Stewart 1884e4c84f8SRandall Stewart /* 1894e4c84f8SRandall Stewart * Called when a RTT sample is made (fas = flight at send, if you dont have it 1904e4c84f8SRandall Stewart * send the cwnd in). 1914e4c84f8SRandall Stewart */ 1924e4c84f8SRandall Stewart void (*rttsample)(struct cc_var *ccv, uint32_t usec_rtt, uint32_t rxtcnt, uint32_t fas); 1934e4c84f8SRandall Stewart 1944644fda3SGleb Smirnoff /* Called for {get|set}sockopt() on a TCP socket with TCP_CCALGOOPT. */ 1954644fda3SGleb Smirnoff int (*ctl_output)(struct cc_var *, struct sockopt *, void *); 1964644fda3SGleb Smirnoff 1974644fda3SGleb Smirnoff STAILQ_ENTRY (cc_algo) entries; 198ea9017fbSRandall Stewart u_int cc_refcount; 199b8d60729SRandall Stewart uint8_t flags; 2004644fda3SGleb Smirnoff }; 2014644fda3SGleb Smirnoff 202b8d60729SRandall Stewart #define CC_MODULE_BEING_REMOVED 0x01 /* The module is being removed */ 203b8d60729SRandall Stewart 2044644fda3SGleb Smirnoff /* Macro to obtain the CC algo's struct ptr. */ 205e68b3792SGleb Smirnoff #define CC_ALGO(tp) ((tp)->t_cc) 2064644fda3SGleb Smirnoff 2074644fda3SGleb Smirnoff /* Macro to obtain the CC algo's data ptr. */ 208e68b3792SGleb Smirnoff #define CC_DATA(tp) ((tp)->t_ccv.cc_data) 2094644fda3SGleb Smirnoff 2104644fda3SGleb Smirnoff /* Macro to obtain the system default CC algo's struct ptr. */ 211b8d60729SRandall Stewart #define CC_DEFAULT_ALGO() V_default_cc_ptr 2124644fda3SGleb Smirnoff 2134644fda3SGleb Smirnoff extern struct rwlock cc_list_lock; 2144644fda3SGleb Smirnoff #define CC_LIST_LOCK_INIT() rw_init(&cc_list_lock, "cc_list") 2154644fda3SGleb Smirnoff #define CC_LIST_LOCK_DESTROY() rw_destroy(&cc_list_lock) 2164644fda3SGleb Smirnoff #define CC_LIST_RLOCK() rw_rlock(&cc_list_lock) 2174644fda3SGleb Smirnoff #define CC_LIST_RUNLOCK() rw_runlock(&cc_list_lock) 2184644fda3SGleb Smirnoff #define CC_LIST_WLOCK() rw_wlock(&cc_list_lock) 2194644fda3SGleb Smirnoff #define CC_LIST_WUNLOCK() rw_wunlock(&cc_list_lock) 2204644fda3SGleb Smirnoff #define CC_LIST_LOCK_ASSERT() rw_assert(&cc_list_lock, RA_LOCKED) 2214644fda3SGleb Smirnoff 222c8b53cedSMichael Tuexen #define CC_ALGOOPT_LIMIT 2048 223c8b53cedSMichael Tuexen 224b8d60729SRandall Stewart /* 225b8d60729SRandall Stewart * These routines give NewReno behavior to the caller 226b8d60729SRandall Stewart * they require no state and can be used by any other CC 227b8d60729SRandall Stewart * module that wishes to use NewReno type behaviour (along 228b8d60729SRandall Stewart * with anything else they may add on, pre or post call). 229b8d60729SRandall Stewart */ 230b8d60729SRandall Stewart void newreno_cc_post_recovery(struct cc_var *); 231b8d60729SRandall Stewart void newreno_cc_after_idle(struct cc_var *); 232f74352fbSRichard Scheffenegger void newreno_cc_cong_signal(struct cc_var *, ccsignal_t); 233f74352fbSRichard Scheffenegger void newreno_cc_ack_received(struct cc_var *, ccsignal_t); 234*b6c137deSCheng Cui u_int newreno_cc_cwnd_on_multiplicative_decrease(struct cc_var *ccv, uint32_t mss); 235*b6c137deSCheng Cui u_int newreno_cc_cwnd_in_cong_avoid(struct cc_var *ccv); 236*b6c137deSCheng Cui u_int newreno_cc_cwnd_in_slow_start(struct cc_var *ccv); 237b8d60729SRandall Stewart 238ea9017fbSRandall Stewart /* Called to temporarily keep an algo from going away during change */ 239ea9017fbSRandall Stewart void cc_refer(struct cc_algo *algo); 240ea9017fbSRandall Stewart /* Called to release the temporary hold */ 241ea9017fbSRandall Stewart void cc_release(struct cc_algo *algo); 242ea9017fbSRandall Stewart 243ea9017fbSRandall Stewart /* Called to attach a CC algorithm to a tcpcb */ 244ea9017fbSRandall Stewart void cc_attach(struct tcpcb *, struct cc_algo *); 245ea9017fbSRandall Stewart /* Called to detach a CC algorithm from a tcpcb */ 246ea9017fbSRandall Stewart void cc_detach(struct tcpcb *); 247ea9017fbSRandall Stewart 248adc56f5aSEdward Tomasz Napierala #endif /* _KERNEL */ 2494644fda3SGleb Smirnoff #endif /* _NETINET_CC_CC_H_ */ 250