1c398230bSWarner Losh /*- 2df8bae1dSRodney W. Grimes * Copyright (c) 1980, 1986, 1991, 1993 3df8bae1dSRodney W. Grimes * The Regents of the University of California. All rights reserved. 4df8bae1dSRodney W. Grimes * 5df8bae1dSRodney W. Grimes * Redistribution and use in source and binary forms, with or without 6df8bae1dSRodney W. Grimes * modification, are permitted provided that the following conditions 7df8bae1dSRodney W. Grimes * are met: 8df8bae1dSRodney W. Grimes * 1. Redistributions of source code must retain the above copyright 9df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer. 10df8bae1dSRodney W. Grimes * 2. Redistributions in binary form must reproduce the above copyright 11df8bae1dSRodney W. Grimes * notice, this list of conditions and the following disclaimer in the 12df8bae1dSRodney W. Grimes * documentation and/or other materials provided with the distribution. 13df8bae1dSRodney W. Grimes * 4. Neither the name of the University nor the names of its contributors 14df8bae1dSRodney W. Grimes * may be used to endorse or promote products derived from this software 15df8bae1dSRodney W. Grimes * without specific prior written permission. 16df8bae1dSRodney W. Grimes * 17df8bae1dSRodney W. Grimes * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18df8bae1dSRodney W. Grimes * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19df8bae1dSRodney W. Grimes * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20df8bae1dSRodney W. Grimes * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21df8bae1dSRodney W. Grimes * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22df8bae1dSRodney W. Grimes * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23df8bae1dSRodney W. Grimes * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24df8bae1dSRodney W. Grimes * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25df8bae1dSRodney W. Grimes * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26df8bae1dSRodney W. Grimes * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27df8bae1dSRodney W. Grimes * SUCH DAMAGE. 28df8bae1dSRodney W. Grimes * 2942e9e16dSRuslan Ermilov * @(#)route.c 8.3.1.1 (Berkeley) 2/23/95 30c3aac50fSPeter Wemm * $FreeBSD$ 31df8bae1dSRodney W. Grimes */ 328b07e49aSJulian Elischer /************************************************************************ 338b07e49aSJulian Elischer * Note: In this file a 'fib' is a "forwarding information base" * 348b07e49aSJulian Elischer * Which is the new name for an in kernel routing (next hop) table. * 358b07e49aSJulian Elischer ***********************************************************************/ 36df8bae1dSRodney W. Grimes 371d5e9e22SEivind Eklund #include "opt_inet.h" 38096f2786SBjoern A. Zeeb #include "opt_inet6.h" 398b07e49aSJulian Elischer #include "opt_route.h" 404cbac30bSAlexander V. Chernikov #include "opt_sctp.h" 414bd49128SPeter Wemm #include "opt_mrouting.h" 42e440aed9SQing Li #include "opt_mpath.h" 434bd49128SPeter Wemm 44df8bae1dSRodney W. Grimes #include <sys/param.h> 45df8bae1dSRodney W. Grimes #include <sys/systm.h> 466e6b3f7cSQing Li #include <sys/syslog.h> 474d1d4912SBruce Evans #include <sys/malloc.h> 48df8bae1dSRodney W. Grimes #include <sys/mbuf.h> 49df8bae1dSRodney W. Grimes #include <sys/socket.h> 508b07e49aSJulian Elischer #include <sys/sysctl.h> 513120b9d4SKip Macy #include <sys/syslog.h> 528b07e49aSJulian Elischer #include <sys/sysproto.h> 538b07e49aSJulian Elischer #include <sys/proc.h> 54df8bae1dSRodney W. Grimes #include <sys/domain.h> 55cb64988fSLuoqi Chen #include <sys/kernel.h> 56df8bae1dSRodney W. Grimes 57df8bae1dSRodney W. Grimes #include <net/if.h> 5876039bc8SGleb Smirnoff #include <net/if_var.h> 596e6b3f7cSQing Li #include <net/if_dl.h> 60df8bae1dSRodney W. Grimes #include <net/route.h> 61530c0060SRobert Watson #include <net/vnet.h> 62e5c610d6SQing Li #include <net/flowtable.h> 63df8bae1dSRodney W. Grimes 64e440aed9SQing Li #ifdef RADIX_MPATH 65e440aed9SQing Li #include <net/radix_mpath.h> 66e440aed9SQing Li #endif 67e440aed9SQing Li 68df8bae1dSRodney W. Grimes #include <netinet/in.h> 69b5e8ce9fSBruce Evans #include <netinet/ip_mroute.h> 70df8bae1dSRodney W. Grimes 712dc1d581SAndre Oppermann #include <vm/uma.h> 722dc1d581SAndre Oppermann 734871fc4aSJulian Elischer #define RT_MAXFIBS UINT16_MAX 74bfca216eSBjoern A. Zeeb 75bfca216eSBjoern A. Zeeb /* Kernel config default option. */ 76bfca216eSBjoern A. Zeeb #ifdef ROUTETABLES 77bfca216eSBjoern A. Zeeb #if ROUTETABLES <= 0 78bfca216eSBjoern A. Zeeb #error "ROUTETABLES defined too low" 79bfca216eSBjoern A. Zeeb #endif 80bfca216eSBjoern A. Zeeb #if ROUTETABLES > RT_MAXFIBS 81bfca216eSBjoern A. Zeeb #error "ROUTETABLES defined too big" 82bfca216eSBjoern A. Zeeb #endif 83bfca216eSBjoern A. Zeeb #define RT_NUMFIBS ROUTETABLES 84bfca216eSBjoern A. Zeeb #endif /* ROUTETABLES */ 85bfca216eSBjoern A. Zeeb /* Initialize to default if not otherwise set. */ 86bfca216eSBjoern A. Zeeb #ifndef RT_NUMFIBS 87bfca216eSBjoern A. Zeeb #define RT_NUMFIBS 1 88bfca216eSBjoern A. Zeeb #endif 89bfca216eSBjoern A. Zeeb 904cbac30bSAlexander V. Chernikov #if defined(INET) || defined(INET6) 914cbac30bSAlexander V. Chernikov #ifdef SCTP 924cbac30bSAlexander V. Chernikov extern void sctp_addr_change(struct ifaddr *ifa, int cmd); 934cbac30bSAlexander V. Chernikov #endif /* SCTP */ 944cbac30bSAlexander V. Chernikov #endif 954cbac30bSAlexander V. Chernikov 964cbac30bSAlexander V. Chernikov 974871fc4aSJulian Elischer /* This is read-only.. */ 988b07e49aSJulian Elischer u_int rt_numfibs = RT_NUMFIBS; 99f88910cdSMatthew D Fleming SYSCTL_UINT(_net, OID_AUTO, fibs, CTLFLAG_RD, &rt_numfibs, 0, ""); 1004871fc4aSJulian Elischer /* and this can be set too big but will be fixed before it is used */ 1018b07e49aSJulian Elischer TUNABLE_INT("net.fibs", &rt_numfibs); 1028b07e49aSJulian Elischer 10366e8505fSJulian Elischer /* 10466e8505fSJulian Elischer * By default add routes to all fibs for new interfaces. 10566e8505fSJulian Elischer * Once this is set to 0 then only allocate routes on interface 10666e8505fSJulian Elischer * changes for the FIB of the caller when adding a new set of addresses 10766e8505fSJulian Elischer * to an interface. XXX this is a shotgun aproach to a problem that needs 10866e8505fSJulian Elischer * a more fine grained solution.. that will come. 109a8498625SBjoern A. Zeeb * XXX also has the problems getting the FIB from curthread which will not 110a8498625SBjoern A. Zeeb * always work given the fib can be overridden and prefixes can be added 111a8498625SBjoern A. Zeeb * from the network stack context. 11266e8505fSJulian Elischer */ 11366e8505fSJulian Elischer u_int rt_add_addr_allfibs = 1; 114f88910cdSMatthew D Fleming SYSCTL_UINT(_net, OID_AUTO, add_addr_allfibs, CTLFLAG_RW, 11566e8505fSJulian Elischer &rt_add_addr_allfibs, 0, ""); 11666e8505fSJulian Elischer TUNABLE_INT("net.add_addr_allfibs", &rt_add_addr_allfibs); 11766e8505fSJulian Elischer 118eddfbb76SRobert Watson VNET_DEFINE(struct rtstat, rtstat); 1191e77c105SRobert Watson #define V_rtstat VNET(rtstat) 120b58ea5f3SBjoern A. Zeeb 12182cea7e6SBjoern A. Zeeb VNET_DEFINE(struct radix_node_head *, rt_tables); 12282cea7e6SBjoern A. Zeeb #define V_rt_tables VNET(rt_tables) 12382cea7e6SBjoern A. Zeeb 12482cea7e6SBjoern A. Zeeb VNET_DEFINE(int, rttrash); /* routes not in table but not freed */ 12582cea7e6SBjoern A. Zeeb #define V_rttrash VNET(rttrash) 12682cea7e6SBjoern A. Zeeb 127bfe1aba4SMarko Zec 128d6941ce9SLuigi Rizzo /* 129d6941ce9SLuigi Rizzo * Convert a 'struct radix_node *' to a 'struct rtentry *'. 130d6941ce9SLuigi Rizzo * The operation can be done safely (in this code) because a 131d6941ce9SLuigi Rizzo * 'struct rtentry' starts with two 'struct radix_node''s, the first 132d6941ce9SLuigi Rizzo * one representing leaf nodes in the routing tree, which is 133d6941ce9SLuigi Rizzo * what the code in radix.c passes us as a 'struct radix_node'. 134d6941ce9SLuigi Rizzo * 135d6941ce9SLuigi Rizzo * But because there are a lot of assumptions in this conversion, 136d6941ce9SLuigi Rizzo * do not cast explicitly, but always use the macro below. 137d6941ce9SLuigi Rizzo */ 138d6941ce9SLuigi Rizzo #define RNTORT(p) ((struct rtentry *)(p)) 139d6941ce9SLuigi Rizzo 1403e288e62SDimitry Andric static VNET_DEFINE(uma_zone_t, rtzone); /* Routing table UMA zone. */ 14182cea7e6SBjoern A. Zeeb #define V_rtzone VNET(rtzone) 14282cea7e6SBjoern A. Zeeb 143*c77462ddSAlexander V. Chernikov static int rtrequest1_fib_change(struct radix_node_head *, struct rt_addrinfo *, 144*c77462ddSAlexander V. Chernikov struct rtentry **, u_int); 145*c77462ddSAlexander V. Chernikov 1468b07e49aSJulian Elischer /* 1478b07e49aSJulian Elischer * handler for net.my_fibnum 1488b07e49aSJulian Elischer */ 1498b07e49aSJulian Elischer static int 1508b07e49aSJulian Elischer sysctl_my_fibnum(SYSCTL_HANDLER_ARGS) 151df8bae1dSRodney W. Grimes { 1528b07e49aSJulian Elischer int fibnum; 1538b07e49aSJulian Elischer int error; 1548b07e49aSJulian Elischer 1558b07e49aSJulian Elischer fibnum = curthread->td_proc->p_fibnum; 1568b07e49aSJulian Elischer error = sysctl_handle_int(oidp, &fibnum, 0, req); 1578b07e49aSJulian Elischer return (error); 158df8bae1dSRodney W. Grimes } 159df8bae1dSRodney W. Grimes 1608b07e49aSJulian Elischer SYSCTL_PROC(_net, OID_AUTO, my_fibnum, CTLTYPE_INT|CTLFLAG_RD, 1618b07e49aSJulian Elischer NULL, 0, &sysctl_my_fibnum, "I", "default FIB of caller"); 1622dc1d581SAndre Oppermann 163c2c2a7c1SBjoern A. Zeeb static __inline struct radix_node_head ** 164c2c2a7c1SBjoern A. Zeeb rt_tables_get_rnh_ptr(int table, int fam) 165c2c2a7c1SBjoern A. Zeeb { 166c2c2a7c1SBjoern A. Zeeb struct radix_node_head **rnh; 167c2c2a7c1SBjoern A. Zeeb 168c2c2a7c1SBjoern A. Zeeb KASSERT(table >= 0 && table < rt_numfibs, ("%s: table out of bounds.", 169c2c2a7c1SBjoern A. Zeeb __func__)); 170c2c2a7c1SBjoern A. Zeeb KASSERT(fam >= 0 && fam < (AF_MAX+1), ("%s: fam out of bounds.", 171c2c2a7c1SBjoern A. Zeeb __func__)); 172c2c2a7c1SBjoern A. Zeeb 173c2c2a7c1SBjoern A. Zeeb /* rnh is [fib=0][af=0]. */ 174c2c2a7c1SBjoern A. Zeeb rnh = (struct radix_node_head **)V_rt_tables; 175c2c2a7c1SBjoern A. Zeeb /* Get the offset to the requested table and fam. */ 176c2c2a7c1SBjoern A. Zeeb rnh += table * (AF_MAX+1) + fam; 177c2c2a7c1SBjoern A. Zeeb 178c2c2a7c1SBjoern A. Zeeb return (rnh); 179c2c2a7c1SBjoern A. Zeeb } 180c2c2a7c1SBjoern A. Zeeb 181c2c2a7c1SBjoern A. Zeeb struct radix_node_head * 182c2c2a7c1SBjoern A. Zeeb rt_tables_get_rnh(int table, int fam) 183c2c2a7c1SBjoern A. Zeeb { 184c2c2a7c1SBjoern A. Zeeb 185c2c2a7c1SBjoern A. Zeeb return (*rt_tables_get_rnh_ptr(table, fam)); 186c2c2a7c1SBjoern A. Zeeb } 187c2c2a7c1SBjoern A. Zeeb 188d0728d71SRobert Watson /* 189d0728d71SRobert Watson * route initialization must occur before ip6_init2(), which happenas at 190d0728d71SRobert Watson * SI_ORDER_MIDDLE. 191d0728d71SRobert Watson */ 1922eb5613fSLuigi Rizzo static void 1932eb5613fSLuigi Rizzo route_init(void) 194df8bae1dSRodney W. Grimes { 1958b07e49aSJulian Elischer 1966f95a5ebSJulian Elischer /* whack the tunable ints into line. */ 1978b07e49aSJulian Elischer if (rt_numfibs > RT_MAXFIBS) 1988b07e49aSJulian Elischer rt_numfibs = RT_MAXFIBS; 1998b07e49aSJulian Elischer if (rt_numfibs == 0) 2008b07e49aSJulian Elischer rt_numfibs = 1; 2011ed81b73SMarko Zec } 202d0728d71SRobert Watson SYSINIT(route_init, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, route_init, 0); 2031ed81b73SMarko Zec 204e3a7aa6fSGleb Smirnoff static int 205e3a7aa6fSGleb Smirnoff rtentry_zinit(void *mem, int size, int how) 206e3a7aa6fSGleb Smirnoff { 207e3a7aa6fSGleb Smirnoff struct rtentry *rt = mem; 208e3a7aa6fSGleb Smirnoff 209e3a7aa6fSGleb Smirnoff rt->rt_pksent = counter_u64_alloc(how); 210e3a7aa6fSGleb Smirnoff if (rt->rt_pksent == NULL) 211e3a7aa6fSGleb Smirnoff return (ENOMEM); 212e3a7aa6fSGleb Smirnoff 213e3a7aa6fSGleb Smirnoff RT_LOCK_INIT(rt); 214e3a7aa6fSGleb Smirnoff 215e3a7aa6fSGleb Smirnoff return (0); 216e3a7aa6fSGleb Smirnoff } 217e3a7aa6fSGleb Smirnoff 218e3a7aa6fSGleb Smirnoff static void 219e3a7aa6fSGleb Smirnoff rtentry_zfini(void *mem, int size) 220e3a7aa6fSGleb Smirnoff { 221e3a7aa6fSGleb Smirnoff struct rtentry *rt = mem; 222e3a7aa6fSGleb Smirnoff 223e3a7aa6fSGleb Smirnoff RT_LOCK_DESTROY(rt); 224e3a7aa6fSGleb Smirnoff counter_u64_free(rt->rt_pksent); 225e3a7aa6fSGleb Smirnoff } 226e3a7aa6fSGleb Smirnoff 227e3a7aa6fSGleb Smirnoff static int 228e3a7aa6fSGleb Smirnoff rtentry_ctor(void *mem, int size, void *arg, int how) 229e3a7aa6fSGleb Smirnoff { 230e3a7aa6fSGleb Smirnoff struct rtentry *rt = mem; 231e3a7aa6fSGleb Smirnoff 232e3a7aa6fSGleb Smirnoff bzero(rt, offsetof(struct rtentry, rt_endzero)); 233e3a7aa6fSGleb Smirnoff counter_u64_zero(rt->rt_pksent); 234e3a7aa6fSGleb Smirnoff 235e3a7aa6fSGleb Smirnoff return (0); 236e3a7aa6fSGleb Smirnoff } 237e3a7aa6fSGleb Smirnoff 238d0728d71SRobert Watson static void 239256ea2abSGleb Smirnoff rtentry_dtor(void *mem, int size, void *arg) 240256ea2abSGleb Smirnoff { 241256ea2abSGleb Smirnoff struct rtentry *rt = mem; 242256ea2abSGleb Smirnoff 243256ea2abSGleb Smirnoff RT_UNLOCK_COND(rt); 244256ea2abSGleb Smirnoff } 245256ea2abSGleb Smirnoff 246256ea2abSGleb Smirnoff static void 247d0728d71SRobert Watson vnet_route_init(const void *unused __unused) 2481ed81b73SMarko Zec { 2491ed81b73SMarko Zec struct domain *dom; 250c2c2a7c1SBjoern A. Zeeb struct radix_node_head **rnh; 251c2c2a7c1SBjoern A. Zeeb int table; 2521ed81b73SMarko Zec int fam; 2531ed81b73SMarko Zec 254c2c2a7c1SBjoern A. Zeeb V_rt_tables = malloc(rt_numfibs * (AF_MAX+1) * 255c2c2a7c1SBjoern A. Zeeb sizeof(struct radix_node_head *), M_RTABLE, M_WAITOK|M_ZERO); 256c2c2a7c1SBjoern A. Zeeb 257e3a7aa6fSGleb Smirnoff V_rtzone = uma_zcreate("rtentry", sizeof(struct rtentry), 258256ea2abSGleb Smirnoff rtentry_ctor, rtentry_dtor, 259e3a7aa6fSGleb Smirnoff rtentry_zinit, rtentry_zfini, UMA_ALIGN_PTR, 0); 2608b07e49aSJulian Elischer for (dom = domains; dom; dom = dom->dom_next) { 261b680a383SBjoern A. Zeeb if (dom->dom_rtattach == NULL) 262b680a383SBjoern A. Zeeb continue; 263b680a383SBjoern A. Zeeb 2648b07e49aSJulian Elischer for (table = 0; table < rt_numfibs; table++) { 265b680a383SBjoern A. Zeeb fam = dom->dom_family; 266b680a383SBjoern A. Zeeb if (table != 0 && fam != AF_INET6 && fam != AF_INET) 267b680a383SBjoern A. Zeeb break; 268b680a383SBjoern A. Zeeb 269b680a383SBjoern A. Zeeb /* 270b680a383SBjoern A. Zeeb * XXX MRT rtattach will be also called from 271b680a383SBjoern A. Zeeb * vfs_export.c but the offset will be 0 (only for 272b680a383SBjoern A. Zeeb * AF_INET and AF_INET6 which don't need it anyhow). 2738b07e49aSJulian Elischer */ 274c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh_ptr(table, fam); 275c2c2a7c1SBjoern A. Zeeb if (rnh == NULL) 276c2c2a7c1SBjoern A. Zeeb panic("%s: rnh NULL", __func__); 277b680a383SBjoern A. Zeeb dom->dom_rtattach((void **)rnh, dom->dom_rtoffset); 2788b07e49aSJulian Elischer } 2798b07e49aSJulian Elischer } 2808b07e49aSJulian Elischer } 281d0728d71SRobert Watson VNET_SYSINIT(vnet_route_init, SI_SUB_PROTO_DOMAIN, SI_ORDER_FOURTH, 282d0728d71SRobert Watson vnet_route_init, 0); 2838b07e49aSJulian Elischer 284bc29160dSMarko Zec #ifdef VIMAGE 285d0728d71SRobert Watson static void 286d0728d71SRobert Watson vnet_route_uninit(const void *unused __unused) 287bc29160dSMarko Zec { 288bc29160dSMarko Zec int table; 289bc29160dSMarko Zec int fam; 290bc29160dSMarko Zec struct domain *dom; 291bc29160dSMarko Zec struct radix_node_head **rnh; 292bc29160dSMarko Zec 293bc29160dSMarko Zec for (dom = domains; dom; dom = dom->dom_next) { 294b680a383SBjoern A. Zeeb if (dom->dom_rtdetach == NULL) 295b680a383SBjoern A. Zeeb continue; 296b680a383SBjoern A. Zeeb 297bc29160dSMarko Zec for (table = 0; table < rt_numfibs; table++) { 298b680a383SBjoern A. Zeeb fam = dom->dom_family; 299b680a383SBjoern A. Zeeb 300b680a383SBjoern A. Zeeb if (table != 0 && fam != AF_INET6 && fam != AF_INET) 301b680a383SBjoern A. Zeeb break; 302b680a383SBjoern A. Zeeb 303bc29160dSMarko Zec rnh = rt_tables_get_rnh_ptr(table, fam); 304bc29160dSMarko Zec if (rnh == NULL) 305bc29160dSMarko Zec panic("%s: rnh NULL", __func__); 306b680a383SBjoern A. Zeeb dom->dom_rtdetach((void **)rnh, dom->dom_rtoffset); 307bc29160dSMarko Zec } 308bc29160dSMarko Zec } 3096274ce3eSCraig Rodrigues 3106274ce3eSCraig Rodrigues free(V_rt_tables, M_RTABLE); 3116274ce3eSCraig Rodrigues uma_zdestroy(V_rtzone); 312bc29160dSMarko Zec } 313d0728d71SRobert Watson VNET_SYSUNINIT(vnet_route_uninit, SI_SUB_PROTO_DOMAIN, SI_ORDER_THIRD, 314d0728d71SRobert Watson vnet_route_uninit, 0); 315bc29160dSMarko Zec #endif 316bc29160dSMarko Zec 3178b07e49aSJulian Elischer #ifndef _SYS_SYSPROTO_H_ 3188b07e49aSJulian Elischer struct setfib_args { 3198b07e49aSJulian Elischer int fibnum; 3208b07e49aSJulian Elischer }; 3218b07e49aSJulian Elischer #endif 3228b07e49aSJulian Elischer int 3238451d0ddSKip Macy sys_setfib(struct thread *td, struct setfib_args *uap) 3248b07e49aSJulian Elischer { 3258b07e49aSJulian Elischer if (uap->fibnum < 0 || uap->fibnum >= rt_numfibs) 3268b07e49aSJulian Elischer return EINVAL; 3278b07e49aSJulian Elischer td->td_proc->p_fibnum = uap->fibnum; 3288b07e49aSJulian Elischer return (0); 329df8bae1dSRodney W. Grimes } 330df8bae1dSRodney W. Grimes 331df8bae1dSRodney W. Grimes /* 332df8bae1dSRodney W. Grimes * Packet routing routines. 333df8bae1dSRodney W. Grimes */ 334df8bae1dSRodney W. Grimes void 335d1dd20beSSam Leffler rtalloc(struct route *ro) 336df8bae1dSRodney W. Grimes { 337a8498625SBjoern A. Zeeb 338a8498625SBjoern A. Zeeb rtalloc_ign_fib(ro, 0UL, RT_DEFAULT_FIB); 3398b07e49aSJulian Elischer } 3408b07e49aSJulian Elischer 3418b07e49aSJulian Elischer void 3428b07e49aSJulian Elischer rtalloc_fib(struct route *ro, u_int fibnum) 3438b07e49aSJulian Elischer { 3448b07e49aSJulian Elischer rtalloc_ign_fib(ro, 0UL, fibnum); 345df8bae1dSRodney W. Grimes } 346df8bae1dSRodney W. Grimes 347652082e6SGarrett Wollman void 348d1dd20beSSam Leffler rtalloc_ign(struct route *ro, u_long ignore) 349652082e6SGarrett Wollman { 35068f956b8SJohn Polstra struct rtentry *rt; 35168f956b8SJohn Polstra 35268f956b8SJohn Polstra if ((rt = ro->ro_rt) != NULL) { 35368f956b8SJohn Polstra if (rt->rt_ifp != NULL && rt->rt_flags & RTF_UP) 35468f956b8SJohn Polstra return; 35568f956b8SJohn Polstra RTFREE(rt); 35666810dd0SYoshinobu Inoue ro->ro_rt = NULL; 35768f956b8SJohn Polstra } 358a8498625SBjoern A. Zeeb ro->ro_rt = rtalloc1_fib(&ro->ro_dst, 1, ignore, RT_DEFAULT_FIB); 3598b07e49aSJulian Elischer if (ro->ro_rt) 3608b07e49aSJulian Elischer RT_UNLOCK(ro->ro_rt); 3618b07e49aSJulian Elischer } 3628b07e49aSJulian Elischer 3638b07e49aSJulian Elischer void 3648b07e49aSJulian Elischer rtalloc_ign_fib(struct route *ro, u_long ignore, u_int fibnum) 3658b07e49aSJulian Elischer { 3668b07e49aSJulian Elischer struct rtentry *rt; 3678b07e49aSJulian Elischer 3688b07e49aSJulian Elischer if ((rt = ro->ro_rt) != NULL) { 3698b07e49aSJulian Elischer if (rt->rt_ifp != NULL && rt->rt_flags & RTF_UP) 3708b07e49aSJulian Elischer return; 3718b07e49aSJulian Elischer RTFREE(rt); 3728b07e49aSJulian Elischer ro->ro_rt = NULL; 3738b07e49aSJulian Elischer } 3748b07e49aSJulian Elischer ro->ro_rt = rtalloc1_fib(&ro->ro_dst, 1, ignore, fibnum); 375d1dd20beSSam Leffler if (ro->ro_rt) 376d1dd20beSSam Leffler RT_UNLOCK(ro->ro_rt); 377652082e6SGarrett Wollman } 378652082e6SGarrett Wollman 379b0a76b88SJulian Elischer /* 380b0a76b88SJulian Elischer * Look up the route that matches the address given 381b0a76b88SJulian Elischer * Or, at least try.. Create a cloned route if needed. 382d1dd20beSSam Leffler * 383d1dd20beSSam Leffler * The returned route, if any, is locked. 384b0a76b88SJulian Elischer */ 385df8bae1dSRodney W. Grimes struct rtentry * 386d1dd20beSSam Leffler rtalloc1(struct sockaddr *dst, int report, u_long ignflags) 387df8bae1dSRodney W. Grimes { 388a8498625SBjoern A. Zeeb 389a8498625SBjoern A. Zeeb return (rtalloc1_fib(dst, report, ignflags, RT_DEFAULT_FIB)); 3908b07e49aSJulian Elischer } 3918b07e49aSJulian Elischer 3928b07e49aSJulian Elischer struct rtentry * 3938b07e49aSJulian Elischer rtalloc1_fib(struct sockaddr *dst, int report, u_long ignflags, 3948b07e49aSJulian Elischer u_int fibnum) 3958b07e49aSJulian Elischer { 3968b07e49aSJulian Elischer struct radix_node_head *rnh; 397d1dd20beSSam Leffler struct radix_node *rn; 398d1dd20beSSam Leffler struct rtentry *newrt; 399df8bae1dSRodney W. Grimes struct rt_addrinfo info; 4006e6b3f7cSQing Li int err = 0, msgtype = RTM_MISS; 4013120b9d4SKip Macy int needlock; 402df8bae1dSRodney W. Grimes 4038b07e49aSJulian Elischer KASSERT((fibnum < rt_numfibs), ("rtalloc1_fib: bad fibnum")); 404b680a383SBjoern A. Zeeb switch (dst->sa_family) { 405b680a383SBjoern A. Zeeb case AF_INET6: 406b680a383SBjoern A. Zeeb case AF_INET: 407b680a383SBjoern A. Zeeb /* We support multiple FIBs. */ 408b680a383SBjoern A. Zeeb break; 409b680a383SBjoern A. Zeeb default: 410b680a383SBjoern A. Zeeb fibnum = RT_DEFAULT_FIB; 411b680a383SBjoern A. Zeeb break; 412b680a383SBjoern A. Zeeb } 413c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(fibnum, dst->sa_family); 414e579f1c1SDmitry Chagin newrt = NULL; 415523e6002SDmitry Chagin if (rnh == NULL) 416523e6002SDmitry Chagin goto miss; 417523e6002SDmitry Chagin 418b0a76b88SJulian Elischer /* 419b0a76b88SJulian Elischer * Look up the address in the table for that Address Family 420b0a76b88SJulian Elischer */ 4213120b9d4SKip Macy needlock = !(ignflags & RTF_RNH_LOCKED); 4223120b9d4SKip Macy if (needlock) 4233120b9d4SKip Macy RADIX_NODE_HEAD_RLOCK(rnh); 4243120b9d4SKip Macy #ifdef INVARIANTS 4253120b9d4SKip Macy else 4269b5f5edeSGeorge V. Neville-Neil RADIX_NODE_HEAD_LOCK_ASSERT(rnh); 4273120b9d4SKip Macy #endif 4283120b9d4SKip Macy rn = rnh->rnh_matchaddr(dst, rnh); 4293120b9d4SKip Macy if (rn && ((rn->rn_flags & RNF_ROOT) == 0)) { 4306a873ef7SDmitry Chagin newrt = RNTORT(rn); 4313120b9d4SKip Macy RT_LOCK(newrt); 4323120b9d4SKip Macy RT_ADDREF(newrt); 4333120b9d4SKip Macy if (needlock) 4343120b9d4SKip Macy RADIX_NODE_HEAD_RUNLOCK(rnh); 4353120b9d4SKip Macy goto done; 4366e6b3f7cSQing Li 4376e6b3f7cSQing Li } else if (needlock) 4383120b9d4SKip Macy RADIX_NODE_HEAD_RUNLOCK(rnh); 4393120b9d4SKip Macy 440b0a76b88SJulian Elischer /* 441b0a76b88SJulian Elischer * Either we hit the root or couldn't find any match, 442b0a76b88SJulian Elischer * Which basically means 443b0a76b88SJulian Elischer * "caint get there frm here" 444b0a76b88SJulian Elischer */ 445956b0b65SJeffrey Hsu miss: 446523e6002SDmitry Chagin V_rtstat.rts_unreach++; 447523e6002SDmitry Chagin 4486e6b3f7cSQing Li if (report) { 449b0a76b88SJulian Elischer /* 450b0a76b88SJulian Elischer * If required, report the failure to the supervising 451b0a76b88SJulian Elischer * Authorities. 452b0a76b88SJulian Elischer * For a delete, this is not an error. (report == 0) 453b0a76b88SJulian Elischer */ 4546f5967c0SBruce Evans bzero(&info, sizeof(info)); 455df8bae1dSRodney W. Grimes info.rti_info[RTAX_DST] = dst; 456528737fdSBjoern A. Zeeb rt_missmsg_fib(msgtype, &info, 0, err, fibnum); 457df8bae1dSRodney W. Grimes } 4583120b9d4SKip Macy done: 459d1dd20beSSam Leffler if (newrt) 460d1dd20beSSam Leffler RT_LOCK_ASSERT(newrt); 461df8bae1dSRodney W. Grimes return (newrt); 462df8bae1dSRodney W. Grimes } 463df8bae1dSRodney W. Grimes 464499676dfSJulian Elischer /* 465499676dfSJulian Elischer * Remove a reference count from an rtentry. 466499676dfSJulian Elischer * If the count gets low enough, take it out of the routing table 467499676dfSJulian Elischer */ 468df8bae1dSRodney W. Grimes void 469d1dd20beSSam Leffler rtfree(struct rtentry *rt) 470df8bae1dSRodney W. Grimes { 47185911824SLuigi Rizzo struct radix_node_head *rnh; 472df8bae1dSRodney W. Grimes 473a0c0e34bSGleb Smirnoff KASSERT(rt != NULL,("%s: NULL rt", __func__)); 474c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(rt->rt_fibnum, rt_key(rt)->sa_family); 475a0c0e34bSGleb Smirnoff KASSERT(rnh != NULL,("%s: NULL rnh", __func__)); 476499676dfSJulian Elischer 477d1dd20beSSam Leffler RT_LOCK_ASSERT(rt); 478d1dd20beSSam Leffler 479499676dfSJulian Elischer /* 480a0c0e34bSGleb Smirnoff * The callers should use RTFREE_LOCKED() or RTFREE(), so 481a0c0e34bSGleb Smirnoff * we should come here exactly with the last reference. 482499676dfSJulian Elischer */ 4837138d65cSSam Leffler RT_REMREF(rt); 484a0c0e34bSGleb Smirnoff if (rt->rt_refcnt > 0) { 485a42ea597SQing Li log(LOG_DEBUG, "%s: %p has %d refs\n", __func__, rt, rt->rt_refcnt); 486d1dd20beSSam Leffler goto done; 487a0c0e34bSGleb Smirnoff } 4889c63e9dbSSam Leffler 4899c63e9dbSSam Leffler /* 4909c63e9dbSSam Leffler * On last reference give the "close method" a chance 4919c63e9dbSSam Leffler * to cleanup private state. This also permits (for 4929c63e9dbSSam Leffler * IPv4 and IPv6) a chance to decide if the routing table 4939c63e9dbSSam Leffler * entry should be purged immediately or at a later time. 4949c63e9dbSSam Leffler * When an immediate purge is to happen the close routine 4959c63e9dbSSam Leffler * typically calls rtexpunge which clears the RTF_UP flag 4969c63e9dbSSam Leffler * on the entry so that the code below reclaims the storage. 4979c63e9dbSSam Leffler */ 498d1dd20beSSam Leffler if (rt->rt_refcnt == 0 && rnh->rnh_close) 4995c2dae8eSGarrett Wollman rnh->rnh_close((struct radix_node *)rt, rnh); 500499676dfSJulian Elischer 501499676dfSJulian Elischer /* 502499676dfSJulian Elischer * If we are no longer "up" (and ref == 0) 503499676dfSJulian Elischer * then we can free the resources associated 504499676dfSJulian Elischer * with the route. 505499676dfSJulian Elischer */ 506d1dd20beSSam Leffler if ((rt->rt_flags & RTF_UP) == 0) { 507df8bae1dSRodney W. Grimes if (rt->rt_nodes->rn_flags & (RNF_ACTIVE | RNF_ROOT)) 508df8bae1dSRodney W. Grimes panic("rtfree 2"); 509499676dfSJulian Elischer /* 510499676dfSJulian Elischer * the rtentry must have been removed from the routing table 511499676dfSJulian Elischer * so it is represented in rttrash.. remove that now. 512499676dfSJulian Elischer */ 513603724d3SBjoern A. Zeeb V_rttrash--; 514499676dfSJulian Elischer #ifdef DIAGNOSTIC 515df8bae1dSRodney W. Grimes if (rt->rt_refcnt < 0) { 516623ae52eSPoul-Henning Kamp printf("rtfree: %p not freed (neg refs)\n", rt); 517d1dd20beSSam Leffler goto done; 518df8bae1dSRodney W. Grimes } 519499676dfSJulian Elischer #endif 520499676dfSJulian Elischer /* 521499676dfSJulian Elischer * release references on items we hold them on.. 522499676dfSJulian Elischer * e.g other routes and ifaddrs. 523499676dfSJulian Elischer */ 52419fc74fbSJeffrey Hsu if (rt->rt_ifa) 5251099f828SRobert Watson ifa_free(rt->rt_ifa); 526499676dfSJulian Elischer /* 527499676dfSJulian Elischer * The key is separatly alloc'd so free it (see rt_setgate()). 528499676dfSJulian Elischer * This also frees the gateway, as they are always malloc'd 529499676dfSJulian Elischer * together. 530499676dfSJulian Elischer */ 531df8bae1dSRodney W. Grimes Free(rt_key(rt)); 532499676dfSJulian Elischer 533499676dfSJulian Elischer /* 534499676dfSJulian Elischer * and the rtentry itself of course 535499676dfSJulian Elischer */ 5361ed81b73SMarko Zec uma_zfree(V_rtzone, rt); 537d1dd20beSSam Leffler return; 538df8bae1dSRodney W. Grimes } 539d1dd20beSSam Leffler done: 540d1dd20beSSam Leffler RT_UNLOCK(rt); 541df8bae1dSRodney W. Grimes } 542df8bae1dSRodney W. Grimes 543df8bae1dSRodney W. Grimes 544df8bae1dSRodney W. Grimes /* 545df8bae1dSRodney W. Grimes * Force a routing table entry to the specified 546df8bae1dSRodney W. Grimes * destination to go through the given gateway. 547df8bae1dSRodney W. Grimes * Normally called as a result of a routing redirect 548df8bae1dSRodney W. Grimes * message from the network layer. 549df8bae1dSRodney W. Grimes */ 55026f9a767SRodney W. Grimes void 551d1dd20beSSam Leffler rtredirect(struct sockaddr *dst, 552d1dd20beSSam Leffler struct sockaddr *gateway, 553d1dd20beSSam Leffler struct sockaddr *netmask, 554d1dd20beSSam Leffler int flags, 555d1dd20beSSam Leffler struct sockaddr *src) 556df8bae1dSRodney W. Grimes { 557a8498625SBjoern A. Zeeb 558a8498625SBjoern A. Zeeb rtredirect_fib(dst, gateway, netmask, flags, src, RT_DEFAULT_FIB); 5598b07e49aSJulian Elischer } 5608b07e49aSJulian Elischer 5618b07e49aSJulian Elischer void 5628b07e49aSJulian Elischer rtredirect_fib(struct sockaddr *dst, 5638b07e49aSJulian Elischer struct sockaddr *gateway, 5648b07e49aSJulian Elischer struct sockaddr *netmask, 5658b07e49aSJulian Elischer int flags, 5668b07e49aSJulian Elischer struct sockaddr *src, 5678b07e49aSJulian Elischer u_int fibnum) 5688b07e49aSJulian Elischer { 5698e7e854cSKip Macy struct rtentry *rt, *rt0 = NULL; 570df8bae1dSRodney W. Grimes int error = 0; 57185911824SLuigi Rizzo short *stat = NULL; 572df8bae1dSRodney W. Grimes struct rt_addrinfo info; 573df8bae1dSRodney W. Grimes struct ifaddr *ifa; 574c2c2a7c1SBjoern A. Zeeb struct radix_node_head *rnh; 575c2c2a7c1SBjoern A. Zeeb 5768c0fec80SRobert Watson ifa = NULL; 577c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(fibnum, dst->sa_family); 578c2c2a7c1SBjoern A. Zeeb if (rnh == NULL) { 579c2c2a7c1SBjoern A. Zeeb error = EAFNOSUPPORT; 580c2c2a7c1SBjoern A. Zeeb goto out; 581c2c2a7c1SBjoern A. Zeeb } 582df8bae1dSRodney W. Grimes 583df8bae1dSRodney W. Grimes /* verify the gateway is directly reachable */ 5840cfee0c2SAlan Somers if ((ifa = ifa_ifwithnet(gateway, 0, fibnum)) == NULL) { 585df8bae1dSRodney W. Grimes error = ENETUNREACH; 586df8bae1dSRodney W. Grimes goto out; 587df8bae1dSRodney W. Grimes } 5888b07e49aSJulian Elischer rt = rtalloc1_fib(dst, 0, 0UL, fibnum); /* NB: rt is locked */ 589df8bae1dSRodney W. Grimes /* 590df8bae1dSRodney W. Grimes * If the redirect isn't from our current router for this dst, 591df8bae1dSRodney W. Grimes * it's either old or wrong. If it redirects us to ourselves, 592df8bae1dSRodney W. Grimes * we have a routing loop, perhaps as a result of an interface 593df8bae1dSRodney W. Grimes * going down recently. 594df8bae1dSRodney W. Grimes */ 595df8bae1dSRodney W. Grimes if (!(flags & RTF_DONE) && rt && 596956b0b65SJeffrey Hsu (!sa_equal(src, rt->rt_gateway) || rt->rt_ifa != ifa)) 597df8bae1dSRodney W. Grimes error = EINVAL; 5988896f83aSRobert Watson else if (ifa_ifwithaddr_check(gateway)) 599df8bae1dSRodney W. Grimes error = EHOSTUNREACH; 600df8bae1dSRodney W. Grimes if (error) 601df8bae1dSRodney W. Grimes goto done; 602df8bae1dSRodney W. Grimes /* 603df8bae1dSRodney W. Grimes * Create a new entry if we just got back a wildcard entry 6046bccea7cSRebecca Cran * or the lookup failed. This is necessary for hosts 605df8bae1dSRodney W. Grimes * which use routing redirects generated by smart gateways 606df8bae1dSRodney W. Grimes * to dynamically build the routing tables. 607df8bae1dSRodney W. Grimes */ 60885911824SLuigi Rizzo if (rt == NULL || (rt_mask(rt) && rt_mask(rt)->sa_len < 2)) 609df8bae1dSRodney W. Grimes goto create; 610df8bae1dSRodney W. Grimes /* 611df8bae1dSRodney W. Grimes * Don't listen to the redirect if it's 612df8bae1dSRodney W. Grimes * for a route to an interface. 613df8bae1dSRodney W. Grimes */ 614df8bae1dSRodney W. Grimes if (rt->rt_flags & RTF_GATEWAY) { 615df8bae1dSRodney W. Grimes if (((rt->rt_flags & RTF_HOST) == 0) && (flags & RTF_HOST)) { 616df8bae1dSRodney W. Grimes /* 617df8bae1dSRodney W. Grimes * Changing from route to net => route to host. 618df8bae1dSRodney W. Grimes * Create new route, rather than smashing route to net. 619df8bae1dSRodney W. Grimes */ 620df8bae1dSRodney W. Grimes create: 6218e7e854cSKip Macy rt0 = rt; 6228e7e854cSKip Macy rt = NULL; 6238e7e854cSKip Macy 624df8bae1dSRodney W. Grimes flags |= RTF_GATEWAY | RTF_DYNAMIC; 6258071913dSRuslan Ermilov bzero((caddr_t)&info, sizeof(info)); 6268071913dSRuslan Ermilov info.rti_info[RTAX_DST] = dst; 6278071913dSRuslan Ermilov info.rti_info[RTAX_GATEWAY] = gateway; 6288071913dSRuslan Ermilov info.rti_info[RTAX_NETMASK] = netmask; 6298071913dSRuslan Ermilov info.rti_ifa = ifa; 6308071913dSRuslan Ermilov info.rti_flags = flags; 6313120b9d4SKip Macy if (rt0 != NULL) 6323120b9d4SKip Macy RT_UNLOCK(rt0); /* drop lock to avoid LOR with RNH */ 6338b07e49aSJulian Elischer error = rtrequest1_fib(RTM_ADD, &info, &rt, fibnum); 634d1dd20beSSam Leffler if (rt != NULL) { 6354de5d90cSSam Leffler RT_LOCK(rt); 6363120b9d4SKip Macy if (rt0 != NULL) 63729910a5aSKip Macy EVENTHANDLER_INVOKE(route_redirect_event, rt0, rt, dst); 6388071913dSRuslan Ermilov flags = rt->rt_flags; 639d1dd20beSSam Leffler } 6403120b9d4SKip Macy if (rt0 != NULL) 6413120b9d4SKip Macy RTFREE(rt0); 6428e7e854cSKip Macy 643603724d3SBjoern A. Zeeb stat = &V_rtstat.rts_dynamic; 644df8bae1dSRodney W. Grimes } else { 6458e7e854cSKip Macy struct rtentry *gwrt; 6468e7e854cSKip Macy 647df8bae1dSRodney W. Grimes /* 648df8bae1dSRodney W. Grimes * Smash the current notion of the gateway to 649df8bae1dSRodney W. Grimes * this destination. Should check about netmask!!! 650df8bae1dSRodney W. Grimes */ 651df8bae1dSRodney W. Grimes rt->rt_flags |= RTF_MODIFIED; 652df8bae1dSRodney W. Grimes flags |= RTF_MODIFIED; 653603724d3SBjoern A. Zeeb stat = &V_rtstat.rts_newgateway; 654499676dfSJulian Elischer /* 655499676dfSJulian Elischer * add the key and gateway (in one malloc'd chunk). 656499676dfSJulian Elischer */ 6573120b9d4SKip Macy RT_UNLOCK(rt); 6583120b9d4SKip Macy RADIX_NODE_HEAD_LOCK(rnh); 6593120b9d4SKip Macy RT_LOCK(rt); 660df8bae1dSRodney W. Grimes rt_setgate(rt, rt_key(rt), gateway); 6613120b9d4SKip Macy gwrt = rtalloc1(gateway, 1, RTF_RNH_LOCKED); 6623120b9d4SKip Macy RADIX_NODE_HEAD_UNLOCK(rnh); 66329910a5aSKip Macy EVENTHANDLER_INVOKE(route_redirect_event, rt, gwrt, dst); 6648e7e854cSKip Macy RTFREE_LOCKED(gwrt); 665df8bae1dSRodney W. Grimes } 666df8bae1dSRodney W. Grimes } else 667df8bae1dSRodney W. Grimes error = EHOSTUNREACH; 668df8bae1dSRodney W. Grimes done: 669d1dd20beSSam Leffler if (rt) 6701951e633SJohn Baldwin RTFREE_LOCKED(rt); 671df8bae1dSRodney W. Grimes out: 672df8bae1dSRodney W. Grimes if (error) 673603724d3SBjoern A. Zeeb V_rtstat.rts_badredirect++; 674df8bae1dSRodney W. Grimes else if (stat != NULL) 675df8bae1dSRodney W. Grimes (*stat)++; 676df8bae1dSRodney W. Grimes bzero((caddr_t)&info, sizeof(info)); 677df8bae1dSRodney W. Grimes info.rti_info[RTAX_DST] = dst; 678df8bae1dSRodney W. Grimes info.rti_info[RTAX_GATEWAY] = gateway; 679df8bae1dSRodney W. Grimes info.rti_info[RTAX_NETMASK] = netmask; 680df8bae1dSRodney W. Grimes info.rti_info[RTAX_AUTHOR] = src; 681528737fdSBjoern A. Zeeb rt_missmsg_fib(RTM_REDIRECT, &info, flags, error, fibnum); 6828c0fec80SRobert Watson if (ifa != NULL) 6838c0fec80SRobert Watson ifa_free(ifa); 684df8bae1dSRodney W. Grimes } 685df8bae1dSRodney W. Grimes 6868b07e49aSJulian Elischer int 6878b07e49aSJulian Elischer rtioctl(u_long req, caddr_t data) 6888b07e49aSJulian Elischer { 689a8498625SBjoern A. Zeeb 690a8498625SBjoern A. Zeeb return (rtioctl_fib(req, data, RT_DEFAULT_FIB)); 6918b07e49aSJulian Elischer } 6928b07e49aSJulian Elischer 693df8bae1dSRodney W. Grimes /* 694df8bae1dSRodney W. Grimes * Routing table ioctl interface. 695df8bae1dSRodney W. Grimes */ 696df8bae1dSRodney W. Grimes int 6978b07e49aSJulian Elischer rtioctl_fib(u_long req, caddr_t data, u_int fibnum) 698df8bae1dSRodney W. Grimes { 6995090559bSChristian S.J. Peron 7005090559bSChristian S.J. Peron /* 7015090559bSChristian S.J. Peron * If more ioctl commands are added here, make sure the proper 7025090559bSChristian S.J. Peron * super-user checks are being performed because it is possible for 7035090559bSChristian S.J. Peron * prison-root to make it this far if raw sockets have been enabled 7045090559bSChristian S.J. Peron * in jails. 7055090559bSChristian S.J. Peron */ 706623ae52eSPoul-Henning Kamp #ifdef INET 707f0068c4aSGarrett Wollman /* Multicast goop, grrr... */ 7088b07e49aSJulian Elischer return mrt_ioctl ? mrt_ioctl(req, data, fibnum) : EOPNOTSUPP; 709623ae52eSPoul-Henning Kamp #else /* INET */ 710623ae52eSPoul-Henning Kamp return ENXIO; 711623ae52eSPoul-Henning Kamp #endif /* INET */ 712df8bae1dSRodney W. Grimes } 713df8bae1dSRodney W. Grimes 7148c0fec80SRobert Watson /* 7158c0fec80SRobert Watson * For both ifa_ifwithroute() routines, 'ifa' is returned referenced. 7168c0fec80SRobert Watson */ 717df8bae1dSRodney W. Grimes struct ifaddr * 718d1dd20beSSam Leffler ifa_ifwithroute(int flags, struct sockaddr *dst, struct sockaddr *gateway) 719df8bae1dSRodney W. Grimes { 720a8498625SBjoern A. Zeeb 721a8498625SBjoern A. Zeeb return (ifa_ifwithroute_fib(flags, dst, gateway, RT_DEFAULT_FIB)); 7228b07e49aSJulian Elischer } 7238b07e49aSJulian Elischer 7248b07e49aSJulian Elischer struct ifaddr * 7258b07e49aSJulian Elischer ifa_ifwithroute_fib(int flags, struct sockaddr *dst, struct sockaddr *gateway, 7268b07e49aSJulian Elischer u_int fibnum) 7278b07e49aSJulian Elischer { 728df8bae1dSRodney W. Grimes register struct ifaddr *ifa; 729e034e82cSQing Li int not_found = 0; 730d1dd20beSSam Leffler 731df8bae1dSRodney W. Grimes if ((flags & RTF_GATEWAY) == 0) { 732df8bae1dSRodney W. Grimes /* 733df8bae1dSRodney W. Grimes * If we are adding a route to an interface, 734df8bae1dSRodney W. Grimes * and the interface is a pt to pt link 735df8bae1dSRodney W. Grimes * we should search for the destination 736df8bae1dSRodney W. Grimes * as our clue to the interface. Otherwise 737df8bae1dSRodney W. Grimes * we can use the local address. 738df8bae1dSRodney W. Grimes */ 73985911824SLuigi Rizzo ifa = NULL; 74085911824SLuigi Rizzo if (flags & RTF_HOST) 7410cfee0c2SAlan Somers ifa = ifa_ifwithdstaddr(dst, fibnum); 74285911824SLuigi Rizzo if (ifa == NULL) 743df8bae1dSRodney W. Grimes ifa = ifa_ifwithaddr(gateway); 744df8bae1dSRodney W. Grimes } else { 745df8bae1dSRodney W. Grimes /* 746df8bae1dSRodney W. Grimes * If we are adding a route to a remote net 747df8bae1dSRodney W. Grimes * or host, the gateway may still be on the 748df8bae1dSRodney W. Grimes * other end of a pt to pt link. 749df8bae1dSRodney W. Grimes */ 7500cfee0c2SAlan Somers ifa = ifa_ifwithdstaddr(gateway, fibnum); 751df8bae1dSRodney W. Grimes } 75285911824SLuigi Rizzo if (ifa == NULL) 7530cfee0c2SAlan Somers ifa = ifa_ifwithnet(gateway, 0, fibnum); 75485911824SLuigi Rizzo if (ifa == NULL) { 7559b20205dSKip Macy struct rtentry *rt = rtalloc1_fib(gateway, 0, RTF_RNH_LOCKED, fibnum); 75685911824SLuigi Rizzo if (rt == NULL) 75785911824SLuigi Rizzo return (NULL); 758e034e82cSQing Li /* 759e034e82cSQing Li * dismiss a gateway that is reachable only 760e034e82cSQing Li * through the default router 761e034e82cSQing Li */ 762e034e82cSQing Li switch (gateway->sa_family) { 763e034e82cSQing Li case AF_INET: 764e034e82cSQing Li if (satosin(rt_key(rt))->sin_addr.s_addr == INADDR_ANY) 765e034e82cSQing Li not_found = 1; 766e034e82cSQing Li break; 767e034e82cSQing Li case AF_INET6: 768e034e82cSQing Li if (IN6_IS_ADDR_UNSPECIFIED(&satosin6(rt_key(rt))->sin6_addr)) 769e034e82cSQing Li not_found = 1; 770e034e82cSQing Li break; 771e034e82cSQing Li default: 772e034e82cSQing Li break; 773e034e82cSQing Li } 7748c0fec80SRobert Watson if (!not_found && rt->rt_ifa != NULL) { 7758c0fec80SRobert Watson ifa = rt->rt_ifa; 7768c0fec80SRobert Watson ifa_ref(ifa); 7778c0fec80SRobert Watson } 7787138d65cSSam Leffler RT_REMREF(rt); 779d1dd20beSSam Leffler RT_UNLOCK(rt); 7808c0fec80SRobert Watson if (not_found || ifa == NULL) 78185911824SLuigi Rizzo return (NULL); 782df8bae1dSRodney W. Grimes } 783df8bae1dSRodney W. Grimes if (ifa->ifa_addr->sa_family != dst->sa_family) { 784df8bae1dSRodney W. Grimes struct ifaddr *oifa = ifa; 785df8bae1dSRodney W. Grimes ifa = ifaof_ifpforaddr(dst, ifa->ifa_ifp); 78685911824SLuigi Rizzo if (ifa == NULL) 787df8bae1dSRodney W. Grimes ifa = oifa; 7888c0fec80SRobert Watson else 7898c0fec80SRobert Watson ifa_free(oifa); 790df8bae1dSRodney W. Grimes } 791df8bae1dSRodney W. Grimes return (ifa); 792df8bae1dSRodney W. Grimes } 793df8bae1dSRodney W. Grimes 794b0a76b88SJulian Elischer /* 795b0a76b88SJulian Elischer * Do appropriate manipulations of a routing tree given 796b0a76b88SJulian Elischer * all the bits of info needed 797b0a76b88SJulian Elischer */ 798df8bae1dSRodney W. Grimes int 799d1dd20beSSam Leffler rtrequest(int req, 800d1dd20beSSam Leffler struct sockaddr *dst, 801d1dd20beSSam Leffler struct sockaddr *gateway, 802d1dd20beSSam Leffler struct sockaddr *netmask, 803d1dd20beSSam Leffler int flags, 804d1dd20beSSam Leffler struct rtentry **ret_nrt) 805df8bae1dSRodney W. Grimes { 806a8498625SBjoern A. Zeeb 807a8498625SBjoern A. Zeeb return (rtrequest_fib(req, dst, gateway, netmask, flags, ret_nrt, 808a8498625SBjoern A. Zeeb RT_DEFAULT_FIB)); 8098b07e49aSJulian Elischer } 8108b07e49aSJulian Elischer 8118b07e49aSJulian Elischer int 8128b07e49aSJulian Elischer rtrequest_fib(int req, 8138b07e49aSJulian Elischer struct sockaddr *dst, 8148b07e49aSJulian Elischer struct sockaddr *gateway, 8158b07e49aSJulian Elischer struct sockaddr *netmask, 8168b07e49aSJulian Elischer int flags, 8178b07e49aSJulian Elischer struct rtentry **ret_nrt, 8188b07e49aSJulian Elischer u_int fibnum) 8198b07e49aSJulian Elischer { 8208071913dSRuslan Ermilov struct rt_addrinfo info; 8218071913dSRuslan Ermilov 822ac4a76ebSBjoern A. Zeeb if (dst->sa_len == 0) 823ac4a76ebSBjoern A. Zeeb return(EINVAL); 824ac4a76ebSBjoern A. Zeeb 8258071913dSRuslan Ermilov bzero((caddr_t)&info, sizeof(info)); 8268071913dSRuslan Ermilov info.rti_flags = flags; 8278071913dSRuslan Ermilov info.rti_info[RTAX_DST] = dst; 8288071913dSRuslan Ermilov info.rti_info[RTAX_GATEWAY] = gateway; 8298071913dSRuslan Ermilov info.rti_info[RTAX_NETMASK] = netmask; 8308b07e49aSJulian Elischer return rtrequest1_fib(req, &info, ret_nrt, fibnum); 8318071913dSRuslan Ermilov } 8328071913dSRuslan Ermilov 8338071913dSRuslan Ermilov /* 8348071913dSRuslan Ermilov * These (questionable) definitions of apparent local variables apply 8358071913dSRuslan Ermilov * to the next two functions. XXXXXX!!! 8368071913dSRuslan Ermilov */ 8378071913dSRuslan Ermilov #define dst info->rti_info[RTAX_DST] 8388071913dSRuslan Ermilov #define gateway info->rti_info[RTAX_GATEWAY] 8398071913dSRuslan Ermilov #define netmask info->rti_info[RTAX_NETMASK] 8408071913dSRuslan Ermilov #define ifaaddr info->rti_info[RTAX_IFA] 8418071913dSRuslan Ermilov #define ifpaddr info->rti_info[RTAX_IFP] 8428071913dSRuslan Ermilov #define flags info->rti_flags 8438071913dSRuslan Ermilov 8448071913dSRuslan Ermilov int 845d1dd20beSSam Leffler rt_getifa(struct rt_addrinfo *info) 8468071913dSRuslan Ermilov { 847a8498625SBjoern A. Zeeb 848a8498625SBjoern A. Zeeb return (rt_getifa_fib(info, RT_DEFAULT_FIB)); 8498b07e49aSJulian Elischer } 8508b07e49aSJulian Elischer 8518c0fec80SRobert Watson /* 8528c0fec80SRobert Watson * Look up rt_addrinfo for a specific fib. Note that if rti_ifa is defined, 8538c0fec80SRobert Watson * it will be referenced so the caller must free it. 8548c0fec80SRobert Watson */ 8558b07e49aSJulian Elischer int 8568b07e49aSJulian Elischer rt_getifa_fib(struct rt_addrinfo *info, u_int fibnum) 8578b07e49aSJulian Elischer { 8588071913dSRuslan Ermilov struct ifaddr *ifa; 8598071913dSRuslan Ermilov int error = 0; 8608071913dSRuslan Ermilov 8618071913dSRuslan Ermilov /* 8628071913dSRuslan Ermilov * ifp may be specified by sockaddr_dl 8638071913dSRuslan Ermilov * when protocol address is ambiguous. 8648071913dSRuslan Ermilov */ 8658071913dSRuslan Ermilov if (info->rti_ifp == NULL && ifpaddr != NULL && 8668071913dSRuslan Ermilov ifpaddr->sa_family == AF_LINK && 8670cfee0c2SAlan Somers (ifa = ifa_ifwithnet(ifpaddr, 0, fibnum)) != NULL) { 8688071913dSRuslan Ermilov info->rti_ifp = ifa->ifa_ifp; 8698c0fec80SRobert Watson ifa_free(ifa); 8708c0fec80SRobert Watson } 8718071913dSRuslan Ermilov if (info->rti_ifa == NULL && ifaaddr != NULL) 8728071913dSRuslan Ermilov info->rti_ifa = ifa_ifwithaddr(ifaaddr); 8738071913dSRuslan Ermilov if (info->rti_ifa == NULL) { 8748071913dSRuslan Ermilov struct sockaddr *sa; 8758071913dSRuslan Ermilov 8768071913dSRuslan Ermilov sa = ifaaddr != NULL ? ifaaddr : 8778071913dSRuslan Ermilov (gateway != NULL ? gateway : dst); 8788071913dSRuslan Ermilov if (sa != NULL && info->rti_ifp != NULL) 8798071913dSRuslan Ermilov info->rti_ifa = ifaof_ifpforaddr(sa, info->rti_ifp); 8808071913dSRuslan Ermilov else if (dst != NULL && gateway != NULL) 8818b07e49aSJulian Elischer info->rti_ifa = ifa_ifwithroute_fib(flags, dst, gateway, 8828b07e49aSJulian Elischer fibnum); 8838071913dSRuslan Ermilov else if (sa != NULL) 8848b07e49aSJulian Elischer info->rti_ifa = ifa_ifwithroute_fib(flags, sa, sa, 8858b07e49aSJulian Elischer fibnum); 8868071913dSRuslan Ermilov } 8878071913dSRuslan Ermilov if ((ifa = info->rti_ifa) != NULL) { 8888071913dSRuslan Ermilov if (info->rti_ifp == NULL) 8898071913dSRuslan Ermilov info->rti_ifp = ifa->ifa_ifp; 8908071913dSRuslan Ermilov } else 8918071913dSRuslan Ermilov error = ENETUNREACH; 8928071913dSRuslan Ermilov return (error); 8938071913dSRuslan Ermilov } 8948071913dSRuslan Ermilov 8959c63e9dbSSam Leffler /* 8969c63e9dbSSam Leffler * Expunges references to a route that's about to be reclaimed. 8979c63e9dbSSam Leffler * The route must be locked. 8989c63e9dbSSam Leffler */ 8999c63e9dbSSam Leffler int 9009c63e9dbSSam Leffler rtexpunge(struct rtentry *rt) 9019c63e9dbSSam Leffler { 902c7ea0aa6SQing Li #if !defined(RADIX_MPATH) 9039c63e9dbSSam Leffler struct radix_node *rn; 904c7ea0aa6SQing Li #else 905c7ea0aa6SQing Li struct rt_addrinfo info; 906c7ea0aa6SQing Li int fib; 907c7ea0aa6SQing Li struct rtentry *rt0; 908c7ea0aa6SQing Li #endif 9099c63e9dbSSam Leffler struct radix_node_head *rnh; 9109c63e9dbSSam Leffler struct ifaddr *ifa; 9119c63e9dbSSam Leffler int error = 0; 9129c63e9dbSSam Leffler 9136e6b3f7cSQing Li /* 9146e6b3f7cSQing Li * Find the correct routing tree to use for this Address Family 9156e6b3f7cSQing Li */ 916c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(rt->rt_fibnum, rt_key(rt)->sa_family); 9179c63e9dbSSam Leffler RT_LOCK_ASSERT(rt); 9186e6b3f7cSQing Li if (rnh == NULL) 9196e6b3f7cSQing Li return (EAFNOSUPPORT); 9203120b9d4SKip Macy RADIX_NODE_HEAD_LOCK_ASSERT(rnh); 921c7ea0aa6SQing Li 922c7ea0aa6SQing Li #ifdef RADIX_MPATH 923c7ea0aa6SQing Li fib = rt->rt_fibnum; 924c7ea0aa6SQing Li bzero(&info, sizeof(info)); 925c7ea0aa6SQing Li info.rti_ifp = rt->rt_ifp; 926c7ea0aa6SQing Li info.rti_flags = RTF_RNH_LOCKED; 927c7ea0aa6SQing Li info.rti_info[RTAX_DST] = rt_key(rt); 928c7ea0aa6SQing Li info.rti_info[RTAX_GATEWAY] = rt->rt_ifa->ifa_addr; 929c7ea0aa6SQing Li 930c7ea0aa6SQing Li RT_UNLOCK(rt); 931c7ea0aa6SQing Li error = rtrequest1_fib(RTM_DELETE, &info, &rt0, fib); 932c7ea0aa6SQing Li 933c7ea0aa6SQing Li if (error == 0 && rt0 != NULL) { 934c7ea0aa6SQing Li rt = rt0; 935c7ea0aa6SQing Li RT_LOCK(rt); 936c7ea0aa6SQing Li } else if (error != 0) { 937c7ea0aa6SQing Li RT_LOCK(rt); 938c7ea0aa6SQing Li return (error); 939c7ea0aa6SQing Li } 940c7ea0aa6SQing Li #else 9419c63e9dbSSam Leffler /* 9429c63e9dbSSam Leffler * Remove the item from the tree; it should be there, 9439c63e9dbSSam Leffler * but when callers invoke us blindly it may not (sigh). 9449c63e9dbSSam Leffler */ 9459c63e9dbSSam Leffler rn = rnh->rnh_deladdr(rt_key(rt), rt_mask(rt), rnh); 94685911824SLuigi Rizzo if (rn == NULL) { 9479c63e9dbSSam Leffler error = ESRCH; 9489c63e9dbSSam Leffler goto bad; 9499c63e9dbSSam Leffler } 9509c63e9dbSSam Leffler KASSERT((rn->rn_flags & (RNF_ACTIVE | RNF_ROOT)) == 0, 9519c63e9dbSSam Leffler ("unexpected flags 0x%x", rn->rn_flags)); 952d6941ce9SLuigi Rizzo KASSERT(rt == RNTORT(rn), 9539c63e9dbSSam Leffler ("lookup mismatch, rt %p rn %p", rt, rn)); 954c7ea0aa6SQing Li #endif /* RADIX_MPATH */ 9559c63e9dbSSam Leffler 9569c63e9dbSSam Leffler rt->rt_flags &= ~RTF_UP; 9579c63e9dbSSam Leffler 9589c63e9dbSSam Leffler /* 9599c63e9dbSSam Leffler * Give the protocol a chance to keep things in sync. 9609c63e9dbSSam Leffler */ 9619c63e9dbSSam Leffler if ((ifa = rt->rt_ifa) && ifa->ifa_rtrequest) { 9629c63e9dbSSam Leffler struct rt_addrinfo info; 9639c63e9dbSSam Leffler 9649c63e9dbSSam Leffler bzero((caddr_t)&info, sizeof(info)); 9659c63e9dbSSam Leffler info.rti_flags = rt->rt_flags; 9669c63e9dbSSam Leffler info.rti_info[RTAX_DST] = rt_key(rt); 9679c63e9dbSSam Leffler info.rti_info[RTAX_GATEWAY] = rt->rt_gateway; 9689c63e9dbSSam Leffler info.rti_info[RTAX_NETMASK] = rt_mask(rt); 9699c63e9dbSSam Leffler ifa->ifa_rtrequest(RTM_DELETE, rt, &info); 9709c63e9dbSSam Leffler } 9719c63e9dbSSam Leffler 9729c63e9dbSSam Leffler /* 9739c63e9dbSSam Leffler * one more rtentry floating around that is not 9749c63e9dbSSam Leffler * linked to the routing table. 9759c63e9dbSSam Leffler */ 976603724d3SBjoern A. Zeeb V_rttrash++; 977c7ea0aa6SQing Li #if !defined(RADIX_MPATH) 9789c63e9dbSSam Leffler bad: 979c7ea0aa6SQing Li #endif 9809c63e9dbSSam Leffler return (error); 9819c63e9dbSSam Leffler } 9829c63e9dbSSam Leffler 9835a2f4cbdSAlexander V. Chernikov #if 0 9845a2f4cbdSAlexander V. Chernikov int p_sockaddr(char *buf, int buflen, struct sockaddr *s); 9855a2f4cbdSAlexander V. Chernikov int rt_print(char *buf, int buflen, struct rtentry *rt); 9865a2f4cbdSAlexander V. Chernikov 9875a2f4cbdSAlexander V. Chernikov int 9885a2f4cbdSAlexander V. Chernikov p_sockaddr(char *buf, int buflen, struct sockaddr *s) 9895a2f4cbdSAlexander V. Chernikov { 9905a2f4cbdSAlexander V. Chernikov void *paddr = NULL; 9915a2f4cbdSAlexander V. Chernikov 9925a2f4cbdSAlexander V. Chernikov switch (s->sa_family) { 9935a2f4cbdSAlexander V. Chernikov case AF_INET: 9945a2f4cbdSAlexander V. Chernikov paddr = &((struct sockaddr_in *)s)->sin_addr; 9955a2f4cbdSAlexander V. Chernikov break; 9965a2f4cbdSAlexander V. Chernikov case AF_INET6: 9975a2f4cbdSAlexander V. Chernikov paddr = &((struct sockaddr_in6 *)s)->sin6_addr; 9985a2f4cbdSAlexander V. Chernikov break; 9995a2f4cbdSAlexander V. Chernikov } 10005a2f4cbdSAlexander V. Chernikov 10015a2f4cbdSAlexander V. Chernikov if (paddr == NULL) 10025a2f4cbdSAlexander V. Chernikov return (0); 10035a2f4cbdSAlexander V. Chernikov 10045a2f4cbdSAlexander V. Chernikov if (inet_ntop(s->sa_family, paddr, buf, buflen) == NULL) 10055a2f4cbdSAlexander V. Chernikov return (0); 10065a2f4cbdSAlexander V. Chernikov 10075a2f4cbdSAlexander V. Chernikov return (strlen(buf)); 10085a2f4cbdSAlexander V. Chernikov } 10095a2f4cbdSAlexander V. Chernikov 10105a2f4cbdSAlexander V. Chernikov int 10115a2f4cbdSAlexander V. Chernikov rt_print(char *buf, int buflen, struct rtentry *rt) 10125a2f4cbdSAlexander V. Chernikov { 10135a2f4cbdSAlexander V. Chernikov struct sockaddr *addr, *mask; 10145a2f4cbdSAlexander V. Chernikov int i = 0; 10155a2f4cbdSAlexander V. Chernikov 10165a2f4cbdSAlexander V. Chernikov addr = rt_key(rt); 10175a2f4cbdSAlexander V. Chernikov mask = rt_mask(rt); 10185a2f4cbdSAlexander V. Chernikov 10195a2f4cbdSAlexander V. Chernikov i = p_sockaddr(buf, buflen, addr); 10205a2f4cbdSAlexander V. Chernikov if (!(rt->rt_flags & RTF_HOST)) { 10215a2f4cbdSAlexander V. Chernikov buf[i++] = '/'; 10225a2f4cbdSAlexander V. Chernikov i += p_sockaddr(buf + i, buflen - i, mask); 10235a2f4cbdSAlexander V. Chernikov } 10245a2f4cbdSAlexander V. Chernikov 10255a2f4cbdSAlexander V. Chernikov if (rt->rt_flags & RTF_GATEWAY) { 10265a2f4cbdSAlexander V. Chernikov buf[i++] = '>'; 10275a2f4cbdSAlexander V. Chernikov i += p_sockaddr(buf + i, buflen - i, rt->rt_gateway); 10285a2f4cbdSAlexander V. Chernikov } 10295a2f4cbdSAlexander V. Chernikov 10305a2f4cbdSAlexander V. Chernikov return (i); 10315a2f4cbdSAlexander V. Chernikov } 10325a2f4cbdSAlexander V. Chernikov #endif 10335a2f4cbdSAlexander V. Chernikov 1034427ac07fSKip Macy #ifdef RADIX_MPATH 1035427ac07fSKip Macy static int 1036427ac07fSKip Macy rn_mpath_update(int req, struct rt_addrinfo *info, 1037427ac07fSKip Macy struct radix_node_head *rnh, struct rtentry **ret_nrt) 1038427ac07fSKip Macy { 1039427ac07fSKip Macy /* 1040427ac07fSKip Macy * if we got multipath routes, we require users to specify 1041427ac07fSKip Macy * a matching RTAX_GATEWAY. 1042427ac07fSKip Macy */ 1043427ac07fSKip Macy struct rtentry *rt, *rto = NULL; 10449b5f5edeSGeorge V. Neville-Neil register struct radix_node *rn; 1045427ac07fSKip Macy int error = 0; 1046427ac07fSKip Macy 10475a2f4cbdSAlexander V. Chernikov rn = rnh->rnh_lookup(dst, netmask, rnh); 1048427ac07fSKip Macy if (rn == NULL) 1049427ac07fSKip Macy return (ESRCH); 1050427ac07fSKip Macy rto = rt = RNTORT(rn); 10515a2f4cbdSAlexander V. Chernikov 1052427ac07fSKip Macy rt = rt_mpath_matchgate(rt, gateway); 1053427ac07fSKip Macy if (rt == NULL) 1054427ac07fSKip Macy return (ESRCH); 1055427ac07fSKip Macy /* 1056427ac07fSKip Macy * this is the first entry in the chain 1057427ac07fSKip Macy */ 1058427ac07fSKip Macy if (rto == rt) { 1059427ac07fSKip Macy rn = rn_mpath_next((struct radix_node *)rt); 1060427ac07fSKip Macy /* 1061427ac07fSKip Macy * there is another entry, now it's active 1062427ac07fSKip Macy */ 1063427ac07fSKip Macy if (rn) { 1064427ac07fSKip Macy rto = RNTORT(rn); 1065427ac07fSKip Macy RT_LOCK(rto); 1066427ac07fSKip Macy rto->rt_flags |= RTF_UP; 1067427ac07fSKip Macy RT_UNLOCK(rto); 1068427ac07fSKip Macy } else if (rt->rt_flags & RTF_GATEWAY) { 1069427ac07fSKip Macy /* 1070427ac07fSKip Macy * For gateway routes, we need to 1071427ac07fSKip Macy * make sure that we we are deleting 1072427ac07fSKip Macy * the correct gateway. 1073427ac07fSKip Macy * rt_mpath_matchgate() does not 1074427ac07fSKip Macy * check the case when there is only 1075427ac07fSKip Macy * one route in the chain. 1076427ac07fSKip Macy */ 1077427ac07fSKip Macy if (gateway && 1078427ac07fSKip Macy (rt->rt_gateway->sa_len != gateway->sa_len || 1079427ac07fSKip Macy memcmp(rt->rt_gateway, gateway, gateway->sa_len))) 1080427ac07fSKip Macy error = ESRCH; 10816a7bff2cSKip Macy else { 10826a7bff2cSKip Macy /* 10836a7bff2cSKip Macy * remove from tree before returning it 10846a7bff2cSKip Macy * to the caller 10856a7bff2cSKip Macy */ 10866a7bff2cSKip Macy rn = rnh->rnh_deladdr(dst, netmask, rnh); 10876a7bff2cSKip Macy KASSERT(rt == RNTORT(rn), ("radix node disappeared")); 10886a7bff2cSKip Macy goto gwdelete; 10896a7bff2cSKip Macy } 10906a7bff2cSKip Macy 1091427ac07fSKip Macy } 1092427ac07fSKip Macy /* 1093427ac07fSKip Macy * use the normal delete code to remove 1094427ac07fSKip Macy * the first entry 1095427ac07fSKip Macy */ 1096427ac07fSKip Macy if (req != RTM_DELETE) 1097427ac07fSKip Macy goto nondelete; 1098427ac07fSKip Macy 1099427ac07fSKip Macy error = ENOENT; 1100427ac07fSKip Macy goto done; 1101427ac07fSKip Macy } 1102427ac07fSKip Macy 1103427ac07fSKip Macy /* 1104427ac07fSKip Macy * if the entry is 2nd and on up 1105427ac07fSKip Macy */ 1106427ac07fSKip Macy if ((req == RTM_DELETE) && !rt_mpath_deldup(rto, rt)) 1107427ac07fSKip Macy panic ("rtrequest1: rt_mpath_deldup"); 11086a7bff2cSKip Macy gwdelete: 1109427ac07fSKip Macy RT_LOCK(rt); 1110427ac07fSKip Macy RT_ADDREF(rt); 1111427ac07fSKip Macy if (req == RTM_DELETE) { 1112427ac07fSKip Macy rt->rt_flags &= ~RTF_UP; 1113427ac07fSKip Macy /* 1114427ac07fSKip Macy * One more rtentry floating around that is not 1115427ac07fSKip Macy * linked to the routing table. rttrash will be decremented 1116427ac07fSKip Macy * when RTFREE(rt) is eventually called. 1117427ac07fSKip Macy */ 1118427ac07fSKip Macy V_rttrash++; 1119427ac07fSKip Macy } 1120427ac07fSKip Macy 1121427ac07fSKip Macy nondelete: 1122427ac07fSKip Macy if (req != RTM_DELETE) 1123427ac07fSKip Macy panic("unrecognized request %d", req); 1124427ac07fSKip Macy 1125427ac07fSKip Macy 1126427ac07fSKip Macy /* 1127427ac07fSKip Macy * If the caller wants it, then it can have it, 1128427ac07fSKip Macy * but it's up to it to free the rtentry as we won't be 1129427ac07fSKip Macy * doing it. 1130427ac07fSKip Macy */ 1131427ac07fSKip Macy if (ret_nrt) { 1132427ac07fSKip Macy *ret_nrt = rt; 1133427ac07fSKip Macy RT_UNLOCK(rt); 1134427ac07fSKip Macy } else 1135427ac07fSKip Macy RTFREE_LOCKED(rt); 1136427ac07fSKip Macy done: 1137427ac07fSKip Macy return (error); 1138427ac07fSKip Macy } 1139427ac07fSKip Macy #endif 1140427ac07fSKip Macy 11418071913dSRuslan Ermilov int 11428b07e49aSJulian Elischer rtrequest1_fib(int req, struct rt_addrinfo *info, struct rtentry **ret_nrt, 11438b07e49aSJulian Elischer u_int fibnum) 11448b07e49aSJulian Elischer { 11453120b9d4SKip Macy int error = 0, needlock = 0; 1146df8bae1dSRodney W. Grimes register struct rtentry *rt; 1147e5c610d6SQing Li #ifdef FLOWTABLE 1148e5c610d6SQing Li register struct rtentry *rt0; 1149e5c610d6SQing Li #endif 1150df8bae1dSRodney W. Grimes register struct radix_node *rn; 1151df8bae1dSRodney W. Grimes register struct radix_node_head *rnh; 1152df8bae1dSRodney W. Grimes struct ifaddr *ifa; 1153df8bae1dSRodney W. Grimes struct sockaddr *ndst; 115446a70de2SQing Li struct sockaddr_storage mdst; 1155df8bae1dSRodney W. Grimes #define senderr(x) { error = x ; goto bad; } 1156df8bae1dSRodney W. Grimes 11578b07e49aSJulian Elischer KASSERT((fibnum < rt_numfibs), ("rtrequest1_fib: bad fibnum")); 1158b680a383SBjoern A. Zeeb switch (dst->sa_family) { 1159b680a383SBjoern A. Zeeb case AF_INET6: 1160b680a383SBjoern A. Zeeb case AF_INET: 1161b680a383SBjoern A. Zeeb /* We support multiple FIBs. */ 1162b680a383SBjoern A. Zeeb break; 1163b680a383SBjoern A. Zeeb default: 1164b680a383SBjoern A. Zeeb fibnum = RT_DEFAULT_FIB; 1165b680a383SBjoern A. Zeeb break; 1166b680a383SBjoern A. Zeeb } 1167b680a383SBjoern A. Zeeb 1168b0a76b88SJulian Elischer /* 1169b0a76b88SJulian Elischer * Find the correct routing tree to use for this Address Family 1170b0a76b88SJulian Elischer */ 1171c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(fibnum, dst->sa_family); 117285911824SLuigi Rizzo if (rnh == NULL) 1173983985c1SJeffrey Hsu return (EAFNOSUPPORT); 11743120b9d4SKip Macy needlock = ((flags & RTF_RNH_LOCKED) == 0); 11753120b9d4SKip Macy flags &= ~RTF_RNH_LOCKED; 11763120b9d4SKip Macy if (needlock) 1177956b0b65SJeffrey Hsu RADIX_NODE_HEAD_LOCK(rnh); 1178c96b8224SKip Macy else 1179c96b8224SKip Macy RADIX_NODE_HEAD_LOCK_ASSERT(rnh); 1180b0a76b88SJulian Elischer /* 1181b0a76b88SJulian Elischer * If we are adding a host route then we don't want to put 118266953138SRuslan Ermilov * a netmask in the tree, nor do we want to clone it. 1183b0a76b88SJulian Elischer */ 11846e6b3f7cSQing Li if (flags & RTF_HOST) 118585911824SLuigi Rizzo netmask = NULL; 11866e6b3f7cSQing Li 1187df8bae1dSRodney W. Grimes switch (req) { 1188df8bae1dSRodney W. Grimes case RTM_DELETE: 118946a70de2SQing Li if (netmask) { 119046a70de2SQing Li rt_maskedcopy(dst, (struct sockaddr *)&mdst, netmask); 119146a70de2SQing Li dst = (struct sockaddr *)&mdst; 119246a70de2SQing Li } 1193e440aed9SQing Li #ifdef RADIX_MPATH 1194e440aed9SQing Li if (rn_mpath_capable(rnh)) { 1195427ac07fSKip Macy error = rn_mpath_update(req, info, rnh, ret_nrt); 1196e440aed9SQing Li /* 1197427ac07fSKip Macy * "bad" holds true for the success case 1198427ac07fSKip Macy * as well 1199e440aed9SQing Li */ 1200427ac07fSKip Macy if (error != ENOENT) 1201427ac07fSKip Macy goto bad; 1202c7ea0aa6SQing Li error = 0; 1203e440aed9SQing Li } 1204ea9cd9f2SBjoern A. Zeeb #endif 12053034f43fSAlexander V. Chernikov if ((flags & RTF_PINNED) == 0) { 12063034f43fSAlexander V. Chernikov /* Check if target route can be deleted */ 12073034f43fSAlexander V. Chernikov rt = (struct rtentry *)rnh->rnh_lookup(dst, 12083034f43fSAlexander V. Chernikov netmask, rnh); 12093034f43fSAlexander V. Chernikov if ((rt != NULL) && (rt->rt_flags & RTF_PINNED)) 12103034f43fSAlexander V. Chernikov senderr(EADDRINUSE); 12113034f43fSAlexander V. Chernikov } 12123034f43fSAlexander V. Chernikov 1213b0a76b88SJulian Elischer /* 1214b0a76b88SJulian Elischer * Remove the item from the tree and return it. 1215b0a76b88SJulian Elischer * Complain if it is not there and do no more processing. 1216b0a76b88SJulian Elischer */ 1217d1dd20beSSam Leffler rn = rnh->rnh_deladdr(dst, netmask, rnh); 121885911824SLuigi Rizzo if (rn == NULL) 1219df8bae1dSRodney W. Grimes senderr(ESRCH); 1220df8bae1dSRodney W. Grimes if (rn->rn_flags & (RNF_ACTIVE | RNF_ROOT)) 1221df8bae1dSRodney W. Grimes panic ("rtrequest delete"); 1222d6941ce9SLuigi Rizzo rt = RNTORT(rn); 1223d1dd20beSSam Leffler RT_LOCK(rt); 12247138d65cSSam Leffler RT_ADDREF(rt); 122571eba915SRuslan Ermilov rt->rt_flags &= ~RTF_UP; 1226c2bed6a3SGarrett Wollman 1227c2bed6a3SGarrett Wollman /* 1228499676dfSJulian Elischer * give the protocol a chance to keep things in sync. 1229b0a76b88SJulian Elischer */ 1230df8bae1dSRodney W. Grimes if ((ifa = rt->rt_ifa) && ifa->ifa_rtrequest) 12318071913dSRuslan Ermilov ifa->ifa_rtrequest(RTM_DELETE, rt, info); 1232499676dfSJulian Elischer 1233b0a76b88SJulian Elischer /* 1234d6941ce9SLuigi Rizzo * One more rtentry floating around that is not 1235d6941ce9SLuigi Rizzo * linked to the routing table. rttrash will be decremented 1236d6941ce9SLuigi Rizzo * when RTFREE(rt) is eventually called. 1237499676dfSJulian Elischer */ 1238603724d3SBjoern A. Zeeb V_rttrash++; 1239499676dfSJulian Elischer 1240499676dfSJulian Elischer /* 1241499676dfSJulian Elischer * If the caller wants it, then it can have it, 1242499676dfSJulian Elischer * but it's up to it to free the rtentry as we won't be 1243499676dfSJulian Elischer * doing it. 1244b0a76b88SJulian Elischer */ 1245d1dd20beSSam Leffler if (ret_nrt) { 1246df8bae1dSRodney W. Grimes *ret_nrt = rt; 1247d1dd20beSSam Leffler RT_UNLOCK(rt); 1248d1dd20beSSam Leffler } else 1249d1dd20beSSam Leffler RTFREE_LOCKED(rt); 1250df8bae1dSRodney W. Grimes break; 1251df8bae1dSRodney W. Grimes case RTM_RESOLVE: 12526e6b3f7cSQing Li /* 12536e6b3f7cSQing Li * resolve was only used for route cloning 12546e6b3f7cSQing Li * here for compat 12556e6b3f7cSQing Li */ 12566e6b3f7cSQing Li break; 1257df8bae1dSRodney W. Grimes case RTM_ADD: 12585df72964SGarrett Wollman if ((flags & RTF_GATEWAY) && !gateway) 125916a2e0a6SQing Li senderr(EINVAL); 126016a2e0a6SQing Li if (dst && gateway && (dst->sa_family != gateway->sa_family) && 126116a2e0a6SQing Li (gateway->sa_family != AF_UNSPEC) && (gateway->sa_family != AF_LINK)) 126216a2e0a6SQing Li senderr(EINVAL); 12635df72964SGarrett Wollman 12648c0fec80SRobert Watson if (info->rti_ifa == NULL) { 12658c0fec80SRobert Watson error = rt_getifa_fib(info, fibnum); 12668c0fec80SRobert Watson if (error) 12678071913dSRuslan Ermilov senderr(error); 12688c0fec80SRobert Watson } else 12698c0fec80SRobert Watson ifa_ref(info->rti_ifa); 12708071913dSRuslan Ermilov ifa = info->rti_ifa; 1271e3a7aa6fSGleb Smirnoff rt = uma_zalloc(V_rtzone, M_NOWAIT); 12728c0fec80SRobert Watson if (rt == NULL) { 12738c0fec80SRobert Watson ifa_free(ifa); 1274df8bae1dSRodney W. Grimes senderr(ENOBUFS); 12758c0fec80SRobert Watson } 1276df8bae1dSRodney W. Grimes rt->rt_flags = RTF_UP | flags; 12778b07e49aSJulian Elischer rt->rt_fibnum = fibnum; 1278499676dfSJulian Elischer /* 1279a8498625SBjoern A. Zeeb * Add the gateway. Possibly re-malloc-ing the storage for it. 1280499676dfSJulian Elischer */ 1281d1dd20beSSam Leffler RT_LOCK(rt); 1282831a80b0SMatthew Dillon if ((error = rt_setgate(rt, dst, gateway)) != 0) { 12838c0fec80SRobert Watson ifa_free(ifa); 12841ed81b73SMarko Zec uma_zfree(V_rtzone, rt); 1285704b0666SBill Fenner senderr(error); 1286df8bae1dSRodney W. Grimes } 1287499676dfSJulian Elischer 1288499676dfSJulian Elischer /* 1289499676dfSJulian Elischer * point to the (possibly newly malloc'd) dest address. 1290499676dfSJulian Elischer */ 1291d1dd20beSSam Leffler ndst = (struct sockaddr *)rt_key(rt); 1292499676dfSJulian Elischer 1293499676dfSJulian Elischer /* 1294499676dfSJulian Elischer * make sure it contains the value we want (masked if needed). 1295499676dfSJulian Elischer */ 1296df8bae1dSRodney W. Grimes if (netmask) { 1297df8bae1dSRodney W. Grimes rt_maskedcopy(dst, ndst, netmask); 1298df8bae1dSRodney W. Grimes } else 12991838a647SLuigi Rizzo bcopy(dst, ndst, dst->sa_len); 13008e718bb4SGarrett Wollman 13018e718bb4SGarrett Wollman /* 13028c0fec80SRobert Watson * We use the ifa reference returned by rt_getifa_fib(). 13038e718bb4SGarrett Wollman * This moved from below so that rnh->rnh_addaddr() can 1304499676dfSJulian Elischer * examine the ifa and ifa->ifa_ifp if it so desires. 13058e718bb4SGarrett Wollman */ 13068e718bb4SGarrett Wollman rt->rt_ifa = ifa; 13078e718bb4SGarrett Wollman rt->rt_ifp = ifa->ifa_ifp; 1308e3a7aa6fSGleb Smirnoff rt->rt_weight = 1; 13098e718bb4SGarrett Wollman 1310e440aed9SQing Li #ifdef RADIX_MPATH 1311e440aed9SQing Li /* do not permit exactly the same dst/mask/gw pair */ 1312e440aed9SQing Li if (rn_mpath_capable(rnh) && 1313e440aed9SQing Li rt_mpath_conflict(rnh, rt, netmask)) { 13141099f828SRobert Watson ifa_free(rt->rt_ifa); 1315e440aed9SQing Li Free(rt_key(rt)); 13161ed81b73SMarko Zec uma_zfree(V_rtzone, rt); 1317e440aed9SQing Li senderr(EEXIST); 1318e440aed9SQing Li } 1319e440aed9SQing Li #endif 1320e440aed9SQing Li 1321e5c610d6SQing Li #ifdef FLOWTABLE 1322e5c610d6SQing Li rt0 = NULL; 1323096f2786SBjoern A. Zeeb /* "flow-table" only supports IPv6 and IPv4 at the moment. */ 1324096f2786SBjoern A. Zeeb switch (dst->sa_family) { 1325096f2786SBjoern A. Zeeb #ifdef INET6 1326096f2786SBjoern A. Zeeb case AF_INET6: 1327096f2786SBjoern A. Zeeb #endif 1328db44ff40SBjoern A. Zeeb #ifdef INET 1329096f2786SBjoern A. Zeeb case AF_INET: 1330096f2786SBjoern A. Zeeb #endif 1331096f2786SBjoern A. Zeeb #if defined(INET6) || defined(INET) 1332e5c610d6SQing Li rn = rnh->rnh_matchaddr(dst, rnh); 1333e5c610d6SQing Li if (rn && ((rn->rn_flags & RNF_ROOT) == 0)) { 1334e5c610d6SQing Li struct sockaddr *mask; 1335e5c610d6SQing Li u_char *m, *n; 1336e5c610d6SQing Li int len; 1337e5c610d6SQing Li 1338e5c610d6SQing Li /* 1339e5c610d6SQing Li * compare mask to see if the new route is 1340e5c610d6SQing Li * more specific than the existing one 1341e5c610d6SQing Li */ 1342e5c610d6SQing Li rt0 = RNTORT(rn); 1343e5c610d6SQing Li RT_LOCK(rt0); 1344e5c610d6SQing Li RT_ADDREF(rt0); 1345e5c610d6SQing Li RT_UNLOCK(rt0); 1346e5c610d6SQing Li /* 1347e5c610d6SQing Li * A host route is already present, so 1348e5c610d6SQing Li * leave the flow-table entries as is. 1349e5c610d6SQing Li */ 1350e5c610d6SQing Li if (rt0->rt_flags & RTF_HOST) { 1351e5c610d6SQing Li RTFREE(rt0); 1352e5c610d6SQing Li rt0 = NULL; 1353e5c610d6SQing Li } else if (!(flags & RTF_HOST) && netmask) { 1354e5c610d6SQing Li mask = rt_mask(rt0); 1355e5c610d6SQing Li len = mask->sa_len; 1356e5c610d6SQing Li m = (u_char *)mask; 1357e5c610d6SQing Li n = (u_char *)netmask; 1358e5c610d6SQing Li while (len-- > 0) { 1359e5c610d6SQing Li if (*n != *m) 1360e5c610d6SQing Li break; 1361e5c610d6SQing Li n++; 1362e5c610d6SQing Li m++; 1363e5c610d6SQing Li } 1364e5c610d6SQing Li if (len == 0 || (*n < *m)) { 1365e5c610d6SQing Li RTFREE(rt0); 1366e5c610d6SQing Li rt0 = NULL; 1367e5c610d6SQing Li } 1368e5c610d6SQing Li } 1369e5c610d6SQing Li } 1370096f2786SBjoern A. Zeeb #endif/* INET6 || INET */ 1371e5c610d6SQing Li } 1372096f2786SBjoern A. Zeeb #endif /* FLOWTABLE */ 1373e5c610d6SQing Li 1374d1dd20beSSam Leffler /* XXX mtu manipulation will be done in rnh_addaddr -- itojun */ 1375d1dd20beSSam Leffler rn = rnh->rnh_addaddr(ndst, netmask, rnh, rt->rt_nodes); 1376499676dfSJulian Elischer /* 1377499676dfSJulian Elischer * If it still failed to go into the tree, 1378499676dfSJulian Elischer * then un-make it (this should be a function) 1379499676dfSJulian Elischer */ 138085911824SLuigi Rizzo if (rn == NULL) { 13811099f828SRobert Watson ifa_free(rt->rt_ifa); 1382df8bae1dSRodney W. Grimes Free(rt_key(rt)); 13831ed81b73SMarko Zec uma_zfree(V_rtzone, rt); 1384e5c610d6SQing Li #ifdef FLOWTABLE 1385e5c610d6SQing Li if (rt0 != NULL) 1386e5c610d6SQing Li RTFREE(rt0); 1387e5c610d6SQing Li #endif 1388df8bae1dSRodney W. Grimes senderr(EEXIST); 1389df8bae1dSRodney W. Grimes } 1390e5c610d6SQing Li #ifdef FLOWTABLE 1391e5c610d6SQing Li else if (rt0 != NULL) { 13925d6d7e75SGleb Smirnoff flowtable_route_flush(dst->sa_family, rt0); 1393e5c610d6SQing Li RTFREE(rt0); 1394e5c610d6SQing Li } 1395e5c610d6SQing Li #endif 1396499676dfSJulian Elischer 1397499676dfSJulian Elischer /* 1398a0c0e34bSGleb Smirnoff * If this protocol has something to add to this then 1399499676dfSJulian Elischer * allow it to do that as well. 1400499676dfSJulian Elischer */ 1401df8bae1dSRodney W. Grimes if (ifa->ifa_rtrequest) 14028071913dSRuslan Ermilov ifa->ifa_rtrequest(req, rt, info); 1403499676dfSJulian Elischer 1404cd02a0b7SGarrett Wollman /* 1405499676dfSJulian Elischer * actually return a resultant rtentry and 1406499676dfSJulian Elischer * give the caller a single reference. 1407499676dfSJulian Elischer */ 1408df8bae1dSRodney W. Grimes if (ret_nrt) { 1409df8bae1dSRodney W. Grimes *ret_nrt = rt; 14107138d65cSSam Leffler RT_ADDREF(rt); 1411df8bae1dSRodney W. Grimes } 1412d1dd20beSSam Leffler RT_UNLOCK(rt); 1413df8bae1dSRodney W. Grimes break; 1414*c77462ddSAlexander V. Chernikov case RTM_CHANGE: 1415*c77462ddSAlexander V. Chernikov error = rtrequest1_fib_change(rnh, info, ret_nrt, fibnum); 1416*c77462ddSAlexander V. Chernikov break; 14178071913dSRuslan Ermilov default: 14188071913dSRuslan Ermilov error = EOPNOTSUPP; 1419df8bae1dSRodney W. Grimes } 1420df8bae1dSRodney W. Grimes bad: 14213120b9d4SKip Macy if (needlock) 1422956b0b65SJeffrey Hsu RADIX_NODE_HEAD_UNLOCK(rnh); 1423df8bae1dSRodney W. Grimes return (error); 1424d1dd20beSSam Leffler #undef senderr 1425d1dd20beSSam Leffler } 1426d1dd20beSSam Leffler 14278071913dSRuslan Ermilov #undef dst 14288071913dSRuslan Ermilov #undef gateway 14298071913dSRuslan Ermilov #undef netmask 14308071913dSRuslan Ermilov #undef ifaaddr 14318071913dSRuslan Ermilov #undef ifpaddr 14328071913dSRuslan Ermilov #undef flags 1433df8bae1dSRodney W. Grimes 1434*c77462ddSAlexander V. Chernikov #define senderr(e) { error = e; goto bad; } 1435*c77462ddSAlexander V. Chernikov static int 1436*c77462ddSAlexander V. Chernikov rtrequest1_fib_change(struct radix_node_head *rnh, struct rt_addrinfo *info, 1437*c77462ddSAlexander V. Chernikov struct rtentry **ret_nrt, u_int fibnum) 1438*c77462ddSAlexander V. Chernikov { 1439*c77462ddSAlexander V. Chernikov struct rtentry *rt = NULL; 1440*c77462ddSAlexander V. Chernikov int error = 0; 1441*c77462ddSAlexander V. Chernikov int free_ifa = 0; 1442*c77462ddSAlexander V. Chernikov 1443*c77462ddSAlexander V. Chernikov rt = (struct rtentry *)rnh->rnh_lookup(info->rti_info[RTAX_DST], 1444*c77462ddSAlexander V. Chernikov info->rti_info[RTAX_NETMASK], rnh); 1445*c77462ddSAlexander V. Chernikov 1446*c77462ddSAlexander V. Chernikov if (rt == NULL) 1447*c77462ddSAlexander V. Chernikov return (ESRCH); 1448*c77462ddSAlexander V. Chernikov 1449*c77462ddSAlexander V. Chernikov #ifdef RADIX_MPATH 1450*c77462ddSAlexander V. Chernikov /* 1451*c77462ddSAlexander V. Chernikov * If we got multipath routes, 1452*c77462ddSAlexander V. Chernikov * we require users to specify a matching RTAX_GATEWAY. 1453*c77462ddSAlexander V. Chernikov */ 1454*c77462ddSAlexander V. Chernikov if (rn_mpath_capable(rnh)) { 1455*c77462ddSAlexander V. Chernikov rt = rt_mpath_matchgate(rt, info->rti_info[RTAX_GATEWAY]); 1456*c77462ddSAlexander V. Chernikov if (rt == NULL) 1457*c77462ddSAlexander V. Chernikov return (ESRCH); 1458*c77462ddSAlexander V. Chernikov } 1459*c77462ddSAlexander V. Chernikov #endif 1460*c77462ddSAlexander V. Chernikov 1461*c77462ddSAlexander V. Chernikov RT_LOCK(rt); 1462*c77462ddSAlexander V. Chernikov 1463*c77462ddSAlexander V. Chernikov /* 1464*c77462ddSAlexander V. Chernikov * New gateway could require new ifaddr, ifp; 1465*c77462ddSAlexander V. Chernikov * flags may also be different; ifp may be specified 1466*c77462ddSAlexander V. Chernikov * by ll sockaddr when protocol address is ambiguous 1467*c77462ddSAlexander V. Chernikov */ 1468*c77462ddSAlexander V. Chernikov if (((rt->rt_flags & RTF_GATEWAY) && 1469*c77462ddSAlexander V. Chernikov info->rti_info[RTAX_GATEWAY] != NULL) || 1470*c77462ddSAlexander V. Chernikov info->rti_info[RTAX_IFP] != NULL || 1471*c77462ddSAlexander V. Chernikov (info->rti_info[RTAX_IFA] != NULL && 1472*c77462ddSAlexander V. Chernikov !sa_equal(info->rti_info[RTAX_IFA], rt->rt_ifa->ifa_addr))) { 1473*c77462ddSAlexander V. Chernikov 1474*c77462ddSAlexander V. Chernikov error = rt_getifa_fib(info, fibnum); 1475*c77462ddSAlexander V. Chernikov if (info->rti_ifa != NULL) 1476*c77462ddSAlexander V. Chernikov free_ifa = 1; 1477*c77462ddSAlexander V. Chernikov 1478*c77462ddSAlexander V. Chernikov if (error != 0) 1479*c77462ddSAlexander V. Chernikov senderr(error); 1480*c77462ddSAlexander V. Chernikov } 1481*c77462ddSAlexander V. Chernikov 1482*c77462ddSAlexander V. Chernikov /* Check if outgoing interface has changed */ 1483*c77462ddSAlexander V. Chernikov if (info->rti_ifa != NULL && info->rti_ifa != rt->rt_ifa && 1484*c77462ddSAlexander V. Chernikov rt->rt_ifa != NULL && rt->rt_ifa->ifa_rtrequest != NULL) { 1485*c77462ddSAlexander V. Chernikov rt->rt_ifa->ifa_rtrequest(RTM_DELETE, rt, info); 1486*c77462ddSAlexander V. Chernikov ifa_free(rt->rt_ifa); 1487*c77462ddSAlexander V. Chernikov } 1488*c77462ddSAlexander V. Chernikov /* Update gateway address */ 1489*c77462ddSAlexander V. Chernikov if (info->rti_info[RTAX_GATEWAY] != NULL) { 1490*c77462ddSAlexander V. Chernikov error = rt_setgate(rt, rt_key(rt), info->rti_info[RTAX_GATEWAY]); 1491*c77462ddSAlexander V. Chernikov if (error != 0) 1492*c77462ddSAlexander V. Chernikov senderr(error); 1493*c77462ddSAlexander V. Chernikov 1494*c77462ddSAlexander V. Chernikov rt->rt_flags &= ~RTF_GATEWAY; 1495*c77462ddSAlexander V. Chernikov rt->rt_flags |= (RTF_GATEWAY & info->rti_flags); 1496*c77462ddSAlexander V. Chernikov } 1497*c77462ddSAlexander V. Chernikov 1498*c77462ddSAlexander V. Chernikov if (info->rti_ifa != NULL && info->rti_ifa != rt->rt_ifa) { 1499*c77462ddSAlexander V. Chernikov ifa_ref(info->rti_ifa); 1500*c77462ddSAlexander V. Chernikov rt->rt_ifa = info->rti_ifa; 1501*c77462ddSAlexander V. Chernikov rt->rt_ifp = info->rti_ifp; 1502*c77462ddSAlexander V. Chernikov } 1503*c77462ddSAlexander V. Chernikov /* Allow some flags to be toggled on change. */ 1504*c77462ddSAlexander V. Chernikov rt->rt_flags &= ~RTF_FMASK; 1505*c77462ddSAlexander V. Chernikov rt->rt_flags |= info->rti_flags & RTF_FMASK; 1506*c77462ddSAlexander V. Chernikov 1507*c77462ddSAlexander V. Chernikov if (rt->rt_ifa && rt->rt_ifa->ifa_rtrequest != NULL) 1508*c77462ddSAlexander V. Chernikov rt->rt_ifa->ifa_rtrequest(RTM_ADD, rt, info); 1509*c77462ddSAlexander V. Chernikov 1510*c77462ddSAlexander V. Chernikov if (ret_nrt) { 1511*c77462ddSAlexander V. Chernikov *ret_nrt = rt; 1512*c77462ddSAlexander V. Chernikov RT_ADDREF(rt); 1513*c77462ddSAlexander V. Chernikov } 1514*c77462ddSAlexander V. Chernikov bad: 1515*c77462ddSAlexander V. Chernikov RT_UNLOCK(rt); 1516*c77462ddSAlexander V. Chernikov if (free_ifa != 0) 1517*c77462ddSAlexander V. Chernikov ifa_free(info->rti_ifa); 1518*c77462ddSAlexander V. Chernikov return (error); 1519*c77462ddSAlexander V. Chernikov } 1520*c77462ddSAlexander V. Chernikov #undef senderr 1521*c77462ddSAlexander V. Chernikov 1522*c77462ddSAlexander V. Chernikov 1523df8bae1dSRodney W. Grimes int 1524d1dd20beSSam Leffler rt_setgate(struct rtentry *rt, struct sockaddr *dst, struct sockaddr *gate) 1525df8bae1dSRodney W. Grimes { 1526d1dd20beSSam Leffler /* XXX dst may be overwritten, can we move this to below */ 15276e6b3f7cSQing Li int dlen = SA_SIZE(dst), glen = SA_SIZE(gate); 15286e6b3f7cSQing Li #ifdef INVARIANTS 1529c2c2a7c1SBjoern A. Zeeb struct radix_node_head *rnh; 1530c2c2a7c1SBjoern A. Zeeb 1531c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(rt->rt_fibnum, dst->sa_family); 15326e6b3f7cSQing Li #endif 1533d1dd20beSSam Leffler 1534d1dd20beSSam Leffler RT_LOCK_ASSERT(rt); 15353120b9d4SKip Macy RADIX_NODE_HEAD_LOCK_ASSERT(rnh); 1536df8bae1dSRodney W. Grimes 15371db1fffaSBill Fenner /* 153885911824SLuigi Rizzo * Prepare to store the gateway in rt->rt_gateway. 153985911824SLuigi Rizzo * Both dst and gateway are stored one after the other in the same 154085911824SLuigi Rizzo * malloc'd chunk. If we have room, we can reuse the old buffer, 154185911824SLuigi Rizzo * rt_gateway already points to the right place. 154285911824SLuigi Rizzo * Otherwise, malloc a new block and update the 'dst' address. 1543499676dfSJulian Elischer */ 154485911824SLuigi Rizzo if (rt->rt_gateway == NULL || glen > SA_SIZE(rt->rt_gateway)) { 154585911824SLuigi Rizzo caddr_t new; 154685911824SLuigi Rizzo 1547df8bae1dSRodney W. Grimes R_Malloc(new, caddr_t, dlen + glen); 154885911824SLuigi Rizzo if (new == NULL) 15491db1fffaSBill Fenner return ENOBUFS; 1550499676dfSJulian Elischer /* 155185911824SLuigi Rizzo * XXX note, we copy from *dst and not *rt_key(rt) because 155285911824SLuigi Rizzo * rt_setgate() can be called to initialize a newly 155385911824SLuigi Rizzo * allocated route entry, in which case rt_key(rt) == NULL 155485911824SLuigi Rizzo * (and also rt->rt_gateway == NULL). 155585911824SLuigi Rizzo * Free()/free() handle a NULL argument just fine. 1556499676dfSJulian Elischer */ 15571838a647SLuigi Rizzo bcopy(dst, new, dlen); 155885911824SLuigi Rizzo Free(rt_key(rt)); /* free old block, if any */ 1559445e045bSAlexander Kabaev rt_key(rt) = (struct sockaddr *)new; 156085911824SLuigi Rizzo rt->rt_gateway = (struct sockaddr *)(new + dlen); 1561df8bae1dSRodney W. Grimes } 1562499676dfSJulian Elischer 1563499676dfSJulian Elischer /* 156485911824SLuigi Rizzo * Copy the new gateway value into the memory chunk. 156585911824SLuigi Rizzo */ 156685911824SLuigi Rizzo bcopy(gate, rt->rt_gateway, glen); 156785911824SLuigi Rizzo 15686e6b3f7cSQing Li return (0); 1569df8bae1dSRodney W. Grimes } 1570df8bae1dSRodney W. Grimes 1571c7ab6602SQing Li void 1572d1dd20beSSam Leffler rt_maskedcopy(struct sockaddr *src, struct sockaddr *dst, struct sockaddr *netmask) 1573df8bae1dSRodney W. Grimes { 1574df8bae1dSRodney W. Grimes register u_char *cp1 = (u_char *)src; 1575df8bae1dSRodney W. Grimes register u_char *cp2 = (u_char *)dst; 1576df8bae1dSRodney W. Grimes register u_char *cp3 = (u_char *)netmask; 1577df8bae1dSRodney W. Grimes u_char *cplim = cp2 + *cp3; 1578df8bae1dSRodney W. Grimes u_char *cplim2 = cp2 + *cp1; 1579df8bae1dSRodney W. Grimes 1580df8bae1dSRodney W. Grimes *cp2++ = *cp1++; *cp2++ = *cp1++; /* copies sa_len & sa_family */ 1581df8bae1dSRodney W. Grimes cp3 += 2; 1582df8bae1dSRodney W. Grimes if (cplim > cplim2) 1583df8bae1dSRodney W. Grimes cplim = cplim2; 1584df8bae1dSRodney W. Grimes while (cp2 < cplim) 1585df8bae1dSRodney W. Grimes *cp2++ = *cp1++ & *cp3++; 1586df8bae1dSRodney W. Grimes if (cp2 < cplim2) 1587df8bae1dSRodney W. Grimes bzero((caddr_t)cp2, (unsigned)(cplim2 - cp2)); 1588df8bae1dSRodney W. Grimes } 1589df8bae1dSRodney W. Grimes 1590df8bae1dSRodney W. Grimes /* 1591df8bae1dSRodney W. Grimes * Set up a routing table entry, normally 1592df8bae1dSRodney W. Grimes * for an interface. 1593df8bae1dSRodney W. Grimes */ 15948b07e49aSJulian Elischer #define _SOCKADDR_TMPSIZE 128 /* Not too big.. kernel stack size is limited */ 15958b07e49aSJulian Elischer static inline int 15968b07e49aSJulian Elischer rtinit1(struct ifaddr *ifa, int cmd, int flags, int fibnum) 1597df8bae1dSRodney W. Grimes { 15985aca0b30SLuigi Rizzo struct sockaddr *dst; 15998071913dSRuslan Ermilov struct sockaddr *netmask; 160085911824SLuigi Rizzo struct rtentry *rt = NULL; 16018071913dSRuslan Ermilov struct rt_addrinfo info; 1602e440aed9SQing Li int error = 0; 16038b07e49aSJulian Elischer int startfib, endfib; 16048b07e49aSJulian Elischer char tempbuf[_SOCKADDR_TMPSIZE]; 16058b07e49aSJulian Elischer int didwork = 0; 16068b07e49aSJulian Elischer int a_failure = 0; 16076e6b3f7cSQing Li static struct sockaddr_dl null_sdl = {sizeof(null_sdl), AF_LINK}; 16083034f43fSAlexander V. Chernikov struct radix_node_head *rnh; 1609df8bae1dSRodney W. Grimes 16108071913dSRuslan Ermilov if (flags & RTF_HOST) { 16118071913dSRuslan Ermilov dst = ifa->ifa_dstaddr; 16128071913dSRuslan Ermilov netmask = NULL; 16138071913dSRuslan Ermilov } else { 16148071913dSRuslan Ermilov dst = ifa->ifa_addr; 16158071913dSRuslan Ermilov netmask = ifa->ifa_netmask; 16168071913dSRuslan Ermilov } 1617b3dd0771SBjoern A. Zeeb if (dst->sa_len == 0) 1618b3dd0771SBjoern A. Zeeb return(EINVAL); 1619b680a383SBjoern A. Zeeb switch (dst->sa_family) { 1620b680a383SBjoern A. Zeeb case AF_INET6: 1621b680a383SBjoern A. Zeeb case AF_INET: 1622b680a383SBjoern A. Zeeb /* We support multiple FIBs. */ 1623b680a383SBjoern A. Zeeb break; 1624b680a383SBjoern A. Zeeb default: 1625b680a383SBjoern A. Zeeb fibnum = RT_DEFAULT_FIB; 1626b680a383SBjoern A. Zeeb break; 1627b680a383SBjoern A. Zeeb } 16287d9b6df1SAlexander V. Chernikov if (fibnum == RT_ALL_FIBS) { 162966e8505fSJulian Elischer if (rt_add_addr_allfibs == 0 && cmd == (int)RTM_ADD) { 16300489b891SAlan Somers startfib = endfib = ifa->ifa_ifp->if_fib; 163166e8505fSJulian Elischer } else { 16328b07e49aSJulian Elischer startfib = 0; 16338b07e49aSJulian Elischer endfib = rt_numfibs - 1; 163466e8505fSJulian Elischer } 16358b07e49aSJulian Elischer } else { 16368b07e49aSJulian Elischer KASSERT((fibnum < rt_numfibs), ("rtinit1: bad fibnum")); 16378b07e49aSJulian Elischer startfib = fibnum; 16388b07e49aSJulian Elischer endfib = fibnum; 16398b07e49aSJulian Elischer } 1640ac4a76ebSBjoern A. Zeeb 1641b0a76b88SJulian Elischer /* 16428b07e49aSJulian Elischer * If it's a delete, check that if it exists, 16438b07e49aSJulian Elischer * it's on the correct interface or we might scrub 16448b07e49aSJulian Elischer * a route to another ifa which would 1645b0a76b88SJulian Elischer * be confusing at best and possibly worse. 1646b0a76b88SJulian Elischer */ 1647df8bae1dSRodney W. Grimes if (cmd == RTM_DELETE) { 1648b0a76b88SJulian Elischer /* 1649b0a76b88SJulian Elischer * It's a delete, so it should already exist.. 1650b0a76b88SJulian Elischer * If it's a net, mask off the host bits 1651b0a76b88SJulian Elischer * (Assuming we have a mask) 16528b07e49aSJulian Elischer * XXX this is kinda inet specific.. 1653b0a76b88SJulian Elischer */ 16548071913dSRuslan Ermilov if (netmask != NULL) { 16558b07e49aSJulian Elischer rt_maskedcopy(dst, (struct sockaddr *)tempbuf, netmask); 16568b07e49aSJulian Elischer dst = (struct sockaddr *)tempbuf; 1657df8bae1dSRodney W. Grimes } 16588b07e49aSJulian Elischer } 16598b07e49aSJulian Elischer /* 16608b07e49aSJulian Elischer * Now go through all the requested tables (fibs) and do the 16618b07e49aSJulian Elischer * requested action. Realistically, this will either be fib 0 16628b07e49aSJulian Elischer * for protocols that don't do multiple tables or all the 1663a8498625SBjoern A. Zeeb * tables for those that do. 16648b07e49aSJulian Elischer */ 16658b07e49aSJulian Elischer for ( fibnum = startfib; fibnum <= endfib; fibnum++) { 16668b07e49aSJulian Elischer if (cmd == RTM_DELETE) { 16678b07e49aSJulian Elischer struct radix_node *rn; 1668b0a76b88SJulian Elischer /* 16698071913dSRuslan Ermilov * Look up an rtentry that is in the routing tree and 16708071913dSRuslan Ermilov * contains the correct info. 1671b0a76b88SJulian Elischer */ 1672c2c2a7c1SBjoern A. Zeeb rnh = rt_tables_get_rnh(fibnum, dst->sa_family); 1673c2c2a7c1SBjoern A. Zeeb if (rnh == NULL) 16748b07e49aSJulian Elischer /* this table doesn't exist but others might */ 16758b07e49aSJulian Elischer continue; 167614126522SAlexander V. Chernikov RADIX_NODE_HEAD_RLOCK(rnh); 1677034c09ffSAlexander V. Chernikov rn = rnh->rnh_lookup(dst, netmask, rnh); 1678e440aed9SQing Li #ifdef RADIX_MPATH 1679e440aed9SQing Li if (rn_mpath_capable(rnh)) { 1680e440aed9SQing Li 1681e440aed9SQing Li if (rn == NULL) 1682e440aed9SQing Li error = ESRCH; 1683e440aed9SQing Li else { 1684e440aed9SQing Li rt = RNTORT(rn); 1685e440aed9SQing Li /* 16868b07e49aSJulian Elischer * for interface route the 16878b07e49aSJulian Elischer * rt->rt_gateway is sockaddr_intf 16888b07e49aSJulian Elischer * for cloning ARP entries, so 16898b07e49aSJulian Elischer * rt_mpath_matchgate must use the 16908b07e49aSJulian Elischer * interface address 1691e440aed9SQing Li */ 16928b07e49aSJulian Elischer rt = rt_mpath_matchgate(rt, 16938b07e49aSJulian Elischer ifa->ifa_addr); 1694034c09ffSAlexander V. Chernikov if (rt == NULL) 1695e440aed9SQing Li error = ESRCH; 1696e440aed9SQing Li } 1697e440aed9SQing Li } 1698e440aed9SQing Li #endif 16998b07e49aSJulian Elischer error = (rn == NULL || 17008071913dSRuslan Ermilov (rn->rn_flags & RNF_ROOT) || 17015a2f4cbdSAlexander V. Chernikov RNTORT(rn)->rt_ifa != ifa); 170214126522SAlexander V. Chernikov RADIX_NODE_HEAD_RUNLOCK(rnh); 1703956b0b65SJeffrey Hsu if (error) { 17048b07e49aSJulian Elischer /* this is only an error if bad on ALL tables */ 17058b07e49aSJulian Elischer continue; 1706df8bae1dSRodney W. Grimes } 1707b0a76b88SJulian Elischer } 1708b0a76b88SJulian Elischer /* 1709b0a76b88SJulian Elischer * Do the actual request 1710b0a76b88SJulian Elischer */ 17118071913dSRuslan Ermilov bzero((caddr_t)&info, sizeof(info)); 17128071913dSRuslan Ermilov info.rti_ifa = ifa; 17133034f43fSAlexander V. Chernikov info.rti_flags = flags | 17143034f43fSAlexander V. Chernikov (ifa->ifa_flags & ~IFA_RTSELF) | RTF_PINNED; 17158071913dSRuslan Ermilov info.rti_info[RTAX_DST] = dst; 17166e6b3f7cSQing Li /* 17176e6b3f7cSQing Li * doing this for compatibility reasons 17186e6b3f7cSQing Li */ 17196e6b3f7cSQing Li if (cmd == RTM_ADD) 17206e6b3f7cSQing Li info.rti_info[RTAX_GATEWAY] = 17216e6b3f7cSQing Li (struct sockaddr *)&null_sdl; 17226e6b3f7cSQing Li else 17238071913dSRuslan Ermilov info.rti_info[RTAX_GATEWAY] = ifa->ifa_addr; 17248071913dSRuslan Ermilov info.rti_info[RTAX_NETMASK] = netmask; 17258b07e49aSJulian Elischer error = rtrequest1_fib(cmd, &info, &rt, fibnum); 17263034f43fSAlexander V. Chernikov 17273034f43fSAlexander V. Chernikov if ((error == EEXIST) && (cmd == RTM_ADD)) { 17283034f43fSAlexander V. Chernikov /* 17293034f43fSAlexander V. Chernikov * Interface route addition failed. 17303034f43fSAlexander V. Chernikov * Atomically delete current prefix generating 17313034f43fSAlexander V. Chernikov * RTM_DELETE message, and retry adding 17323034f43fSAlexander V. Chernikov * interface prefix. 17333034f43fSAlexander V. Chernikov */ 17343034f43fSAlexander V. Chernikov rnh = rt_tables_get_rnh(fibnum, dst->sa_family); 17353034f43fSAlexander V. Chernikov RADIX_NODE_HEAD_LOCK(rnh); 17363034f43fSAlexander V. Chernikov 17373034f43fSAlexander V. Chernikov /* Delete old prefix */ 17383034f43fSAlexander V. Chernikov info.rti_ifa = NULL; 17393034f43fSAlexander V. Chernikov info.rti_flags = RTF_RNH_LOCKED; 17403034f43fSAlexander V. Chernikov 1741d54455b0SAlexander V. Chernikov error = rtrequest1_fib(RTM_DELETE, &info, NULL, fibnum); 17423034f43fSAlexander V. Chernikov if (error == 0) { 17433034f43fSAlexander V. Chernikov info.rti_ifa = ifa; 17443034f43fSAlexander V. Chernikov info.rti_flags = flags | RTF_RNH_LOCKED | 17453034f43fSAlexander V. Chernikov (ifa->ifa_flags & ~IFA_RTSELF) | RTF_PINNED; 17463034f43fSAlexander V. Chernikov error = rtrequest1_fib(cmd, &info, &rt, fibnum); 17473034f43fSAlexander V. Chernikov } 17483034f43fSAlexander V. Chernikov 17493034f43fSAlexander V. Chernikov RADIX_NODE_HEAD_UNLOCK(rnh); 17503034f43fSAlexander V. Chernikov } 17513034f43fSAlexander V. Chernikov 17523034f43fSAlexander V. Chernikov 17535aca0b30SLuigi Rizzo if (error == 0 && rt != NULL) { 17548071913dSRuslan Ermilov /* 17556f99b44cSBrian Somers * notify any listening routing agents of the change 17568071913dSRuslan Ermilov */ 1757d1dd20beSSam Leffler RT_LOCK(rt); 1758e440aed9SQing Li #ifdef RADIX_MPATH 1759e440aed9SQing Li /* 1760e440aed9SQing Li * in case address alias finds the first address 17618d74af36SBjoern A. Zeeb * e.g. ifconfig bge0 192.0.2.246/24 17628d74af36SBjoern A. Zeeb * e.g. ifconfig bge0 192.0.2.247/24 17638d74af36SBjoern A. Zeeb * the address set in the route is 192.0.2.246 17648d74af36SBjoern A. Zeeb * so we need to replace it with 192.0.2.247 1765e440aed9SQing Li */ 17668b07e49aSJulian Elischer if (memcmp(rt->rt_ifa->ifa_addr, 17678b07e49aSJulian Elischer ifa->ifa_addr, ifa->ifa_addr->sa_len)) { 17681099f828SRobert Watson ifa_free(rt->rt_ifa); 17691099f828SRobert Watson ifa_ref(ifa); 1770e440aed9SQing Li rt->rt_ifp = ifa->ifa_ifp; 1771e440aed9SQing Li rt->rt_ifa = ifa; 1772e440aed9SQing Li } 1773e440aed9SQing Li #endif 17746e6b3f7cSQing Li /* 17756e6b3f7cSQing Li * doing this for compatibility reasons 17766e6b3f7cSQing Li */ 17776e6b3f7cSQing Li if (cmd == RTM_ADD) { 17786e6b3f7cSQing Li ((struct sockaddr_dl *)rt->rt_gateway)->sdl_type = 17796e6b3f7cSQing Li rt->rt_ifp->if_type; 17806e6b3f7cSQing Li ((struct sockaddr_dl *)rt->rt_gateway)->sdl_index = 17816e6b3f7cSQing Li rt->rt_ifp->if_index; 17826e6b3f7cSQing Li } 17837f279720SMichael Tuexen RT_ADDREF(rt); 17847f279720SMichael Tuexen RT_UNLOCK(rt); 1785528737fdSBjoern A. Zeeb rt_newaddrmsg_fib(cmd, ifa, error, rt, fibnum); 17867f279720SMichael Tuexen RT_LOCK(rt); 17877f279720SMichael Tuexen RT_REMREF(rt); 17888071913dSRuslan Ermilov if (cmd == RTM_DELETE) { 1789b0a76b88SJulian Elischer /* 17908b07e49aSJulian Elischer * If we are deleting, and we found an entry, 17918b07e49aSJulian Elischer * then it's been removed from the tree.. 17928b07e49aSJulian Elischer * now throw it away. 1793b0a76b88SJulian Elischer */ 1794d1dd20beSSam Leffler RTFREE_LOCKED(rt); 1795d1dd20beSSam Leffler } else { 1796d1dd20beSSam Leffler if (cmd == RTM_ADD) { 1797b0a76b88SJulian Elischer /* 17988b07e49aSJulian Elischer * We just wanted to add it.. 17998b07e49aSJulian Elischer * we don't actually need a reference. 1800b0a76b88SJulian Elischer */ 18017138d65cSSam Leffler RT_REMREF(rt); 1802df8bae1dSRodney W. Grimes } 1803d1dd20beSSam Leffler RT_UNLOCK(rt); 1804d1dd20beSSam Leffler } 18058b07e49aSJulian Elischer didwork = 1; 1806df8bae1dSRodney W. Grimes } 18078b07e49aSJulian Elischer if (error) 18088b07e49aSJulian Elischer a_failure = error; 18098b07e49aSJulian Elischer } 18108b07e49aSJulian Elischer if (cmd == RTM_DELETE) { 18118b07e49aSJulian Elischer if (didwork) { 18128b07e49aSJulian Elischer error = 0; 18138b07e49aSJulian Elischer } else { 18148b07e49aSJulian Elischer /* we only give an error if it wasn't in any table */ 18158b07e49aSJulian Elischer error = ((flags & RTF_HOST) ? 18168b07e49aSJulian Elischer EHOSTUNREACH : ENETUNREACH); 18178b07e49aSJulian Elischer } 18188b07e49aSJulian Elischer } else { 18198b07e49aSJulian Elischer if (a_failure) { 18208b07e49aSJulian Elischer /* return an error if any of them failed */ 18218b07e49aSJulian Elischer error = a_failure; 18228b07e49aSJulian Elischer } 18238b07e49aSJulian Elischer } 18243ec66d6cSDavid Greenman return (error); 18253ec66d6cSDavid Greenman } 1826cb64988fSLuoqi Chen 18278b07e49aSJulian Elischer /* 18288b07e49aSJulian Elischer * Set up a routing table entry, normally 18298b07e49aSJulian Elischer * for an interface. 18308b07e49aSJulian Elischer */ 18318b07e49aSJulian Elischer int 18328b07e49aSJulian Elischer rtinit(struct ifaddr *ifa, int cmd, int flags) 18338b07e49aSJulian Elischer { 18348b07e49aSJulian Elischer struct sockaddr *dst; 1835a8498625SBjoern A. Zeeb int fib = RT_DEFAULT_FIB; 18368b07e49aSJulian Elischer 18378b07e49aSJulian Elischer if (flags & RTF_HOST) { 18388b07e49aSJulian Elischer dst = ifa->ifa_dstaddr; 18398b07e49aSJulian Elischer } else { 18408b07e49aSJulian Elischer dst = ifa->ifa_addr; 18418b07e49aSJulian Elischer } 18428b07e49aSJulian Elischer 1843b680a383SBjoern A. Zeeb switch (dst->sa_family) { 1844b680a383SBjoern A. Zeeb case AF_INET6: 1845b680a383SBjoern A. Zeeb case AF_INET: 1846b680a383SBjoern A. Zeeb /* We do support multiple FIBs. */ 18477d9b6df1SAlexander V. Chernikov fib = RT_ALL_FIBS; 1848b680a383SBjoern A. Zeeb break; 1849b680a383SBjoern A. Zeeb } 18508b07e49aSJulian Elischer return (rtinit1(ifa, cmd, flags, fib)); 18518b07e49aSJulian Elischer } 18524cbac30bSAlexander V. Chernikov 18534cbac30bSAlexander V. Chernikov /* 18544cbac30bSAlexander V. Chernikov * Announce interface address arrival/withdraw 18554cbac30bSAlexander V. Chernikov * Returns 0 on success. 18564cbac30bSAlexander V. Chernikov */ 18574cbac30bSAlexander V. Chernikov int 18584cbac30bSAlexander V. Chernikov rt_addrmsg(int cmd, struct ifaddr *ifa, int fibnum) 18594cbac30bSAlexander V. Chernikov { 18604cbac30bSAlexander V. Chernikov 18614cbac30bSAlexander V. Chernikov KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE, 1862d375edc9SAlexander V. Chernikov ("unexpected cmd %d", cmd)); 18634cbac30bSAlexander V. Chernikov 1864d375edc9SAlexander V. Chernikov KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs), 1865d375edc9SAlexander V. Chernikov ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs)); 18664cbac30bSAlexander V. Chernikov 18677f946da0SMichael Tuexen #if defined(INET) || defined(INET6) 18687f946da0SMichael Tuexen #ifdef SCTP 18697f946da0SMichael Tuexen /* 18707f946da0SMichael Tuexen * notify the SCTP stack 18717f946da0SMichael Tuexen * this will only get called when an address is added/deleted 18727f946da0SMichael Tuexen * XXX pass the ifaddr struct instead if ifa->ifa_addr... 18737f946da0SMichael Tuexen */ 18747f946da0SMichael Tuexen sctp_addr_change(ifa, cmd); 18757f946da0SMichael Tuexen #endif /* SCTP */ 18767f946da0SMichael Tuexen #endif 18774cbac30bSAlexander V. Chernikov return (rtsock_addrmsg(cmd, ifa, fibnum)); 18784cbac30bSAlexander V. Chernikov } 18794cbac30bSAlexander V. Chernikov 18804cbac30bSAlexander V. Chernikov /* 1881d375edc9SAlexander V. Chernikov * Announce route addition/removal. 18824cbac30bSAlexander V. Chernikov * Users of this function MUST validate input data BEFORE calling. 18834cbac30bSAlexander V. Chernikov * However we have to be able to handle invalid data: 18844cbac30bSAlexander V. Chernikov * if some userland app sends us "invalid" route message (invalid mask, 1885d375edc9SAlexander V. Chernikov * no dst, wrong address families, etc...) we need to pass it back 18864cbac30bSAlexander V. Chernikov * to app (and any other rtsock consumers) with rtm_errno field set to 18874cbac30bSAlexander V. Chernikov * non-zero value. 18884cbac30bSAlexander V. Chernikov * Returns 0 on success. 18894cbac30bSAlexander V. Chernikov */ 18904cbac30bSAlexander V. Chernikov int 18914cbac30bSAlexander V. Chernikov rt_routemsg(int cmd, struct ifnet *ifp, int error, struct rtentry *rt, 18924cbac30bSAlexander V. Chernikov int fibnum) 18934cbac30bSAlexander V. Chernikov { 18944cbac30bSAlexander V. Chernikov 18954cbac30bSAlexander V. Chernikov KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE, 1896d375edc9SAlexander V. Chernikov ("unexpected cmd %d", cmd)); 18974cbac30bSAlexander V. Chernikov 1898d375edc9SAlexander V. Chernikov KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs), 1899d375edc9SAlexander V. Chernikov ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs)); 19004cbac30bSAlexander V. Chernikov 19014cbac30bSAlexander V. Chernikov KASSERT(rt_key(rt) != NULL, (":%s: rt_key must be supplied", __func__)); 19024cbac30bSAlexander V. Chernikov 19034cbac30bSAlexander V. Chernikov return (rtsock_routemsg(cmd, ifp, error, rt, fibnum)); 19044cbac30bSAlexander V. Chernikov } 19054cbac30bSAlexander V. Chernikov 19064cbac30bSAlexander V. Chernikov void 19074cbac30bSAlexander V. Chernikov rt_newaddrmsg(int cmd, struct ifaddr *ifa, int error, struct rtentry *rt) 19084cbac30bSAlexander V. Chernikov { 19094cbac30bSAlexander V. Chernikov 19104cbac30bSAlexander V. Chernikov rt_newaddrmsg_fib(cmd, ifa, error, rt, RT_ALL_FIBS); 19114cbac30bSAlexander V. Chernikov } 19124cbac30bSAlexander V. Chernikov 19134cbac30bSAlexander V. Chernikov /* 19144cbac30bSAlexander V. Chernikov * This is called to generate messages from the routing socket 19154cbac30bSAlexander V. Chernikov * indicating a network interface has had addresses associated with it. 19164cbac30bSAlexander V. Chernikov */ 19174cbac30bSAlexander V. Chernikov void 19184cbac30bSAlexander V. Chernikov rt_newaddrmsg_fib(int cmd, struct ifaddr *ifa, int error, struct rtentry *rt, 19194cbac30bSAlexander V. Chernikov int fibnum) 19204cbac30bSAlexander V. Chernikov { 19214cbac30bSAlexander V. Chernikov 19224cbac30bSAlexander V. Chernikov KASSERT(cmd == RTM_ADD || cmd == RTM_DELETE, 19234cbac30bSAlexander V. Chernikov ("unexpected cmd %u", cmd)); 1924d375edc9SAlexander V. Chernikov KASSERT(fibnum == RT_ALL_FIBS || (fibnum >= 0 && fibnum < rt_numfibs), 1925d375edc9SAlexander V. Chernikov ("%s: fib out of range 0 <=%d<%d", __func__, fibnum, rt_numfibs)); 19264cbac30bSAlexander V. Chernikov 19274cbac30bSAlexander V. Chernikov if (cmd == RTM_ADD) { 19284cbac30bSAlexander V. Chernikov rt_addrmsg(cmd, ifa, fibnum); 19294cbac30bSAlexander V. Chernikov if (rt != NULL) 19304cbac30bSAlexander V. Chernikov rt_routemsg(cmd, ifa->ifa_ifp, error, rt, fibnum); 19314cbac30bSAlexander V. Chernikov } else { 19324cbac30bSAlexander V. Chernikov if (rt != NULL) 19334cbac30bSAlexander V. Chernikov rt_routemsg(cmd, ifa->ifa_ifp, error, rt, fibnum); 19344cbac30bSAlexander V. Chernikov rt_addrmsg(cmd, ifa, fibnum); 19354cbac30bSAlexander V. Chernikov } 19364cbac30bSAlexander V. Chernikov } 19374cbac30bSAlexander V. Chernikov 1938