1*65ff3638SAlexander V. Chernikov /*- 2*65ff3638SAlexander V. Chernikov * Copyright (c) 2015 3*65ff3638SAlexander V. Chernikov * Alexander V. Chernikov <melifaro@FreeBSD.org> 4*65ff3638SAlexander V. Chernikov * 5*65ff3638SAlexander V. Chernikov * Redistribution and use in source and binary forms, with or without 6*65ff3638SAlexander V. Chernikov * modification, are permitted provided that the following conditions 7*65ff3638SAlexander V. Chernikov * are met: 8*65ff3638SAlexander V. Chernikov * 1. Redistributions of source code must retain the above copyright 9*65ff3638SAlexander V. Chernikov * notice, this list of conditions and the following disclaimer. 10*65ff3638SAlexander V. Chernikov * 2. Redistributions in binary form must reproduce the above copyright 11*65ff3638SAlexander V. Chernikov * notice, this list of conditions and the following disclaimer in the 12*65ff3638SAlexander V. Chernikov * documentation and/or other materials provided with the distribution. 13*65ff3638SAlexander V. Chernikov * 4. Neither the name of the University nor the names of its contributors 14*65ff3638SAlexander V. Chernikov * may be used to endorse or promote products derived from this software 15*65ff3638SAlexander V. Chernikov * without specific prior written permission. 16*65ff3638SAlexander V. Chernikov * 17*65ff3638SAlexander V. Chernikov * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18*65ff3638SAlexander V. Chernikov * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19*65ff3638SAlexander V. Chernikov * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20*65ff3638SAlexander V. Chernikov * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21*65ff3638SAlexander V. Chernikov * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22*65ff3638SAlexander V. Chernikov * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23*65ff3638SAlexander V. Chernikov * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24*65ff3638SAlexander V. Chernikov * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25*65ff3638SAlexander V. Chernikov * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26*65ff3638SAlexander V. Chernikov * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27*65ff3638SAlexander V. Chernikov * SUCH DAMAGE. 28*65ff3638SAlexander V. Chernikov */ 29*65ff3638SAlexander V. Chernikov 30*65ff3638SAlexander V. Chernikov #include <sys/cdefs.h> 31*65ff3638SAlexander V. Chernikov __FBSDID("$FreeBSD$"); 32*65ff3638SAlexander V. Chernikov 33*65ff3638SAlexander V. Chernikov #include "opt_inet.h" 34*65ff3638SAlexander V. Chernikov #include "opt_inet6.h" 35*65ff3638SAlexander V. Chernikov #include "opt_route.h" 36*65ff3638SAlexander V. Chernikov #include "opt_mpath.h" 37*65ff3638SAlexander V. Chernikov 38*65ff3638SAlexander V. Chernikov #include <sys/param.h> 39*65ff3638SAlexander V. Chernikov #include <sys/systm.h> 40*65ff3638SAlexander V. Chernikov #include <sys/lock.h> 41*65ff3638SAlexander V. Chernikov #include <sys/rwlock.h> 42*65ff3638SAlexander V. Chernikov #include <sys/malloc.h> 43*65ff3638SAlexander V. Chernikov #include <sys/mbuf.h> 44*65ff3638SAlexander V. Chernikov #include <sys/socket.h> 45*65ff3638SAlexander V. Chernikov #include <sys/sysctl.h> 46*65ff3638SAlexander V. Chernikov #include <sys/kernel.h> 47*65ff3638SAlexander V. Chernikov 48*65ff3638SAlexander V. Chernikov #include <net/if.h> 49*65ff3638SAlexander V. Chernikov #include <net/if_var.h> 50*65ff3638SAlexander V. Chernikov #include <net/if_dl.h> 51*65ff3638SAlexander V. Chernikov #include <net/route.h> 52*65ff3638SAlexander V. Chernikov #include <net/vnet.h> 53*65ff3638SAlexander V. Chernikov 54*65ff3638SAlexander V. Chernikov #ifdef RADIX_MPATH 55*65ff3638SAlexander V. Chernikov #include <net/radix_mpath.h> 56*65ff3638SAlexander V. Chernikov #endif 57*65ff3638SAlexander V. Chernikov 58*65ff3638SAlexander V. Chernikov #include <netinet/in.h> 59*65ff3638SAlexander V. Chernikov #include <netinet/in_var.h> 60*65ff3638SAlexander V. Chernikov #include <netinet/ip_mroute.h> 61*65ff3638SAlexander V. Chernikov #include <netinet/ip6.h> 62*65ff3638SAlexander V. Chernikov #include <netinet6/in6_fib.h> 63*65ff3638SAlexander V. Chernikov #include <netinet6/in6_var.h> 64*65ff3638SAlexander V. Chernikov #include <netinet6/nd6.h> 65*65ff3638SAlexander V. Chernikov #include <netinet6/scope6_var.h> 66*65ff3638SAlexander V. Chernikov 67*65ff3638SAlexander V. Chernikov #include <net/if_types.h> 68*65ff3638SAlexander V. Chernikov 69*65ff3638SAlexander V. Chernikov #ifdef INET6 70*65ff3638SAlexander V. Chernikov static void fib6_rte_to_nh_extended(struct rtentry *rte, 71*65ff3638SAlexander V. Chernikov const struct in6_addr *dst, uint32_t flags, struct nhop6_extended *pnh6); 72*65ff3638SAlexander V. Chernikov static void fib6_rte_to_nh_basic(struct rtentry *rte, const struct in6_addr *dst, 73*65ff3638SAlexander V. Chernikov uint32_t flags, struct nhop6_basic *pnh6); 74*65ff3638SAlexander V. Chernikov static struct ifnet *fib6_get_ifaifp(struct rtentry *rte); 75*65ff3638SAlexander V. Chernikov #define RNTORT(p) ((struct rtentry *)(p)) 76*65ff3638SAlexander V. Chernikov 77*65ff3638SAlexander V. Chernikov /* 78*65ff3638SAlexander V. Chernikov * Gets real interface for the @rte. 79*65ff3638SAlexander V. Chernikov * Returns rt_ifp for !IFF_LOOPBACK routers. 80*65ff3638SAlexander V. Chernikov * Extracts "real" address interface from interface address 81*65ff3638SAlexander V. Chernikov * loopback routes. 82*65ff3638SAlexander V. Chernikov */ 83*65ff3638SAlexander V. Chernikov static struct ifnet * 84*65ff3638SAlexander V. Chernikov fib6_get_ifaifp(struct rtentry *rte) 85*65ff3638SAlexander V. Chernikov { 86*65ff3638SAlexander V. Chernikov struct ifnet *ifp; 87*65ff3638SAlexander V. Chernikov struct sockaddr_dl *sdl; 88*65ff3638SAlexander V. Chernikov 89*65ff3638SAlexander V. Chernikov ifp = rte->rt_ifp; 90*65ff3638SAlexander V. Chernikov if ((ifp->if_flags & IFF_LOOPBACK) && 91*65ff3638SAlexander V. Chernikov rte->rt_gateway->sa_family == AF_LINK) { 92*65ff3638SAlexander V. Chernikov sdl = (struct sockaddr_dl *)rte->rt_gateway; 93*65ff3638SAlexander V. Chernikov return (ifnet_byindex(sdl->sdl_index)); 94*65ff3638SAlexander V. Chernikov } 95*65ff3638SAlexander V. Chernikov 96*65ff3638SAlexander V. Chernikov return (ifp); 97*65ff3638SAlexander V. Chernikov } 98*65ff3638SAlexander V. Chernikov 99*65ff3638SAlexander V. Chernikov static void 100*65ff3638SAlexander V. Chernikov fib6_rte_to_nh_basic(struct rtentry *rte, const struct in6_addr *dst, 101*65ff3638SAlexander V. Chernikov uint32_t flags, struct nhop6_basic *pnh6) 102*65ff3638SAlexander V. Chernikov { 103*65ff3638SAlexander V. Chernikov struct sockaddr_in6 *gw; 104*65ff3638SAlexander V. Chernikov 105*65ff3638SAlexander V. Chernikov /* Do explicit nexthop zero unless we're copying it */ 106*65ff3638SAlexander V. Chernikov memset(pnh6, 0, sizeof(*pnh6)); 107*65ff3638SAlexander V. Chernikov 108*65ff3638SAlexander V. Chernikov if ((flags & NHR_IFAIF) != 0) 109*65ff3638SAlexander V. Chernikov pnh6->nh_ifp = fib6_get_ifaifp(rte); 110*65ff3638SAlexander V. Chernikov else 111*65ff3638SAlexander V. Chernikov pnh6->nh_ifp = rte->rt_ifp; 112*65ff3638SAlexander V. Chernikov 113*65ff3638SAlexander V. Chernikov pnh6->nh_mtu = min(rte->rt_mtu, IN6_LINKMTU(rte->rt_ifp)); 114*65ff3638SAlexander V. Chernikov if (rte->rt_flags & RTF_GATEWAY) { 115*65ff3638SAlexander V. Chernikov gw = (struct sockaddr_in6 *)rte->rt_gateway; 116*65ff3638SAlexander V. Chernikov pnh6->nh_addr = gw->sin6_addr; 117*65ff3638SAlexander V. Chernikov in6_clearscope(&pnh6->nh_addr); 118*65ff3638SAlexander V. Chernikov } else 119*65ff3638SAlexander V. Chernikov pnh6->nh_addr = *dst; 120*65ff3638SAlexander V. Chernikov /* Set flags */ 121*65ff3638SAlexander V. Chernikov pnh6->nh_flags = fib_rte_to_nh_flags(rte->rt_flags); 122*65ff3638SAlexander V. Chernikov gw = (struct sockaddr_in6 *)rt_key(rte); 123*65ff3638SAlexander V. Chernikov if (IN6_IS_ADDR_UNSPECIFIED(&gw->sin6_addr)) 124*65ff3638SAlexander V. Chernikov pnh6->nh_flags |= NHF_DEFAULT; 125*65ff3638SAlexander V. Chernikov } 126*65ff3638SAlexander V. Chernikov 127*65ff3638SAlexander V. Chernikov static void 128*65ff3638SAlexander V. Chernikov fib6_rte_to_nh_extended(struct rtentry *rte, const struct in6_addr *dst, 129*65ff3638SAlexander V. Chernikov uint32_t flags, struct nhop6_extended *pnh6) 130*65ff3638SAlexander V. Chernikov { 131*65ff3638SAlexander V. Chernikov struct sockaddr_in6 *gw; 132*65ff3638SAlexander V. Chernikov 133*65ff3638SAlexander V. Chernikov /* Do explicit nexthop zero unless we're copying it */ 134*65ff3638SAlexander V. Chernikov memset(pnh6, 0, sizeof(*pnh6)); 135*65ff3638SAlexander V. Chernikov 136*65ff3638SAlexander V. Chernikov if ((flags & NHR_IFAIF) != 0) 137*65ff3638SAlexander V. Chernikov pnh6->nh_ifp = fib6_get_ifaifp(rte); 138*65ff3638SAlexander V. Chernikov else 139*65ff3638SAlexander V. Chernikov pnh6->nh_ifp = rte->rt_ifp; 140*65ff3638SAlexander V. Chernikov 141*65ff3638SAlexander V. Chernikov pnh6->nh_mtu = min(rte->rt_mtu, IN6_LINKMTU(rte->rt_ifp)); 142*65ff3638SAlexander V. Chernikov if (rte->rt_flags & RTF_GATEWAY) { 143*65ff3638SAlexander V. Chernikov gw = (struct sockaddr_in6 *)rte->rt_gateway; 144*65ff3638SAlexander V. Chernikov pnh6->nh_addr = gw->sin6_addr; 145*65ff3638SAlexander V. Chernikov in6_clearscope(&pnh6->nh_addr); 146*65ff3638SAlexander V. Chernikov } else 147*65ff3638SAlexander V. Chernikov pnh6->nh_addr = *dst; 148*65ff3638SAlexander V. Chernikov /* Set flags */ 149*65ff3638SAlexander V. Chernikov pnh6->nh_flags = fib_rte_to_nh_flags(rte->rt_flags); 150*65ff3638SAlexander V. Chernikov gw = (struct sockaddr_in6 *)rt_key(rte); 151*65ff3638SAlexander V. Chernikov if (IN6_IS_ADDR_UNSPECIFIED(&gw->sin6_addr)) 152*65ff3638SAlexander V. Chernikov pnh6->nh_flags |= NHF_DEFAULT; 153*65ff3638SAlexander V. Chernikov } 154*65ff3638SAlexander V. Chernikov 155*65ff3638SAlexander V. Chernikov /* 156*65ff3638SAlexander V. Chernikov * Performs IPv6 route table lookup on @dst. Returns 0 on success. 157*65ff3638SAlexander V. Chernikov * Stores basic nexthop info into provided @pnh6 structure. 158*65ff3638SAlexander V. Chernikov * Note that 159*65ff3638SAlexander V. Chernikov * - nh_ifp represents logical transmit interface (rt_ifp) by default 160*65ff3638SAlexander V. Chernikov * - nh_ifp represents "address" interface if NHR_IFAIF flag is passed 161*65ff3638SAlexander V. Chernikov * - mtu from logical transmit interface will be returned. 162*65ff3638SAlexander V. Chernikov * - nh_ifp cannot be safely dereferenced 163*65ff3638SAlexander V. Chernikov * - nh_ifp represents rt_ifp (e.g. if looking up address on 164*65ff3638SAlexander V. Chernikov * interface "ix0" pointer to "ix0" interface will be returned instead 165*65ff3638SAlexander V. Chernikov * of "lo0") 166*65ff3638SAlexander V. Chernikov * - howewer mtu from "transmit" interface will be returned. 167*65ff3638SAlexander V. Chernikov */ 168*65ff3638SAlexander V. Chernikov int 169*65ff3638SAlexander V. Chernikov fib6_lookup_nh_basic(uint32_t fibnum, const struct in6_addr *dst, uint32_t scopeid, 170*65ff3638SAlexander V. Chernikov uint32_t flags, uint32_t flowid, struct nhop6_basic *pnh6) 171*65ff3638SAlexander V. Chernikov { 172*65ff3638SAlexander V. Chernikov struct radix_node_head *rh; 173*65ff3638SAlexander V. Chernikov struct radix_node *rn; 174*65ff3638SAlexander V. Chernikov struct sockaddr_in6 sin6; 175*65ff3638SAlexander V. Chernikov struct rtentry *rte; 176*65ff3638SAlexander V. Chernikov 177*65ff3638SAlexander V. Chernikov KASSERT((fibnum < rt_numfibs), ("fib6_lookup_nh_basic: bad fibnum")); 178*65ff3638SAlexander V. Chernikov rh = rt_tables_get_rnh(fibnum, AF_INET6); 179*65ff3638SAlexander V. Chernikov if (rh == NULL) 180*65ff3638SAlexander V. Chernikov return (ENOENT); 181*65ff3638SAlexander V. Chernikov 182*65ff3638SAlexander V. Chernikov /* Prepare lookup key */ 183*65ff3638SAlexander V. Chernikov memset(&sin6, 0, sizeof(sin6)); 184*65ff3638SAlexander V. Chernikov sin6.sin6_addr = *dst; 185*65ff3638SAlexander V. Chernikov /* Assume scopeid is valid and embed it directly */ 186*65ff3638SAlexander V. Chernikov if (IN6_IS_SCOPE_LINKLOCAL(dst)) 187*65ff3638SAlexander V. Chernikov sin6.sin6_addr.s6_addr16[1] = htons(scopeid & 0xffff); 188*65ff3638SAlexander V. Chernikov 189*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RLOCK(rh); 190*65ff3638SAlexander V. Chernikov rn = rh->rnh_matchaddr((void *)&sin6, rh); 191*65ff3638SAlexander V. Chernikov if (rn != NULL && ((rn->rn_flags & RNF_ROOT) == 0)) { 192*65ff3638SAlexander V. Chernikov rte = RNTORT(rn); 193*65ff3638SAlexander V. Chernikov /* Ensure route & ifp is UP */ 194*65ff3638SAlexander V. Chernikov if (RT_LINK_IS_UP(rte->rt_ifp)) { 195*65ff3638SAlexander V. Chernikov fib6_rte_to_nh_basic(rte, dst, flags, pnh6); 196*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RUNLOCK(rh); 197*65ff3638SAlexander V. Chernikov return (0); 198*65ff3638SAlexander V. Chernikov } 199*65ff3638SAlexander V. Chernikov } 200*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RUNLOCK(rh); 201*65ff3638SAlexander V. Chernikov 202*65ff3638SAlexander V. Chernikov return (ENOENT); 203*65ff3638SAlexander V. Chernikov } 204*65ff3638SAlexander V. Chernikov 205*65ff3638SAlexander V. Chernikov /* 206*65ff3638SAlexander V. Chernikov * Performs IPv6 route table lookup on @dst. Returns 0 on success. 207*65ff3638SAlexander V. Chernikov * Stores extended nexthop info into provided @pnh6 structure. 208*65ff3638SAlexander V. Chernikov * Note that 209*65ff3638SAlexander V. Chernikov * - nh_ifp cannot be safely dereferenced unless NHR_REF is specified. 210*65ff3638SAlexander V. Chernikov * - in that case you need to call fib6_free_nh_ext() 211*65ff3638SAlexander V. Chernikov * - nh_ifp represents logical transmit interface (rt_ifp) by default 212*65ff3638SAlexander V. Chernikov * - nh_ifp represents "address" interface if NHR_IFAIF flag is passed 213*65ff3638SAlexander V. Chernikov * - mtu from logical transmit interface will be returned. 214*65ff3638SAlexander V. Chernikov */ 215*65ff3638SAlexander V. Chernikov int 216*65ff3638SAlexander V. Chernikov fib6_lookup_nh_ext(uint32_t fibnum, const struct in6_addr *dst,uint32_t scopeid, 217*65ff3638SAlexander V. Chernikov uint32_t flags, uint32_t flowid, struct nhop6_extended *pnh6) 218*65ff3638SAlexander V. Chernikov { 219*65ff3638SAlexander V. Chernikov struct radix_node_head *rh; 220*65ff3638SAlexander V. Chernikov struct radix_node *rn; 221*65ff3638SAlexander V. Chernikov struct sockaddr_in6 sin6; 222*65ff3638SAlexander V. Chernikov struct rtentry *rte; 223*65ff3638SAlexander V. Chernikov 224*65ff3638SAlexander V. Chernikov KASSERT((fibnum < rt_numfibs), ("fib6_lookup_nh_ext: bad fibnum")); 225*65ff3638SAlexander V. Chernikov rh = rt_tables_get_rnh(fibnum, AF_INET6); 226*65ff3638SAlexander V. Chernikov if (rh == NULL) 227*65ff3638SAlexander V. Chernikov return (ENOENT); 228*65ff3638SAlexander V. Chernikov 229*65ff3638SAlexander V. Chernikov /* Prepare lookup key */ 230*65ff3638SAlexander V. Chernikov memset(&sin6, 0, sizeof(sin6)); 231*65ff3638SAlexander V. Chernikov sin6.sin6_len = sizeof(struct sockaddr_in6); 232*65ff3638SAlexander V. Chernikov sin6.sin6_addr = *dst; 233*65ff3638SAlexander V. Chernikov /* Assume scopeid is valid and embed it directly */ 234*65ff3638SAlexander V. Chernikov if (IN6_IS_SCOPE_LINKLOCAL(dst)) 235*65ff3638SAlexander V. Chernikov sin6.sin6_addr.s6_addr16[1] = htons(scopeid & 0xffff); 236*65ff3638SAlexander V. Chernikov 237*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RLOCK(rh); 238*65ff3638SAlexander V. Chernikov rn = rh->rnh_matchaddr((void *)&sin6, rh); 239*65ff3638SAlexander V. Chernikov if (rn != NULL && ((rn->rn_flags & RNF_ROOT) == 0)) { 240*65ff3638SAlexander V. Chernikov rte = RNTORT(rn); 241*65ff3638SAlexander V. Chernikov /* Ensure route & ifp is UP */ 242*65ff3638SAlexander V. Chernikov if (RT_LINK_IS_UP(rte->rt_ifp)) { 243*65ff3638SAlexander V. Chernikov fib6_rte_to_nh_extended(rte, dst, flags, pnh6); 244*65ff3638SAlexander V. Chernikov if ((flags & NHR_REF) != 0) { 245*65ff3638SAlexander V. Chernikov /* TODO: Do lwref on egress ifp's */ 246*65ff3638SAlexander V. Chernikov } 247*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RUNLOCK(rh); 248*65ff3638SAlexander V. Chernikov 249*65ff3638SAlexander V. Chernikov return (0); 250*65ff3638SAlexander V. Chernikov } 251*65ff3638SAlexander V. Chernikov } 252*65ff3638SAlexander V. Chernikov RADIX_NODE_HEAD_RUNLOCK(rh); 253*65ff3638SAlexander V. Chernikov 254*65ff3638SAlexander V. Chernikov return (ENOENT); 255*65ff3638SAlexander V. Chernikov } 256*65ff3638SAlexander V. Chernikov 257*65ff3638SAlexander V. Chernikov void 258*65ff3638SAlexander V. Chernikov fib6_free_nh_ext(uint32_t fibnum, struct nhop6_extended *pnh6) 259*65ff3638SAlexander V. Chernikov { 260*65ff3638SAlexander V. Chernikov 261*65ff3638SAlexander V. Chernikov } 262*65ff3638SAlexander V. Chernikov 263*65ff3638SAlexander V. Chernikov #endif 264*65ff3638SAlexander V. Chernikov 265