1 /*- 2 * Copyright (c) 2015 3 * Alexander V. Chernikov <melifaro@FreeBSD.org> 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions 7 * are met: 8 * 1. Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright 11 * notice, this list of conditions and the following disclaimer in the 12 * documentation and/or other materials provided with the distribution. 13 * 4. Neither the name of the University nor the names of its contributors 14 * may be used to endorse or promote products derived from this software 15 * without specific prior written permission. 16 * 17 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27 * SUCH DAMAGE. 28 */ 29 30 #include <sys/cdefs.h> 31 __FBSDID("$FreeBSD$"); 32 33 #include "opt_inet.h" 34 #include "opt_route.h" 35 #include "opt_mpath.h" 36 37 #include <sys/param.h> 38 #include <sys/systm.h> 39 #include <sys/lock.h> 40 #include <sys/rwlock.h> 41 #include <sys/malloc.h> 42 #include <sys/mbuf.h> 43 #include <sys/socket.h> 44 #include <sys/sysctl.h> 45 #include <sys/kernel.h> 46 47 #include <net/if.h> 48 #include <net/if_var.h> 49 #include <net/if_dl.h> 50 #include <net/route.h> 51 #include <net/route_var.h> 52 #include <net/vnet.h> 53 54 #ifdef RADIX_MPATH 55 #include <net/radix_mpath.h> 56 #endif 57 58 #include <netinet/in.h> 59 #include <netinet/in_var.h> 60 #include <netinet/in_fib.h> 61 62 #ifdef INET 63 static void fib4_rte_to_nh_basic(struct rtentry *rte, struct in_addr dst, 64 uint32_t flags, struct nhop4_basic *pnh4); 65 static void fib4_rte_to_nh_extended(struct rtentry *rte, struct in_addr dst, 66 uint32_t flags, struct nhop4_extended *pnh4); 67 68 #define RNTORT(p) ((struct rtentry *)(p)) 69 70 static void 71 fib4_rte_to_nh_basic(struct rtentry *rte, struct in_addr dst, 72 uint32_t flags, struct nhop4_basic *pnh4) 73 { 74 struct sockaddr_in *gw; 75 76 if ((flags & NHR_IFAIF) != 0) 77 pnh4->nh_ifp = rte->rt_ifa->ifa_ifp; 78 else 79 pnh4->nh_ifp = rte->rt_ifp; 80 pnh4->nh_mtu = min(rte->rt_mtu, rte->rt_ifp->if_mtu); 81 if (rte->rt_flags & RTF_GATEWAY) { 82 gw = (struct sockaddr_in *)rte->rt_gateway; 83 pnh4->nh_addr = gw->sin_addr; 84 } else 85 pnh4->nh_addr = dst; 86 /* Set flags */ 87 pnh4->nh_flags = fib_rte_to_nh_flags(rte->rt_flags); 88 gw = (struct sockaddr_in *)rt_key(rte); 89 if (gw->sin_addr.s_addr == 0) 90 pnh4->nh_flags |= NHF_DEFAULT; 91 /* TODO: Handle RTF_BROADCAST here */ 92 } 93 94 static void 95 fib4_rte_to_nh_extended(struct rtentry *rte, struct in_addr dst, 96 uint32_t flags, struct nhop4_extended *pnh4) 97 { 98 struct sockaddr_in *gw; 99 struct in_ifaddr *ia; 100 101 if ((flags & NHR_IFAIF) != 0) 102 pnh4->nh_ifp = rte->rt_ifa->ifa_ifp; 103 else 104 pnh4->nh_ifp = rte->rt_ifp; 105 pnh4->nh_mtu = min(rte->rt_mtu, rte->rt_ifp->if_mtu); 106 if (rte->rt_flags & RTF_GATEWAY) { 107 gw = (struct sockaddr_in *)rte->rt_gateway; 108 pnh4->nh_addr = gw->sin_addr; 109 } else 110 pnh4->nh_addr = dst; 111 /* Set flags */ 112 pnh4->nh_flags = fib_rte_to_nh_flags(rte->rt_flags); 113 gw = (struct sockaddr_in *)rt_key(rte); 114 if (gw->sin_addr.s_addr == 0) 115 pnh4->nh_flags |= NHF_DEFAULT; 116 /* XXX: Set RTF_BROADCAST if GW address is broadcast */ 117 118 ia = ifatoia(rte->rt_ifa); 119 pnh4->nh_src = IA_SIN(ia)->sin_addr; 120 } 121 122 /* 123 * Performs IPv4 route table lookup on @dst. Returns 0 on success. 124 * Stores nexthop info provided @pnh4 structure. 125 * Note that 126 * - nh_ifp cannot be safely dereferenced 127 * - nh_ifp represents logical transmit interface (rt_ifp) (e.g. if 128 * looking up address on interface "ix0" pointer to "lo0" interface 129 * will be returned instead of "ix0") 130 * - nh_ifp represents "address" interface if NHR_IFAIF flag is passed 131 * - howewer mtu from "transmit" interface will be returned. 132 */ 133 int 134 fib4_lookup_nh_basic(uint32_t fibnum, struct in_addr dst, uint32_t flags, 135 uint32_t flowid, struct nhop4_basic *pnh4) 136 { 137 struct rib_head *rh; 138 struct radix_node *rn; 139 struct sockaddr_in sin; 140 struct rtentry *rte; 141 142 KASSERT((fibnum < rt_numfibs), ("fib4_lookup_nh_basic: bad fibnum")); 143 rh = rt_tables_get_rnh(fibnum, AF_INET); 144 if (rh == NULL) 145 return (ENOENT); 146 147 /* Prepare lookup key */ 148 memset(&sin, 0, sizeof(sin)); 149 sin.sin_len = sizeof(struct sockaddr_in); 150 sin.sin_addr = dst; 151 152 RIB_RLOCK(rh); 153 rn = rh->rnh_matchaddr((void *)&sin, &rh->head); 154 if (rn != NULL && ((rn->rn_flags & RNF_ROOT) == 0)) { 155 rte = RNTORT(rn); 156 /* Ensure route & ifp is UP */ 157 if (RT_LINK_IS_UP(rte->rt_ifp)) { 158 fib4_rte_to_nh_basic(rte, dst, flags, pnh4); 159 RIB_RUNLOCK(rh); 160 161 return (0); 162 } 163 } 164 RIB_RUNLOCK(rh); 165 166 return (ENOENT); 167 } 168 169 /* 170 * Performs IPv4 route table lookup on @dst. Returns 0 on success. 171 * Stores extende nexthop info provided @pnh4 structure. 172 * Note that 173 * - nh_ifp cannot be safely dereferenced unless NHR_REF is specified. 174 * - in that case you need to call fib4_free_nh_ext() 175 * - nh_ifp represents logical transmit interface (rt_ifp) (e.g. if 176 * looking up address of interface "ix0" pointer to "lo0" interface 177 * will be returned instead of "ix0") 178 * - nh_ifp represents "address" interface if NHR_IFAIF flag is passed 179 * - howewer mtu from "transmit" interface will be returned. 180 */ 181 int 182 fib4_lookup_nh_ext(uint32_t fibnum, struct in_addr dst, uint32_t flags, 183 uint32_t flowid, struct nhop4_extended *pnh4) 184 { 185 struct rib_head *rh; 186 struct radix_node *rn; 187 struct sockaddr_in sin; 188 struct rtentry *rte; 189 190 KASSERT((fibnum < rt_numfibs), ("fib4_lookup_nh_ext: bad fibnum")); 191 rh = rt_tables_get_rnh(fibnum, AF_INET); 192 if (rh == NULL) 193 return (ENOENT); 194 195 /* Prepare lookup key */ 196 memset(&sin, 0, sizeof(sin)); 197 sin.sin_len = sizeof(struct sockaddr_in); 198 sin.sin_addr = dst; 199 200 RIB_RLOCK(rh); 201 rn = rh->rnh_matchaddr((void *)&sin, &rh->head); 202 if (rn != NULL && ((rn->rn_flags & RNF_ROOT) == 0)) { 203 rte = RNTORT(rn); 204 #ifdef RADIX_MPATH 205 rte = rt_mpath_select(rte, flowid); 206 if (rte == NULL) { 207 RIB_RUNLOCK(rh); 208 return (ENOENT); 209 } 210 #endif 211 /* Ensure route & ifp is UP */ 212 if (RT_LINK_IS_UP(rte->rt_ifp)) { 213 fib4_rte_to_nh_extended(rte, dst, flags, pnh4); 214 if ((flags & NHR_REF) != 0) { 215 /* TODO: lwref on egress ifp's ? */ 216 } 217 RIB_RUNLOCK(rh); 218 219 return (0); 220 } 221 } 222 RIB_RUNLOCK(rh); 223 224 return (ENOENT); 225 } 226 227 void 228 fib4_free_nh_ext(uint32_t fibnum, struct nhop4_extended *pnh4) 229 { 230 231 } 232 233 #endif 234