1caf43b02SWarner Losh /*- 2686cdd19SJun-ichiro itojun Hagino * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 3686cdd19SJun-ichiro itojun Hagino * All rights reserved. 4686cdd19SJun-ichiro itojun Hagino * 5686cdd19SJun-ichiro itojun Hagino * Redistribution and use in source and binary forms, with or without 6686cdd19SJun-ichiro itojun Hagino * modification, are permitted provided that the following conditions 7686cdd19SJun-ichiro itojun Hagino * are met: 8686cdd19SJun-ichiro itojun Hagino * 1. Redistributions of source code must retain the above copyright 9686cdd19SJun-ichiro itojun Hagino * notice, this list of conditions and the following disclaimer. 10686cdd19SJun-ichiro itojun Hagino * 2. Redistributions in binary form must reproduce the above copyright 11686cdd19SJun-ichiro itojun Hagino * notice, this list of conditions and the following disclaimer in the 12686cdd19SJun-ichiro itojun Hagino * documentation and/or other materials provided with the distribution. 13686cdd19SJun-ichiro itojun Hagino * 3. Neither the name of the project nor the names of its contributors 14686cdd19SJun-ichiro itojun Hagino * may be used to endorse or promote products derived from this software 15686cdd19SJun-ichiro itojun Hagino * without specific prior written permission. 16686cdd19SJun-ichiro itojun Hagino * 17686cdd19SJun-ichiro itojun Hagino * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 18686cdd19SJun-ichiro itojun Hagino * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 19686cdd19SJun-ichiro itojun Hagino * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 20686cdd19SJun-ichiro itojun Hagino * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 21686cdd19SJun-ichiro itojun Hagino * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 22686cdd19SJun-ichiro itojun Hagino * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 23686cdd19SJun-ichiro itojun Hagino * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 24686cdd19SJun-ichiro itojun Hagino * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 25686cdd19SJun-ichiro itojun Hagino * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 26686cdd19SJun-ichiro itojun Hagino * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 27686cdd19SJun-ichiro itojun Hagino * SUCH DAMAGE. 28b48287a3SDavid E. O'Brien * 29b48287a3SDavid E. O'Brien * $KAME: in6_src.c,v 1.132 2003/08/26 04:42:27 keiichi Exp $ 30686cdd19SJun-ichiro itojun Hagino */ 31686cdd19SJun-ichiro itojun Hagino 32caf43b02SWarner Losh /*- 33686cdd19SJun-ichiro itojun Hagino * Copyright (c) 1982, 1986, 1991, 1993 34686cdd19SJun-ichiro itojun Hagino * The Regents of the University of California. All rights reserved. 35686cdd19SJun-ichiro itojun Hagino * 36686cdd19SJun-ichiro itojun Hagino * Redistribution and use in source and binary forms, with or without 37686cdd19SJun-ichiro itojun Hagino * modification, are permitted provided that the following conditions 38686cdd19SJun-ichiro itojun Hagino * are met: 39686cdd19SJun-ichiro itojun Hagino * 1. Redistributions of source code must retain the above copyright 40686cdd19SJun-ichiro itojun Hagino * notice, this list of conditions and the following disclaimer. 41686cdd19SJun-ichiro itojun Hagino * 2. Redistributions in binary form must reproduce the above copyright 42686cdd19SJun-ichiro itojun Hagino * notice, this list of conditions and the following disclaimer in the 43686cdd19SJun-ichiro itojun Hagino * documentation and/or other materials provided with the distribution. 44686cdd19SJun-ichiro itojun Hagino * 4. Neither the name of the University nor the names of its contributors 45686cdd19SJun-ichiro itojun Hagino * may be used to endorse or promote products derived from this software 46686cdd19SJun-ichiro itojun Hagino * without specific prior written permission. 47686cdd19SJun-ichiro itojun Hagino * 48686cdd19SJun-ichiro itojun Hagino * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 49686cdd19SJun-ichiro itojun Hagino * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 50686cdd19SJun-ichiro itojun Hagino * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 51686cdd19SJun-ichiro itojun Hagino * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 52686cdd19SJun-ichiro itojun Hagino * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 53686cdd19SJun-ichiro itojun Hagino * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 54686cdd19SJun-ichiro itojun Hagino * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 55686cdd19SJun-ichiro itojun Hagino * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 56686cdd19SJun-ichiro itojun Hagino * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 57686cdd19SJun-ichiro itojun Hagino * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 58686cdd19SJun-ichiro itojun Hagino * SUCH DAMAGE. 59686cdd19SJun-ichiro itojun Hagino * 60686cdd19SJun-ichiro itojun Hagino * @(#)in_pcb.c 8.2 (Berkeley) 1/4/94 61686cdd19SJun-ichiro itojun Hagino */ 62686cdd19SJun-ichiro itojun Hagino 63b48287a3SDavid E. O'Brien #include <sys/cdefs.h> 64b48287a3SDavid E. O'Brien __FBSDID("$FreeBSD$"); 65b48287a3SDavid E. O'Brien 66686cdd19SJun-ichiro itojun Hagino #include "opt_inet.h" 67686cdd19SJun-ichiro itojun Hagino #include "opt_inet6.h" 68e440aed9SQing Li #include "opt_mpath.h" 69686cdd19SJun-ichiro itojun Hagino 70686cdd19SJun-ichiro itojun Hagino #include <sys/param.h> 71686cdd19SJun-ichiro itojun Hagino #include <sys/systm.h> 724e7f640dSJohn Baldwin #include <sys/lock.h> 7333841545SHajimu UMEMOTO #include <sys/malloc.h> 74686cdd19SJun-ichiro itojun Hagino #include <sys/mbuf.h> 75acd3428bSRobert Watson #include <sys/priv.h> 76686cdd19SJun-ichiro itojun Hagino #include <sys/protosw.h> 77686cdd19SJun-ichiro itojun Hagino #include <sys/socket.h> 78686cdd19SJun-ichiro itojun Hagino #include <sys/socketvar.h> 797fc91b3fSHajimu UMEMOTO #include <sys/sockio.h> 807fc91b3fSHajimu UMEMOTO #include <sys/sysctl.h> 81686cdd19SJun-ichiro itojun Hagino #include <sys/errno.h> 82686cdd19SJun-ichiro itojun Hagino #include <sys/time.h> 834a201dfcSHajimu UMEMOTO #include <sys/kernel.h> 845d525653SHajimu UMEMOTO #include <sys/sx.h> 85603724d3SBjoern A. Zeeb #include <sys/vimage.h> 86686cdd19SJun-ichiro itojun Hagino 87686cdd19SJun-ichiro itojun Hagino #include <net/if.h> 88686cdd19SJun-ichiro itojun Hagino #include <net/route.h> 89e440aed9SQing Li #ifdef RADIX_MPATH 90e440aed9SQing Li #include <net/radix_mpath.h> 91e440aed9SQing Li #endif 92686cdd19SJun-ichiro itojun Hagino 93686cdd19SJun-ichiro itojun Hagino #include <netinet/in.h> 94686cdd19SJun-ichiro itojun Hagino #include <netinet/in_var.h> 95686cdd19SJun-ichiro itojun Hagino #include <netinet/in_systm.h> 96686cdd19SJun-ichiro itojun Hagino #include <netinet/ip.h> 97686cdd19SJun-ichiro itojun Hagino #include <netinet/in_pcb.h> 98686cdd19SJun-ichiro itojun Hagino #include <netinet6/in6_var.h> 99686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h> 100686cdd19SJun-ichiro itojun Hagino #include <netinet6/in6_pcb.h> 101686cdd19SJun-ichiro itojun Hagino #include <netinet6/ip6_var.h> 102a1f7e5f8SHajimu UMEMOTO #include <netinet6/scope6_var.h> 103686cdd19SJun-ichiro itojun Hagino #include <netinet6/nd6.h> 104686cdd19SJun-ichiro itojun Hagino 1057fc91b3fSHajimu UMEMOTO static struct mtx addrsel_lock; 1067fc91b3fSHajimu UMEMOTO #define ADDRSEL_LOCK_INIT() mtx_init(&addrsel_lock, "addrsel_lock", NULL, MTX_DEF) 1077fc91b3fSHajimu UMEMOTO #define ADDRSEL_LOCK() mtx_lock(&addrsel_lock) 1087fc91b3fSHajimu UMEMOTO #define ADDRSEL_UNLOCK() mtx_unlock(&addrsel_lock) 1097fc91b3fSHajimu UMEMOTO #define ADDRSEL_LOCK_ASSERT() mtx_assert(&addrsel_lock, MA_OWNED) 1107fc91b3fSHajimu UMEMOTO 1115d525653SHajimu UMEMOTO static struct sx addrsel_sxlock; 1125d525653SHajimu UMEMOTO #define ADDRSEL_SXLOCK_INIT() sx_init(&addrsel_sxlock, "addrsel_sxlock") 1135d525653SHajimu UMEMOTO #define ADDRSEL_SLOCK() sx_slock(&addrsel_sxlock) 1145d525653SHajimu UMEMOTO #define ADDRSEL_SUNLOCK() sx_sunlock(&addrsel_sxlock) 1155d525653SHajimu UMEMOTO #define ADDRSEL_XLOCK() sx_xlock(&addrsel_sxlock) 1165d525653SHajimu UMEMOTO #define ADDRSEL_XUNLOCK() sx_xunlock(&addrsel_sxlock) 1175d525653SHajimu UMEMOTO 1187fc91b3fSHajimu UMEMOTO #define ADDR_LABEL_NOTAPP (-1) 1197fc91b3fSHajimu UMEMOTO struct in6_addrpolicy defaultaddrpolicy; 1207fc91b3fSHajimu UMEMOTO 121d6385b1cSHajimu UMEMOTO int ip6_prefer_tempaddr = 0; 122d6385b1cSHajimu UMEMOTO 123a1f7e5f8SHajimu UMEMOTO static int selectroute __P((struct sockaddr_in6 *, struct ip6_pktopts *, 124a1f7e5f8SHajimu UMEMOTO struct ip6_moptions *, struct route_in6 *, struct ifnet **, 125a1f7e5f8SHajimu UMEMOTO struct rtentry **, int, int)); 126d6385b1cSHajimu UMEMOTO static int in6_selectif __P((struct sockaddr_in6 *, struct ip6_pktopts *, 12768efda09SHajimu UMEMOTO struct ip6_moptions *, struct route_in6 *ro, struct ifnet **)); 128d6385b1cSHajimu UMEMOTO 1299233d8f3SDavid E. O'Brien static struct in6_addrpolicy *lookup_addrsel_policy(struct sockaddr_in6 *); 130d6385b1cSHajimu UMEMOTO 1319233d8f3SDavid E. O'Brien static void init_policy_queue(void); 1329233d8f3SDavid E. O'Brien static int add_addrsel_policyent(struct in6_addrpolicy *); 1339233d8f3SDavid E. O'Brien static int delete_addrsel_policyent(struct in6_addrpolicy *); 1347fc91b3fSHajimu UMEMOTO static int walk_addrsel_policy __P((int (*)(struct in6_addrpolicy *, void *), 1357fc91b3fSHajimu UMEMOTO void *)); 1369233d8f3SDavid E. O'Brien static int dump_addrsel_policyent(struct in6_addrpolicy *, void *); 1379233d8f3SDavid E. O'Brien static struct in6_addrpolicy *match_addrsel_policy(struct sockaddr_in6 *); 1387fc91b3fSHajimu UMEMOTO 139686cdd19SJun-ichiro itojun Hagino /* 14033841545SHajimu UMEMOTO * Return an IPv6 address, which is the most appropriate for a given 141686cdd19SJun-ichiro itojun Hagino * destination and user specified options. 14233841545SHajimu UMEMOTO * If necessary, this function lookups the routing table and returns 143686cdd19SJun-ichiro itojun Hagino * an entry to the caller for later use. 144686cdd19SJun-ichiro itojun Hagino */ 145d6385b1cSHajimu UMEMOTO #define REPLACE(r) do {\ 146603724d3SBjoern A. Zeeb if ((r) < sizeof(V_ip6stat.ip6s_sources_rule) / \ 147603724d3SBjoern A. Zeeb sizeof(V_ip6stat.ip6s_sources_rule[0])) /* check for safety */ \ 148603724d3SBjoern A. Zeeb V_ip6stat.ip6s_sources_rule[(r)]++; \ 149ab569b9cSBjoern A. Zeeb /* { \ 150ab569b9cSBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN], ip6b[INET6_ADDRSTRLEN]; \ 151ab569b9cSBjoern A. Zeeb printf("in6_selectsrc: replace %s with %s by %d\n", ia_best ? ip6_sprintf(ip6buf, &ia_best->ia_addr.sin6_addr) : "none", ip6_sprintf(ip6b, &ia->ia_addr.sin6_addr), (r)); \ 152ab569b9cSBjoern A. Zeeb } */ \ 153d6385b1cSHajimu UMEMOTO goto replace; \ 154d6385b1cSHajimu UMEMOTO } while(0) 155d6385b1cSHajimu UMEMOTO #define NEXT(r) do {\ 156603724d3SBjoern A. Zeeb if ((r) < sizeof(V_ip6stat.ip6s_sources_rule) / \ 157603724d3SBjoern A. Zeeb sizeof(V_ip6stat.ip6s_sources_rule[0])) /* check for safety */ \ 158603724d3SBjoern A. Zeeb V_ip6stat.ip6s_sources_rule[(r)]++; \ 159ab569b9cSBjoern A. Zeeb /* { \ 160ab569b9cSBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN], ip6b[INET6_ADDRSTRLEN]; \ 161ab569b9cSBjoern A. Zeeb printf("in6_selectsrc: keep %s against %s by %d\n", ia_best ? ip6_sprintf(ip6buf, &ia_best->ia_addr.sin6_addr) : "none", ip6_sprintf(ip6b, &ia->ia_addr.sin6_addr), (r)); \ 162ab569b9cSBjoern A. Zeeb } */ \ 163d6385b1cSHajimu UMEMOTO goto next; /* XXX: we can't use 'continue' here */ \ 164d6385b1cSHajimu UMEMOTO } while(0) 165d6385b1cSHajimu UMEMOTO #define BREAK(r) do { \ 166603724d3SBjoern A. Zeeb if ((r) < sizeof(V_ip6stat.ip6s_sources_rule) / \ 167603724d3SBjoern A. Zeeb sizeof(V_ip6stat.ip6s_sources_rule[0])) /* check for safety */ \ 168603724d3SBjoern A. Zeeb V_ip6stat.ip6s_sources_rule[(r)]++; \ 169d6385b1cSHajimu UMEMOTO goto out; /* XXX: we can't use 'break' here */ \ 170d6385b1cSHajimu UMEMOTO } while(0) 171d6385b1cSHajimu UMEMOTO 172686cdd19SJun-ichiro itojun Hagino struct in6_addr * 1731272577eSXin LI in6_selectsrc(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 174f2f877d3SBjoern A. Zeeb struct inpcb *inp, struct route_in6 *ro, struct ucred *cred, 175f2f877d3SBjoern A. Zeeb struct ifnet **ifpp, int *errorp) 176686cdd19SJun-ichiro itojun Hagino { 177a1f7e5f8SHajimu UMEMOTO struct in6_addr dst; 178d6385b1cSHajimu UMEMOTO struct ifnet *ifp = NULL; 179d6385b1cSHajimu UMEMOTO struct in6_ifaddr *ia = NULL, *ia_best = NULL; 180686cdd19SJun-ichiro itojun Hagino struct in6_pktinfo *pi = NULL; 181d6385b1cSHajimu UMEMOTO int dst_scope = -1, best_scope = -1, best_matchlen = -1; 182d6385b1cSHajimu UMEMOTO struct in6_addrpolicy *dst_policy = NULL, *best_policy = NULL; 183d6385b1cSHajimu UMEMOTO u_int32_t odstzone; 184d6385b1cSHajimu UMEMOTO int prefer_tempaddr; 185f2f877d3SBjoern A. Zeeb struct ip6_moptions *mopts; 186e6a27350SHajimu UMEMOTO 187a1f7e5f8SHajimu UMEMOTO dst = dstsock->sin6_addr; /* make a copy for local operation */ 188686cdd19SJun-ichiro itojun Hagino *errorp = 0; 189a1f7e5f8SHajimu UMEMOTO if (ifpp) 190a1f7e5f8SHajimu UMEMOTO *ifpp = NULL; 191686cdd19SJun-ichiro itojun Hagino 192a55b8b20SBjoern A. Zeeb if (inp != NULL) { 193a55b8b20SBjoern A. Zeeb INP_LOCK_ASSERT(inp); 194f2f877d3SBjoern A. Zeeb mopts = inp->in6p_moptions; 195a55b8b20SBjoern A. Zeeb } else { 196f2f877d3SBjoern A. Zeeb mopts = NULL; 197a55b8b20SBjoern A. Zeeb } 198f2f877d3SBjoern A. Zeeb 199686cdd19SJun-ichiro itojun Hagino /* 200686cdd19SJun-ichiro itojun Hagino * If the source address is explicitly specified by the caller, 201d6385b1cSHajimu UMEMOTO * check if the requested source address is indeed a unicast address 202d6385b1cSHajimu UMEMOTO * assigned to the node, and can be used as the packet's source 203d6385b1cSHajimu UMEMOTO * address. If everything is okay, use the address as source. 204686cdd19SJun-ichiro itojun Hagino */ 205686cdd19SJun-ichiro itojun Hagino if (opts && (pi = opts->ip6po_pktinfo) && 206d6385b1cSHajimu UMEMOTO !IN6_IS_ADDR_UNSPECIFIED(&pi->ipi6_addr)) { 207d6385b1cSHajimu UMEMOTO struct sockaddr_in6 srcsock; 208d6385b1cSHajimu UMEMOTO struct in6_ifaddr *ia6; 209d6385b1cSHajimu UMEMOTO 210d6385b1cSHajimu UMEMOTO /* get the outgoing interface */ 211d6385b1cSHajimu UMEMOTO if ((*errorp = in6_selectif(dstsock, opts, mopts, ro, &ifp)) 212d6385b1cSHajimu UMEMOTO != 0) { 213d6385b1cSHajimu UMEMOTO return (NULL); 214d6385b1cSHajimu UMEMOTO } 21568efda09SHajimu UMEMOTO 216686cdd19SJun-ichiro itojun Hagino /* 217d6385b1cSHajimu UMEMOTO * determine the appropriate zone id of the source based on 218d6385b1cSHajimu UMEMOTO * the zone of the destination and the outgoing interface. 219a1f7e5f8SHajimu UMEMOTO * If the specified address is ambiguous wrt the scope zone, 220a1f7e5f8SHajimu UMEMOTO * the interface must be specified; otherwise, ifa_ifwithaddr() 221a1f7e5f8SHajimu UMEMOTO * will fail matching the address. 222d6385b1cSHajimu UMEMOTO */ 223d6385b1cSHajimu UMEMOTO bzero(&srcsock, sizeof(srcsock)); 224d6385b1cSHajimu UMEMOTO srcsock.sin6_family = AF_INET6; 225d6385b1cSHajimu UMEMOTO srcsock.sin6_len = sizeof(srcsock); 226d6385b1cSHajimu UMEMOTO srcsock.sin6_addr = pi->ipi6_addr; 227d6385b1cSHajimu UMEMOTO if (ifp) { 228a1f7e5f8SHajimu UMEMOTO *errorp = in6_setscope(&srcsock.sin6_addr, ifp, NULL); 229a1f7e5f8SHajimu UMEMOTO if (*errorp != 0) 230d6385b1cSHajimu UMEMOTO return (NULL); 231d6385b1cSHajimu UMEMOTO } 232a1f7e5f8SHajimu UMEMOTO 233d6385b1cSHajimu UMEMOTO ia6 = (struct in6_ifaddr *)ifa_ifwithaddr((struct sockaddr *)(&srcsock)); 234d6385b1cSHajimu UMEMOTO if (ia6 == NULL || 235d6385b1cSHajimu UMEMOTO (ia6->ia6_flags & (IN6_IFF_ANYCAST | IN6_IFF_NOTREADY))) { 236d6385b1cSHajimu UMEMOTO *errorp = EADDRNOTAVAIL; 237d6385b1cSHajimu UMEMOTO return (NULL); 238d6385b1cSHajimu UMEMOTO } 239d6385b1cSHajimu UMEMOTO pi->ipi6_addr = srcsock.sin6_addr; /* XXX: this overrides pi */ 240a1f7e5f8SHajimu UMEMOTO if (ifpp) 241a1f7e5f8SHajimu UMEMOTO *ifpp = ifp; 242d6385b1cSHajimu UMEMOTO return (&ia6->ia_addr.sin6_addr); 243d6385b1cSHajimu UMEMOTO } 244d6385b1cSHajimu UMEMOTO 245d6385b1cSHajimu UMEMOTO /* 246d6385b1cSHajimu UMEMOTO * Otherwise, if the socket has already bound the source, just use it. 247686cdd19SJun-ichiro itojun Hagino */ 248f2f877d3SBjoern A. Zeeb if (inp != NULL && !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) { 249f2f877d3SBjoern A. Zeeb return (&inp->in6p_laddr); 250f2f877d3SBjoern A. Zeeb } 251686cdd19SJun-ichiro itojun Hagino 252686cdd19SJun-ichiro itojun Hagino /* 253d6385b1cSHajimu UMEMOTO * If the address is not specified, choose the best one based on 254d6385b1cSHajimu UMEMOTO * the outgoing interface and the destination address. 255686cdd19SJun-ichiro itojun Hagino */ 256d6385b1cSHajimu UMEMOTO /* get the outgoing interface */ 257d6385b1cSHajimu UMEMOTO if ((*errorp = in6_selectif(dstsock, opts, mopts, ro, &ifp)) != 0) 258d6385b1cSHajimu UMEMOTO return (NULL); 259686cdd19SJun-ichiro itojun Hagino 260d6385b1cSHajimu UMEMOTO #ifdef DIAGNOSTIC 261d6385b1cSHajimu UMEMOTO if (ifp == NULL) /* this should not happen */ 262d6385b1cSHajimu UMEMOTO panic("in6_selectsrc: NULL ifp"); 263d6385b1cSHajimu UMEMOTO #endif 264a1f7e5f8SHajimu UMEMOTO *errorp = in6_setscope(&dst, ifp, &odstzone); 265a1f7e5f8SHajimu UMEMOTO if (*errorp != 0) 266d6385b1cSHajimu UMEMOTO return (NULL); 267a1f7e5f8SHajimu UMEMOTO 268603724d3SBjoern A. Zeeb for (ia = V_in6_ifaddr; ia; ia = ia->ia_next) { 269d6385b1cSHajimu UMEMOTO int new_scope = -1, new_matchlen = -1; 270d6385b1cSHajimu UMEMOTO struct in6_addrpolicy *new_policy = NULL; 271d6385b1cSHajimu UMEMOTO u_int32_t srczone, osrczone, dstzone; 272a1f7e5f8SHajimu UMEMOTO struct in6_addr src; 273d6385b1cSHajimu UMEMOTO struct ifnet *ifp1 = ia->ia_ifp; 274d6385b1cSHajimu UMEMOTO 275d6385b1cSHajimu UMEMOTO /* 276d6385b1cSHajimu UMEMOTO * We'll never take an address that breaks the scope zone 277d6385b1cSHajimu UMEMOTO * of the destination. We also skip an address if its zone 278d6385b1cSHajimu UMEMOTO * does not contain the outgoing interface. 279d6385b1cSHajimu UMEMOTO * XXX: we should probably use sin6_scope_id here. 280d6385b1cSHajimu UMEMOTO */ 281a1f7e5f8SHajimu UMEMOTO if (in6_setscope(&dst, ifp1, &dstzone) || 282d6385b1cSHajimu UMEMOTO odstzone != dstzone) { 283d6385b1cSHajimu UMEMOTO continue; 284d6385b1cSHajimu UMEMOTO } 285a1f7e5f8SHajimu UMEMOTO src = ia->ia_addr.sin6_addr; 286a1f7e5f8SHajimu UMEMOTO if (in6_setscope(&src, ifp, &osrczone) || 287a1f7e5f8SHajimu UMEMOTO in6_setscope(&src, ifp1, &srczone) || 288d6385b1cSHajimu UMEMOTO osrczone != srczone) { 289d6385b1cSHajimu UMEMOTO continue; 290686cdd19SJun-ichiro itojun Hagino } 291686cdd19SJun-ichiro itojun Hagino 292d6385b1cSHajimu UMEMOTO /* avoid unusable addresses */ 293d6385b1cSHajimu UMEMOTO if ((ia->ia6_flags & 294d6385b1cSHajimu UMEMOTO (IN6_IFF_NOTREADY | IN6_IFF_ANYCAST | IN6_IFF_DETACHED))) { 295d6385b1cSHajimu UMEMOTO continue; 296d6385b1cSHajimu UMEMOTO } 297603724d3SBjoern A. Zeeb if (!V_ip6_use_deprecated && IFA6_IS_DEPRECATED(ia)) 298d6385b1cSHajimu UMEMOTO continue; 299d6385b1cSHajimu UMEMOTO 300d6385b1cSHajimu UMEMOTO /* Rule 1: Prefer same address */ 301a1f7e5f8SHajimu UMEMOTO if (IN6_ARE_ADDR_EQUAL(&dst, &ia->ia_addr.sin6_addr)) { 302d6385b1cSHajimu UMEMOTO ia_best = ia; 303d6385b1cSHajimu UMEMOTO BREAK(1); /* there should be no better candidate */ 304d6385b1cSHajimu UMEMOTO } 305d6385b1cSHajimu UMEMOTO 306d6385b1cSHajimu UMEMOTO if (ia_best == NULL) 307d6385b1cSHajimu UMEMOTO REPLACE(0); 308d6385b1cSHajimu UMEMOTO 309d6385b1cSHajimu UMEMOTO /* Rule 2: Prefer appropriate scope */ 310d6385b1cSHajimu UMEMOTO if (dst_scope < 0) 311a1f7e5f8SHajimu UMEMOTO dst_scope = in6_addrscope(&dst); 312d6385b1cSHajimu UMEMOTO new_scope = in6_addrscope(&ia->ia_addr.sin6_addr); 313d6385b1cSHajimu UMEMOTO if (IN6_ARE_SCOPE_CMP(best_scope, new_scope) < 0) { 314d6385b1cSHajimu UMEMOTO if (IN6_ARE_SCOPE_CMP(best_scope, dst_scope) < 0) 315d6385b1cSHajimu UMEMOTO REPLACE(2); 316d6385b1cSHajimu UMEMOTO NEXT(2); 317d6385b1cSHajimu UMEMOTO } else if (IN6_ARE_SCOPE_CMP(new_scope, best_scope) < 0) { 318d6385b1cSHajimu UMEMOTO if (IN6_ARE_SCOPE_CMP(new_scope, dst_scope) < 0) 319d6385b1cSHajimu UMEMOTO NEXT(2); 320d6385b1cSHajimu UMEMOTO REPLACE(2); 321d6385b1cSHajimu UMEMOTO } 322d6385b1cSHajimu UMEMOTO 323d6385b1cSHajimu UMEMOTO /* 324d6385b1cSHajimu UMEMOTO * Rule 3: Avoid deprecated addresses. Note that the case of 325d6385b1cSHajimu UMEMOTO * !ip6_use_deprecated is already rejected above. 326d6385b1cSHajimu UMEMOTO */ 327d6385b1cSHajimu UMEMOTO if (!IFA6_IS_DEPRECATED(ia_best) && IFA6_IS_DEPRECATED(ia)) 328d6385b1cSHajimu UMEMOTO NEXT(3); 329d6385b1cSHajimu UMEMOTO if (IFA6_IS_DEPRECATED(ia_best) && !IFA6_IS_DEPRECATED(ia)) 330d6385b1cSHajimu UMEMOTO REPLACE(3); 331d6385b1cSHajimu UMEMOTO 332d6385b1cSHajimu UMEMOTO /* Rule 4: Prefer home addresses */ 333d6385b1cSHajimu UMEMOTO /* 334d6385b1cSHajimu UMEMOTO * XXX: This is a TODO. We should probably merge the MIP6 335d6385b1cSHajimu UMEMOTO * case above. 336d6385b1cSHajimu UMEMOTO */ 337d6385b1cSHajimu UMEMOTO 338d6385b1cSHajimu UMEMOTO /* Rule 5: Prefer outgoing interface */ 339d6385b1cSHajimu UMEMOTO if (ia_best->ia_ifp == ifp && ia->ia_ifp != ifp) 340d6385b1cSHajimu UMEMOTO NEXT(5); 341d6385b1cSHajimu UMEMOTO if (ia_best->ia_ifp != ifp && ia->ia_ifp == ifp) 342d6385b1cSHajimu UMEMOTO REPLACE(5); 343d6385b1cSHajimu UMEMOTO 344d6385b1cSHajimu UMEMOTO /* 345d6385b1cSHajimu UMEMOTO * Rule 6: Prefer matching label 346d6385b1cSHajimu UMEMOTO * Note that best_policy should be non-NULL here. 347d6385b1cSHajimu UMEMOTO */ 348d6385b1cSHajimu UMEMOTO if (dst_policy == NULL) 349d6385b1cSHajimu UMEMOTO dst_policy = lookup_addrsel_policy(dstsock); 350d6385b1cSHajimu UMEMOTO if (dst_policy->label != ADDR_LABEL_NOTAPP) { 351d6385b1cSHajimu UMEMOTO new_policy = lookup_addrsel_policy(&ia->ia_addr); 352d6385b1cSHajimu UMEMOTO if (dst_policy->label == best_policy->label && 353d6385b1cSHajimu UMEMOTO dst_policy->label != new_policy->label) 354d6385b1cSHajimu UMEMOTO NEXT(6); 355d6385b1cSHajimu UMEMOTO if (dst_policy->label != best_policy->label && 356d6385b1cSHajimu UMEMOTO dst_policy->label == new_policy->label) 357d6385b1cSHajimu UMEMOTO REPLACE(6); 358d6385b1cSHajimu UMEMOTO } 359d6385b1cSHajimu UMEMOTO 360d6385b1cSHajimu UMEMOTO /* 361d6385b1cSHajimu UMEMOTO * Rule 7: Prefer public addresses. 362d6385b1cSHajimu UMEMOTO * We allow users to reverse the logic by configuring 363d6385b1cSHajimu UMEMOTO * a sysctl variable, so that privacy conscious users can 364d6385b1cSHajimu UMEMOTO * always prefer temporary addresses. 365d6385b1cSHajimu UMEMOTO */ 366d6385b1cSHajimu UMEMOTO if (opts == NULL || 367d6385b1cSHajimu UMEMOTO opts->ip6po_prefer_tempaddr == IP6PO_TEMPADDR_SYSTEM) { 368603724d3SBjoern A. Zeeb prefer_tempaddr = V_ip6_prefer_tempaddr; 369d6385b1cSHajimu UMEMOTO } else if (opts->ip6po_prefer_tempaddr == 370d6385b1cSHajimu UMEMOTO IP6PO_TEMPADDR_NOTPREFER) { 371d6385b1cSHajimu UMEMOTO prefer_tempaddr = 0; 372d6385b1cSHajimu UMEMOTO } else 373d6385b1cSHajimu UMEMOTO prefer_tempaddr = 1; 374d6385b1cSHajimu UMEMOTO if (!(ia_best->ia6_flags & IN6_IFF_TEMPORARY) && 375d6385b1cSHajimu UMEMOTO (ia->ia6_flags & IN6_IFF_TEMPORARY)) { 376d6385b1cSHajimu UMEMOTO if (prefer_tempaddr) 377d6385b1cSHajimu UMEMOTO REPLACE(7); 378d6385b1cSHajimu UMEMOTO else 379d6385b1cSHajimu UMEMOTO NEXT(7); 380d6385b1cSHajimu UMEMOTO } 381d6385b1cSHajimu UMEMOTO if ((ia_best->ia6_flags & IN6_IFF_TEMPORARY) && 382d6385b1cSHajimu UMEMOTO !(ia->ia6_flags & IN6_IFF_TEMPORARY)) { 383d6385b1cSHajimu UMEMOTO if (prefer_tempaddr) 384d6385b1cSHajimu UMEMOTO NEXT(7); 385d6385b1cSHajimu UMEMOTO else 386d6385b1cSHajimu UMEMOTO REPLACE(7); 387d6385b1cSHajimu UMEMOTO } 388d6385b1cSHajimu UMEMOTO 389d6385b1cSHajimu UMEMOTO /* 390d6385b1cSHajimu UMEMOTO * Rule 8: prefer addresses on alive interfaces. 391d6385b1cSHajimu UMEMOTO * This is a KAME specific rule. 392d6385b1cSHajimu UMEMOTO */ 393d6385b1cSHajimu UMEMOTO if ((ia_best->ia_ifp->if_flags & IFF_UP) && 394d6385b1cSHajimu UMEMOTO !(ia->ia_ifp->if_flags & IFF_UP)) 395d6385b1cSHajimu UMEMOTO NEXT(8); 396d6385b1cSHajimu UMEMOTO if (!(ia_best->ia_ifp->if_flags & IFF_UP) && 397d6385b1cSHajimu UMEMOTO (ia->ia_ifp->if_flags & IFF_UP)) 398d6385b1cSHajimu UMEMOTO REPLACE(8); 399d6385b1cSHajimu UMEMOTO 400d6385b1cSHajimu UMEMOTO /* 401d6385b1cSHajimu UMEMOTO * Rule 14: Use longest matching prefix. 402d6385b1cSHajimu UMEMOTO * Note: in the address selection draft, this rule is 403d6385b1cSHajimu UMEMOTO * documented as "Rule 8". However, since it is also 404d6385b1cSHajimu UMEMOTO * documented that this rule can be overridden, we assign 405d6385b1cSHajimu UMEMOTO * a large number so that it is easy to assign smaller numbers 406d6385b1cSHajimu UMEMOTO * to more preferred rules. 407d6385b1cSHajimu UMEMOTO */ 408a1f7e5f8SHajimu UMEMOTO new_matchlen = in6_matchlen(&ia->ia_addr.sin6_addr, &dst); 409d6385b1cSHajimu UMEMOTO if (best_matchlen < new_matchlen) 410d6385b1cSHajimu UMEMOTO REPLACE(14); 411d6385b1cSHajimu UMEMOTO if (new_matchlen < best_matchlen) 412d6385b1cSHajimu UMEMOTO NEXT(14); 413d6385b1cSHajimu UMEMOTO 414d6385b1cSHajimu UMEMOTO /* Rule 15 is reserved. */ 415d6385b1cSHajimu UMEMOTO 416d6385b1cSHajimu UMEMOTO /* 417d6385b1cSHajimu UMEMOTO * Last resort: just keep the current candidate. 418d6385b1cSHajimu UMEMOTO * Or, do we need more rules? 419d6385b1cSHajimu UMEMOTO */ 420d6385b1cSHajimu UMEMOTO continue; 421d6385b1cSHajimu UMEMOTO 422d6385b1cSHajimu UMEMOTO replace: 423d6385b1cSHajimu UMEMOTO ia_best = ia; 424d6385b1cSHajimu UMEMOTO best_scope = (new_scope >= 0 ? new_scope : 425d6385b1cSHajimu UMEMOTO in6_addrscope(&ia_best->ia_addr.sin6_addr)); 426d6385b1cSHajimu UMEMOTO best_policy = (new_policy ? new_policy : 427d6385b1cSHajimu UMEMOTO lookup_addrsel_policy(&ia_best->ia_addr)); 428d6385b1cSHajimu UMEMOTO best_matchlen = (new_matchlen >= 0 ? new_matchlen : 429d6385b1cSHajimu UMEMOTO in6_matchlen(&ia_best->ia_addr.sin6_addr, 430a1f7e5f8SHajimu UMEMOTO &dst)); 431d6385b1cSHajimu UMEMOTO 432d6385b1cSHajimu UMEMOTO next: 433d6385b1cSHajimu UMEMOTO continue; 434d6385b1cSHajimu UMEMOTO 435d6385b1cSHajimu UMEMOTO out: 436d6385b1cSHajimu UMEMOTO break; 437d6385b1cSHajimu UMEMOTO } 438d6385b1cSHajimu UMEMOTO 439d6385b1cSHajimu UMEMOTO if ((ia = ia_best) == NULL) { 440686cdd19SJun-ichiro itojun Hagino *errorp = EADDRNOTAVAIL; 441d6385b1cSHajimu UMEMOTO return (NULL); 442686cdd19SJun-ichiro itojun Hagino } 443686cdd19SJun-ichiro itojun Hagino 444a1f7e5f8SHajimu UMEMOTO if (ifpp) 445a1f7e5f8SHajimu UMEMOTO *ifpp = ifp; 446a1f7e5f8SHajimu UMEMOTO 447d6385b1cSHajimu UMEMOTO return (&ia->ia_addr.sin6_addr); 448d6385b1cSHajimu UMEMOTO } 449d6385b1cSHajimu UMEMOTO 4501272577eSXin LI /* 4511272577eSXin LI * clone - meaningful only for bsdi and freebsd 4521272577eSXin LI */ 453d6385b1cSHajimu UMEMOTO static int 4541272577eSXin LI selectroute(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 4551272577eSXin LI struct ip6_moptions *mopts, struct route_in6 *ro, 4561272577eSXin LI struct ifnet **retifp, struct rtentry **retrt, int clone, 4571272577eSXin LI int norouteok) 458d6385b1cSHajimu UMEMOTO { 459d6385b1cSHajimu UMEMOTO int error = 0; 460d6385b1cSHajimu UMEMOTO struct ifnet *ifp = NULL; 461d6385b1cSHajimu UMEMOTO struct rtentry *rt = NULL; 462d6385b1cSHajimu UMEMOTO struct sockaddr_in6 *sin6_next; 463d6385b1cSHajimu UMEMOTO struct in6_pktinfo *pi = NULL; 464d6385b1cSHajimu UMEMOTO struct in6_addr *dst = &dstsock->sin6_addr; 465d6385b1cSHajimu UMEMOTO #if 0 4661d54aa3bSBjoern A. Zeeb char ip6buf[INET6_ADDRSTRLEN]; 4671d54aa3bSBjoern A. Zeeb 468d6385b1cSHajimu UMEMOTO if (dstsock->sin6_addr.s6_addr32[0] == 0 && 469d6385b1cSHajimu UMEMOTO dstsock->sin6_addr.s6_addr32[1] == 0 && 470d6385b1cSHajimu UMEMOTO !IN6_IS_ADDR_LOOPBACK(&dstsock->sin6_addr)) { 471d6385b1cSHajimu UMEMOTO printf("in6_selectroute: strange destination %s\n", 4721d54aa3bSBjoern A. Zeeb ip6_sprintf(ip6buf, &dstsock->sin6_addr)); 473d6385b1cSHajimu UMEMOTO } else { 474d6385b1cSHajimu UMEMOTO printf("in6_selectroute: destination = %s%%%d\n", 4751d54aa3bSBjoern A. Zeeb ip6_sprintf(ip6buf, &dstsock->sin6_addr), 476d6385b1cSHajimu UMEMOTO dstsock->sin6_scope_id); /* for debug */ 477d6385b1cSHajimu UMEMOTO } 478d6385b1cSHajimu UMEMOTO #endif 479d6385b1cSHajimu UMEMOTO 480d6385b1cSHajimu UMEMOTO /* If the caller specify the outgoing interface explicitly, use it. */ 481d6385b1cSHajimu UMEMOTO if (opts && (pi = opts->ip6po_pktinfo) != NULL && pi->ipi6_ifindex) { 482d6385b1cSHajimu UMEMOTO /* XXX boundary check is assumed to be already done. */ 483d6385b1cSHajimu UMEMOTO ifp = ifnet_byindex(pi->ipi6_ifindex); 484d6385b1cSHajimu UMEMOTO if (ifp != NULL && 485a1f7e5f8SHajimu UMEMOTO (norouteok || retrt == NULL || 486a1f7e5f8SHajimu UMEMOTO IN6_IS_ADDR_MULTICAST(dst))) { 487d6385b1cSHajimu UMEMOTO /* 488cd0fdcf7SHajimu UMEMOTO * we do not have to check or get the route for 489d6385b1cSHajimu UMEMOTO * multicast. 490d6385b1cSHajimu UMEMOTO */ 491d6385b1cSHajimu UMEMOTO goto done; 492d6385b1cSHajimu UMEMOTO } else 493d6385b1cSHajimu UMEMOTO goto getroute; 494d6385b1cSHajimu UMEMOTO } 495d6385b1cSHajimu UMEMOTO 496d6385b1cSHajimu UMEMOTO /* 497d6385b1cSHajimu UMEMOTO * If the destination address is a multicast address and the outgoing 498d6385b1cSHajimu UMEMOTO * interface for the address is specified by the caller, use it. 499d6385b1cSHajimu UMEMOTO */ 500d6385b1cSHajimu UMEMOTO if (IN6_IS_ADDR_MULTICAST(dst) && 501d6385b1cSHajimu UMEMOTO mopts != NULL && (ifp = mopts->im6o_multicast_ifp) != NULL) { 502d6385b1cSHajimu UMEMOTO goto done; /* we do not need a route for multicast. */ 503d6385b1cSHajimu UMEMOTO } 504d6385b1cSHajimu UMEMOTO 505d6385b1cSHajimu UMEMOTO getroute: 506d6385b1cSHajimu UMEMOTO /* 507d6385b1cSHajimu UMEMOTO * If the next hop address for the packet is specified by the caller, 508d6385b1cSHajimu UMEMOTO * use it as the gateway. 509d6385b1cSHajimu UMEMOTO */ 510d6385b1cSHajimu UMEMOTO if (opts && opts->ip6po_nexthop) { 511d6385b1cSHajimu UMEMOTO struct route_in6 *ron; 512d6385b1cSHajimu UMEMOTO 513d6385b1cSHajimu UMEMOTO sin6_next = satosin6(opts->ip6po_nexthop); 514d6385b1cSHajimu UMEMOTO 515d6385b1cSHajimu UMEMOTO /* at this moment, we only support AF_INET6 next hops */ 516d6385b1cSHajimu UMEMOTO if (sin6_next->sin6_family != AF_INET6) { 517d6385b1cSHajimu UMEMOTO error = EAFNOSUPPORT; /* or should we proceed? */ 518d6385b1cSHajimu UMEMOTO goto done; 519d6385b1cSHajimu UMEMOTO } 520d6385b1cSHajimu UMEMOTO 521d6385b1cSHajimu UMEMOTO /* 522d6385b1cSHajimu UMEMOTO * If the next hop is an IPv6 address, then the node identified 523d6385b1cSHajimu UMEMOTO * by that address must be a neighbor of the sending host. 524d6385b1cSHajimu UMEMOTO */ 525d6385b1cSHajimu UMEMOTO ron = &opts->ip6po_nextroute; 526d6385b1cSHajimu UMEMOTO if ((ron->ro_rt && 527d6385b1cSHajimu UMEMOTO (ron->ro_rt->rt_flags & (RTF_UP | RTF_LLINFO)) != 528d6385b1cSHajimu UMEMOTO (RTF_UP | RTF_LLINFO)) || 529c1a049acSSUZUKI Shinsuke !IN6_ARE_ADDR_EQUAL(&satosin6(&ron->ro_dst)->sin6_addr, 530c1a049acSSUZUKI Shinsuke &sin6_next->sin6_addr)) { 531d6385b1cSHajimu UMEMOTO if (ron->ro_rt) { 532d6385b1cSHajimu UMEMOTO RTFREE(ron->ro_rt); 533d6385b1cSHajimu UMEMOTO ron->ro_rt = NULL; 534d6385b1cSHajimu UMEMOTO } 535d6385b1cSHajimu UMEMOTO *satosin6(&ron->ro_dst) = *sin6_next; 536d6385b1cSHajimu UMEMOTO } 537d6385b1cSHajimu UMEMOTO if (ron->ro_rt == NULL) { 538d6385b1cSHajimu UMEMOTO rtalloc((struct route *)ron); /* multi path case? */ 539d6385b1cSHajimu UMEMOTO if (ron->ro_rt == NULL || 540d6385b1cSHajimu UMEMOTO !(ron->ro_rt->rt_flags & RTF_LLINFO)) { 541d6385b1cSHajimu UMEMOTO if (ron->ro_rt) { 542d6385b1cSHajimu UMEMOTO RTFREE(ron->ro_rt); 543d6385b1cSHajimu UMEMOTO ron->ro_rt = NULL; 544d6385b1cSHajimu UMEMOTO } 545d6385b1cSHajimu UMEMOTO error = EHOSTUNREACH; 546d6385b1cSHajimu UMEMOTO goto done; 547d6385b1cSHajimu UMEMOTO } 548d6385b1cSHajimu UMEMOTO } 549d6385b1cSHajimu UMEMOTO rt = ron->ro_rt; 550d6385b1cSHajimu UMEMOTO ifp = rt->rt_ifp; 551d6385b1cSHajimu UMEMOTO 552d6385b1cSHajimu UMEMOTO /* 553d6385b1cSHajimu UMEMOTO * When cloning is required, try to allocate a route to the 554d6385b1cSHajimu UMEMOTO * destination so that the caller can store path MTU 555d6385b1cSHajimu UMEMOTO * information. 556d6385b1cSHajimu UMEMOTO */ 557d6385b1cSHajimu UMEMOTO if (!clone) 558d6385b1cSHajimu UMEMOTO goto done; 559d6385b1cSHajimu UMEMOTO } 560d6385b1cSHajimu UMEMOTO 561d6385b1cSHajimu UMEMOTO /* 562d6385b1cSHajimu UMEMOTO * Use a cached route if it exists and is valid, else try to allocate 563d6385b1cSHajimu UMEMOTO * a new one. Note that we should check the address family of the 564d6385b1cSHajimu UMEMOTO * cached destination, in case of sharing the cache with IPv4. 565686cdd19SJun-ichiro itojun Hagino */ 566686cdd19SJun-ichiro itojun Hagino if (ro) { 567686cdd19SJun-ichiro itojun Hagino if (ro->ro_rt && 56854c1b882SHajimu UMEMOTO (!(ro->ro_rt->rt_flags & RTF_UP) || 569d6385b1cSHajimu UMEMOTO ((struct sockaddr *)(&ro->ro_dst))->sa_family != AF_INET6 || 57054c1b882SHajimu UMEMOTO !IN6_ARE_ADDR_EQUAL(&satosin6(&ro->ro_dst)->sin6_addr, 57154c1b882SHajimu UMEMOTO dst))) { 572686cdd19SJun-ichiro itojun Hagino RTFREE(ro->ro_rt); 573d6385b1cSHajimu UMEMOTO ro->ro_rt = (struct rtentry *)NULL; 574686cdd19SJun-ichiro itojun Hagino } 575d6385b1cSHajimu UMEMOTO if (ro->ro_rt == (struct rtentry *)NULL) { 57633841545SHajimu UMEMOTO struct sockaddr_in6 *sa6; 57733841545SHajimu UMEMOTO 578686cdd19SJun-ichiro itojun Hagino /* No route yet, so try to acquire one */ 579686cdd19SJun-ichiro itojun Hagino bzero(&ro->ro_dst, sizeof(struct sockaddr_in6)); 58033841545SHajimu UMEMOTO sa6 = (struct sockaddr_in6 *)&ro->ro_dst; 581d6385b1cSHajimu UMEMOTO *sa6 = *dstsock; 582e6a27350SHajimu UMEMOTO sa6->sin6_scope_id = 0; 58397d8d152SAndre Oppermann 584d6385b1cSHajimu UMEMOTO if (clone) { 585e440aed9SQing Li #ifdef RADIX_MPATH 586e440aed9SQing Li rtalloc_mpath((struct route *)ro, 587e440aed9SQing Li ntohl(sa6->sin6_addr.s6_addr32[3])); 588e440aed9SQing Li #else 589d6385b1cSHajimu UMEMOTO rtalloc((struct route *)ro); 590e440aed9SQing Li #endif 591d6385b1cSHajimu UMEMOTO } else { 592686cdd19SJun-ichiro itojun Hagino ro->ro_rt = rtalloc1(&((struct route *)ro) 593a89ec05eSPeter Wemm ->ro_dst, 0, 0UL); 59437bdc280SSam Leffler if (ro->ro_rt) 595d1dd20beSSam Leffler RT_UNLOCK(ro->ro_rt); 596686cdd19SJun-ichiro itojun Hagino } 597686cdd19SJun-ichiro itojun Hagino } 598686cdd19SJun-ichiro itojun Hagino 599686cdd19SJun-ichiro itojun Hagino /* 600d6385b1cSHajimu UMEMOTO * do not care about the result if we have the nexthop 601d6385b1cSHajimu UMEMOTO * explicitly specified. 602686cdd19SJun-ichiro itojun Hagino */ 603d6385b1cSHajimu UMEMOTO if (opts && opts->ip6po_nexthop) 604d6385b1cSHajimu UMEMOTO goto done; 605686cdd19SJun-ichiro itojun Hagino 606686cdd19SJun-ichiro itojun Hagino if (ro->ro_rt) { 607d6385b1cSHajimu UMEMOTO ifp = ro->ro_rt->rt_ifp; 608d6385b1cSHajimu UMEMOTO 609d6385b1cSHajimu UMEMOTO if (ifp == NULL) { /* can this really happen? */ 610d6385b1cSHajimu UMEMOTO RTFREE(ro->ro_rt); 611d6385b1cSHajimu UMEMOTO ro->ro_rt = NULL; 612686cdd19SJun-ichiro itojun Hagino } 613686cdd19SJun-ichiro itojun Hagino } 614d6385b1cSHajimu UMEMOTO if (ro->ro_rt == NULL) 615d6385b1cSHajimu UMEMOTO error = EHOSTUNREACH; 616d6385b1cSHajimu UMEMOTO rt = ro->ro_rt; 617d6385b1cSHajimu UMEMOTO 618d6385b1cSHajimu UMEMOTO /* 619d6385b1cSHajimu UMEMOTO * Check if the outgoing interface conflicts with 620d6385b1cSHajimu UMEMOTO * the interface specified by ipi6_ifindex (if specified). 621d6385b1cSHajimu UMEMOTO * Note that loopback interface is always okay. 622d6385b1cSHajimu UMEMOTO * (this may happen when we are sending a packet to one of 623d6385b1cSHajimu UMEMOTO * our own addresses.) 624d6385b1cSHajimu UMEMOTO */ 625403cbcf5SGeorge V. Neville-Neil if (ifp && opts && opts->ip6po_pktinfo && 62668efda09SHajimu UMEMOTO opts->ip6po_pktinfo->ipi6_ifindex) { 627d6385b1cSHajimu UMEMOTO if (!(ifp->if_flags & IFF_LOOPBACK) && 628d6385b1cSHajimu UMEMOTO ifp->if_index != 629d6385b1cSHajimu UMEMOTO opts->ip6po_pktinfo->ipi6_ifindex) { 630d6385b1cSHajimu UMEMOTO error = EHOSTUNREACH; 631d6385b1cSHajimu UMEMOTO goto done; 632d6385b1cSHajimu UMEMOTO } 633d6385b1cSHajimu UMEMOTO } 634686cdd19SJun-ichiro itojun Hagino } 635686cdd19SJun-ichiro itojun Hagino 636d6385b1cSHajimu UMEMOTO done: 637d6385b1cSHajimu UMEMOTO if (ifp == NULL && rt == NULL) { 638d6385b1cSHajimu UMEMOTO /* 639d6385b1cSHajimu UMEMOTO * This can happen if the caller did not pass a cached route 640d6385b1cSHajimu UMEMOTO * nor any other hints. We treat this case an error. 641d6385b1cSHajimu UMEMOTO */ 642d6385b1cSHajimu UMEMOTO error = EHOSTUNREACH; 643d6385b1cSHajimu UMEMOTO } 644d6385b1cSHajimu UMEMOTO if (error == EHOSTUNREACH) 645603724d3SBjoern A. Zeeb V_ip6stat.ip6s_noroute++; 646d6385b1cSHajimu UMEMOTO 647d6385b1cSHajimu UMEMOTO if (retifp != NULL) 648d6385b1cSHajimu UMEMOTO *retifp = ifp; 649d6385b1cSHajimu UMEMOTO if (retrt != NULL) 650d6385b1cSHajimu UMEMOTO *retrt = rt; /* rt may be NULL */ 651d6385b1cSHajimu UMEMOTO 652d6385b1cSHajimu UMEMOTO return (error); 653686cdd19SJun-ichiro itojun Hagino } 654686cdd19SJun-ichiro itojun Hagino 655a1f7e5f8SHajimu UMEMOTO static int 6561272577eSXin LI in6_selectif(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 6571272577eSXin LI struct ip6_moptions *mopts, struct route_in6 *ro, struct ifnet **retifp) 658a1f7e5f8SHajimu UMEMOTO { 659a1f7e5f8SHajimu UMEMOTO int error; 660a1f7e5f8SHajimu UMEMOTO struct route_in6 sro; 661a1f7e5f8SHajimu UMEMOTO struct rtentry *rt = NULL; 662a1f7e5f8SHajimu UMEMOTO 663a1f7e5f8SHajimu UMEMOTO if (ro == NULL) { 664a1f7e5f8SHajimu UMEMOTO bzero(&sro, sizeof(sro)); 665a1f7e5f8SHajimu UMEMOTO ro = &sro; 666a1f7e5f8SHajimu UMEMOTO } 667a1f7e5f8SHajimu UMEMOTO 668a1f7e5f8SHajimu UMEMOTO if ((error = selectroute(dstsock, opts, mopts, ro, retifp, 669a1f7e5f8SHajimu UMEMOTO &rt, 0, 1)) != 0) { 670f8366b03SSeigo Tanimura if (ro == &sro && rt && rt == sro.ro_rt) 671a1f7e5f8SHajimu UMEMOTO RTFREE(rt); 672a1f7e5f8SHajimu UMEMOTO return (error); 673a1f7e5f8SHajimu UMEMOTO } 674a1f7e5f8SHajimu UMEMOTO 675a1f7e5f8SHajimu UMEMOTO /* 676a1f7e5f8SHajimu UMEMOTO * do not use a rejected or black hole route. 677a1f7e5f8SHajimu UMEMOTO * XXX: this check should be done in the L2 output routine. 678a1f7e5f8SHajimu UMEMOTO * However, if we skipped this check here, we'd see the following 679a1f7e5f8SHajimu UMEMOTO * scenario: 680a1f7e5f8SHajimu UMEMOTO * - install a rejected route for a scoped address prefix 681a1f7e5f8SHajimu UMEMOTO * (like fe80::/10) 682a1f7e5f8SHajimu UMEMOTO * - send a packet to a destination that matches the scoped prefix, 683a1f7e5f8SHajimu UMEMOTO * with ambiguity about the scope zone. 684a1f7e5f8SHajimu UMEMOTO * - pick the outgoing interface from the route, and disambiguate the 685a1f7e5f8SHajimu UMEMOTO * scope zone with the interface. 686a1f7e5f8SHajimu UMEMOTO * - ip6_output() would try to get another route with the "new" 687a1f7e5f8SHajimu UMEMOTO * destination, which may be valid. 688a1f7e5f8SHajimu UMEMOTO * - we'd see no error on output. 689a1f7e5f8SHajimu UMEMOTO * Although this may not be very harmful, it should still be confusing. 690a1f7e5f8SHajimu UMEMOTO * We thus reject the case here. 691a1f7e5f8SHajimu UMEMOTO */ 692a1f7e5f8SHajimu UMEMOTO if (rt && (rt->rt_flags & (RTF_REJECT | RTF_BLACKHOLE))) { 693a1f7e5f8SHajimu UMEMOTO int flags = (rt->rt_flags & RTF_HOST ? EHOSTUNREACH : ENETUNREACH); 694a1f7e5f8SHajimu UMEMOTO 695f8366b03SSeigo Tanimura if (ro == &sro && rt && rt == sro.ro_rt) 696a1f7e5f8SHajimu UMEMOTO RTFREE(rt); 697a1f7e5f8SHajimu UMEMOTO return (flags); 698a1f7e5f8SHajimu UMEMOTO } 699a1f7e5f8SHajimu UMEMOTO 700a1f7e5f8SHajimu UMEMOTO /* 701a1f7e5f8SHajimu UMEMOTO * Adjust the "outgoing" interface. If we're going to loop the packet 702a1f7e5f8SHajimu UMEMOTO * back to ourselves, the ifp would be the loopback interface. 703a1f7e5f8SHajimu UMEMOTO * However, we'd rather know the interface associated to the 704a1f7e5f8SHajimu UMEMOTO * destination address (which should probably be one of our own 705a1f7e5f8SHajimu UMEMOTO * addresses.) 706a1f7e5f8SHajimu UMEMOTO */ 707a1f7e5f8SHajimu UMEMOTO if (rt && rt->rt_ifa && rt->rt_ifa->ifa_ifp) 708a1f7e5f8SHajimu UMEMOTO *retifp = rt->rt_ifa->ifa_ifp; 709a1f7e5f8SHajimu UMEMOTO 710f8366b03SSeigo Tanimura if (ro == &sro && rt && rt == sro.ro_rt) 711a1f7e5f8SHajimu UMEMOTO RTFREE(rt); 712a1f7e5f8SHajimu UMEMOTO return (0); 713a1f7e5f8SHajimu UMEMOTO } 714a1f7e5f8SHajimu UMEMOTO 7151272577eSXin LI /* 7161272577eSXin LI * clone - meaningful only for bsdi and freebsd 7171272577eSXin LI */ 718a1f7e5f8SHajimu UMEMOTO int 7191272577eSXin LI in6_selectroute(struct sockaddr_in6 *dstsock, struct ip6_pktopts *opts, 7201272577eSXin LI struct ip6_moptions *mopts, struct route_in6 *ro, 7211272577eSXin LI struct ifnet **retifp, struct rtentry **retrt, int clone) 722a1f7e5f8SHajimu UMEMOTO { 7231272577eSXin LI 724a1f7e5f8SHajimu UMEMOTO return (selectroute(dstsock, opts, mopts, ro, retifp, 725a1f7e5f8SHajimu UMEMOTO retrt, clone, 0)); 726a1f7e5f8SHajimu UMEMOTO } 727a1f7e5f8SHajimu UMEMOTO 728686cdd19SJun-ichiro itojun Hagino /* 729686cdd19SJun-ichiro itojun Hagino * Default hop limit selection. The precedence is as follows: 730686cdd19SJun-ichiro itojun Hagino * 1. Hoplimit value specified via ioctl. 731686cdd19SJun-ichiro itojun Hagino * 2. (If the outgoing interface is detected) the current 732686cdd19SJun-ichiro itojun Hagino * hop limit of the interface specified by router advertisement. 733686cdd19SJun-ichiro itojun Hagino * 3. The system default hoplimit. 734686cdd19SJun-ichiro itojun Hagino */ 735686cdd19SJun-ichiro itojun Hagino int 7361272577eSXin LI in6_selecthlim(struct in6pcb *in6p, struct ifnet *ifp) 737686cdd19SJun-ichiro itojun Hagino { 7381272577eSXin LI 739686cdd19SJun-ichiro itojun Hagino if (in6p && in6p->in6p_hops >= 0) 740686cdd19SJun-ichiro itojun Hagino return (in6p->in6p_hops); 741686cdd19SJun-ichiro itojun Hagino else if (ifp) 74231b1bfe1SHajimu UMEMOTO return (ND_IFINFO(ifp)->chlim); 74397d8d152SAndre Oppermann else if (in6p && !IN6_IS_ADDR_UNSPECIFIED(&in6p->in6p_faddr)) { 74497d8d152SAndre Oppermann struct route_in6 ro6; 74597d8d152SAndre Oppermann struct ifnet *lifp; 74697d8d152SAndre Oppermann 74797d8d152SAndre Oppermann bzero(&ro6, sizeof(ro6)); 74897d8d152SAndre Oppermann ro6.ro_dst.sin6_family = AF_INET6; 74997d8d152SAndre Oppermann ro6.ro_dst.sin6_len = sizeof(struct sockaddr_in6); 75097d8d152SAndre Oppermann ro6.ro_dst.sin6_addr = in6p->in6p_faddr; 75197d8d152SAndre Oppermann rtalloc((struct route *)&ro6); 75297d8d152SAndre Oppermann if (ro6.ro_rt) { 75397d8d152SAndre Oppermann lifp = ro6.ro_rt->rt_ifp; 75497d8d152SAndre Oppermann RTFREE(ro6.ro_rt); 75597d8d152SAndre Oppermann if (lifp) 75697d8d152SAndre Oppermann return (ND_IFINFO(lifp)->chlim); 75797d8d152SAndre Oppermann } else 758603724d3SBjoern A. Zeeb return (V_ip6_defhlim); 75997d8d152SAndre Oppermann } 760603724d3SBjoern A. Zeeb return (V_ip6_defhlim); 761686cdd19SJun-ichiro itojun Hagino } 762686cdd19SJun-ichiro itojun Hagino 763686cdd19SJun-ichiro itojun Hagino /* 764686cdd19SJun-ichiro itojun Hagino * XXX: this is borrowed from in6_pcbbind(). If possible, we should 765686cdd19SJun-ichiro itojun Hagino * share this function by all *bsd*... 766686cdd19SJun-ichiro itojun Hagino */ 767686cdd19SJun-ichiro itojun Hagino int 7681272577eSXin LI in6_pcbsetport(struct in6_addr *laddr, struct inpcb *inp, struct ucred *cred) 769686cdd19SJun-ichiro itojun Hagino { 770686cdd19SJun-ichiro itojun Hagino struct socket *so = inp->inp_socket; 771686cdd19SJun-ichiro itojun Hagino u_int16_t lport = 0, first, last, *lastport; 772686cdd19SJun-ichiro itojun Hagino int count, error = 0, wild = 0; 773686cdd19SJun-ichiro itojun Hagino struct inpcbinfo *pcbinfo = inp->inp_pcbinfo; 774686cdd19SJun-ichiro itojun Hagino 7758deea4a8SRobert Watson INP_INFO_WLOCK_ASSERT(pcbinfo); 7768501a69cSRobert Watson INP_WLOCK_ASSERT(inp); 7778deea4a8SRobert Watson 778686cdd19SJun-ichiro itojun Hagino /* XXX: this is redundant when called from in6_pcbbind */ 779686cdd19SJun-ichiro itojun Hagino if ((so->so_options & (SO_REUSEADDR|SO_REUSEPORT)) == 0) 780686cdd19SJun-ichiro itojun Hagino wild = INPLOOKUP_WILDCARD; 781686cdd19SJun-ichiro itojun Hagino 782686cdd19SJun-ichiro itojun Hagino inp->inp_flags |= INP_ANONPORT; 783686cdd19SJun-ichiro itojun Hagino 784686cdd19SJun-ichiro itojun Hagino if (inp->inp_flags & INP_HIGHPORT) { 785603724d3SBjoern A. Zeeb first = V_ipport_hifirstauto; /* sysctl */ 786603724d3SBjoern A. Zeeb last = V_ipport_hilastauto; 787712fc218SRobert Watson lastport = &pcbinfo->ipi_lasthi; 788686cdd19SJun-ichiro itojun Hagino } else if (inp->inp_flags & INP_LOWPORT) { 78932f9753cSRobert Watson error = priv_check_cred(cred, PRIV_NETINET_RESERVEDPORT, 0); 790acd3428bSRobert Watson if (error) 791686cdd19SJun-ichiro itojun Hagino return error; 792603724d3SBjoern A. Zeeb first = V_ipport_lowfirstauto; /* 1023 */ 793603724d3SBjoern A. Zeeb last = V_ipport_lowlastauto; /* 600 */ 794712fc218SRobert Watson lastport = &pcbinfo->ipi_lastlow; 795686cdd19SJun-ichiro itojun Hagino } else { 796603724d3SBjoern A. Zeeb first = V_ipport_firstauto; /* sysctl */ 797603724d3SBjoern A. Zeeb last = V_ipport_lastauto; 798712fc218SRobert Watson lastport = &pcbinfo->ipi_lastport; 799686cdd19SJun-ichiro itojun Hagino } 800686cdd19SJun-ichiro itojun Hagino /* 801686cdd19SJun-ichiro itojun Hagino * Simple check to ensure all ports are not used up causing 802686cdd19SJun-ichiro itojun Hagino * a deadlock here. 803686cdd19SJun-ichiro itojun Hagino * 804686cdd19SJun-ichiro itojun Hagino * We split the two cases (up and down) so that the direction 805686cdd19SJun-ichiro itojun Hagino * is not being tested on each round of the loop. 806686cdd19SJun-ichiro itojun Hagino */ 807686cdd19SJun-ichiro itojun Hagino if (first > last) { 808686cdd19SJun-ichiro itojun Hagino /* 809686cdd19SJun-ichiro itojun Hagino * counting down 810686cdd19SJun-ichiro itojun Hagino */ 811686cdd19SJun-ichiro itojun Hagino count = first - last; 812686cdd19SJun-ichiro itojun Hagino 813686cdd19SJun-ichiro itojun Hagino do { 814686cdd19SJun-ichiro itojun Hagino if (count-- < 0) { /* completely used? */ 815686cdd19SJun-ichiro itojun Hagino /* 816686cdd19SJun-ichiro itojun Hagino * Undo any address bind that may have 817686cdd19SJun-ichiro itojun Hagino * occurred above. 818686cdd19SJun-ichiro itojun Hagino */ 819686cdd19SJun-ichiro itojun Hagino inp->in6p_laddr = in6addr_any; 820686cdd19SJun-ichiro itojun Hagino return (EAGAIN); 821686cdd19SJun-ichiro itojun Hagino } 822686cdd19SJun-ichiro itojun Hagino --*lastport; 823686cdd19SJun-ichiro itojun Hagino if (*lastport > first || *lastport < last) 824686cdd19SJun-ichiro itojun Hagino *lastport = first; 825686cdd19SJun-ichiro itojun Hagino lport = htons(*lastport); 82668efda09SHajimu UMEMOTO } while (in6_pcblookup_local(pcbinfo, &inp->in6p_laddr, 827078b7042SBjoern A. Zeeb lport, wild, cred)); 828686cdd19SJun-ichiro itojun Hagino } else { 829686cdd19SJun-ichiro itojun Hagino /* 830686cdd19SJun-ichiro itojun Hagino * counting up 831686cdd19SJun-ichiro itojun Hagino */ 832686cdd19SJun-ichiro itojun Hagino count = last - first; 833686cdd19SJun-ichiro itojun Hagino 834686cdd19SJun-ichiro itojun Hagino do { 835686cdd19SJun-ichiro itojun Hagino if (count-- < 0) { /* completely used? */ 836686cdd19SJun-ichiro itojun Hagino /* 837686cdd19SJun-ichiro itojun Hagino * Undo any address bind that may have 838686cdd19SJun-ichiro itojun Hagino * occurred above. 839686cdd19SJun-ichiro itojun Hagino */ 840686cdd19SJun-ichiro itojun Hagino inp->in6p_laddr = in6addr_any; 841686cdd19SJun-ichiro itojun Hagino return (EAGAIN); 842686cdd19SJun-ichiro itojun Hagino } 843686cdd19SJun-ichiro itojun Hagino ++*lastport; 844686cdd19SJun-ichiro itojun Hagino if (*lastport < first || *lastport > last) 845686cdd19SJun-ichiro itojun Hagino *lastport = first; 846686cdd19SJun-ichiro itojun Hagino lport = htons(*lastport); 847078b7042SBjoern A. Zeeb } while (in6_pcblookup_local(pcbinfo, &inp->in6p_laddr, 848078b7042SBjoern A. Zeeb lport, wild, cred)); 849686cdd19SJun-ichiro itojun Hagino } 850686cdd19SJun-ichiro itojun Hagino 851686cdd19SJun-ichiro itojun Hagino inp->inp_lport = lport; 852686cdd19SJun-ichiro itojun Hagino if (in_pcbinshash(inp) != 0) { 853686cdd19SJun-ichiro itojun Hagino inp->in6p_laddr = in6addr_any; 854686cdd19SJun-ichiro itojun Hagino inp->inp_lport = 0; 855686cdd19SJun-ichiro itojun Hagino return (EAGAIN); 856686cdd19SJun-ichiro itojun Hagino } 857686cdd19SJun-ichiro itojun Hagino 858686cdd19SJun-ichiro itojun Hagino return (0); 859686cdd19SJun-ichiro itojun Hagino } 860686cdd19SJun-ichiro itojun Hagino 8617fc91b3fSHajimu UMEMOTO void 8621272577eSXin LI addrsel_policy_init(void) 8637fc91b3fSHajimu UMEMOTO { 8647fc91b3fSHajimu UMEMOTO ADDRSEL_LOCK_INIT(); 8655d525653SHajimu UMEMOTO ADDRSEL_SXLOCK_INIT(); 8667fc91b3fSHajimu UMEMOTO 8677fc91b3fSHajimu UMEMOTO init_policy_queue(); 8687fc91b3fSHajimu UMEMOTO 8697fc91b3fSHajimu UMEMOTO /* initialize the "last resort" policy */ 870603724d3SBjoern A. Zeeb bzero(&V_defaultaddrpolicy, sizeof(V_defaultaddrpolicy)); 871603724d3SBjoern A. Zeeb V_defaultaddrpolicy.label = ADDR_LABEL_NOTAPP; 8727fc91b3fSHajimu UMEMOTO } 8737fc91b3fSHajimu UMEMOTO 874d6385b1cSHajimu UMEMOTO static struct in6_addrpolicy * 8751272577eSXin LI lookup_addrsel_policy(struct sockaddr_in6 *key) 876d6385b1cSHajimu UMEMOTO { 877d6385b1cSHajimu UMEMOTO struct in6_addrpolicy *match = NULL; 878d6385b1cSHajimu UMEMOTO 879d6385b1cSHajimu UMEMOTO ADDRSEL_LOCK(); 880d6385b1cSHajimu UMEMOTO match = match_addrsel_policy(key); 881d6385b1cSHajimu UMEMOTO 882d6385b1cSHajimu UMEMOTO if (match == NULL) 883603724d3SBjoern A. Zeeb match = &V_defaultaddrpolicy; 884d6385b1cSHajimu UMEMOTO else 885d6385b1cSHajimu UMEMOTO match->use++; 886d6385b1cSHajimu UMEMOTO ADDRSEL_UNLOCK(); 887d6385b1cSHajimu UMEMOTO 888d6385b1cSHajimu UMEMOTO return (match); 889d6385b1cSHajimu UMEMOTO } 890d6385b1cSHajimu UMEMOTO 8917fc91b3fSHajimu UMEMOTO /* 8927fc91b3fSHajimu UMEMOTO * Subroutines to manage the address selection policy table via sysctl. 8937fc91b3fSHajimu UMEMOTO */ 8947fc91b3fSHajimu UMEMOTO struct walkarg { 8957fc91b3fSHajimu UMEMOTO struct sysctl_req *w_req; 8967fc91b3fSHajimu UMEMOTO }; 8977fc91b3fSHajimu UMEMOTO 8987fc91b3fSHajimu UMEMOTO static int in6_src_sysctl(SYSCTL_HANDLER_ARGS); 8997fc91b3fSHajimu UMEMOTO SYSCTL_DECL(_net_inet6_ip6); 9007fc91b3fSHajimu UMEMOTO SYSCTL_NODE(_net_inet6_ip6, IPV6CTL_ADDRCTLPOLICY, addrctlpolicy, 9017fc91b3fSHajimu UMEMOTO CTLFLAG_RD, in6_src_sysctl, ""); 9027fc91b3fSHajimu UMEMOTO 9037fc91b3fSHajimu UMEMOTO static int 9047fc91b3fSHajimu UMEMOTO in6_src_sysctl(SYSCTL_HANDLER_ARGS) 9057fc91b3fSHajimu UMEMOTO { 9067fc91b3fSHajimu UMEMOTO struct walkarg w; 9077fc91b3fSHajimu UMEMOTO 9087fc91b3fSHajimu UMEMOTO if (req->newptr) 9097fc91b3fSHajimu UMEMOTO return EPERM; 9107fc91b3fSHajimu UMEMOTO 9117fc91b3fSHajimu UMEMOTO bzero(&w, sizeof(w)); 9127fc91b3fSHajimu UMEMOTO w.w_req = req; 9137fc91b3fSHajimu UMEMOTO 9147fc91b3fSHajimu UMEMOTO return (walk_addrsel_policy(dump_addrsel_policyent, &w)); 9157fc91b3fSHajimu UMEMOTO } 9167fc91b3fSHajimu UMEMOTO 9177fc91b3fSHajimu UMEMOTO int 9181272577eSXin LI in6_src_ioctl(u_long cmd, caddr_t data) 9197fc91b3fSHajimu UMEMOTO { 9207fc91b3fSHajimu UMEMOTO int i; 9217fc91b3fSHajimu UMEMOTO struct in6_addrpolicy ent0; 9227fc91b3fSHajimu UMEMOTO 9237fc91b3fSHajimu UMEMOTO if (cmd != SIOCAADDRCTL_POLICY && cmd != SIOCDADDRCTL_POLICY) 9247fc91b3fSHajimu UMEMOTO return (EOPNOTSUPP); /* check for safety */ 9257fc91b3fSHajimu UMEMOTO 9267fc91b3fSHajimu UMEMOTO ent0 = *(struct in6_addrpolicy *)data; 9277fc91b3fSHajimu UMEMOTO 9287fc91b3fSHajimu UMEMOTO if (ent0.label == ADDR_LABEL_NOTAPP) 9297fc91b3fSHajimu UMEMOTO return (EINVAL); 9307fc91b3fSHajimu UMEMOTO /* check if the prefix mask is consecutive. */ 9317fc91b3fSHajimu UMEMOTO if (in6_mask2len(&ent0.addrmask.sin6_addr, NULL) < 0) 9327fc91b3fSHajimu UMEMOTO return (EINVAL); 9337fc91b3fSHajimu UMEMOTO /* clear trailing garbages (if any) of the prefix address. */ 9347fc91b3fSHajimu UMEMOTO for (i = 0; i < 4; i++) { 9357fc91b3fSHajimu UMEMOTO ent0.addr.sin6_addr.s6_addr32[i] &= 9367fc91b3fSHajimu UMEMOTO ent0.addrmask.sin6_addr.s6_addr32[i]; 9377fc91b3fSHajimu UMEMOTO } 9387fc91b3fSHajimu UMEMOTO ent0.use = 0; 9397fc91b3fSHajimu UMEMOTO 9407fc91b3fSHajimu UMEMOTO switch (cmd) { 9417fc91b3fSHajimu UMEMOTO case SIOCAADDRCTL_POLICY: 9427fc91b3fSHajimu UMEMOTO return (add_addrsel_policyent(&ent0)); 9437fc91b3fSHajimu UMEMOTO case SIOCDADDRCTL_POLICY: 9447fc91b3fSHajimu UMEMOTO return (delete_addrsel_policyent(&ent0)); 9457fc91b3fSHajimu UMEMOTO } 9467fc91b3fSHajimu UMEMOTO 9477fc91b3fSHajimu UMEMOTO return (0); /* XXX: compromise compilers */ 9487fc91b3fSHajimu UMEMOTO } 9497fc91b3fSHajimu UMEMOTO 9507fc91b3fSHajimu UMEMOTO /* 9517fc91b3fSHajimu UMEMOTO * The followings are implementation of the policy table using a 9527fc91b3fSHajimu UMEMOTO * simple tail queue. 9537fc91b3fSHajimu UMEMOTO * XXX such details should be hidden. 9547fc91b3fSHajimu UMEMOTO * XXX implementation using binary tree should be more efficient. 9557fc91b3fSHajimu UMEMOTO */ 9567fc91b3fSHajimu UMEMOTO struct addrsel_policyent { 9577fc91b3fSHajimu UMEMOTO TAILQ_ENTRY(addrsel_policyent) ape_entry; 9587fc91b3fSHajimu UMEMOTO struct in6_addrpolicy ape_policy; 9597fc91b3fSHajimu UMEMOTO }; 9607fc91b3fSHajimu UMEMOTO 9617fc91b3fSHajimu UMEMOTO TAILQ_HEAD(addrsel_policyhead, addrsel_policyent); 9627fc91b3fSHajimu UMEMOTO 9637fc91b3fSHajimu UMEMOTO struct addrsel_policyhead addrsel_policytab; 9647fc91b3fSHajimu UMEMOTO 9657fc91b3fSHajimu UMEMOTO static void 9661272577eSXin LI init_policy_queue(void) 9677fc91b3fSHajimu UMEMOTO { 9681272577eSXin LI 969603724d3SBjoern A. Zeeb TAILQ_INIT(&V_addrsel_policytab); 9707fc91b3fSHajimu UMEMOTO } 9717fc91b3fSHajimu UMEMOTO 9727fc91b3fSHajimu UMEMOTO static int 9731272577eSXin LI add_addrsel_policyent(struct in6_addrpolicy *newpolicy) 9747fc91b3fSHajimu UMEMOTO { 9757fc91b3fSHajimu UMEMOTO struct addrsel_policyent *new, *pol; 9767fc91b3fSHajimu UMEMOTO 977349b668aSHajimu UMEMOTO MALLOC(new, struct addrsel_policyent *, sizeof(*new), M_IFADDR, 978349b668aSHajimu UMEMOTO M_WAITOK); 9795d525653SHajimu UMEMOTO ADDRSEL_XLOCK(); 9807fc91b3fSHajimu UMEMOTO ADDRSEL_LOCK(); 9817fc91b3fSHajimu UMEMOTO 9827fc91b3fSHajimu UMEMOTO /* duplication check */ 983603724d3SBjoern A. Zeeb TAILQ_FOREACH(pol, &V_addrsel_policytab, ape_entry) { 984c1a049acSSUZUKI Shinsuke if (IN6_ARE_ADDR_EQUAL(&newpolicy->addr.sin6_addr, 985c1a049acSSUZUKI Shinsuke &pol->ape_policy.addr.sin6_addr) && 986c1a049acSSUZUKI Shinsuke IN6_ARE_ADDR_EQUAL(&newpolicy->addrmask.sin6_addr, 987c1a049acSSUZUKI Shinsuke &pol->ape_policy.addrmask.sin6_addr)) { 988349b668aSHajimu UMEMOTO ADDRSEL_UNLOCK(); 9895d525653SHajimu UMEMOTO ADDRSEL_XUNLOCK(); 990349b668aSHajimu UMEMOTO FREE(new, M_IFADDR); 9917fc91b3fSHajimu UMEMOTO return (EEXIST); /* or override it? */ 9927fc91b3fSHajimu UMEMOTO } 9937fc91b3fSHajimu UMEMOTO } 9947fc91b3fSHajimu UMEMOTO 9957fc91b3fSHajimu UMEMOTO bzero(new, sizeof(*new)); 9967fc91b3fSHajimu UMEMOTO 9977fc91b3fSHajimu UMEMOTO /* XXX: should validate entry */ 9987fc91b3fSHajimu UMEMOTO new->ape_policy = *newpolicy; 9997fc91b3fSHajimu UMEMOTO 1000603724d3SBjoern A. Zeeb TAILQ_INSERT_TAIL(&V_addrsel_policytab, new, ape_entry); 10017fc91b3fSHajimu UMEMOTO ADDRSEL_UNLOCK(); 10025d525653SHajimu UMEMOTO ADDRSEL_XUNLOCK(); 10037fc91b3fSHajimu UMEMOTO 10047fc91b3fSHajimu UMEMOTO return (0); 10057fc91b3fSHajimu UMEMOTO } 10067fc91b3fSHajimu UMEMOTO 10077fc91b3fSHajimu UMEMOTO static int 10081272577eSXin LI delete_addrsel_policyent(struct in6_addrpolicy *key) 10097fc91b3fSHajimu UMEMOTO { 10107fc91b3fSHajimu UMEMOTO struct addrsel_policyent *pol; 10117fc91b3fSHajimu UMEMOTO 10125d525653SHajimu UMEMOTO ADDRSEL_XLOCK(); 10137fc91b3fSHajimu UMEMOTO ADDRSEL_LOCK(); 10147fc91b3fSHajimu UMEMOTO 10157fc91b3fSHajimu UMEMOTO /* search for the entry in the table */ 1016603724d3SBjoern A. Zeeb TAILQ_FOREACH(pol, &V_addrsel_policytab, ape_entry) { 1017c1a049acSSUZUKI Shinsuke if (IN6_ARE_ADDR_EQUAL(&key->addr.sin6_addr, 1018c1a049acSSUZUKI Shinsuke &pol->ape_policy.addr.sin6_addr) && 1019c1a049acSSUZUKI Shinsuke IN6_ARE_ADDR_EQUAL(&key->addrmask.sin6_addr, 1020c1a049acSSUZUKI Shinsuke &pol->ape_policy.addrmask.sin6_addr)) { 10217fc91b3fSHajimu UMEMOTO break; 10227fc91b3fSHajimu UMEMOTO } 10237fc91b3fSHajimu UMEMOTO } 1024349b668aSHajimu UMEMOTO if (pol == NULL) { 1025349b668aSHajimu UMEMOTO ADDRSEL_UNLOCK(); 10265d525653SHajimu UMEMOTO ADDRSEL_XUNLOCK(); 10277fc91b3fSHajimu UMEMOTO return (ESRCH); 1028349b668aSHajimu UMEMOTO } 10297fc91b3fSHajimu UMEMOTO 1030603724d3SBjoern A. Zeeb TAILQ_REMOVE(&V_addrsel_policytab, pol, ape_entry); 10317fc91b3fSHajimu UMEMOTO ADDRSEL_UNLOCK(); 10325d525653SHajimu UMEMOTO ADDRSEL_XUNLOCK(); 10337fc91b3fSHajimu UMEMOTO 10347fc91b3fSHajimu UMEMOTO return (0); 10357fc91b3fSHajimu UMEMOTO } 10367fc91b3fSHajimu UMEMOTO 10377fc91b3fSHajimu UMEMOTO static int 10389233d8f3SDavid E. O'Brien walk_addrsel_policy(int (*callback)(struct in6_addrpolicy *, void *), 10391272577eSXin LI void *w) 10407fc91b3fSHajimu UMEMOTO { 10417fc91b3fSHajimu UMEMOTO struct addrsel_policyent *pol; 10427fc91b3fSHajimu UMEMOTO int error = 0; 10437fc91b3fSHajimu UMEMOTO 10445d525653SHajimu UMEMOTO ADDRSEL_SLOCK(); 1045603724d3SBjoern A. Zeeb TAILQ_FOREACH(pol, &V_addrsel_policytab, ape_entry) { 10465d525653SHajimu UMEMOTO if ((error = (*callback)(&pol->ape_policy, w)) != 0) { 10475d525653SHajimu UMEMOTO ADDRSEL_SUNLOCK(); 10487fc91b3fSHajimu UMEMOTO return (error); 1049349b668aSHajimu UMEMOTO } 10505d525653SHajimu UMEMOTO } 10515d525653SHajimu UMEMOTO ADDRSEL_SUNLOCK(); 10527fc91b3fSHajimu UMEMOTO return (error); 10537fc91b3fSHajimu UMEMOTO } 10547fc91b3fSHajimu UMEMOTO 10557fc91b3fSHajimu UMEMOTO static int 10561272577eSXin LI dump_addrsel_policyent(struct in6_addrpolicy *pol, void *arg) 10577fc91b3fSHajimu UMEMOTO { 10587fc91b3fSHajimu UMEMOTO int error = 0; 10597fc91b3fSHajimu UMEMOTO struct walkarg *w = arg; 10607fc91b3fSHajimu UMEMOTO 10617fc91b3fSHajimu UMEMOTO error = SYSCTL_OUT(w->w_req, pol, sizeof(*pol)); 10627fc91b3fSHajimu UMEMOTO 10637fc91b3fSHajimu UMEMOTO return (error); 10647fc91b3fSHajimu UMEMOTO } 1065d6385b1cSHajimu UMEMOTO 1066d6385b1cSHajimu UMEMOTO static struct in6_addrpolicy * 10671272577eSXin LI match_addrsel_policy(struct sockaddr_in6 *key) 1068d6385b1cSHajimu UMEMOTO { 1069d6385b1cSHajimu UMEMOTO struct addrsel_policyent *pent; 1070d6385b1cSHajimu UMEMOTO struct in6_addrpolicy *bestpol = NULL, *pol; 1071d6385b1cSHajimu UMEMOTO int matchlen, bestmatchlen = -1; 1072d6385b1cSHajimu UMEMOTO u_char *mp, *ep, *k, *p, m; 1073d6385b1cSHajimu UMEMOTO 1074603724d3SBjoern A. Zeeb TAILQ_FOREACH(pent, &V_addrsel_policytab, ape_entry) { 1075d6385b1cSHajimu UMEMOTO matchlen = 0; 1076d6385b1cSHajimu UMEMOTO 1077d6385b1cSHajimu UMEMOTO pol = &pent->ape_policy; 1078d6385b1cSHajimu UMEMOTO mp = (u_char *)&pol->addrmask.sin6_addr; 1079d6385b1cSHajimu UMEMOTO ep = mp + 16; /* XXX: scope field? */ 1080d6385b1cSHajimu UMEMOTO k = (u_char *)&key->sin6_addr; 1081d6385b1cSHajimu UMEMOTO p = (u_char *)&pol->addr.sin6_addr; 1082d6385b1cSHajimu UMEMOTO for (; mp < ep && *mp; mp++, k++, p++) { 1083d6385b1cSHajimu UMEMOTO m = *mp; 1084d6385b1cSHajimu UMEMOTO if ((*k & m) != *p) 1085d6385b1cSHajimu UMEMOTO goto next; /* not match */ 1086d6385b1cSHajimu UMEMOTO if (m == 0xff) /* short cut for a typical case */ 1087d6385b1cSHajimu UMEMOTO matchlen += 8; 1088d6385b1cSHajimu UMEMOTO else { 1089d6385b1cSHajimu UMEMOTO while (m >= 0x80) { 1090d6385b1cSHajimu UMEMOTO matchlen++; 1091d6385b1cSHajimu UMEMOTO m <<= 1; 1092d6385b1cSHajimu UMEMOTO } 1093d6385b1cSHajimu UMEMOTO } 1094d6385b1cSHajimu UMEMOTO } 1095d6385b1cSHajimu UMEMOTO 1096d6385b1cSHajimu UMEMOTO /* matched. check if this is better than the current best. */ 1097d6385b1cSHajimu UMEMOTO if (bestpol == NULL || 1098d6385b1cSHajimu UMEMOTO matchlen > bestmatchlen) { 1099d6385b1cSHajimu UMEMOTO bestpol = pol; 1100d6385b1cSHajimu UMEMOTO bestmatchlen = matchlen; 1101d6385b1cSHajimu UMEMOTO } 1102d6385b1cSHajimu UMEMOTO 1103d6385b1cSHajimu UMEMOTO next: 1104d6385b1cSHajimu UMEMOTO continue; 1105d6385b1cSHajimu UMEMOTO } 1106d6385b1cSHajimu UMEMOTO 1107d6385b1cSHajimu UMEMOTO return (bestpol); 1108d6385b1cSHajimu UMEMOTO } 1109