xref: /freebsd/sys/netinet6/ip6_output.c (revision 53af690381641290d252455b3c227c8a0920811b)
1caf43b02SWarner Losh /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
482cd038dSYoshinobu Inoue  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
582cd038dSYoshinobu Inoue  * All rights reserved.
682cd038dSYoshinobu Inoue  *
782cd038dSYoshinobu Inoue  * Redistribution and use in source and binary forms, with or without
882cd038dSYoshinobu Inoue  * modification, are permitted provided that the following conditions
982cd038dSYoshinobu Inoue  * are met:
1082cd038dSYoshinobu Inoue  * 1. Redistributions of source code must retain the above copyright
1182cd038dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer.
1282cd038dSYoshinobu Inoue  * 2. Redistributions in binary form must reproduce the above copyright
1382cd038dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer in the
1482cd038dSYoshinobu Inoue  *    documentation and/or other materials provided with the distribution.
1582cd038dSYoshinobu Inoue  * 3. Neither the name of the project nor the names of its contributors
1682cd038dSYoshinobu Inoue  *    may be used to endorse or promote products derived from this software
1782cd038dSYoshinobu Inoue  *    without specific prior written permission.
1882cd038dSYoshinobu Inoue  *
1982cd038dSYoshinobu Inoue  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
2082cd038dSYoshinobu Inoue  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2182cd038dSYoshinobu Inoue  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2282cd038dSYoshinobu Inoue  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
2382cd038dSYoshinobu Inoue  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2482cd038dSYoshinobu Inoue  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2582cd038dSYoshinobu Inoue  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2682cd038dSYoshinobu Inoue  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2782cd038dSYoshinobu Inoue  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2882cd038dSYoshinobu Inoue  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2982cd038dSYoshinobu Inoue  * SUCH DAMAGE.
30b48287a3SDavid E. O'Brien  *
31b48287a3SDavid E. O'Brien  *	$KAME: ip6_output.c,v 1.279 2002/01/26 06:12:30 jinmei Exp $
3282cd038dSYoshinobu Inoue  */
3382cd038dSYoshinobu Inoue 
34caf43b02SWarner Losh /*-
3582cd038dSYoshinobu Inoue  * Copyright (c) 1982, 1986, 1988, 1990, 1993
3682cd038dSYoshinobu Inoue  *	The Regents of the University of California.  All rights reserved.
3782cd038dSYoshinobu Inoue  *
3882cd038dSYoshinobu Inoue  * Redistribution and use in source and binary forms, with or without
3982cd038dSYoshinobu Inoue  * modification, are permitted provided that the following conditions
4082cd038dSYoshinobu Inoue  * are met:
4182cd038dSYoshinobu Inoue  * 1. Redistributions of source code must retain the above copyright
4282cd038dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer.
4382cd038dSYoshinobu Inoue  * 2. Redistributions in binary form must reproduce the above copyright
4482cd038dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer in the
4582cd038dSYoshinobu Inoue  *    documentation and/or other materials provided with the distribution.
46fbbd9655SWarner Losh  * 3. Neither the name of the University nor the names of its contributors
4782cd038dSYoshinobu Inoue  *    may be used to endorse or promote products derived from this software
4882cd038dSYoshinobu Inoue  *    without specific prior written permission.
4982cd038dSYoshinobu Inoue  *
5082cd038dSYoshinobu Inoue  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
5182cd038dSYoshinobu Inoue  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
5282cd038dSYoshinobu Inoue  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
5382cd038dSYoshinobu Inoue  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
5482cd038dSYoshinobu Inoue  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
5582cd038dSYoshinobu Inoue  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
5682cd038dSYoshinobu Inoue  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
5782cd038dSYoshinobu Inoue  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
5882cd038dSYoshinobu Inoue  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
5982cd038dSYoshinobu Inoue  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
6082cd038dSYoshinobu Inoue  * SUCH DAMAGE.
6182cd038dSYoshinobu Inoue  *
6282cd038dSYoshinobu Inoue  *	@(#)ip_output.c	8.3 (Berkeley) 1/21/94
6382cd038dSYoshinobu Inoue  */
6482cd038dSYoshinobu Inoue 
65b48287a3SDavid E. O'Brien #include <sys/cdefs.h>
66b48287a3SDavid E. O'Brien __FBSDID("$FreeBSD$");
67b48287a3SDavid E. O'Brien 
68686cdd19SJun-ichiro itojun Hagino #include "opt_inet.h"
69686cdd19SJun-ichiro itojun Hagino #include "opt_inet6.h"
70686cdd19SJun-ichiro itojun Hagino #include "opt_ipsec.h"
71b2e60773SJohn Baldwin #include "opt_kern_tls.h"
7277a01441SJohn Baldwin #include "opt_ratelimit.h"
7377931dd5SKip Macy #include "opt_route.h"
74c7c0d948SAdrian Chadd #include "opt_rss.h"
7577a01441SJohn Baldwin #include "opt_sctp.h"
7682cd038dSYoshinobu Inoue 
7782cd038dSYoshinobu Inoue #include <sys/param.h>
78c26fe973SBjoern A. Zeeb #include <sys/kernel.h>
79b2e60773SJohn Baldwin #include <sys/ktls.h>
8082cd038dSYoshinobu Inoue #include <sys/malloc.h>
8182cd038dSYoshinobu Inoue #include <sys/mbuf.h>
8282cd038dSYoshinobu Inoue #include <sys/errno.h>
83c2259ba4SRobert Watson #include <sys/priv.h>
84c26fe973SBjoern A. Zeeb #include <sys/proc.h>
8582cd038dSYoshinobu Inoue #include <sys/protosw.h>
8682cd038dSYoshinobu Inoue #include <sys/socket.h>
8782cd038dSYoshinobu Inoue #include <sys/socketvar.h>
881263305fSBjoern A. Zeeb #include <sys/syslog.h>
89c26fe973SBjoern A. Zeeb #include <sys/ucred.h>
9082cd038dSYoshinobu Inoue 
91e7b92e27SBjoern A. Zeeb #include <machine/in_cksum.h>
92e7b92e27SBjoern A. Zeeb 
9382cd038dSYoshinobu Inoue #include <net/if.h>
9476039bc8SGleb Smirnoff #include <net/if_var.h>
95868aabb4SRichard Scheffenegger #include <net/if_vlan_var.h>
960f5687f2SMike Karels #include <net/if_llatbl.h>
97868aabb4SRichard Scheffenegger #include <net/ethernet.h>
988195404bSBrooks Davis #include <net/netisr.h>
9982cd038dSYoshinobu Inoue #include <net/route.h>
100983066f0SAlexander V. Chernikov #include <net/route/nhop.h>
101c4ac87eaSDarren Reed #include <net/pfil.h>
102b2bdc62aSAdrian Chadd #include <net/rss_config.h>
1034b79449eSBjoern A. Zeeb #include <net/vnet.h>
10482cd038dSYoshinobu Inoue 
10582cd038dSYoshinobu Inoue #include <netinet/in.h>
10682cd038dSYoshinobu Inoue #include <netinet/in_var.h>
1078a006adbSBjoern A. Zeeb #include <netinet/ip_var.h>
108bacf6684SAlexander V. Chernikov #include <netinet6/in6_fib.h>
10933841545SHajimu UMEMOTO #include <netinet6/in6_var.h>
110686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h>
111686cdd19SJun-ichiro itojun Hagino #include <netinet/icmp6.h>
11282cd038dSYoshinobu Inoue #include <netinet6/ip6_var.h>
113686cdd19SJun-ichiro itojun Hagino #include <netinet/in_pcb.h>
11497d8d152SAndre Oppermann #include <netinet/tcp_var.h>
11582cd038dSYoshinobu Inoue #include <netinet6/nd6.h>
116b2bdc62aSAdrian Chadd #include <netinet6/in6_rss.h>
11782cd038dSYoshinobu Inoue 
118fcf59617SAndrey V. Elsukov #include <netipsec/ipsec_support.h>
11995033af9SMark Johnston #if defined(SCTP) || defined(SCTP_SUPPORT)
1209b03990aSRandall Stewart #include <netinet/sctp.h>
1219b03990aSRandall Stewart #include <netinet/sctp_crc32.h>
1229b03990aSRandall Stewart #endif
123b9234fafSSam Leffler 
124a1f7e5f8SHajimu UMEMOTO #include <netinet6/scope6_var.h>
1251469c434SHajimu UMEMOTO 
12633cde130SBruce M Simpson extern int in6_mcast_loop;
12782cd038dSYoshinobu Inoue 
12882cd038dSYoshinobu Inoue struct ip6_exthdrs {
12982cd038dSYoshinobu Inoue 	struct mbuf *ip6e_ip6;
13082cd038dSYoshinobu Inoue 	struct mbuf *ip6e_hbh;
13182cd038dSYoshinobu Inoue 	struct mbuf *ip6e_dest1;
13282cd038dSYoshinobu Inoue 	struct mbuf *ip6e_rthdr;
13382cd038dSYoshinobu Inoue 	struct mbuf *ip6e_dest2;
13482cd038dSYoshinobu Inoue };
13582cd038dSYoshinobu Inoue 
1365e0a6f31SMark Johnston static MALLOC_DEFINE(M_IP6OPT, "ip6opt", "IPv6 options");
1375e0a6f31SMark Johnston 
1386f56329aSXin LI static int ip6_pcbopt(int, u_char *, int, struct ip6_pktopts **,
1396f56329aSXin LI 			   struct ucred *, int);
1406f56329aSXin LI static int ip6_pcbopts(struct ip6_pktopts **, struct mbuf *,
1416f56329aSXin LI 	struct socket *, struct sockopt *);
14206b479a6SSean Bruno static int ip6_getpcbopt(struct inpcb *, int, struct sockopt *);
1436f56329aSXin LI static int ip6_setpktopt(int, u_char *, int, struct ip6_pktopts *,
1446f56329aSXin LI 	struct ucred *, int, int, int);
145f95d4633SHajimu UMEMOTO 
1469233d8f3SDavid E. O'Brien static int ip6_copyexthdr(struct mbuf **, caddr_t, int);
1476f56329aSXin LI static int ip6_insertfraghdr(struct mbuf *, struct mbuf *, int,
1486f56329aSXin LI 	struct ip6_frag **);
1499233d8f3SDavid E. O'Brien static int ip6_insert_jumboopt(struct ip6_exthdrs *, u_int32_t);
1509233d8f3SDavid E. O'Brien static int ip6_splithdr(struct mbuf *, struct ip6_exthdrs *);
1510d4df029SAlexander V. Chernikov static int ip6_getpmtu(struct route_in6 *, int,
152d4c22202SAndrew Gallatin 	struct ifnet *, const struct in6_addr *, u_long *, int *, u_int,
153d4c22202SAndrew Gallatin 	u_int);
1540d4df029SAlexander V. Chernikov static int ip6_calcmtu(struct ifnet *, const struct in6_addr *, u_long,
155d4c22202SAndrew Gallatin 	u_long *, int *, u_int);
156f0937b2cSAndrey V. Elsukov static int ip6_getpmtu_ctl(u_int, const struct in6_addr *, u_long *);
1579233d8f3SDavid E. O'Brien static int copypktopts(struct ip6_pktopts *, struct ip6_pktopts *, int);
15882cd038dSYoshinobu Inoue 
15982cd038dSYoshinobu Inoue /*
160a1a6c01eSBjoern A. Zeeb  * Make an extension header from option data.  hp is the source,
161a1a6c01eSBjoern A. Zeeb  * mp is the destination, and _ol is the optlen.
1622cb64cb2SGeorge V. Neville-Neil  */
163a1a6c01eSBjoern A. Zeeb #define	MAKE_EXTHDR(hp, mp, _ol)					\
1642cb64cb2SGeorge V. Neville-Neil     do {								\
1652cb64cb2SGeorge V. Neville-Neil 	if (hp) {							\
1662cb64cb2SGeorge V. Neville-Neil 		struct ip6_ext *eh = (struct ip6_ext *)(hp);		\
1672cb64cb2SGeorge V. Neville-Neil 		error = ip6_copyexthdr((mp), (caddr_t)(hp),		\
1682cb64cb2SGeorge V. Neville-Neil 		    ((eh)->ip6e_len + 1) << 3);				\
1692cb64cb2SGeorge V. Neville-Neil 		if (error)						\
1702cb64cb2SGeorge V. Neville-Neil 			goto freehdrs;					\
171a1a6c01eSBjoern A. Zeeb 		(_ol) += (*(mp))->m_len;				\
1722cb64cb2SGeorge V. Neville-Neil 	}								\
1732cb64cb2SGeorge V. Neville-Neil     } while (/*CONSTCOND*/ 0)
1742cb64cb2SGeorge V. Neville-Neil 
1752cb64cb2SGeorge V. Neville-Neil /*
1762cb64cb2SGeorge V. Neville-Neil  * Form a chain of extension headers.
1772cb64cb2SGeorge V. Neville-Neil  * m is the extension header mbuf
1782cb64cb2SGeorge V. Neville-Neil  * mp is the previous mbuf in the chain
1792cb64cb2SGeorge V. Neville-Neil  * p is the next header
1802cb64cb2SGeorge V. Neville-Neil  * i is the type of option.
1812cb64cb2SGeorge V. Neville-Neil  */
1822cb64cb2SGeorge V. Neville-Neil #define MAKE_CHAIN(m, mp, p, i)\
1832cb64cb2SGeorge V. Neville-Neil     do {\
1842cb64cb2SGeorge V. Neville-Neil 	if (m) {\
1852cb64cb2SGeorge V. Neville-Neil 		if (!hdrsplit) \
1867c1daefeSBjoern A. Zeeb 			panic("%s:%d: assumption failed: "\
1877c1daefeSBjoern A. Zeeb 			    "hdr not split: hdrsplit %d exthdrs %p",\
1887c1daefeSBjoern A. Zeeb 			    __func__, __LINE__, hdrsplit, &exthdrs);\
1892cb64cb2SGeorge V. Neville-Neil 		*mtod((m), u_char *) = *(p);\
1902cb64cb2SGeorge V. Neville-Neil 		*(p) = (i);\
1912cb64cb2SGeorge V. Neville-Neil 		p = mtod((m), u_char *);\
1922cb64cb2SGeorge V. Neville-Neil 		(m)->m_next = (mp)->m_next;\
1932cb64cb2SGeorge V. Neville-Neil 		(mp)->m_next = (m);\
1942cb64cb2SGeorge V. Neville-Neil 		(mp) = (m);\
1952cb64cb2SGeorge V. Neville-Neil 	}\
1962cb64cb2SGeorge V. Neville-Neil     } while (/*CONSTCOND*/ 0)
1972cb64cb2SGeorge V. Neville-Neil 
198aaf2cfc0SVANHULLEBUS Yvan void
199e7b92e27SBjoern A. Zeeb in6_delayed_cksum(struct mbuf *m, uint32_t plen, u_short offset)
200e7b92e27SBjoern A. Zeeb {
201e7b92e27SBjoern A. Zeeb 	u_short csum;
202e7b92e27SBjoern A. Zeeb 
203c69baa7eSBjoern A. Zeeb 	csum = in_cksum_skip(m, offset + plen, offset);
204356ab07eSBjoern A. Zeeb 	if (m->m_pkthdr.csum_flags & CSUM_UDP_IPV6 && csum == 0)
205e7b92e27SBjoern A. Zeeb 		csum = 0xffff;
206e7b92e27SBjoern A. Zeeb 	offset += m->m_pkthdr.csum_data;	/* checksum offset */
207e7b92e27SBjoern A. Zeeb 
2084a089e6bSAndrey V. Elsukov 	if (offset + sizeof(csum) > m->m_len)
2094a089e6bSAndrey V. Elsukov 		m_copyback(m, offset, sizeof(csum), (caddr_t)&csum);
2104a089e6bSAndrey V. Elsukov 	else
2114a089e6bSAndrey V. Elsukov 		*(u_short *)mtodo(m, offset) = csum;
212e7b92e27SBjoern A. Zeeb }
213e7b92e27SBjoern A. Zeeb 
21444775b16SMark Johnston static void
2153459050cSBjoern A. Zeeb ip6_output_delayed_csum(struct mbuf *m, struct ifnet *ifp, int csum_flags,
21644775b16SMark Johnston     int plen, int optlen)
2173459050cSBjoern A. Zeeb {
2183459050cSBjoern A. Zeeb 
2193459050cSBjoern A. Zeeb 	KASSERT((plen >= optlen), ("%s:%d: plen %d < optlen %d, m %p, ifp %p "
22044775b16SMark Johnston 	    "csum_flags %#x",
22144775b16SMark Johnston 	    __func__, __LINE__, plen, optlen, m, ifp, csum_flags));
2223459050cSBjoern A. Zeeb 
2233459050cSBjoern A. Zeeb 	if (csum_flags & CSUM_DELAY_DATA_IPV6) {
2243459050cSBjoern A. Zeeb 		in6_delayed_cksum(m, plen - optlen,
2253459050cSBjoern A. Zeeb 		    sizeof(struct ip6_hdr) + optlen);
2263459050cSBjoern A. Zeeb 		m->m_pkthdr.csum_flags &= ~CSUM_DELAY_DATA_IPV6;
2273459050cSBjoern A. Zeeb 	}
22895033af9SMark Johnston #if defined(SCTP) || defined(SCTP_SUPPORT)
2293459050cSBjoern A. Zeeb 	if (csum_flags & CSUM_SCTP_IPV6) {
2303459050cSBjoern A. Zeeb 		sctp_delayed_cksum(m, sizeof(struct ip6_hdr) + optlen);
2313459050cSBjoern A. Zeeb 		m->m_pkthdr.csum_flags &= ~CSUM_SCTP_IPV6;
2323459050cSBjoern A. Zeeb 	}
2333459050cSBjoern A. Zeeb #endif
2343459050cSBjoern A. Zeeb }
2353459050cSBjoern A. Zeeb 
2366c269f69SGleb Smirnoff int
2376c269f69SGleb Smirnoff ip6_fragment(struct ifnet *ifp, struct mbuf *m0, int hlen, u_char nextproto,
238d78c0804SKristof Provost     int fraglen , uint32_t id)
2396c269f69SGleb Smirnoff {
2406c269f69SGleb Smirnoff 	struct mbuf *m, **mnext, *m_frgpart;
2416c269f69SGleb Smirnoff 	struct ip6_hdr *ip6, *mhip6;
2426c269f69SGleb Smirnoff 	struct ip6_frag *ip6f;
2436c269f69SGleb Smirnoff 	int off;
2446c269f69SGleb Smirnoff 	int error;
2456c269f69SGleb Smirnoff 	int tlen = m0->m_pkthdr.len;
2466c269f69SGleb Smirnoff 
247d78c0804SKristof Provost 	KASSERT((fraglen % 8 == 0), ("Fragment length must be a multiple of 8"));
24800eab743SKristof Provost 
2496c269f69SGleb Smirnoff 	m = m0;
2506c269f69SGleb Smirnoff 	ip6 = mtod(m, struct ip6_hdr *);
2516c269f69SGleb Smirnoff 	mnext = &m->m_nextpkt;
2526c269f69SGleb Smirnoff 
253d78c0804SKristof Provost 	for (off = hlen; off < tlen; off += fraglen) {
2546c269f69SGleb Smirnoff 		m = m_gethdr(M_NOWAIT, MT_DATA);
2556c269f69SGleb Smirnoff 		if (!m) {
2566c269f69SGleb Smirnoff 			IP6STAT_INC(ip6s_odropped);
2576c269f69SGleb Smirnoff 			return (ENOBUFS);
2586c269f69SGleb Smirnoff 		}
259c9d33708SJohn Baldwin 
260c9d33708SJohn Baldwin 		/*
261c9d33708SJohn Baldwin 		 * Make sure the complete packet header gets copied
262c9d33708SJohn Baldwin 		 * from the originating mbuf to the newly created
263c9d33708SJohn Baldwin 		 * mbuf. This also ensures that existing firewall
264c9d33708SJohn Baldwin 		 * classification(s), VLAN tags and so on get copied
265c9d33708SJohn Baldwin 		 * to the resulting fragmented packet(s):
266c9d33708SJohn Baldwin 		 */
267c9d33708SJohn Baldwin 		if (m_dup_pkthdr(m, m0, M_NOWAIT) == 0) {
268c9d33708SJohn Baldwin 			m_free(m);
269c9d33708SJohn Baldwin 			IP6STAT_INC(ip6s_odropped);
270c9d33708SJohn Baldwin 			return (ENOBUFS);
271c9d33708SJohn Baldwin 		}
272c9d33708SJohn Baldwin 
2736c269f69SGleb Smirnoff 		*mnext = m;
2746c269f69SGleb Smirnoff 		mnext = &m->m_nextpkt;
2756c269f69SGleb Smirnoff 		m->m_data += max_linkhdr;
2766c269f69SGleb Smirnoff 		mhip6 = mtod(m, struct ip6_hdr *);
2776c269f69SGleb Smirnoff 		*mhip6 = *ip6;
2786c269f69SGleb Smirnoff 		m->m_len = sizeof(*mhip6);
2796c269f69SGleb Smirnoff 		error = ip6_insertfraghdr(m0, m, hlen, &ip6f);
2806c269f69SGleb Smirnoff 		if (error) {
2816c269f69SGleb Smirnoff 			IP6STAT_INC(ip6s_odropped);
2826c269f69SGleb Smirnoff 			return (error);
2836c269f69SGleb Smirnoff 		}
2846c269f69SGleb Smirnoff 		ip6f->ip6f_offlg = htons((u_short)((off - hlen) & ~7));
285d78c0804SKristof Provost 		if (off + fraglen >= tlen)
286d78c0804SKristof Provost 			fraglen = tlen - off;
2876c269f69SGleb Smirnoff 		else
2886c269f69SGleb Smirnoff 			ip6f->ip6f_offlg |= IP6F_MORE_FRAG;
289d78c0804SKristof Provost 		mhip6->ip6_plen = htons((u_short)(fraglen + hlen +
2906c269f69SGleb Smirnoff 		    sizeof(*ip6f) - sizeof(struct ip6_hdr)));
291d78c0804SKristof Provost 		if ((m_frgpart = m_copym(m0, off, fraglen, M_NOWAIT)) == NULL) {
2926c269f69SGleb Smirnoff 			IP6STAT_INC(ip6s_odropped);
2936c269f69SGleb Smirnoff 			return (ENOBUFS);
2946c269f69SGleb Smirnoff 		}
2956c269f69SGleb Smirnoff 		m_cat(m, m_frgpart);
296d78c0804SKristof Provost 		m->m_pkthdr.len = fraglen + hlen + sizeof(*ip6f);
2976c269f69SGleb Smirnoff 		ip6f->ip6f_reserved = 0;
2986c269f69SGleb Smirnoff 		ip6f->ip6f_ident = id;
2996c269f69SGleb Smirnoff 		ip6f->ip6f_nxt = nextproto;
3006c269f69SGleb Smirnoff 		IP6STAT_INC(ip6s_ofragments);
3016c269f69SGleb Smirnoff 		in6_ifstat_inc(ifp, ifs6_out_fragcreat);
3026c269f69SGleb Smirnoff 	}
3036c269f69SGleb Smirnoff 
3046c269f69SGleb Smirnoff 	return (0);
3056c269f69SGleb Smirnoff }
3066c269f69SGleb Smirnoff 
307fb3bc596SJohn Baldwin static int
308fb3bc596SJohn Baldwin ip6_output_send(struct inpcb *inp, struct ifnet *ifp, struct ifnet *origifp,
309d7452d89SAndrew Gallatin     struct mbuf *m, struct sockaddr_in6 *dst, struct route_in6 *ro,
310d7452d89SAndrew Gallatin     bool stamp_tag)
311fb3bc596SJohn Baldwin {
312b2e60773SJohn Baldwin #ifdef KERN_TLS
313b2e60773SJohn Baldwin 	struct ktls_session *tls = NULL;
314b2e60773SJohn Baldwin #endif
315fb3bc596SJohn Baldwin 	struct m_snd_tag *mst;
316fb3bc596SJohn Baldwin 	int error;
317fb3bc596SJohn Baldwin 
318fb3bc596SJohn Baldwin 	MPASS((m->m_pkthdr.csum_flags & CSUM_SND_TAG) == 0);
319fb3bc596SJohn Baldwin 	mst = NULL;
320fb3bc596SJohn Baldwin 
321b2e60773SJohn Baldwin #ifdef KERN_TLS
322b2e60773SJohn Baldwin 	/*
323b2e60773SJohn Baldwin 	 * If this is an unencrypted TLS record, save a reference to
324b2e60773SJohn Baldwin 	 * the record.  This local reference is used to call
325b2e60773SJohn Baldwin 	 * ktls_output_eagain after the mbuf has been freed (thus
326b2e60773SJohn Baldwin 	 * dropping the mbuf's reference) in if_output.
327b2e60773SJohn Baldwin 	 */
328b2e60773SJohn Baldwin 	if (m->m_next != NULL && mbuf_has_tls_session(m->m_next)) {
3297b6c99d0SGleb Smirnoff 		tls = ktls_hold(m->m_next->m_epg_tls);
330b2e60773SJohn Baldwin 		mst = tls->snd_tag;
331b2e60773SJohn Baldwin 
332b2e60773SJohn Baldwin 		/*
333b2e60773SJohn Baldwin 		 * If a TLS session doesn't have a valid tag, it must
334b2e60773SJohn Baldwin 		 * have had an earlier ifp mismatch, so drop this
335b2e60773SJohn Baldwin 		 * packet.
336b2e60773SJohn Baldwin 		 */
337b2e60773SJohn Baldwin 		if (mst == NULL) {
3389ba11796SAndrew Gallatin 			m_freem(m);
339b2e60773SJohn Baldwin 			error = EAGAIN;
340b2e60773SJohn Baldwin 			goto done;
341b2e60773SJohn Baldwin 		}
342d7452d89SAndrew Gallatin 		/*
343d7452d89SAndrew Gallatin 		 * Always stamp tags that include NIC ktls.
344d7452d89SAndrew Gallatin 		 */
345d7452d89SAndrew Gallatin 		stamp_tag = true;
346b2e60773SJohn Baldwin 	}
347b2e60773SJohn Baldwin #endif
348fb3bc596SJohn Baldwin #ifdef RATELIMIT
349b2e60773SJohn Baldwin 	if (inp != NULL && mst == NULL) {
350fb3bc596SJohn Baldwin 		if ((inp->inp_flags2 & INP_RATE_LIMIT_CHANGED) != 0 ||
351fb3bc596SJohn Baldwin 		    (inp->inp_snd_tag != NULL &&
352fb3bc596SJohn Baldwin 		    inp->inp_snd_tag->ifp != ifp))
353fb3bc596SJohn Baldwin 			in_pcboutput_txrtlmt(inp, ifp, m);
354fb3bc596SJohn Baldwin 
355fb3bc596SJohn Baldwin 		if (inp->inp_snd_tag != NULL)
356fb3bc596SJohn Baldwin 			mst = inp->inp_snd_tag;
357fb3bc596SJohn Baldwin 	}
358fb3bc596SJohn Baldwin #endif
359d7452d89SAndrew Gallatin 	if (stamp_tag && mst != NULL) {
360fb3bc596SJohn Baldwin 		KASSERT(m->m_pkthdr.rcvif == NULL,
361fb3bc596SJohn Baldwin 		    ("trying to add a send tag to a forwarded packet"));
362fb3bc596SJohn Baldwin 		if (mst->ifp != ifp) {
3639ba11796SAndrew Gallatin 			m_freem(m);
364fb3bc596SJohn Baldwin 			error = EAGAIN;
365fb3bc596SJohn Baldwin 			goto done;
366fb3bc596SJohn Baldwin 		}
367fb3bc596SJohn Baldwin 
368fb3bc596SJohn Baldwin 		/* stamp send tag on mbuf */
369fb3bc596SJohn Baldwin 		m->m_pkthdr.snd_tag = m_snd_tag_ref(mst);
370fb3bc596SJohn Baldwin 		m->m_pkthdr.csum_flags |= CSUM_SND_TAG;
371fb3bc596SJohn Baldwin 	}
372fb3bc596SJohn Baldwin 
373fb3bc596SJohn Baldwin 	error = nd6_output_ifp(ifp, origifp, m, dst, (struct route *)ro);
374fb3bc596SJohn Baldwin 
375fb3bc596SJohn Baldwin done:
376fb3bc596SJohn Baldwin 	/* Check for route change invalidating send tags. */
377b2e60773SJohn Baldwin #ifdef KERN_TLS
378b2e60773SJohn Baldwin 	if (tls != NULL) {
379b2e60773SJohn Baldwin 		if (error == EAGAIN)
380b2e60773SJohn Baldwin 			error = ktls_output_eagain(inp, tls);
381b2e60773SJohn Baldwin 		ktls_free(tls);
382b2e60773SJohn Baldwin 	}
383b2e60773SJohn Baldwin #endif
384fb3bc596SJohn Baldwin #ifdef RATELIMIT
385fb3bc596SJohn Baldwin 	if (error == EAGAIN)
386fb3bc596SJohn Baldwin 		in_pcboutput_eagain(inp);
387fb3bc596SJohn Baldwin #endif
388fb3bc596SJohn Baldwin 	return (error);
389fb3bc596SJohn Baldwin }
390fb3bc596SJohn Baldwin 
3912cb64cb2SGeorge V. Neville-Neil /*
3927c1daefeSBjoern A. Zeeb  * IP6 output.
3937c1daefeSBjoern A. Zeeb  * The packet in mbuf chain m contains a skeletal IP6 header (with pri, len,
3947c1daefeSBjoern A. Zeeb  * nxt, hlim, src, dst).
39582cd038dSYoshinobu Inoue  * This function may modify ver and hlim only.
39682cd038dSYoshinobu Inoue  * The mbuf chain containing the packet will be freed.
39782cd038dSYoshinobu Inoue  * The mbuf opt, if present, will not be freed.
398983066f0SAlexander V. Chernikov  * If route_in6 ro is present and has ro_nh initialized, route lookup would be
399983066f0SAlexander V. Chernikov  * skipped and ro->ro_nh would be used. If ro is present but ro->ro_nh is NULL,
400983066f0SAlexander V. Chernikov  * then result of route lookup is stored in ro->ro_nh.
40133841545SHajimu UMEMOTO  *
4027c1daefeSBjoern A. Zeeb  * Type of "mtu": rt_mtu is u_long, ifnet.ifr_mtu is int, and nd_ifinfo.linkmtu
4037c1daefeSBjoern A. Zeeb  * is uint32_t.  So we use u_long to hold largest one, which is rt_mtu.
4041272577eSXin LI  *
4051272577eSXin LI  * ifpp - XXX: just for statistics
40682cd038dSYoshinobu Inoue  */
40782cd038dSYoshinobu Inoue int
4081272577eSXin LI ip6_output(struct mbuf *m0, struct ip6_pktopts *opt,
4091272577eSXin LI     struct route_in6 *ro, int flags, struct ip6_moptions *im6o,
4101272577eSXin LI     struct ifnet **ifpp, struct inpcb *inp)
41182cd038dSYoshinobu Inoue {
4126c269f69SGleb Smirnoff 	struct ip6_hdr *ip6;
413686cdd19SJun-ichiro itojun Hagino 	struct ifnet *ifp, *origifp;
41482cd038dSYoshinobu Inoue 	struct mbuf *m = m0;
415a1a6c01eSBjoern A. Zeeb 	struct mbuf *mprev;
416000c42faSBjoern A. Zeeb 	struct route_in6 *ro_pmtu;
417983066f0SAlexander V. Chernikov 	struct nhop_object *nh;
418000c42faSBjoern A. Zeeb 	struct sockaddr_in6 *dst, sin6, src_sa, dst_sa;
4198195404bSBrooks Davis 	struct in6_addr odst;
420a1a6c01eSBjoern A. Zeeb 	u_char *nexthdrp;
421000c42faSBjoern A. Zeeb 	int tlen, len;
42282cd038dSYoshinobu Inoue 	int error = 0;
423868aabb4SRichard Scheffenegger 	int vlan_pcp = -1;
4245da9f8faSJosef Karthauser 	struct in6_ifaddr *ia = NULL;
42582cd038dSYoshinobu Inoue 	u_long mtu;
426f95d4633SHajimu UMEMOTO 	int alwaysfrag, dontfrag;
427a1a6c01eSBjoern A. Zeeb 	u_int32_t optlen, plen = 0, unfragpartlen;
42882cd038dSYoshinobu Inoue 	struct ip6_exthdrs exthdrs;
429f0937b2cSAndrey V. Elsukov 	struct in6_addr src0, dst0;
430a1f7e5f8SHajimu UMEMOTO 	u_int32_t zone;
431a1a6c01eSBjoern A. Zeeb 	bool hdrsplit;
432e7b92e27SBjoern A. Zeeb 	int sw_csum, tso;
4339c57a5b6SHiroki Sato 	int needfiblookup;
4349c57a5b6SHiroki Sato 	uint32_t fibnum;
435f8fe3dc9SAndrey V. Elsukov 	struct m_tag *fwd_tag = NULL;
43679831849SKristof Provost 	uint32_t id;
437b9234fafSSam Leffler 
438b9555453SGleb Smirnoff 	NET_EPOCH_ASSERT();
4391e4f4e56SGleb Smirnoff 
440b174de32SAdrian Chadd 	if (inp != NULL) {
441ce9ac139SNavdeep Parhar 		INP_LOCK_ASSERT(inp);
44281d5d46bSBjoern A. Zeeb 		M_SETFIB(m, inp->inp_inc.inc_fibnum);
443c2529042SHans Petter Selasky 		if ((flags & IP_NODEFAULTFLOWID) == 0) {
4447c1daefeSBjoern A. Zeeb 			/* Unconditionally set flowid. */
445b174de32SAdrian Chadd 			m->m_pkthdr.flowid = inp->inp_flowid;
446c2529042SHans Petter Selasky 			M_HASHTYPE_SET(m, inp->inp_flowtype);
447b174de32SAdrian Chadd 		}
448868aabb4SRichard Scheffenegger 		if ((inp->inp_flags2 & INP_2PCP_SET) != 0)
449868aabb4SRichard Scheffenegger 			vlan_pcp = (inp->inp_flags2 & INP_2PCP_MASK) >>
450868aabb4SRichard Scheffenegger 			    INP_2PCP_SHIFT;
45150575ce1SAndrew Gallatin #ifdef NUMA
45250575ce1SAndrew Gallatin 		m->m_pkthdr.numa_domain = inp->inp_numa_domain;
45350575ce1SAndrew Gallatin #endif
454b174de32SAdrian Chadd 	}
45581d5d46bSBjoern A. Zeeb 
456fcf59617SAndrey V. Elsukov #if defined(IPSEC) || defined(IPSEC_SUPPORT)
457fcf59617SAndrey V. Elsukov 	/*
458fcf59617SAndrey V. Elsukov 	 * IPSec checking which handles several cases.
459fcf59617SAndrey V. Elsukov 	 * FAST IPSEC: We re-injected the packet.
460fcf59617SAndrey V. Elsukov 	 * XXX: need scope argument.
461fcf59617SAndrey V. Elsukov 	 */
462fcf59617SAndrey V. Elsukov 	if (IPSEC_ENABLED(ipv6)) {
463fcf59617SAndrey V. Elsukov 		if ((error = IPSEC_OUTPUT(ipv6, m, inp)) != 0) {
464fcf59617SAndrey V. Elsukov 			if (error == EINPROGRESS)
465fcf59617SAndrey V. Elsukov 				error = 0;
466fcf59617SAndrey V. Elsukov 			goto done;
467fcf59617SAndrey V. Elsukov 		}
468fcf59617SAndrey V. Elsukov 	}
469fcf59617SAndrey V. Elsukov #endif /* IPSEC */
470fcf59617SAndrey V. Elsukov 
471a1a6c01eSBjoern A. Zeeb 	/* Source address validation. */
472a1a6c01eSBjoern A. Zeeb 	ip6 = mtod(m, struct ip6_hdr *);
473a1a6c01eSBjoern A. Zeeb 	if (IN6_IS_ADDR_UNSPECIFIED(&ip6->ip6_src) &&
474a1a6c01eSBjoern A. Zeeb 	    (flags & IPV6_UNSPECSRC) == 0) {
475a1a6c01eSBjoern A. Zeeb 		error = EOPNOTSUPP;
476a1a6c01eSBjoern A. Zeeb 		IP6STAT_INC(ip6s_badscope);
477a1a6c01eSBjoern A. Zeeb 		goto bad;
478a1a6c01eSBjoern A. Zeeb 	}
479a1a6c01eSBjoern A. Zeeb 	if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_src)) {
480a1a6c01eSBjoern A. Zeeb 		error = EOPNOTSUPP;
481a1a6c01eSBjoern A. Zeeb 		IP6STAT_INC(ip6s_badscope);
482a1a6c01eSBjoern A. Zeeb 		goto bad;
483a1a6c01eSBjoern A. Zeeb 	}
484a1a6c01eSBjoern A. Zeeb 
485a1a6c01eSBjoern A. Zeeb 	/*
486a1a6c01eSBjoern A. Zeeb 	 * If we are given packet options to add extension headers prepare them.
487a1a6c01eSBjoern A. Zeeb 	 * Calculate the total length of the extension header chain.
488a1a6c01eSBjoern A. Zeeb 	 * Keep the length of the unfragmentable part for fragmentation.
489a1a6c01eSBjoern A. Zeeb 	 */
49082cd038dSYoshinobu Inoue 	bzero(&exthdrs, sizeof(exthdrs));
491a1a6c01eSBjoern A. Zeeb 	optlen = 0;
4923db60531SBjoern A. Zeeb 	unfragpartlen = sizeof(struct ip6_hdr);
49382cd038dSYoshinobu Inoue 	if (opt) {
4947c1daefeSBjoern A. Zeeb 		/* Hop-by-Hop options header. */
495a1a6c01eSBjoern A. Zeeb 		MAKE_EXTHDR(opt->ip6po_hbh, &exthdrs.ip6e_hbh, optlen);
496a1a6c01eSBjoern A. Zeeb 
4977c1daefeSBjoern A. Zeeb 		/* Destination options header (1st part). */
49829bc2c48SHajimu UMEMOTO 		if (opt->ip6po_rthdr) {
499a1a6c01eSBjoern A. Zeeb #ifndef RTHDR_SUPPORT_IMPLEMENTED
500a1a6c01eSBjoern A. Zeeb 			/*
501a1a6c01eSBjoern A. Zeeb 			 * If there is a routing header, discard the packet
502a1a6c01eSBjoern A. Zeeb 			 * right away here. RH0/1 are obsolete and we do not
503a1a6c01eSBjoern A. Zeeb 			 * currently support RH2/3/4.
504a1a6c01eSBjoern A. Zeeb 			 * People trying to use RH253/254 may want to disable
505a1a6c01eSBjoern A. Zeeb 			 * this check.
506a1a6c01eSBjoern A. Zeeb 			 * The moment we do support any routing header (again)
507a1a6c01eSBjoern A. Zeeb 			 * this block should check the routing type more
508a1a6c01eSBjoern A. Zeeb 			 * selectively.
509a1a6c01eSBjoern A. Zeeb 			 */
510a1a6c01eSBjoern A. Zeeb 			error = EINVAL;
511a1a6c01eSBjoern A. Zeeb 			goto bad;
512a1a6c01eSBjoern A. Zeeb #endif
513a1a6c01eSBjoern A. Zeeb 
51429bc2c48SHajimu UMEMOTO 			/*
5157c1daefeSBjoern A. Zeeb 			 * Destination options header (1st part).
5162cb64cb2SGeorge V. Neville-Neil 			 * This only makes sense with a routing header.
51729bc2c48SHajimu UMEMOTO 			 * See Section 9.2 of RFC 3542.
51829bc2c48SHajimu UMEMOTO 			 * Disabling this part just for MIP6 convenience is
51929bc2c48SHajimu UMEMOTO 			 * a bad idea.  We need to think carefully about a
52029bc2c48SHajimu UMEMOTO 			 * way to make the advanced API coexist with MIP6
52129bc2c48SHajimu UMEMOTO 			 * options, which might automatically be inserted in
52229bc2c48SHajimu UMEMOTO 			 * the kernel.
52329bc2c48SHajimu UMEMOTO 			 */
524a1a6c01eSBjoern A. Zeeb 			MAKE_EXTHDR(opt->ip6po_dest1, &exthdrs.ip6e_dest1,
525a1a6c01eSBjoern A. Zeeb 			    optlen);
52629bc2c48SHajimu UMEMOTO 		}
5277c1daefeSBjoern A. Zeeb 		/* Routing header. */
528a1a6c01eSBjoern A. Zeeb 		MAKE_EXTHDR(opt->ip6po_rthdr, &exthdrs.ip6e_rthdr, optlen);
52982cd038dSYoshinobu Inoue 
5303db60531SBjoern A. Zeeb 		unfragpartlen += optlen;
5312cb64cb2SGeorge V. Neville-Neil 
532a1a6c01eSBjoern A. Zeeb 		/*
533a1a6c01eSBjoern A. Zeeb 		 * NOTE: we don't add AH/ESP length here (done in
534a1a6c01eSBjoern A. Zeeb 		 * ip6_ipsec_output()).
535a1a6c01eSBjoern A. Zeeb 		 */
536a1a6c01eSBjoern A. Zeeb 
537a1a6c01eSBjoern A. Zeeb 		/* Destination options header (2nd part). */
538a1a6c01eSBjoern A. Zeeb 		MAKE_EXTHDR(opt->ip6po_dest2, &exthdrs.ip6e_dest2, optlen);
539a1a6c01eSBjoern A. Zeeb 	}
54082cd038dSYoshinobu Inoue 
54182cd038dSYoshinobu Inoue 	/*
542aaf2cfc0SVANHULLEBUS Yvan 	 * If there is at least one extension header,
54382cd038dSYoshinobu Inoue 	 * separate IP6 header from the payload.
54482cd038dSYoshinobu Inoue 	 */
545a1a6c01eSBjoern A. Zeeb 	hdrsplit = false;
546a1a6c01eSBjoern A. Zeeb 	if (optlen) {
54782cd038dSYoshinobu Inoue 		if ((error = ip6_splithdr(m, &exthdrs)) != 0) {
54882cd038dSYoshinobu Inoue 			m = NULL;
54982cd038dSYoshinobu Inoue 			goto freehdrs;
55082cd038dSYoshinobu Inoue 		}
55182cd038dSYoshinobu Inoue 		m = exthdrs.ip6e_ip6;
55282cd038dSYoshinobu Inoue 		ip6 = mtod(m, struct ip6_hdr *);
553a1a6c01eSBjoern A. Zeeb 		hdrsplit = true;
554a1a6c01eSBjoern A. Zeeb 	}
55582cd038dSYoshinobu Inoue 
5567c1daefeSBjoern A. Zeeb 	/* Adjust mbuf packet header length. */
55782cd038dSYoshinobu Inoue 	m->m_pkthdr.len += optlen;
55882cd038dSYoshinobu Inoue 	plen = m->m_pkthdr.len - sizeof(*ip6);
55982cd038dSYoshinobu Inoue 
56082cd038dSYoshinobu Inoue 	/* If this is a jumbo payload, insert a jumbo payload option. */
56182cd038dSYoshinobu Inoue 	if (plen > IPV6_MAXPACKET) {
56282cd038dSYoshinobu Inoue 		if (!hdrsplit) {
56382cd038dSYoshinobu Inoue 			if ((error = ip6_splithdr(m, &exthdrs)) != 0) {
56482cd038dSYoshinobu Inoue 				m = NULL;
56582cd038dSYoshinobu Inoue 				goto freehdrs;
56682cd038dSYoshinobu Inoue 			}
56782cd038dSYoshinobu Inoue 			m = exthdrs.ip6e_ip6;
56882cd038dSYoshinobu Inoue 			ip6 = mtod(m, struct ip6_hdr *);
569a1a6c01eSBjoern A. Zeeb 			hdrsplit = true;
570a1a6c01eSBjoern A. Zeeb 		}
57182cd038dSYoshinobu Inoue 		if ((error = ip6_insert_jumboopt(&exthdrs, plen)) != 0)
57282cd038dSYoshinobu Inoue 			goto freehdrs;
57382cd038dSYoshinobu Inoue 		ip6->ip6_plen = 0;
57482cd038dSYoshinobu Inoue 	} else
57582cd038dSYoshinobu Inoue 		ip6->ip6_plen = htons(plen);
576a1a6c01eSBjoern A. Zeeb 	nexthdrp = &ip6->ip6_nxt;
57782cd038dSYoshinobu Inoue 
578a1a6c01eSBjoern A. Zeeb 	if (optlen) {
57982cd038dSYoshinobu Inoue 		/*
58082cd038dSYoshinobu Inoue 		 * Concatenate headers and fill in next header fields.
58182cd038dSYoshinobu Inoue 		 * Here we have, on "m"
58282cd038dSYoshinobu Inoue 		 *	IPv6 payload
5837c1daefeSBjoern A. Zeeb 		 * and we insert headers accordingly.
5847c1daefeSBjoern A. Zeeb 		 * Finally, we should be getting:
5857c1daefeSBjoern A. Zeeb 		 *	IPv6 hbh dest1 rthdr ah* [esp* dest2 payload].
58682cd038dSYoshinobu Inoue 		 *
5877c1daefeSBjoern A. Zeeb 		 * During the header composing process "m" points to IPv6
5887c1daefeSBjoern A. Zeeb 		 * header.  "mprev" points to an extension header prior to esp.
58982cd038dSYoshinobu Inoue 		 */
5902cb64cb2SGeorge V. Neville-Neil 		mprev = m;
59182cd038dSYoshinobu Inoue 
59282cd038dSYoshinobu Inoue 		/*
5937c1daefeSBjoern A. Zeeb 		 * We treat dest2 specially.  This makes IPsec processing
5947c1daefeSBjoern A. Zeeb 		 * much easier.  The goal here is to make mprev point the
59588ff5695SSUZUKI Shinsuke 		 * mbuf prior to dest2.
59682cd038dSYoshinobu Inoue 		 *
5977c1daefeSBjoern A. Zeeb 		 * Result: IPv6 dest2 payload.
59882cd038dSYoshinobu Inoue 		 * m and mprev will point to IPv6 header.
59982cd038dSYoshinobu Inoue 		 */
60082cd038dSYoshinobu Inoue 		if (exthdrs.ip6e_dest2) {
60182cd038dSYoshinobu Inoue 			if (!hdrsplit)
6027c1daefeSBjoern A. Zeeb 				panic("%s:%d: assumption failed: "
6037c1daefeSBjoern A. Zeeb 				    "hdr not split: hdrsplit %d exthdrs %p",
6047c1daefeSBjoern A. Zeeb 				    __func__, __LINE__, hdrsplit, &exthdrs);
60582cd038dSYoshinobu Inoue 			exthdrs.ip6e_dest2->m_next = m->m_next;
60682cd038dSYoshinobu Inoue 			m->m_next = exthdrs.ip6e_dest2;
60782cd038dSYoshinobu Inoue 			*mtod(exthdrs.ip6e_dest2, u_char *) = ip6->ip6_nxt;
60882cd038dSYoshinobu Inoue 			ip6->ip6_nxt = IPPROTO_DSTOPTS;
60982cd038dSYoshinobu Inoue 		}
61082cd038dSYoshinobu Inoue 
61182cd038dSYoshinobu Inoue 		/*
6127c1daefeSBjoern A. Zeeb 		 * Result: IPv6 hbh dest1 rthdr dest2 payload.
61382cd038dSYoshinobu Inoue 		 * m will point to IPv6 header.  mprev will point to the
61482cd038dSYoshinobu Inoue 		 * extension header prior to dest2 (rthdr in the above case).
61582cd038dSYoshinobu Inoue 		 */
6167efe5d92SHajimu UMEMOTO 		MAKE_CHAIN(exthdrs.ip6e_hbh, mprev, nexthdrp, IPPROTO_HOPOPTS);
6177efe5d92SHajimu UMEMOTO 		MAKE_CHAIN(exthdrs.ip6e_dest1, mprev, nexthdrp,
6187efe5d92SHajimu UMEMOTO 			   IPPROTO_DSTOPTS);
6197efe5d92SHajimu UMEMOTO 		MAKE_CHAIN(exthdrs.ip6e_rthdr, mprev, nexthdrp,
6207efe5d92SHajimu UMEMOTO 			   IPPROTO_ROUTING);
62182cd038dSYoshinobu Inoue 	}
62282cd038dSYoshinobu Inoue 
6239cb8d207SAndrey V. Elsukov 	IP6STAT_INC(ip6s_localout);
62482cd038dSYoshinobu Inoue 
6257c1daefeSBjoern A. Zeeb 	/* Route packet. */
62682cd038dSYoshinobu Inoue 	ro_pmtu = ro;
62782cd038dSYoshinobu Inoue 	if (opt && opt->ip6po_rthdr)
62882cd038dSYoshinobu Inoue 		ro = &opt->ip6po_route;
629000c42faSBjoern A. Zeeb 	if (ro != NULL)
63082cd038dSYoshinobu Inoue 		dst = (struct sockaddr_in6 *)&ro->ro_dst;
631000c42faSBjoern A. Zeeb 	else
632000c42faSBjoern A. Zeeb 		dst = &sin6;
6339c57a5b6SHiroki Sato 	fibnum = (inp != NULL) ? inp->inp_inc.inc_fibnum : M_GETFIB(m);
634000c42faSBjoern A. Zeeb 
6358195404bSBrooks Davis again:
63682cd038dSYoshinobu Inoue 	/*
6377c1daefeSBjoern A. Zeeb 	 * If specified, try to fill in the traffic class field.
6387c1daefeSBjoern A. Zeeb 	 * Do not override if a non-zero value is already set.
6397c1daefeSBjoern A. Zeeb 	 * We check the diffserv field and the ECN field separately.
640f95d4633SHajimu UMEMOTO 	 */
641f95d4633SHajimu UMEMOTO 	if (opt && opt->ip6po_tclass >= 0) {
642f95d4633SHajimu UMEMOTO 		int mask = 0;
643f95d4633SHajimu UMEMOTO 
644bb4a7d94SKristof Provost 		if (IPV6_DSCP(ip6) == 0)
645f95d4633SHajimu UMEMOTO 			mask |= 0xfc;
646bb4a7d94SKristof Provost 		if (IPV6_ECN(ip6) == 0)
647f95d4633SHajimu UMEMOTO 			mask |= 0x03;
648f95d4633SHajimu UMEMOTO 		if (mask != 0)
649f95d4633SHajimu UMEMOTO 			ip6->ip6_flow |= htonl((opt->ip6po_tclass & mask) << 20);
650f95d4633SHajimu UMEMOTO 	}
651f95d4633SHajimu UMEMOTO 
6527c1daefeSBjoern A. Zeeb 	/* Fill in or override the hop limit field, if necessary. */
653f95d4633SHajimu UMEMOTO 	if (opt && opt->ip6po_hlim != -1)
654f95d4633SHajimu UMEMOTO 		ip6->ip6_hlim = opt->ip6po_hlim & 0xff;
655f95d4633SHajimu UMEMOTO 	else if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
656f95d4633SHajimu UMEMOTO 		if (im6o != NULL)
657f95d4633SHajimu UMEMOTO 			ip6->ip6_hlim = im6o->im6o_multicast_hlim;
658f95d4633SHajimu UMEMOTO 		else
659603724d3SBjoern A. Zeeb 			ip6->ip6_hlim = V_ip6_defmcasthlim;
660f95d4633SHajimu UMEMOTO 	}
661000c42faSBjoern A. Zeeb 
662983066f0SAlexander V. Chernikov 	if (ro == NULL || ro->ro_nh == NULL) {
663000c42faSBjoern A. Zeeb 		bzero(dst, sizeof(*dst));
664000c42faSBjoern A. Zeeb 		dst->sin6_family = AF_INET6;
665000c42faSBjoern A. Zeeb 		dst->sin6_len = sizeof(*dst);
666000c42faSBjoern A. Zeeb 		dst->sin6_addr = ip6->ip6_dst;
667000c42faSBjoern A. Zeeb 	}
66884cc0778SGeorge V. Neville-Neil 	/*
669000c42faSBjoern A. Zeeb 	 * Validate route against routing table changes.
6707c1daefeSBjoern A. Zeeb 	 * Make sure that the address family is set in route.
67184cc0778SGeorge V. Neville-Neil 	 */
672983066f0SAlexander V. Chernikov 	nh = NULL;
673000c42faSBjoern A. Zeeb 	ifp = NULL;
674000c42faSBjoern A. Zeeb 	mtu = 0;
675000c42faSBjoern A. Zeeb 	if (ro != NULL) {
676983066f0SAlexander V. Chernikov 		if (ro->ro_nh != NULL && inp != NULL) {
677000c42faSBjoern A. Zeeb 			ro->ro_dst.sin6_family = AF_INET6; /* XXX KASSERT? */
678983066f0SAlexander V. Chernikov 			NH_VALIDATE((struct route *)ro, &inp->inp_rt_cookie,
679000c42faSBjoern A. Zeeb 			    fibnum);
68084cc0778SGeorge V. Neville-Neil 		}
681983066f0SAlexander V. Chernikov 		if (ro->ro_nh != NULL && fwd_tag == NULL &&
682983066f0SAlexander V. Chernikov 		    (!NH_IS_VALID(ro->ro_nh) ||
683000c42faSBjoern A. Zeeb 		    ro->ro_dst.sin6_family != AF_INET6 ||
684000c42faSBjoern A. Zeeb 		    !IN6_ARE_ADDR_EQUAL(&ro->ro_dst.sin6_addr, &ip6->ip6_dst)))
685000c42faSBjoern A. Zeeb 			RO_INVALIDATE_CACHE(ro);
686000c42faSBjoern A. Zeeb 
687983066f0SAlexander V. Chernikov 		if (ro->ro_nh != NULL && fwd_tag == NULL &&
68884cc0778SGeorge V. Neville-Neil 		    ro->ro_dst.sin6_family == AF_INET6 &&
68984cc0778SGeorge V. Neville-Neil 		    IN6_ARE_ADDR_EQUAL(&ro->ro_dst.sin6_addr, &ip6->ip6_dst)) {
69050fa27e7SAlexander V. Chernikov 			/* Nexthop is valid and contains valid ifp */
691983066f0SAlexander V. Chernikov 			nh = ro->ro_nh;
69216607317SAndrey V. Elsukov 		} else {
6930f5687f2SMike Karels 			if (ro->ro_lle)
6940f5687f2SMike Karels 				LLE_FREE(ro->ro_lle);	/* zeros ro_lle */
6950f5687f2SMike Karels 			ro->ro_lle = NULL;
696f8fe3dc9SAndrey V. Elsukov 			if (fwd_tag == NULL) {
697a1f7e5f8SHajimu UMEMOTO 				bzero(&dst_sa, sizeof(dst_sa));
698a1f7e5f8SHajimu UMEMOTO 				dst_sa.sin6_family = AF_INET6;
699a1f7e5f8SHajimu UMEMOTO 				dst_sa.sin6_len = sizeof(dst_sa);
700a1f7e5f8SHajimu UMEMOTO 				dst_sa.sin6_addr = ip6->ip6_dst;
701f8fe3dc9SAndrey V. Elsukov 			}
7028483fce6SBjoern A. Zeeb 			error = in6_selectroute(&dst_sa, opt, im6o, ro, &ifp,
703983066f0SAlexander V. Chernikov 			    &nh, fibnum, m->m_pkthdr.flowid);
70416607317SAndrey V. Elsukov 			if (error != 0) {
705000c42faSBjoern A. Zeeb 				IP6STAT_INC(ip6s_noroute);
706a1f7e5f8SHajimu UMEMOTO 				if (ifp != NULL)
70782cd038dSYoshinobu Inoue 					in6_ifstat_inc(ifp, ifs6_out_discard);
70882cd038dSYoshinobu Inoue 				goto bad;
70982cd038dSYoshinobu Inoue 			}
71050fa27e7SAlexander V. Chernikov 			/*
71150fa27e7SAlexander V. Chernikov 			 * At this point at least @ifp is not NULL
71250fa27e7SAlexander V. Chernikov 			 * Can be the case when dst is multicast, link-local or
71350fa27e7SAlexander V. Chernikov 			 * interface is explicitly specificed by the caller.
71450fa27e7SAlexander V. Chernikov 			 */
71516607317SAndrey V. Elsukov 		}
716983066f0SAlexander V. Chernikov 		if (nh == NULL) {
717a1f7e5f8SHajimu UMEMOTO 			/*
718983066f0SAlexander V. Chernikov 			 * If in6_selectroute() does not return a nexthop
719a1f7e5f8SHajimu UMEMOTO 			 * dst may not have been updated.
720a1f7e5f8SHajimu UMEMOTO 			 */
721a1f7e5f8SHajimu UMEMOTO 			*dst = dst_sa;	/* XXX */
72250fa27e7SAlexander V. Chernikov 			origifp = ifp;
72350fa27e7SAlexander V. Chernikov 			mtu = ifp->if_mtu;
724000c42faSBjoern A. Zeeb 		} else {
72550fa27e7SAlexander V. Chernikov 			ifp = nh->nh_ifp;
72650fa27e7SAlexander V. Chernikov 			origifp = nh->nh_aifp;
727983066f0SAlexander V. Chernikov 			ia = (struct in6_ifaddr *)(nh->nh_ifa);
728983066f0SAlexander V. Chernikov 			counter_u64_add(nh->nh_pksent, 1);
729000c42faSBjoern A. Zeeb 		}
730000c42faSBjoern A. Zeeb 	} else {
7311483c1c5SAlexander V. Chernikov 		struct nhop_object *nh;
732000c42faSBjoern A. Zeeb 		struct in6_addr kdst;
733000c42faSBjoern A. Zeeb 		uint32_t scopeid;
734000c42faSBjoern A. Zeeb 
735000c42faSBjoern A. Zeeb 		if (fwd_tag == NULL) {
736000c42faSBjoern A. Zeeb 			bzero(&dst_sa, sizeof(dst_sa));
737000c42faSBjoern A. Zeeb 			dst_sa.sin6_family = AF_INET6;
738000c42faSBjoern A. Zeeb 			dst_sa.sin6_len = sizeof(dst_sa);
739000c42faSBjoern A. Zeeb 			dst_sa.sin6_addr = ip6->ip6_dst;
740000c42faSBjoern A. Zeeb 		}
741000c42faSBjoern A. Zeeb 
742000c42faSBjoern A. Zeeb 		if (IN6_IS_ADDR_MULTICAST(&dst_sa.sin6_addr) &&
743000c42faSBjoern A. Zeeb 		    im6o != NULL &&
744000c42faSBjoern A. Zeeb 		    (ifp = im6o->im6o_multicast_ifp) != NULL) {
745000c42faSBjoern A. Zeeb 			/* We do not need a route lookup. */
746000c42faSBjoern A. Zeeb 			*dst = dst_sa;	/* XXX */
74750fa27e7SAlexander V. Chernikov 			origifp = ifp;
748000c42faSBjoern A. Zeeb 			goto nonh6lookup;
749000c42faSBjoern A. Zeeb 		}
750000c42faSBjoern A. Zeeb 
751000c42faSBjoern A. Zeeb 		in6_splitscope(&dst_sa.sin6_addr, &kdst, &scopeid);
752000c42faSBjoern A. Zeeb 
753000c42faSBjoern A. Zeeb 		if (IN6_IS_ADDR_MC_LINKLOCAL(&dst_sa.sin6_addr) ||
754000c42faSBjoern A. Zeeb 		    IN6_IS_ADDR_MC_NODELOCAL(&dst_sa.sin6_addr)) {
755000c42faSBjoern A. Zeeb 			if (scopeid > 0) {
756000c42faSBjoern A. Zeeb 				ifp = in6_getlinkifnet(scopeid);
75719afc65aSMark Johnston 				if (ifp == NULL) {
75819afc65aSMark Johnston 					error = EHOSTUNREACH;
75919afc65aSMark Johnston 					goto bad;
76019afc65aSMark Johnston 				}
761000c42faSBjoern A. Zeeb 				*dst = dst_sa;	/* XXX */
76250fa27e7SAlexander V. Chernikov 				origifp = ifp;
763000c42faSBjoern A. Zeeb 				goto nonh6lookup;
764000c42faSBjoern A. Zeeb 			}
765000c42faSBjoern A. Zeeb 		}
766000c42faSBjoern A. Zeeb 
7670c325f53SAlexander V. Chernikov 		nh = fib6_lookup(fibnum, &kdst, scopeid, NHR_NONE,
7680c325f53SAlexander V. Chernikov 		    m->m_pkthdr.flowid);
7691483c1c5SAlexander V. Chernikov 		if (nh == NULL) {
770000c42faSBjoern A. Zeeb 			IP6STAT_INC(ip6s_noroute);
771000c42faSBjoern A. Zeeb 			/* No ifp in6_ifstat_inc(ifp, ifs6_out_discard); */
772000c42faSBjoern A. Zeeb 			error = EHOSTUNREACH;;
773000c42faSBjoern A. Zeeb 			goto bad;
774000c42faSBjoern A. Zeeb 		}
775000c42faSBjoern A. Zeeb 
7761483c1c5SAlexander V. Chernikov 		ifp = nh->nh_ifp;
77750fa27e7SAlexander V. Chernikov 		origifp = nh->nh_aifp;
7781483c1c5SAlexander V. Chernikov 		ia = ifatoia6(nh->nh_ifa);
7791483c1c5SAlexander V. Chernikov 		if (nh->nh_flags & NHF_GATEWAY)
7801483c1c5SAlexander V. Chernikov 			dst->sin6_addr = nh->gw6_sa.sin6_addr;
7817d98cc09SAndrey V. Elsukov 		else if (fwd_tag != NULL)
7827d98cc09SAndrey V. Elsukov 			dst->sin6_addr = dst_sa.sin6_addr;
783000c42faSBjoern A. Zeeb nonh6lookup:
784000c42faSBjoern A. Zeeb 		;
78582cd038dSYoshinobu Inoue 	}
78650fa27e7SAlexander V. Chernikov 	/*
78750fa27e7SAlexander V. Chernikov 	 * At this point ifp MUST be pointing to the valid transmit ifp.
78850fa27e7SAlexander V. Chernikov 	 * origifp MUST be valid and pointing to either the same ifp or,
78950fa27e7SAlexander V. Chernikov 	 * in case of loopback output, to the interface which ip6_src
79050fa27e7SAlexander V. Chernikov 	 * belongs to.
79150fa27e7SAlexander V. Chernikov 	 * Examples:
79250fa27e7SAlexander V. Chernikov 	 *  fe80::1%em0 -> fe80::2%em0 -> ifp=em0, origifp=em0
79350fa27e7SAlexander V. Chernikov 	 *  fe80::1%em0 -> fe80::1%em0 -> ifp=lo0, origifp=em0
79450fa27e7SAlexander V. Chernikov 	 *  ::1 -> ::1 -> ifp=lo0, origifp=lo0
79550fa27e7SAlexander V. Chernikov 	 *
79650fa27e7SAlexander V. Chernikov 	 * mtu can be 0 and will be refined later.
79750fa27e7SAlexander V. Chernikov 	 */
79850fa27e7SAlexander V. Chernikov 	KASSERT((ifp != NULL), ("output interface must not be NULL"));
79950fa27e7SAlexander V. Chernikov 	KASSERT((origifp != NULL), ("output address interface must not be NULL"));
80082cd038dSYoshinobu Inoue 
801a1f7e5f8SHajimu UMEMOTO 	if ((flags & IPV6_FORWARDING) == 0) {
802a1f7e5f8SHajimu UMEMOTO 		/* XXX: the FORWARDING flag can be set for mrouting. */
803a1f7e5f8SHajimu UMEMOTO 		in6_ifstat_inc(ifp, ifs6_out_request);
804a1f7e5f8SHajimu UMEMOTO 	}
805a1f7e5f8SHajimu UMEMOTO 
806ef0111fdSHans Petter Selasky 	/* Setup data structures for scope ID checks. */
807a1f7e5f8SHajimu UMEMOTO 	src0 = ip6->ip6_src;
808a1f7e5f8SHajimu UMEMOTO 	bzero(&src_sa, sizeof(src_sa));
809a1f7e5f8SHajimu UMEMOTO 	src_sa.sin6_family = AF_INET6;
810a1f7e5f8SHajimu UMEMOTO 	src_sa.sin6_len = sizeof(src_sa);
811a1f7e5f8SHajimu UMEMOTO 	src_sa.sin6_addr = ip6->ip6_src;
812a1f7e5f8SHajimu UMEMOTO 
813a1f7e5f8SHajimu UMEMOTO 	dst0 = ip6->ip6_dst;
8147c1daefeSBjoern A. Zeeb 	/* Re-initialize to be sure. */
815a1f7e5f8SHajimu UMEMOTO 	bzero(&dst_sa, sizeof(dst_sa));
816a1f7e5f8SHajimu UMEMOTO 	dst_sa.sin6_family = AF_INET6;
817a1f7e5f8SHajimu UMEMOTO 	dst_sa.sin6_len = sizeof(dst_sa);
818a1f7e5f8SHajimu UMEMOTO 	dst_sa.sin6_addr = ip6->ip6_dst;
819a1f7e5f8SHajimu UMEMOTO 
820ef0111fdSHans Petter Selasky 	/* Check for valid scope ID. */
82150fa27e7SAlexander V. Chernikov 	if (in6_setscope(&src0, origifp, &zone) == 0 &&
822ef0111fdSHans Petter Selasky 	    sa6_recoverscope(&src_sa) == 0 && zone == src_sa.sin6_scope_id &&
82350fa27e7SAlexander V. Chernikov 	    in6_setscope(&dst0, origifp, &zone) == 0 &&
824ef0111fdSHans Petter Selasky 	    sa6_recoverscope(&dst_sa) == 0 && zone == dst_sa.sin6_scope_id) {
825ef0111fdSHans Petter Selasky 		/*
826ef0111fdSHans Petter Selasky 		 * The outgoing interface is in the zone of the source
827ef0111fdSHans Petter Selasky 		 * and destination addresses.
828ef0111fdSHans Petter Selasky 		 *
829ef0111fdSHans Petter Selasky 		 */
83050fa27e7SAlexander V. Chernikov 	} else if ((origifp->if_flags & IFF_LOOPBACK) == 0 ||
831ef0111fdSHans Petter Selasky 	    sa6_recoverscope(&src_sa) != 0 ||
832ef0111fdSHans Petter Selasky 	    sa6_recoverscope(&dst_sa) != 0 ||
833ef0111fdSHans Petter Selasky 	    dst_sa.sin6_scope_id == 0 ||
834ef0111fdSHans Petter Selasky 	    (src_sa.sin6_scope_id != 0 &&
835ef0111fdSHans Petter Selasky 	    src_sa.sin6_scope_id != dst_sa.sin6_scope_id) ||
83650fa27e7SAlexander V. Chernikov 	    ifnet_byindex(dst_sa.sin6_scope_id) == NULL) {
837ef0111fdSHans Petter Selasky 		/*
838ef0111fdSHans Petter Selasky 		 * If the destination network interface is not a
839ef0111fdSHans Petter Selasky 		 * loopback interface, or the destination network
840ef0111fdSHans Petter Selasky 		 * address has no scope ID, or the source address has
841ef0111fdSHans Petter Selasky 		 * a scope ID set which is different from the
842ef0111fdSHans Petter Selasky 		 * destination address one, or there is no network
843ef0111fdSHans Petter Selasky 		 * interface representing this scope ID, the address
844ef0111fdSHans Petter Selasky 		 * pair is considered invalid.
845ef0111fdSHans Petter Selasky 		 */
8469cb8d207SAndrey V. Elsukov 		IP6STAT_INC(ip6s_badscope);
84750fa27e7SAlexander V. Chernikov 		in6_ifstat_inc(origifp, ifs6_out_discard);
848a1f7e5f8SHajimu UMEMOTO 		if (error == 0)
849a1f7e5f8SHajimu UMEMOTO 			error = EHOSTUNREACH; /* XXX */
850a1f7e5f8SHajimu UMEMOTO 		goto bad;
851ef0111fdSHans Petter Selasky 	}
852ef0111fdSHans Petter Selasky 	/* All scope ID checks are successful. */
853ef0111fdSHans Petter Selasky 
854983066f0SAlexander V. Chernikov 	if (nh && !IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
855983066f0SAlexander V. Chernikov 		if (opt && opt->ip6po_nextroute.ro_nh) {
856a1f7e5f8SHajimu UMEMOTO 			/*
857a1f7e5f8SHajimu UMEMOTO 			 * The nexthop is explicitly specified by the
858a1f7e5f8SHajimu UMEMOTO 			 * application.  We assume the next hop is an IPv6
859a1f7e5f8SHajimu UMEMOTO 			 * address.
860a1f7e5f8SHajimu UMEMOTO 			 */
861a1f7e5f8SHajimu UMEMOTO 			dst = (struct sockaddr_in6 *)opt->ip6po_nexthop;
862a1f7e5f8SHajimu UMEMOTO 		}
863983066f0SAlexander V. Chernikov 		else if ((nh->nh_flags & NHF_GATEWAY))
864983066f0SAlexander V. Chernikov 			dst = &nh->gw6_sa;
865a1f7e5f8SHajimu UMEMOTO 	}
866a1f7e5f8SHajimu UMEMOTO 
867a1f7e5f8SHajimu UMEMOTO 	if (!IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) {
8687c1daefeSBjoern A. Zeeb 		m->m_flags &= ~(M_BCAST | M_MCAST); /* Just in case. */
86982cd038dSYoshinobu Inoue 	} else {
87082cd038dSYoshinobu Inoue 		m->m_flags = (m->m_flags & ~M_BCAST) | M_MCAST;
87182cd038dSYoshinobu Inoue 		in6_ifstat_inc(ifp, ifs6_out_mcast);
8727c1daefeSBjoern A. Zeeb 
8737c1daefeSBjoern A. Zeeb 		/* Confirm that the outgoing interface supports multicast. */
874a1f7e5f8SHajimu UMEMOTO 		if (!(ifp->if_flags & IFF_MULTICAST)) {
8759cb8d207SAndrey V. Elsukov 			IP6STAT_INC(ip6s_noroute);
87682cd038dSYoshinobu Inoue 			in6_ifstat_inc(ifp, ifs6_out_discard);
87782cd038dSYoshinobu Inoue 			error = ENETUNREACH;
87882cd038dSYoshinobu Inoue 			goto bad;
87982cd038dSYoshinobu Inoue 		}
88033cde130SBruce M Simpson 		if ((im6o == NULL && in6_mcast_loop) ||
88133cde130SBruce M Simpson 		    (im6o && im6o->im6o_multicast_loop)) {
88282cd038dSYoshinobu Inoue 			/*
88333cde130SBruce M Simpson 			 * Loop back multicast datagram if not expressly
88433cde130SBruce M Simpson 			 * forbidden to do so, even if we have not joined
88533cde130SBruce M Simpson 			 * the address; protocols will filter it later,
88633cde130SBruce M Simpson 			 * thus deferring a hash lookup and lock acquisition
88733cde130SBruce M Simpson 			 * at the expense of an m_copym().
88882cd038dSYoshinobu Inoue 			 */
889331dff07SAlexander V. Chernikov 			ip6_mloopback(ifp, m);
89091ec0a1eSYoshinobu Inoue 		} else {
89191ec0a1eSYoshinobu Inoue 			/*
89291ec0a1eSYoshinobu Inoue 			 * If we are acting as a multicast router, perform
89391ec0a1eSYoshinobu Inoue 			 * multicast forwarding as if the packet had just
89491ec0a1eSYoshinobu Inoue 			 * arrived on the interface to which we are about
89591ec0a1eSYoshinobu Inoue 			 * to send.  The multicast forwarding function
89691ec0a1eSYoshinobu Inoue 			 * recursively calls this function, using the
89791ec0a1eSYoshinobu Inoue 			 * IPV6_FORWARDING flag to prevent infinite recursion.
89891ec0a1eSYoshinobu Inoue 			 *
89991ec0a1eSYoshinobu Inoue 			 * Multicasts that are looped back by ip6_mloopback(),
90091ec0a1eSYoshinobu Inoue 			 * above, will be forwarded by the ip6_input() routine,
90191ec0a1eSYoshinobu Inoue 			 * if necessary.
90291ec0a1eSYoshinobu Inoue 			 */
90333cde130SBruce M Simpson 			if (V_ip6_mrouter && (flags & IPV6_FORWARDING) == 0) {
904a1f7e5f8SHajimu UMEMOTO 				/*
905a1f7e5f8SHajimu UMEMOTO 				 * XXX: ip6_mforward expects that rcvif is NULL
906a1f7e5f8SHajimu UMEMOTO 				 * when it is called from the originating path.
9077b07d1beSGleb Smirnoff 				 * However, it may not always be the case.
908a1f7e5f8SHajimu UMEMOTO 				 */
909a1f7e5f8SHajimu UMEMOTO 				m->m_pkthdr.rcvif = NULL;
910686cdd19SJun-ichiro itojun Hagino 				if (ip6_mforward(ip6, ifp, m) != 0) {
91191ec0a1eSYoshinobu Inoue 					m_freem(m);
91291ec0a1eSYoshinobu Inoue 					goto done;
91391ec0a1eSYoshinobu Inoue 				}
91491ec0a1eSYoshinobu Inoue 			}
91582cd038dSYoshinobu Inoue 		}
91682cd038dSYoshinobu Inoue 		/*
91782cd038dSYoshinobu Inoue 		 * Multicasts with a hoplimit of zero may be looped back,
91882cd038dSYoshinobu Inoue 		 * above, but must not be transmitted on a network.
91982cd038dSYoshinobu Inoue 		 * Also, multicasts addressed to the loopback interface
92082cd038dSYoshinobu Inoue 		 * are not sent -- the above call to ip6_mloopback() will
92182cd038dSYoshinobu Inoue 		 * loop back a copy if this host actually belongs to the
92282cd038dSYoshinobu Inoue 		 * destination group on the loopback interface.
92382cd038dSYoshinobu Inoue 		 */
924f95d4633SHajimu UMEMOTO 		if (ip6->ip6_hlim == 0 || (ifp->if_flags & IFF_LOOPBACK) ||
925f95d4633SHajimu UMEMOTO 		    IN6_IS_ADDR_MC_INTFACELOCAL(&ip6->ip6_dst)) {
92682cd038dSYoshinobu Inoue 			m_freem(m);
92782cd038dSYoshinobu Inoue 			goto done;
92882cd038dSYoshinobu Inoue 		}
92982cd038dSYoshinobu Inoue 	}
93082cd038dSYoshinobu Inoue 
93182cd038dSYoshinobu Inoue 	/*
93282cd038dSYoshinobu Inoue 	 * Fill the outgoing inteface to tell the upper layer
93382cd038dSYoshinobu Inoue 	 * to increment per-interface statistics.
93482cd038dSYoshinobu Inoue 	 */
93582cd038dSYoshinobu Inoue 	if (ifpp)
93682cd038dSYoshinobu Inoue 		*ifpp = ifp;
93782cd038dSYoshinobu Inoue 
93831b3783cSHajimu UMEMOTO 	/* Determine path MTU. */
939f0937b2cSAndrey V. Elsukov 	if ((error = ip6_getpmtu(ro_pmtu, ro != ro_pmtu, ifp, &ip6->ip6_dst,
940d4c22202SAndrew Gallatin 		    &mtu, &alwaysfrag, fibnum, *nexthdrp)) != 0)
94131b3783cSHajimu UMEMOTO 		goto bad;
942000c42faSBjoern A. Zeeb 	KASSERT(mtu > 0, ("%s:%d: mtu %ld, ro_pmtu %p ro %p ifp %p "
943000c42faSBjoern A. Zeeb 	    "alwaysfrag %d fibnum %u\n", __func__, __LINE__, mtu, ro_pmtu, ro,
944000c42faSBjoern A. Zeeb 	    ifp, alwaysfrag, fibnum));
94582cd038dSYoshinobu Inoue 
94633841545SHajimu UMEMOTO 	/*
9478b00e59dSHajimu UMEMOTO 	 * The caller of this function may specify to use the minimum MTU
9488b00e59dSHajimu UMEMOTO 	 * in some cases.
9498b00e59dSHajimu UMEMOTO 	 * An advanced API option (IPV6_USE_MIN_MTU) can also override MTU
9508b00e59dSHajimu UMEMOTO 	 * setting.  The logic is a bit complicated; by default, unicast
9518b00e59dSHajimu UMEMOTO 	 * packets will follow path MTU while multicast packets will be sent at
9528b00e59dSHajimu UMEMOTO 	 * the minimum MTU.  If IP6PO_MINMTU_ALL is specified, all packets
9538b00e59dSHajimu UMEMOTO 	 * including unicast ones will be sent at the minimum MTU.  Multicast
9548b00e59dSHajimu UMEMOTO 	 * packets will always be sent at the minimum MTU unless
9558b00e59dSHajimu UMEMOTO 	 * IP6PO_MINMTU_DISABLE is explicitly specified.
9568b00e59dSHajimu UMEMOTO 	 * See RFC 3542 for more details.
95733841545SHajimu UMEMOTO 	 */
9588b00e59dSHajimu UMEMOTO 	if (mtu > IPV6_MMTU) {
9598b00e59dSHajimu UMEMOTO 		if ((flags & IPV6_MINMTU))
96033841545SHajimu UMEMOTO 			mtu = IPV6_MMTU;
9618b00e59dSHajimu UMEMOTO 		else if (opt && opt->ip6po_minmtu == IP6PO_MINMTU_ALL)
9628b00e59dSHajimu UMEMOTO 			mtu = IPV6_MMTU;
9638b00e59dSHajimu UMEMOTO 		else if (IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst) &&
9648b00e59dSHajimu UMEMOTO 			 (opt == NULL ||
9658b00e59dSHajimu UMEMOTO 			  opt->ip6po_minmtu != IP6PO_MINMTU_DISABLE)) {
9668b00e59dSHajimu UMEMOTO 			mtu = IPV6_MMTU;
9678b00e59dSHajimu UMEMOTO 		}
9688b00e59dSHajimu UMEMOTO 	}
96933841545SHajimu UMEMOTO 
97033841545SHajimu UMEMOTO 	/*
9717c1daefeSBjoern A. Zeeb 	 * Clear embedded scope identifiers if necessary.
9727c1daefeSBjoern A. Zeeb 	 * in6_clearscope() will touch the addresses only when necessary.
97333841545SHajimu UMEMOTO 	 */
97433841545SHajimu UMEMOTO 	in6_clearscope(&ip6->ip6_src);
97533841545SHajimu UMEMOTO 	in6_clearscope(&ip6->ip6_dst);
97682cd038dSYoshinobu Inoue 
97782cd038dSYoshinobu Inoue 	/*
97882cd038dSYoshinobu Inoue 	 * If the outgoing packet contains a hop-by-hop options header,
97982cd038dSYoshinobu Inoue 	 * it must be examined and processed even by the source node.
98082cd038dSYoshinobu Inoue 	 * (RFC 2460, section 4.)
98182cd038dSYoshinobu Inoue 	 */
98282cd038dSYoshinobu Inoue 	if (exthdrs.ip6e_hbh) {
98333841545SHajimu UMEMOTO 		struct ip6_hbh *hbh = mtod(exthdrs.ip6e_hbh, struct ip6_hbh *);
984283f9f8aSHajimu UMEMOTO 		u_int32_t dummy; /* XXX unused */
985283f9f8aSHajimu UMEMOTO 		u_int32_t plen = 0; /* XXX: ip6_process will check the value */
98682cd038dSYoshinobu Inoue 
98733841545SHajimu UMEMOTO #ifdef DIAGNOSTIC
98833841545SHajimu UMEMOTO 		if ((hbh->ip6h_len + 1) << 3 > exthdrs.ip6e_hbh->m_len)
9896d79f3f6SRebecca Cran 			panic("ip6e_hbh is not contiguous");
99033841545SHajimu UMEMOTO #endif
99182cd038dSYoshinobu Inoue 		/*
99282cd038dSYoshinobu Inoue 		 *  XXX: if we have to send an ICMPv6 error to the sender,
99382cd038dSYoshinobu Inoue 		 *       we need the M_LOOP flag since icmp6_error() expects
99482cd038dSYoshinobu Inoue 		 *       the IPv6 and the hop-by-hop options header are
9956d79f3f6SRebecca Cran 		 *       contiguous unless the flag is set.
99682cd038dSYoshinobu Inoue 		 */
99782cd038dSYoshinobu Inoue 		m->m_flags |= M_LOOP;
99882cd038dSYoshinobu Inoue 		m->m_pkthdr.rcvif = ifp;
9997efe5d92SHajimu UMEMOTO 		if (ip6_process_hopopts(m, (u_int8_t *)(hbh + 1),
10007efe5d92SHajimu UMEMOTO 		    ((hbh->ip6h_len + 1) << 3) - sizeof(struct ip6_hbh),
1001283f9f8aSHajimu UMEMOTO 		    &dummy, &plen) < 0) {
10027c1daefeSBjoern A. Zeeb 			/* m was already freed at this point. */
100382cd038dSYoshinobu Inoue 			error = EINVAL;/* better error? */
100482cd038dSYoshinobu Inoue 			goto done;
100582cd038dSYoshinobu Inoue 		}
100682cd038dSYoshinobu Inoue 		m->m_flags &= ~M_LOOP; /* XXX */
100782cd038dSYoshinobu Inoue 		m->m_pkthdr.rcvif = NULL;
100882cd038dSYoshinobu Inoue 	}
100982cd038dSYoshinobu Inoue 
1010c21fd232SAndre Oppermann 	/* Jump over all PFIL processing if hooks are not active. */
1011b252313fSGleb Smirnoff 	if (!PFIL_HOOKED_OUT(V_inet6_pfil_head))
1012c21fd232SAndre Oppermann 		goto passout;
1013c21fd232SAndre Oppermann 
10148195404bSBrooks Davis 	odst = ip6->ip6_dst;
1015c21fd232SAndre Oppermann 	/* Run through list of hooks for output packets. */
1016dda6376bSMateusz Guzik 	switch (pfil_mbuf_out(V_inet6_pfil_head, &m, ifp, inp)) {
1017b252313fSGleb Smirnoff 	case PFIL_PASS:
1018c4ac87eaSDarren Reed 		ip6 = mtod(m, struct ip6_hdr *);
1019b252313fSGleb Smirnoff 		break;
1020b252313fSGleb Smirnoff 	case PFIL_DROPPED:
1021e00ee1a9SGleb Smirnoff 		error = EACCES;
1022b252313fSGleb Smirnoff 		/* FALLTHROUGH */
1023b252313fSGleb Smirnoff 	case PFIL_CONSUMED:
1024b252313fSGleb Smirnoff 		goto done;
1025b252313fSGleb Smirnoff 	}
10267efe5d92SHajimu UMEMOTO 
10279c57a5b6SHiroki Sato 	needfiblookup = 0;
10288195404bSBrooks Davis 	/* See if destination IP address was changed by packet filter. */
10298195404bSBrooks Davis 	if (!IN6_ARE_ADDR_EQUAL(&odst, &ip6->ip6_dst)) {
10308195404bSBrooks Davis 		m->m_flags |= M_SKIP_FIREWALL;
10318195404bSBrooks Davis 		/* If destination is now ourself drop to ip6_input(). */
10328a006adbSBjoern A. Zeeb 		if (in6_localip(&ip6->ip6_dst)) {
10338a006adbSBjoern A. Zeeb 			m->m_flags |= M_FASTFWD_OURS;
10348195404bSBrooks Davis 			if (m->m_pkthdr.rcvif == NULL)
1035603724d3SBjoern A. Zeeb 				m->m_pkthdr.rcvif = V_loif;
1036356ab07eSBjoern A. Zeeb 			if (m->m_pkthdr.csum_flags & CSUM_DELAY_DATA_IPV6) {
10378195404bSBrooks Davis 				m->m_pkthdr.csum_flags |=
1038356ab07eSBjoern A. Zeeb 				    CSUM_DATA_VALID_IPV6 | CSUM_PSEUDO_HDR;
10398195404bSBrooks Davis 				m->m_pkthdr.csum_data = 0xffff;
10408195404bSBrooks Davis 			}
104195033af9SMark Johnston #if defined(SCTP) || defined(SCTP_SUPPORT)
1042a6cff10fSMichael Tuexen 			if (m->m_pkthdr.csum_flags & CSUM_SCTP_IPV6)
10439b03990aSRandall Stewart 				m->m_pkthdr.csum_flags |= CSUM_SCTP_VALID;
10449b03990aSRandall Stewart #endif
10458195404bSBrooks Davis 			error = netisr_queue(NETISR_IPV6, m);
10468195404bSBrooks Davis 			goto done;
10474ee7e5a6SAndrey V. Elsukov 		} else {
1048000c42faSBjoern A. Zeeb 			if (ro != NULL)
1049ec86402eSBjoern A. Zeeb 				RO_INVALIDATE_CACHE(ro);
10509c57a5b6SHiroki Sato 			needfiblookup = 1; /* Redo the routing table lookup. */
10518195404bSBrooks Davis 		}
10524ee7e5a6SAndrey V. Elsukov 	}
10539c57a5b6SHiroki Sato 	/* See if fib was changed by packet filter. */
10549c57a5b6SHiroki Sato 	if (fibnum != M_GETFIB(m)) {
10559c57a5b6SHiroki Sato 		m->m_flags |= M_SKIP_FIREWALL;
10569c57a5b6SHiroki Sato 		fibnum = M_GETFIB(m);
1057000c42faSBjoern A. Zeeb 		if (ro != NULL)
1058ec86402eSBjoern A. Zeeb 			RO_INVALIDATE_CACHE(ro);
10599c57a5b6SHiroki Sato 		needfiblookup = 1;
10609c57a5b6SHiroki Sato 	}
10619c57a5b6SHiroki Sato 	if (needfiblookup)
10629c57a5b6SHiroki Sato 		goto again;
10638195404bSBrooks Davis 
10648a006adbSBjoern A. Zeeb 	/* See if local, if yes, send it to netisr. */
10658a006adbSBjoern A. Zeeb 	if (m->m_flags & M_FASTFWD_OURS) {
10668a006adbSBjoern A. Zeeb 		if (m->m_pkthdr.rcvif == NULL)
10678a006adbSBjoern A. Zeeb 			m->m_pkthdr.rcvif = V_loif;
1068356ab07eSBjoern A. Zeeb 		if (m->m_pkthdr.csum_flags & CSUM_DELAY_DATA_IPV6) {
10698a006adbSBjoern A. Zeeb 			m->m_pkthdr.csum_flags |=
1070356ab07eSBjoern A. Zeeb 			    CSUM_DATA_VALID_IPV6 | CSUM_PSEUDO_HDR;
10718a006adbSBjoern A. Zeeb 			m->m_pkthdr.csum_data = 0xffff;
10728a006adbSBjoern A. Zeeb 		}
107395033af9SMark Johnston #if defined(SCTP) || defined(SCTP_SUPPORT)
1074a6cff10fSMichael Tuexen 		if (m->m_pkthdr.csum_flags & CSUM_SCTP_IPV6)
10758a006adbSBjoern A. Zeeb 			m->m_pkthdr.csum_flags |= CSUM_SCTP_VALID;
10768a006adbSBjoern A. Zeeb #endif
10778a006adbSBjoern A. Zeeb 		error = netisr_queue(NETISR_IPV6, m);
10788a006adbSBjoern A. Zeeb 		goto done;
10798a006adbSBjoern A. Zeeb 	}
10808a006adbSBjoern A. Zeeb 	/* Or forward to some other address? */
1081ffdbf9daSAndrey V. Elsukov 	if ((m->m_flags & M_IP6_NEXTHOP) &&
1082ffdbf9daSAndrey V. Elsukov 	    (fwd_tag = m_tag_find(m, PACKET_TAG_IPFORWARD, NULL)) != NULL) {
1083000c42faSBjoern A. Zeeb 		if (ro != NULL)
10848a006adbSBjoern A. Zeeb 			dst = (struct sockaddr_in6 *)&ro->ro_dst;
1085000c42faSBjoern A. Zeeb 		else
1086000c42faSBjoern A. Zeeb 			dst = &sin6;
1087f8fe3dc9SAndrey V. Elsukov 		bcopy((fwd_tag+1), &dst_sa, sizeof(struct sockaddr_in6));
10888a006adbSBjoern A. Zeeb 		m->m_flags |= M_SKIP_FIREWALL;
1089ffdbf9daSAndrey V. Elsukov 		m->m_flags &= ~M_IP6_NEXTHOP;
10908a006adbSBjoern A. Zeeb 		m_tag_delete(m, fwd_tag);
10918a006adbSBjoern A. Zeeb 		goto again;
10928a006adbSBjoern A. Zeeb 	}
10938195404bSBrooks Davis 
1094c21fd232SAndre Oppermann passout:
1095868aabb4SRichard Scheffenegger 	if (vlan_pcp > -1)
1096868aabb4SRichard Scheffenegger 		EVL_APPLY_PRI(m, vlan_pcp);
109744775b16SMark Johnston 
109844775b16SMark Johnston 	/* Ensure the packet data is mapped if the interface requires it. */
109944775b16SMark Johnston 	if ((ifp->if_capenable & IFCAP_MEXTPG) == 0) {
110044775b16SMark Johnston 		m = mb_unmapped_to_ext(m);
110144775b16SMark Johnston 		if (m == NULL) {
110244775b16SMark Johnston 			IP6STAT_INC(ip6s_odropped);
110344775b16SMark Johnston 			return (ENOBUFS);
110444775b16SMark Johnston 		}
110544775b16SMark Johnston 	}
110644775b16SMark Johnston 
110782cd038dSYoshinobu Inoue 	/*
110882cd038dSYoshinobu Inoue 	 * Send the packet to the outgoing interface.
110982cd038dSYoshinobu Inoue 	 * If necessary, do IPv6 fragmentation before sending.
1110f95d4633SHajimu UMEMOTO 	 *
11117c1daefeSBjoern A. Zeeb 	 * The logic here is rather complex:
1112f95d4633SHajimu UMEMOTO 	 * 1: normal case (dontfrag == 0, alwaysfrag == 0)
1113f95d4633SHajimu UMEMOTO 	 * 1-a:	send as is if tlen <= path mtu
1114f95d4633SHajimu UMEMOTO 	 * 1-b:	fragment if tlen > path mtu
1115f95d4633SHajimu UMEMOTO 	 *
1116f95d4633SHajimu UMEMOTO 	 * 2: if user asks us not to fragment (dontfrag == 1)
1117f95d4633SHajimu UMEMOTO 	 * 2-a:	send as is if tlen <= interface mtu
1118f95d4633SHajimu UMEMOTO 	 * 2-b:	error if tlen > interface mtu
1119f95d4633SHajimu UMEMOTO 	 *
1120f95d4633SHajimu UMEMOTO 	 * 3: if we always need to attach fragment header (alwaysfrag == 1)
1121f95d4633SHajimu UMEMOTO 	 *	always fragment
1122f95d4633SHajimu UMEMOTO 	 *
1123f95d4633SHajimu UMEMOTO 	 * 4: if dontfrag == 1 && alwaysfrag == 1
11247c1daefeSBjoern A. Zeeb 	 *	error, as we cannot handle this conflicting request.
112582cd038dSYoshinobu Inoue 	 */
1126e7b92e27SBjoern A. Zeeb 	sw_csum = m->m_pkthdr.csum_flags;
1127e7b92e27SBjoern A. Zeeb 	if (!hdrsplit) {
1128b092fd6cSNavdeep Parhar 		tso = ((sw_csum & ifp->if_hwassist &
1129b092fd6cSNavdeep Parhar 		    (CSUM_TSO | CSUM_INNER_TSO)) != 0) ? 1 : 0;
1130e7b92e27SBjoern A. Zeeb 		sw_csum &= ~ifp->if_hwassist;
1131e7b92e27SBjoern A. Zeeb 	} else
1132e7b92e27SBjoern A. Zeeb 		tso = 0;
1133e7b92e27SBjoern A. Zeeb 	/*
1134e7b92e27SBjoern A. Zeeb 	 * If we added extension headers, we will not do TSO and calculate the
1135e7b92e27SBjoern A. Zeeb 	 * checksums ourselves for now.
1136e7b92e27SBjoern A. Zeeb 	 * XXX-BZ  Need a framework to know when the NIC can handle it, even
1137e7b92e27SBjoern A. Zeeb 	 * with ext. hdrs.
1138e7b92e27SBjoern A. Zeeb 	 */
113944775b16SMark Johnston 	ip6_output_delayed_csum(m, ifp, sw_csum, plen, optlen);
11403459050cSBjoern A. Zeeb 	/* XXX-BZ m->m_pkthdr.csum_flags &= ~ifp->if_hwassist; */
114182cd038dSYoshinobu Inoue 	tlen = m->m_pkthdr.len;
114282cd038dSYoshinobu Inoue 
1143e7b92e27SBjoern A. Zeeb 	if ((opt && (opt->ip6po_flags & IP6PO_DONTFRAG)) || tso)
1144f95d4633SHajimu UMEMOTO 		dontfrag = 1;
1145f95d4633SHajimu UMEMOTO 	else
1146f95d4633SHajimu UMEMOTO 		dontfrag = 0;
11477c1daefeSBjoern A. Zeeb 	if (dontfrag && alwaysfrag) {	/* Case 4. */
11487c1daefeSBjoern A. Zeeb 		/* Conflicting request - can't transmit. */
1149f95d4633SHajimu UMEMOTO 		error = EMSGSIZE;
1150f95d4633SHajimu UMEMOTO 		goto bad;
1151f95d4633SHajimu UMEMOTO 	}
11527c1daefeSBjoern A. Zeeb 	if (dontfrag && tlen > IN6_LINKMTU(ifp) && !tso) {	/* Case 2-b. */
1153f95d4633SHajimu UMEMOTO 		/*
1154f95d4633SHajimu UMEMOTO 		 * Even if the DONTFRAG option is specified, we cannot send the
1155f95d4633SHajimu UMEMOTO 		 * packet when the data length is larger than the MTU of the
1156f95d4633SHajimu UMEMOTO 		 * outgoing interface.
11578f1beb88SAndrey V. Elsukov 		 * Notify the error by sending IPV6_PATHMTU ancillary data if
11588f1beb88SAndrey V. Elsukov 		 * application wanted to know the MTU value. Also return an
11598f1beb88SAndrey V. Elsukov 		 * error code (this is not described in the API spec).
1160f95d4633SHajimu UMEMOTO 		 */
11618f1beb88SAndrey V. Elsukov 		if (inp != NULL)
11628f1beb88SAndrey V. Elsukov 			ip6_notify_pmtu(inp, &dst_sa, (u_int32_t)mtu);
1163f95d4633SHajimu UMEMOTO 		error = EMSGSIZE;
1164f95d4633SHajimu UMEMOTO 		goto bad;
1165f95d4633SHajimu UMEMOTO 	}
1166f95d4633SHajimu UMEMOTO 
11677c1daefeSBjoern A. Zeeb 	/* Transmit packet without fragmentation. */
11687c1daefeSBjoern A. Zeeb 	if (dontfrag || (!alwaysfrag && tlen <= mtu)) {	/* Cases 1-a and 2-a. */
1169f95d4633SHajimu UMEMOTO 		struct in6_ifaddr *ia6;
1170f95d4633SHajimu UMEMOTO 
1171f95d4633SHajimu UMEMOTO 		ip6 = mtod(m, struct ip6_hdr *);
1172f95d4633SHajimu UMEMOTO 		ia6 = in6_ifawithifp(ifp, &ip6->ip6_src);
1173f95d4633SHajimu UMEMOTO 		if (ia6) {
11745da9f8faSJosef Karthauser 			/* Record statistics for this interface address. */
11757caf4ab7SGleb Smirnoff 			counter_u64_add(ia6->ia_ifa.ifa_opackets, 1);
11767caf4ab7SGleb Smirnoff 			counter_u64_add(ia6->ia_ifa.ifa_obytes,
11777caf4ab7SGleb Smirnoff 			    m->m_pkthdr.len);
11785da9f8faSJosef Karthauser 		}
1179d7452d89SAndrew Gallatin 		error = ip6_output_send(inp, ifp, origifp, m, dst, ro,
1180d7452d89SAndrew Gallatin 		    (flags & IP_NO_SND_TAG_RL) ? false : true);
118182cd038dSYoshinobu Inoue 		goto done;
1182f95d4633SHajimu UMEMOTO 	}
1183f95d4633SHajimu UMEMOTO 
11847c1daefeSBjoern A. Zeeb 	/* Try to fragment the packet.  Cases 1-b and 3. */
1185f95d4633SHajimu UMEMOTO 	if (mtu < IPV6_MMTU) {
11867c1daefeSBjoern A. Zeeb 		/* Path MTU cannot be less than IPV6_MMTU. */
118782cd038dSYoshinobu Inoue 		error = EMSGSIZE;
118882cd038dSYoshinobu Inoue 		in6_ifstat_inc(ifp, ifs6_out_fragfail);
118982cd038dSYoshinobu Inoue 		goto bad;
11907efe5d92SHajimu UMEMOTO 	} else if (ip6->ip6_plen == 0) {
11917c1daefeSBjoern A. Zeeb 		/* Jumbo payload cannot be fragmented. */
119282cd038dSYoshinobu Inoue 		error = EMSGSIZE;
119382cd038dSYoshinobu Inoue 		in6_ifstat_inc(ifp, ifs6_out_fragfail);
119482cd038dSYoshinobu Inoue 		goto bad;
119582cd038dSYoshinobu Inoue 	} else {
119682cd038dSYoshinobu Inoue 		u_char nextproto;
11972cb64cb2SGeorge V. Neville-Neil 
119882cd038dSYoshinobu Inoue 		/*
119982cd038dSYoshinobu Inoue 		 * Too large for the destination or interface;
120082cd038dSYoshinobu Inoue 		 * fragment if possible.
120182cd038dSYoshinobu Inoue 		 * Must be able to put at least 8 bytes per fragment.
120282cd038dSYoshinobu Inoue 		 */
120382cd038dSYoshinobu Inoue 		if (mtu > IPV6_MAXPACKET)
120482cd038dSYoshinobu Inoue 			mtu = IPV6_MAXPACKET;
120533841545SHajimu UMEMOTO 
12063459050cSBjoern A. Zeeb 		len = (mtu - unfragpartlen - sizeof(struct ip6_frag)) & ~7;
120782cd038dSYoshinobu Inoue 		if (len < 8) {
120882cd038dSYoshinobu Inoue 			error = EMSGSIZE;
120982cd038dSYoshinobu Inoue 			in6_ifstat_inc(ifp, ifs6_out_fragfail);
121082cd038dSYoshinobu Inoue 			goto bad;
121182cd038dSYoshinobu Inoue 		}
121282cd038dSYoshinobu Inoue 
12136f8aee22SBill Paul 		/*
1214e7b92e27SBjoern A. Zeeb 		 * If the interface will not calculate checksums on
1215e7b92e27SBjoern A. Zeeb 		 * fragmented packets, then do it here.
1216e7b92e27SBjoern A. Zeeb 		 * XXX-BZ handle the hw offloading case.  Need flags.
1217e7b92e27SBjoern A. Zeeb 		 */
121844775b16SMark Johnston 		ip6_output_delayed_csum(m, ifp, m->m_pkthdr.csum_flags, plen,
121944775b16SMark Johnston 		    optlen);
12203459050cSBjoern A. Zeeb 
122182cd038dSYoshinobu Inoue 		/*
122282cd038dSYoshinobu Inoue 		 * Change the next header field of the last header in the
122382cd038dSYoshinobu Inoue 		 * unfragmentable part.
122482cd038dSYoshinobu Inoue 		 */
122582cd038dSYoshinobu Inoue 		if (exthdrs.ip6e_rthdr) {
122682cd038dSYoshinobu Inoue 			nextproto = *mtod(exthdrs.ip6e_rthdr, u_char *);
122782cd038dSYoshinobu Inoue 			*mtod(exthdrs.ip6e_rthdr, u_char *) = IPPROTO_FRAGMENT;
122882cd038dSYoshinobu Inoue 		} else if (exthdrs.ip6e_dest1) {
122982cd038dSYoshinobu Inoue 			nextproto = *mtod(exthdrs.ip6e_dest1, u_char *);
123082cd038dSYoshinobu Inoue 			*mtod(exthdrs.ip6e_dest1, u_char *) = IPPROTO_FRAGMENT;
123182cd038dSYoshinobu Inoue 		} else if (exthdrs.ip6e_hbh) {
123282cd038dSYoshinobu Inoue 			nextproto = *mtod(exthdrs.ip6e_hbh, u_char *);
123382cd038dSYoshinobu Inoue 			*mtod(exthdrs.ip6e_hbh, u_char *) = IPPROTO_FRAGMENT;
123482cd038dSYoshinobu Inoue 		} else {
12353459050cSBjoern A. Zeeb 			ip6 = mtod(m, struct ip6_hdr *);
123682cd038dSYoshinobu Inoue 			nextproto = ip6->ip6_nxt;
123782cd038dSYoshinobu Inoue 			ip6->ip6_nxt = IPPROTO_FRAGMENT;
123882cd038dSYoshinobu Inoue 		}
123982cd038dSYoshinobu Inoue 
124082cd038dSYoshinobu Inoue 		/*
124182cd038dSYoshinobu Inoue 		 * Loop through length of segment after first fragment,
124288ff5695SSUZUKI Shinsuke 		 * make new header and copy data of each part and link onto
124388ff5695SSUZUKI Shinsuke 		 * chain.
124482cd038dSYoshinobu Inoue 		 */
124582cd038dSYoshinobu Inoue 		m0 = m;
124679831849SKristof Provost 		id = htonl(ip6_randomid());
12473459050cSBjoern A. Zeeb 		error = ip6_fragment(ifp, m, unfragpartlen, nextproto,len, id);
12483459050cSBjoern A. Zeeb 		if (error != 0)
124982cd038dSYoshinobu Inoue 			goto sendorfree;
125082cd038dSYoshinobu Inoue 
125182cd038dSYoshinobu Inoue 		in6_ifstat_inc(ifp, ifs6_out_fragok);
125282cd038dSYoshinobu Inoue 	}
125382cd038dSYoshinobu Inoue 
12547c1daefeSBjoern A. Zeeb 	/* Remove leading garbage. */
125582cd038dSYoshinobu Inoue sendorfree:
125682cd038dSYoshinobu Inoue 	m = m0->m_nextpkt;
125782cd038dSYoshinobu Inoue 	m0->m_nextpkt = 0;
125882cd038dSYoshinobu Inoue 	m_freem(m0);
1259c187c034SJonathan T. Looney 	for (; m; m = m0) {
126082cd038dSYoshinobu Inoue 		m0 = m->m_nextpkt;
126182cd038dSYoshinobu Inoue 		m->m_nextpkt = 0;
126282cd038dSYoshinobu Inoue 		if (error == 0) {
1263fe937674SJosef Karthauser 			/* Record statistics for this interface address. */
1264fe937674SJosef Karthauser 			if (ia) {
12657caf4ab7SGleb Smirnoff 				counter_u64_add(ia->ia_ifa.ifa_opackets, 1);
12667caf4ab7SGleb Smirnoff 				counter_u64_add(ia->ia_ifa.ifa_obytes,
12677caf4ab7SGleb Smirnoff 				    m->m_pkthdr.len);
1268fe937674SJosef Karthauser 			}
1269868aabb4SRichard Scheffenegger 			if (vlan_pcp > -1)
1270868aabb4SRichard Scheffenegger 				EVL_APPLY_PRI(m, vlan_pcp);
1271d7452d89SAndrew Gallatin 			error = ip6_output_send(inp, ifp, origifp, m, dst, ro,
1272d7452d89SAndrew Gallatin 			    true);
127382cd038dSYoshinobu Inoue 		} else
127482cd038dSYoshinobu Inoue 			m_freem(m);
127582cd038dSYoshinobu Inoue 	}
127682cd038dSYoshinobu Inoue 
127782cd038dSYoshinobu Inoue 	if (error == 0)
12789cb8d207SAndrey V. Elsukov 		IP6STAT_INC(ip6s_fragmented);
127982cd038dSYoshinobu Inoue 
128082cd038dSYoshinobu Inoue done:
128182cd038dSYoshinobu Inoue 	return (error);
128282cd038dSYoshinobu Inoue 
128382cd038dSYoshinobu Inoue freehdrs:
12847c1daefeSBjoern A. Zeeb 	m_freem(exthdrs.ip6e_hbh);	/* m_freem() checks if mbuf is NULL. */
128582cd038dSYoshinobu Inoue 	m_freem(exthdrs.ip6e_dest1);
128682cd038dSYoshinobu Inoue 	m_freem(exthdrs.ip6e_rthdr);
128782cd038dSYoshinobu Inoue 	m_freem(exthdrs.ip6e_dest2);
12887efe5d92SHajimu UMEMOTO 	/* FALLTHROUGH */
128982cd038dSYoshinobu Inoue bad:
12902cb64cb2SGeorge V. Neville-Neil 	if (m)
129182cd038dSYoshinobu Inoue 		m_freem(m);
129282cd038dSYoshinobu Inoue 	goto done;
129382cd038dSYoshinobu Inoue }
129482cd038dSYoshinobu Inoue 
129582cd038dSYoshinobu Inoue static int
12961272577eSXin LI ip6_copyexthdr(struct mbuf **mp, caddr_t hdr, int hlen)
129782cd038dSYoshinobu Inoue {
129882cd038dSYoshinobu Inoue 	struct mbuf *m;
129982cd038dSYoshinobu Inoue 
130082cd038dSYoshinobu Inoue 	if (hlen > MCLBYTES)
130182cd038dSYoshinobu Inoue 		return (ENOBUFS); /* XXX */
130282cd038dSYoshinobu Inoue 
130310e5acc3SGleb Smirnoff 	if (hlen > MLEN)
130410e5acc3SGleb Smirnoff 		m = m_getcl(M_NOWAIT, MT_DATA, 0);
130510e5acc3SGleb Smirnoff 	else
130610e5acc3SGleb Smirnoff 		m = m_get(M_NOWAIT, MT_DATA);
130710e5acc3SGleb Smirnoff 	if (m == NULL)
130882cd038dSYoshinobu Inoue 		return (ENOBUFS);
130982cd038dSYoshinobu Inoue 	m->m_len = hlen;
131082cd038dSYoshinobu Inoue 	if (hdr)
131182cd038dSYoshinobu Inoue 		bcopy(hdr, mtod(m, caddr_t), hlen);
131282cd038dSYoshinobu Inoue 
131382cd038dSYoshinobu Inoue 	*mp = m;
131482cd038dSYoshinobu Inoue 	return (0);
131582cd038dSYoshinobu Inoue }
131682cd038dSYoshinobu Inoue 
131782cd038dSYoshinobu Inoue /*
131882cd038dSYoshinobu Inoue  * Insert jumbo payload option.
131982cd038dSYoshinobu Inoue  */
132082cd038dSYoshinobu Inoue static int
13211272577eSXin LI ip6_insert_jumboopt(struct ip6_exthdrs *exthdrs, u_int32_t plen)
132282cd038dSYoshinobu Inoue {
132382cd038dSYoshinobu Inoue 	struct mbuf *mopt;
132482cd038dSYoshinobu Inoue 	u_char *optbuf;
132533841545SHajimu UMEMOTO 	u_int32_t v;
132682cd038dSYoshinobu Inoue 
132782cd038dSYoshinobu Inoue #define JUMBOOPTLEN	8	/* length of jumbo payload option and padding */
132882cd038dSYoshinobu Inoue 
132982cd038dSYoshinobu Inoue 	/*
133082cd038dSYoshinobu Inoue 	 * If there is no hop-by-hop options header, allocate new one.
133182cd038dSYoshinobu Inoue 	 * If there is one but it doesn't have enough space to store the
133282cd038dSYoshinobu Inoue 	 * jumbo payload option, allocate a cluster to store the whole options.
133382cd038dSYoshinobu Inoue 	 * Otherwise, use it to store the options.
133482cd038dSYoshinobu Inoue 	 */
1335155d72c4SPedro F. Giffuni 	if (exthdrs->ip6e_hbh == NULL) {
133610e5acc3SGleb Smirnoff 		mopt = m_get(M_NOWAIT, MT_DATA);
133710e5acc3SGleb Smirnoff 		if (mopt == NULL)
133882cd038dSYoshinobu Inoue 			return (ENOBUFS);
133982cd038dSYoshinobu Inoue 		mopt->m_len = JUMBOOPTLEN;
134082cd038dSYoshinobu Inoue 		optbuf = mtod(mopt, u_char *);
134182cd038dSYoshinobu Inoue 		optbuf[1] = 0;	/* = ((JUMBOOPTLEN) >> 3) - 1 */
134282cd038dSYoshinobu Inoue 		exthdrs->ip6e_hbh = mopt;
134382cd038dSYoshinobu Inoue 	} else {
134482cd038dSYoshinobu Inoue 		struct ip6_hbh *hbh;
134582cd038dSYoshinobu Inoue 
134682cd038dSYoshinobu Inoue 		mopt = exthdrs->ip6e_hbh;
134782cd038dSYoshinobu Inoue 		if (M_TRAILINGSPACE(mopt) < JUMBOOPTLEN) {
134833841545SHajimu UMEMOTO 			/*
134933841545SHajimu UMEMOTO 			 * XXX assumption:
135033841545SHajimu UMEMOTO 			 * - exthdrs->ip6e_hbh is not referenced from places
135133841545SHajimu UMEMOTO 			 *   other than exthdrs.
135233841545SHajimu UMEMOTO 			 * - exthdrs->ip6e_hbh is not an mbuf chain.
135333841545SHajimu UMEMOTO 			 */
135482cd038dSYoshinobu Inoue 			int oldoptlen = mopt->m_len;
135533841545SHajimu UMEMOTO 			struct mbuf *n;
135682cd038dSYoshinobu Inoue 
135733841545SHajimu UMEMOTO 			/*
135833841545SHajimu UMEMOTO 			 * XXX: give up if the whole (new) hbh header does
135933841545SHajimu UMEMOTO 			 * not fit even in an mbuf cluster.
136033841545SHajimu UMEMOTO 			 */
136133841545SHajimu UMEMOTO 			if (oldoptlen + JUMBOOPTLEN > MCLBYTES)
136282cd038dSYoshinobu Inoue 				return (ENOBUFS);
136382cd038dSYoshinobu Inoue 
136433841545SHajimu UMEMOTO 			/*
136533841545SHajimu UMEMOTO 			 * As a consequence, we must always prepare a cluster
136633841545SHajimu UMEMOTO 			 * at this point.
136733841545SHajimu UMEMOTO 			 */
136810e5acc3SGleb Smirnoff 			n = m_getcl(M_NOWAIT, MT_DATA, 0);
136910e5acc3SGleb Smirnoff 			if (n == NULL)
137033841545SHajimu UMEMOTO 				return (ENOBUFS);
137133841545SHajimu UMEMOTO 			n->m_len = oldoptlen + JUMBOOPTLEN;
137233841545SHajimu UMEMOTO 			bcopy(mtod(mopt, caddr_t), mtod(n, caddr_t),
137333841545SHajimu UMEMOTO 			    oldoptlen);
137433841545SHajimu UMEMOTO 			optbuf = mtod(n, caddr_t) + oldoptlen;
137533841545SHajimu UMEMOTO 			m_freem(mopt);
137633841545SHajimu UMEMOTO 			mopt = exthdrs->ip6e_hbh = n;
137782cd038dSYoshinobu Inoue 		} else {
137882cd038dSYoshinobu Inoue 			optbuf = mtod(mopt, u_char *) + mopt->m_len;
137982cd038dSYoshinobu Inoue 			mopt->m_len += JUMBOOPTLEN;
138082cd038dSYoshinobu Inoue 		}
138182cd038dSYoshinobu Inoue 		optbuf[0] = IP6OPT_PADN;
138282cd038dSYoshinobu Inoue 		optbuf[1] = 1;
138382cd038dSYoshinobu Inoue 
138482cd038dSYoshinobu Inoue 		/*
138582cd038dSYoshinobu Inoue 		 * Adjust the header length according to the pad and
138682cd038dSYoshinobu Inoue 		 * the jumbo payload option.
138782cd038dSYoshinobu Inoue 		 */
138882cd038dSYoshinobu Inoue 		hbh = mtod(mopt, struct ip6_hbh *);
138982cd038dSYoshinobu Inoue 		hbh->ip6h_len += (JUMBOOPTLEN >> 3);
139082cd038dSYoshinobu Inoue 	}
139182cd038dSYoshinobu Inoue 
139282cd038dSYoshinobu Inoue 	/* fill in the option. */
139382cd038dSYoshinobu Inoue 	optbuf[2] = IP6OPT_JUMBO;
139482cd038dSYoshinobu Inoue 	optbuf[3] = 4;
139533841545SHajimu UMEMOTO 	v = (u_int32_t)htonl(plen + JUMBOOPTLEN);
139633841545SHajimu UMEMOTO 	bcopy(&v, &optbuf[4], sizeof(u_int32_t));
139782cd038dSYoshinobu Inoue 
139882cd038dSYoshinobu Inoue 	/* finally, adjust the packet header length */
139982cd038dSYoshinobu Inoue 	exthdrs->ip6e_ip6->m_pkthdr.len += JUMBOOPTLEN;
140082cd038dSYoshinobu Inoue 
140182cd038dSYoshinobu Inoue 	return (0);
140282cd038dSYoshinobu Inoue #undef JUMBOOPTLEN
140382cd038dSYoshinobu Inoue }
140482cd038dSYoshinobu Inoue 
140582cd038dSYoshinobu Inoue /*
140682cd038dSYoshinobu Inoue  * Insert fragment header and copy unfragmentable header portions.
140782cd038dSYoshinobu Inoue  */
140882cd038dSYoshinobu Inoue static int
14091272577eSXin LI ip6_insertfraghdr(struct mbuf *m0, struct mbuf *m, int hlen,
14101272577eSXin LI     struct ip6_frag **frghdrp)
141182cd038dSYoshinobu Inoue {
141282cd038dSYoshinobu Inoue 	struct mbuf *n, *mlast;
141382cd038dSYoshinobu Inoue 
141482cd038dSYoshinobu Inoue 	if (hlen > sizeof(struct ip6_hdr)) {
141582cd038dSYoshinobu Inoue 		n = m_copym(m0, sizeof(struct ip6_hdr),
1416eb1b1807SGleb Smirnoff 		    hlen - sizeof(struct ip6_hdr), M_NOWAIT);
1417155d72c4SPedro F. Giffuni 		if (n == NULL)
141882cd038dSYoshinobu Inoue 			return (ENOBUFS);
141982cd038dSYoshinobu Inoue 		m->m_next = n;
142082cd038dSYoshinobu Inoue 	} else
142182cd038dSYoshinobu Inoue 		n = m;
142282cd038dSYoshinobu Inoue 
142382cd038dSYoshinobu Inoue 	/* Search for the last mbuf of unfragmentable part. */
142482cd038dSYoshinobu Inoue 	for (mlast = n; mlast->m_next; mlast = mlast->m_next)
142582cd038dSYoshinobu Inoue 		;
142682cd038dSYoshinobu Inoue 
1427f0cace5dSRobert Watson 	if (M_WRITABLE(mlast) &&
1428686cdd19SJun-ichiro itojun Hagino 	    M_TRAILINGSPACE(mlast) >= sizeof(struct ip6_frag)) {
142982cd038dSYoshinobu Inoue 		/* use the trailing space of the last mbuf for the fragment hdr */
14307efe5d92SHajimu UMEMOTO 		*frghdrp = (struct ip6_frag *)(mtod(mlast, caddr_t) +
14317efe5d92SHajimu UMEMOTO 		    mlast->m_len);
143282cd038dSYoshinobu Inoue 		mlast->m_len += sizeof(struct ip6_frag);
143382cd038dSYoshinobu Inoue 		m->m_pkthdr.len += sizeof(struct ip6_frag);
143482cd038dSYoshinobu Inoue 	} else {
143582cd038dSYoshinobu Inoue 		/* allocate a new mbuf for the fragment header */
143682cd038dSYoshinobu Inoue 		struct mbuf *mfrg;
143782cd038dSYoshinobu Inoue 
143810e5acc3SGleb Smirnoff 		mfrg = m_get(M_NOWAIT, MT_DATA);
143910e5acc3SGleb Smirnoff 		if (mfrg == NULL)
144082cd038dSYoshinobu Inoue 			return (ENOBUFS);
144182cd038dSYoshinobu Inoue 		mfrg->m_len = sizeof(struct ip6_frag);
144282cd038dSYoshinobu Inoue 		*frghdrp = mtod(mfrg, struct ip6_frag *);
144382cd038dSYoshinobu Inoue 		mlast->m_next = mfrg;
144482cd038dSYoshinobu Inoue 	}
144582cd038dSYoshinobu Inoue 
144682cd038dSYoshinobu Inoue 	return (0);
144782cd038dSYoshinobu Inoue }
144882cd038dSYoshinobu Inoue 
14490d4df029SAlexander V. Chernikov /*
14500d4df029SAlexander V. Chernikov  * Calculates IPv6 path mtu for destination @dst.
14510d4df029SAlexander V. Chernikov  * Resulting MTU is stored in @mtup.
14520d4df029SAlexander V. Chernikov  *
14530d4df029SAlexander V. Chernikov  * Returns 0 on success.
14540d4df029SAlexander V. Chernikov  */
145531b3783cSHajimu UMEMOTO static int
1456f0937b2cSAndrey V. Elsukov ip6_getpmtu_ctl(u_int fibnum, const struct in6_addr *dst, u_long *mtup)
14570d4df029SAlexander V. Chernikov {
14581483c1c5SAlexander V. Chernikov 	struct epoch_tracker et;
14591483c1c5SAlexander V. Chernikov 	struct nhop_object *nh;
1460bacf6684SAlexander V. Chernikov 	struct in6_addr kdst;
1461bacf6684SAlexander V. Chernikov 	uint32_t scopeid;
1462bacf6684SAlexander V. Chernikov 	int error;
14630d4df029SAlexander V. Chernikov 
1464bacf6684SAlexander V. Chernikov 	in6_splitscope(dst, &kdst, &scopeid);
14650d4df029SAlexander V. Chernikov 
14661483c1c5SAlexander V. Chernikov 	NET_EPOCH_ENTER(et);
14671483c1c5SAlexander V. Chernikov 	nh = fib6_lookup(fibnum, &kdst, scopeid, NHR_NONE, 0);
14681483c1c5SAlexander V. Chernikov 	if (nh != NULL)
14691483c1c5SAlexander V. Chernikov 		error = ip6_calcmtu(nh->nh_ifp, dst, nh->nh_mtu, mtup, NULL, 0);
14701483c1c5SAlexander V. Chernikov 	else
14711483c1c5SAlexander V. Chernikov 		error = EHOSTUNREACH;
14721483c1c5SAlexander V. Chernikov 	NET_EPOCH_EXIT(et);
1473bacf6684SAlexander V. Chernikov 
1474bacf6684SAlexander V. Chernikov 	return (error);
14750d4df029SAlexander V. Chernikov }
14760d4df029SAlexander V. Chernikov 
14770d4df029SAlexander V. Chernikov /*
14780d4df029SAlexander V. Chernikov  * Calculates IPv6 path MTU for @dst based on transmit @ifp,
14790d4df029SAlexander V. Chernikov  * and cached data in @ro_pmtu.
14800d4df029SAlexander V. Chernikov  * MTU from (successful) route lookup is saved (along with dst)
14810d4df029SAlexander V. Chernikov  * inside @ro_pmtu to avoid subsequent route lookups after packet
14820d4df029SAlexander V. Chernikov  * filter processing.
14830d4df029SAlexander V. Chernikov  *
14840d4df029SAlexander V. Chernikov  * Stores mtu and always-frag value into @mtup and @alwaysfragp.
14850d4df029SAlexander V. Chernikov  * Returns 0 on success.
14860d4df029SAlexander V. Chernikov  */
14870d4df029SAlexander V. Chernikov static int
14880d4df029SAlexander V. Chernikov ip6_getpmtu(struct route_in6 *ro_pmtu, int do_lookup,
1489f0937b2cSAndrey V. Elsukov     struct ifnet *ifp, const struct in6_addr *dst, u_long *mtup,
1490d4c22202SAndrew Gallatin     int *alwaysfragp, u_int fibnum, u_int proto)
149131b3783cSHajimu UMEMOTO {
14921483c1c5SAlexander V. Chernikov 	struct nhop_object *nh;
1493bacf6684SAlexander V. Chernikov 	struct in6_addr kdst;
1494bacf6684SAlexander V. Chernikov 	uint32_t scopeid;
1495000c42faSBjoern A. Zeeb 	struct sockaddr_in6 *sa6_dst, sin6;
14960d4df029SAlexander V. Chernikov 	u_long mtu;
149731b3783cSHajimu UMEMOTO 
14981483c1c5SAlexander V. Chernikov 	NET_EPOCH_ASSERT();
14991483c1c5SAlexander V. Chernikov 
15000d4df029SAlexander V. Chernikov 	mtu = 0;
1501000c42faSBjoern A. Zeeb 	if (ro_pmtu == NULL || do_lookup) {
15020d4df029SAlexander V. Chernikov 		/*
15030d4df029SAlexander V. Chernikov 		 * Here ro_pmtu has final destination address, while
15040d4df029SAlexander V. Chernikov 		 * ro might represent immediate destination.
15050d4df029SAlexander V. Chernikov 		 * Use ro_pmtu destination since mtu might differ.
15060d4df029SAlexander V. Chernikov 		 */
1507000c42faSBjoern A. Zeeb 		if (ro_pmtu != NULL) {
15080d4df029SAlexander V. Chernikov 			sa6_dst = (struct sockaddr_in6 *)&ro_pmtu->ro_dst;
15090d4df029SAlexander V. Chernikov 			if (!IN6_ARE_ADDR_EQUAL(&sa6_dst->sin6_addr, dst))
15100d4df029SAlexander V. Chernikov 				ro_pmtu->ro_mtu = 0;
1511000c42faSBjoern A. Zeeb 		} else
1512000c42faSBjoern A. Zeeb 			sa6_dst = &sin6;
15130d4df029SAlexander V. Chernikov 
1514000c42faSBjoern A. Zeeb 		if (ro_pmtu == NULL || ro_pmtu->ro_mtu == 0) {
151531b3783cSHajimu UMEMOTO 			bzero(sa6_dst, sizeof(*sa6_dst));
151631b3783cSHajimu UMEMOTO 			sa6_dst->sin6_family = AF_INET6;
151731b3783cSHajimu UMEMOTO 			sa6_dst->sin6_len = sizeof(struct sockaddr_in6);
151831b3783cSHajimu UMEMOTO 			sa6_dst->sin6_addr = *dst;
151931b3783cSHajimu UMEMOTO 
1520bacf6684SAlexander V. Chernikov 			in6_splitscope(dst, &kdst, &scopeid);
15211483c1c5SAlexander V. Chernikov 			nh = fib6_lookup(fibnum, &kdst, scopeid, NHR_NONE, 0);
15221483c1c5SAlexander V. Chernikov 			if (nh != NULL) {
15231483c1c5SAlexander V. Chernikov 				mtu = nh->nh_mtu;
1524000c42faSBjoern A. Zeeb 				if (ro_pmtu != NULL)
1525000c42faSBjoern A. Zeeb 					ro_pmtu->ro_mtu = mtu;
15260d4df029SAlexander V. Chernikov 			}
1527000c42faSBjoern A. Zeeb 		} else
1528bacf6684SAlexander V. Chernikov 			mtu = ro_pmtu->ro_mtu;
15290d4df029SAlexander V. Chernikov 	}
15300d4df029SAlexander V. Chernikov 
1531983066f0SAlexander V. Chernikov 	if (ro_pmtu != NULL && ro_pmtu->ro_nh != NULL)
1532983066f0SAlexander V. Chernikov 		mtu = ro_pmtu->ro_nh->nh_mtu;
15330d4df029SAlexander V. Chernikov 
1534d4c22202SAndrew Gallatin 	return (ip6_calcmtu(ifp, dst, mtu, mtup, alwaysfragp, proto));
15350d4df029SAlexander V. Chernikov }
15360d4df029SAlexander V. Chernikov 
15370d4df029SAlexander V. Chernikov /*
15380d4df029SAlexander V. Chernikov  * Calculate MTU based on transmit @ifp, route mtu @rt_mtu and
15390d4df029SAlexander V. Chernikov  * hostcache data for @dst.
15400d4df029SAlexander V. Chernikov  * Stores mtu and always-frag value into @mtup and @alwaysfragp.
15410d4df029SAlexander V. Chernikov  *
15420d4df029SAlexander V. Chernikov  * Returns 0 on success.
15430d4df029SAlexander V. Chernikov  */
15440d4df029SAlexander V. Chernikov static int
15450d4df029SAlexander V. Chernikov ip6_calcmtu(struct ifnet *ifp, const struct in6_addr *dst, u_long rt_mtu,
1546d4c22202SAndrew Gallatin     u_long *mtup, int *alwaysfragp, u_int proto)
15470d4df029SAlexander V. Chernikov {
15480d4df029SAlexander V. Chernikov 	u_long mtu = 0;
15490d4df029SAlexander V. Chernikov 	int alwaysfrag = 0;
15500d4df029SAlexander V. Chernikov 	int error = 0;
15510d4df029SAlexander V. Chernikov 
15520d4df029SAlexander V. Chernikov 	if (rt_mtu > 0) {
155331b3783cSHajimu UMEMOTO 		u_int32_t ifmtu;
155497d8d152SAndre Oppermann 		struct in_conninfo inc;
155597d8d152SAndre Oppermann 
155697d8d152SAndre Oppermann 		bzero(&inc, sizeof(inc));
1557dcdb4371SBjoern A. Zeeb 		inc.inc_flags |= INC_ISIPV6;
155897d8d152SAndre Oppermann 		inc.inc6_faddr = *dst;
155931b3783cSHajimu UMEMOTO 
156031b3783cSHajimu UMEMOTO 		ifmtu = IN6_LINKMTU(ifp);
1561d4c22202SAndrew Gallatin 
1562d4c22202SAndrew Gallatin 		/* TCP is known to react to pmtu changes so skip hc */
1563d4c22202SAndrew Gallatin 		if (proto != IPPROTO_TCP)
156497d8d152SAndre Oppermann 			mtu = tcp_hc_getmtu(&inc);
1565d4c22202SAndrew Gallatin 
156697d8d152SAndre Oppermann 		if (mtu)
15670d4df029SAlexander V. Chernikov 			mtu = min(mtu, rt_mtu);
156897d8d152SAndre Oppermann 		else
15690d4df029SAlexander V. Chernikov 			mtu = rt_mtu;
157031b3783cSHajimu UMEMOTO 		if (mtu == 0)
157131b3783cSHajimu UMEMOTO 			mtu = ifmtu;
1572f95d4633SHajimu UMEMOTO 		else if (mtu < IPV6_MMTU) {
1573f95d4633SHajimu UMEMOTO 			/*
1574f95d4633SHajimu UMEMOTO 			 * RFC2460 section 5, last paragraph:
1575f95d4633SHajimu UMEMOTO 			 * if we record ICMPv6 too big message with
1576f95d4633SHajimu UMEMOTO 			 * mtu < IPV6_MMTU, transmit packets sized IPV6_MMTU
1577f95d4633SHajimu UMEMOTO 			 * or smaller, with framgent header attached.
1578f95d4633SHajimu UMEMOTO 			 * (fragment header is needed regardless from the
1579f95d4633SHajimu UMEMOTO 			 * packet size, for translators to identify packets)
1580f95d4633SHajimu UMEMOTO 			 */
1581f95d4633SHajimu UMEMOTO 			alwaysfrag = 1;
1582f95d4633SHajimu UMEMOTO 			mtu = IPV6_MMTU;
158331b3783cSHajimu UMEMOTO 		}
158431b3783cSHajimu UMEMOTO 	} else if (ifp) {
158531b3783cSHajimu UMEMOTO 		mtu = IN6_LINKMTU(ifp);
158631b3783cSHajimu UMEMOTO 	} else
158731b3783cSHajimu UMEMOTO 		error = EHOSTUNREACH; /* XXX */
158831b3783cSHajimu UMEMOTO 
158931b3783cSHajimu UMEMOTO 	*mtup = mtu;
1590f95d4633SHajimu UMEMOTO 	if (alwaysfragp)
1591f95d4633SHajimu UMEMOTO 		*alwaysfragp = alwaysfrag;
159231b3783cSHajimu UMEMOTO 	return (error);
159331b3783cSHajimu UMEMOTO }
159431b3783cSHajimu UMEMOTO 
159582cd038dSYoshinobu Inoue /*
159682cd038dSYoshinobu Inoue  * IP6 socket option processing.
159782cd038dSYoshinobu Inoue  */
159882cd038dSYoshinobu Inoue int
15991272577eSXin LI ip6_ctloutput(struct socket *so, struct sockopt *sopt)
160082cd038dSYoshinobu Inoue {
160179ba3952SBjoern A. Zeeb 	int optdatalen, uproto;
1602f95d4633SHajimu UMEMOTO 	void *optdata;
16030ecd976eSBjoern A. Zeeb 	struct inpcb *inp = sotoinpcb(so);
160482cd038dSYoshinobu Inoue 	int error, optval;
160582cd038dSYoshinobu Inoue 	int level, op, optname;
160682cd038dSYoshinobu Inoue 	int optlen;
1607b40ce416SJulian Elischer 	struct thread *td;
1608c7c0d948SAdrian Chadd #ifdef	RSS
1609c7c0d948SAdrian Chadd 	uint32_t rss_bucket;
1610c7c0d948SAdrian Chadd 	int retval;
1611c7c0d948SAdrian Chadd #endif
161282cd038dSYoshinobu Inoue 
1613aec9c8d5SGeorge V. Neville-Neil /*
1614aec9c8d5SGeorge V. Neville-Neil  * Don't use more than a quarter of mbuf clusters.  N.B.:
1615aec9c8d5SGeorge V. Neville-Neil  * nmbclusters is an int, but nmbclusters * MCLBYTES may overflow
1616aec9c8d5SGeorge V. Neville-Neil  * on LP64 architectures, so cast to u_long to avoid undefined
1617aec9c8d5SGeorge V. Neville-Neil  * behavior.  ILP32 architectures cannot have nmbclusters
1618aec9c8d5SGeorge V. Neville-Neil  * large enough to overflow for other reasons.
1619aec9c8d5SGeorge V. Neville-Neil  */
1620aec9c8d5SGeorge V. Neville-Neil #define IPV6_PKTOPTIONS_MBUF_LIMIT	((u_long)nmbclusters * MCLBYTES / 4)
1621aec9c8d5SGeorge V. Neville-Neil 
162282cd038dSYoshinobu Inoue 	level = sopt->sopt_level;
162382cd038dSYoshinobu Inoue 	op = sopt->sopt_dir;
162482cd038dSYoshinobu Inoue 	optname = sopt->sopt_name;
162582cd038dSYoshinobu Inoue 	optlen = sopt->sopt_valsize;
1626b40ce416SJulian Elischer 	td = sopt->sopt_td;
1627cc29ac7dSRobert Watson 	error = 0;
1628cc29ac7dSRobert Watson 	optval = 0;
1629f95d4633SHajimu UMEMOTO 	uproto = (int)so->so_proto->pr_protocol;
163082cd038dSYoshinobu Inoue 
1631fc06cd42SMikolaj Golub 	if (level != IPPROTO_IPV6) {
1632fc06cd42SMikolaj Golub 		error = EINVAL;
1633fc06cd42SMikolaj Golub 
1634fc06cd42SMikolaj Golub 		if (sopt->sopt_level == SOL_SOCKET &&
1635fc06cd42SMikolaj Golub 		    sopt->sopt_dir == SOPT_SET) {
1636fc06cd42SMikolaj Golub 			switch (sopt->sopt_name) {
1637fc06cd42SMikolaj Golub 			case SO_REUSEADDR:
16380ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
1639efdf104bSMikolaj Golub 				if ((so->so_options & SO_REUSEADDR) != 0)
16400ecd976eSBjoern A. Zeeb 					inp->inp_flags2 |= INP_REUSEADDR;
1641fc06cd42SMikolaj Golub 				else
16420ecd976eSBjoern A. Zeeb 					inp->inp_flags2 &= ~INP_REUSEADDR;
16430ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
1644fc06cd42SMikolaj Golub 				error = 0;
1645fc06cd42SMikolaj Golub 				break;
1646fc06cd42SMikolaj Golub 			case SO_REUSEPORT:
16470ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
1648fc06cd42SMikolaj Golub 				if ((so->so_options & SO_REUSEPORT) != 0)
16490ecd976eSBjoern A. Zeeb 					inp->inp_flags2 |= INP_REUSEPORT;
1650fc06cd42SMikolaj Golub 				else
16510ecd976eSBjoern A. Zeeb 					inp->inp_flags2 &= ~INP_REUSEPORT;
16520ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
1653fc06cd42SMikolaj Golub 				error = 0;
1654fc06cd42SMikolaj Golub 				break;
16551a43cff9SSean Bruno 			case SO_REUSEPORT_LB:
16560ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
16571a43cff9SSean Bruno 				if ((so->so_options & SO_REUSEPORT_LB) != 0)
16580ecd976eSBjoern A. Zeeb 					inp->inp_flags2 |= INP_REUSEPORT_LB;
16591a43cff9SSean Bruno 				else
16600ecd976eSBjoern A. Zeeb 					inp->inp_flags2 &= ~INP_REUSEPORT_LB;
16610ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
16621a43cff9SSean Bruno 				error = 0;
16631a43cff9SSean Bruno 				break;
1664ee799639SBjoern A. Zeeb 			case SO_SETFIB:
16650ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
16660ecd976eSBjoern A. Zeeb 				inp->inp_inc.inc_fibnum = so->so_fibnum;
16670ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
1668ee799639SBjoern A. Zeeb 				error = 0;
1669ee799639SBjoern A. Zeeb 				break;
1670f3e7afe2SHans Petter Selasky 			case SO_MAX_PACING_RATE:
1671f3e7afe2SHans Petter Selasky #ifdef RATELIMIT
16720ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
16730ecd976eSBjoern A. Zeeb 				inp->inp_flags2 |= INP_RATE_LIMIT_CHANGED;
16740ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
1675f3e7afe2SHans Petter Selasky 				error = 0;
1676f3e7afe2SHans Petter Selasky #else
1677f3e7afe2SHans Petter Selasky 				error = EOPNOTSUPP;
1678f3e7afe2SHans Petter Selasky #endif
1679f3e7afe2SHans Petter Selasky 				break;
1680fc06cd42SMikolaj Golub 			default:
1681fc06cd42SMikolaj Golub 				break;
1682fc06cd42SMikolaj Golub 			}
1683fc06cd42SMikolaj Golub 		}
1684fc06cd42SMikolaj Golub 	} else {		/* level == IPPROTO_IPV6 */
168582cd038dSYoshinobu Inoue 		switch (op) {
168682cd038dSYoshinobu Inoue 		case SOPT_SET:
168782cd038dSYoshinobu Inoue 			switch (optname) {
1688f95d4633SHajimu UMEMOTO 			case IPV6_2292PKTOPTIONS:
1689f95d4633SHajimu UMEMOTO #ifdef IPV6_PKTOPTIONS
169082cd038dSYoshinobu Inoue 			case IPV6_PKTOPTIONS:
1691f95d4633SHajimu UMEMOTO #endif
169282cd038dSYoshinobu Inoue 			{
169382cd038dSYoshinobu Inoue 				struct mbuf *m;
169482cd038dSYoshinobu Inoue 
1695aec9c8d5SGeorge V. Neville-Neil 				if (optlen > IPV6_PKTOPTIONS_MBUF_LIMIT) {
1696aec9c8d5SGeorge V. Neville-Neil 					printf("ip6_ctloutput: mbuf limit hit\n");
1697aec9c8d5SGeorge V. Neville-Neil 					error = ENOBUFS;
1698aec9c8d5SGeorge V. Neville-Neil 					break;
1699aec9c8d5SGeorge V. Neville-Neil 				}
1700aec9c8d5SGeorge V. Neville-Neil 
170182cd038dSYoshinobu Inoue 				error = soopt_getm(sopt, &m); /* XXX */
1702a89ec05eSPeter Wemm 				if (error != 0)
170382cd038dSYoshinobu Inoue 					break;
170482cd038dSYoshinobu Inoue 				error = soopt_mcopyin(sopt, m); /* XXX */
1705a89ec05eSPeter Wemm 				if (error != 0)
170682cd038dSYoshinobu Inoue 					break;
1707e02582d1SMark Johnston 				INP_WLOCK(inp);
1708e02582d1SMark Johnston 				error = ip6_pcbopts(&inp->in6p_outputopts, m,
1709e02582d1SMark Johnston 				    so, sopt);
1710e02582d1SMark Johnston 				INP_WUNLOCK(inp);
171133841545SHajimu UMEMOTO 				m_freem(m); /* XXX */
171282cd038dSYoshinobu Inoue 				break;
171382cd038dSYoshinobu Inoue 			}
171433841545SHajimu UMEMOTO 
171533841545SHajimu UMEMOTO 			/*
171633841545SHajimu UMEMOTO 			 * Use of some Hop-by-Hop options or some
171733841545SHajimu UMEMOTO 			 * Destination options, might require special
171833841545SHajimu UMEMOTO 			 * privilege.  That is, normal applications
171933841545SHajimu UMEMOTO 			 * (without special privilege) might be forbidden
172033841545SHajimu UMEMOTO 			 * from setting certain options in outgoing packets,
172133841545SHajimu UMEMOTO 			 * and might never see certain options in received
172233841545SHajimu UMEMOTO 			 * packets. [RFC 2292 Section 6]
172333841545SHajimu UMEMOTO 			 * KAME specific note:
172433841545SHajimu UMEMOTO 			 *  KAME prevents non-privileged users from sending or
172533841545SHajimu UMEMOTO 			 *  receiving ANY hbh/dst options in order to avoid
172633841545SHajimu UMEMOTO 			 *  overhead of parsing options in the kernel.
172733841545SHajimu UMEMOTO 			 */
1728f95d4633SHajimu UMEMOTO 			case IPV6_RECVHOPOPTS:
1729f95d4633SHajimu UMEMOTO 			case IPV6_RECVDSTOPTS:
1730f95d4633SHajimu UMEMOTO 			case IPV6_RECVRTHDRDSTOPTS:
173179ba3952SBjoern A. Zeeb 				if (td != NULL) {
173279ba3952SBjoern A. Zeeb 					error = priv_check(td,
173379ba3952SBjoern A. Zeeb 					    PRIV_NETINET_SETHDROPTS);
173479ba3952SBjoern A. Zeeb 					if (error)
1735f95d4633SHajimu UMEMOTO 						break;
1736f95d4633SHajimu UMEMOTO 				}
1737f95d4633SHajimu UMEMOTO 				/* FALLTHROUGH */
173882cd038dSYoshinobu Inoue 			case IPV6_UNICAST_HOPS:
1739f95d4633SHajimu UMEMOTO 			case IPV6_HOPLIMIT:
174033841545SHajimu UMEMOTO 
1741f95d4633SHajimu UMEMOTO 			case IPV6_RECVPKTINFO:
1742f95d4633SHajimu UMEMOTO 			case IPV6_RECVHOPLIMIT:
1743f95d4633SHajimu UMEMOTO 			case IPV6_RECVRTHDR:
1744f95d4633SHajimu UMEMOTO 			case IPV6_RECVPATHMTU:
1745f95d4633SHajimu UMEMOTO 			case IPV6_RECVTCLASS:
174668bb8d62SAdrian Chadd 			case IPV6_RECVFLOWID:
174768bb8d62SAdrian Chadd #ifdef	RSS
174868bb8d62SAdrian Chadd 			case IPV6_RECVRSSBUCKETID:
174968bb8d62SAdrian Chadd #endif
175033841545SHajimu UMEMOTO 			case IPV6_V6ONLY:
1751f95d4633SHajimu UMEMOTO 			case IPV6_AUTOFLOWLABEL:
1752dce33a45SErmal Luçi 			case IPV6_ORIGDSTADDR:
1753f44270e7SPawel Jakub Dawidek 			case IPV6_BINDANY:
1754c7c0d948SAdrian Chadd 			case IPV6_BINDMULTI:
1755c7c0d948SAdrian Chadd #ifdef	RSS
1756c7c0d948SAdrian Chadd 			case IPV6_RSS_LISTEN_BUCKET:
1757c7c0d948SAdrian Chadd #endif
1758868aabb4SRichard Scheffenegger 			case IPV6_VLAN_PCP:
1759f44270e7SPawel Jakub Dawidek 				if (optname == IPV6_BINDANY && td != NULL) {
1760f44270e7SPawel Jakub Dawidek 					error = priv_check(td,
1761f44270e7SPawel Jakub Dawidek 					    PRIV_NETINET_BINDANY);
1762f44270e7SPawel Jakub Dawidek 					if (error)
1763f44270e7SPawel Jakub Dawidek 						break;
1764f44270e7SPawel Jakub Dawidek 				}
1765f44270e7SPawel Jakub Dawidek 
176633841545SHajimu UMEMOTO 				if (optlen != sizeof(int)) {
176782cd038dSYoshinobu Inoue 					error = EINVAL;
176833841545SHajimu UMEMOTO 					break;
176933841545SHajimu UMEMOTO 				}
177082cd038dSYoshinobu Inoue 				error = sooptcopyin(sopt, &optval,
177182cd038dSYoshinobu Inoue 					sizeof optval, sizeof optval);
177282cd038dSYoshinobu Inoue 				if (error)
177382cd038dSYoshinobu Inoue 					break;
177482cd038dSYoshinobu Inoue 				switch (optname) {
177582cd038dSYoshinobu Inoue 				case IPV6_UNICAST_HOPS:
177682cd038dSYoshinobu Inoue 					if (optval < -1 || optval >= 256)
177782cd038dSYoshinobu Inoue 						error = EINVAL;
177882cd038dSYoshinobu Inoue 					else {
177982cd038dSYoshinobu Inoue 						/* -1 = kernel default */
17800ecd976eSBjoern A. Zeeb 						inp->in6p_hops = optval;
17810ecd976eSBjoern A. Zeeb 						if ((inp->inp_vflag &
178282cd038dSYoshinobu Inoue 						     INP_IPV4) != 0)
17830ecd976eSBjoern A. Zeeb 							inp->inp_ip_ttl = optval;
178482cd038dSYoshinobu Inoue 					}
178582cd038dSYoshinobu Inoue 					break;
178682cd038dSYoshinobu Inoue #define OPTSET(bit) \
178733841545SHajimu UMEMOTO do { \
17880ecd976eSBjoern A. Zeeb 	INP_WLOCK(inp); \
178982cd038dSYoshinobu Inoue 	if (optval) \
17900ecd976eSBjoern A. Zeeb 		inp->inp_flags |= (bit); \
179182cd038dSYoshinobu Inoue 	else \
17920ecd976eSBjoern A. Zeeb 		inp->inp_flags &= ~(bit); \
17930ecd976eSBjoern A. Zeeb 	INP_WUNLOCK(inp); \
17947efe5d92SHajimu UMEMOTO } while (/*CONSTCOND*/ 0)
1795f95d4633SHajimu UMEMOTO #define OPTSET2292(bit) \
1796f95d4633SHajimu UMEMOTO do { \
17970ecd976eSBjoern A. Zeeb 	INP_WLOCK(inp); \
17980ecd976eSBjoern A. Zeeb 	inp->inp_flags |= IN6P_RFC2292; \
1799f95d4633SHajimu UMEMOTO 	if (optval) \
18000ecd976eSBjoern A. Zeeb 		inp->inp_flags |= (bit); \
1801f95d4633SHajimu UMEMOTO 	else \
18020ecd976eSBjoern A. Zeeb 		inp->inp_flags &= ~(bit); \
18030ecd976eSBjoern A. Zeeb 	INP_WUNLOCK(inp); \
1804f95d4633SHajimu UMEMOTO } while (/*CONSTCOND*/ 0)
18050ecd976eSBjoern A. Zeeb #define OPTBIT(bit) (inp->inp_flags & (bit) ? 1 : 0)
180682cd038dSYoshinobu Inoue 
180737d4fc1eSSean Bruno #define OPTSET2_N(bit, val) do {					\
1808c7c0d948SAdrian Chadd 	if (val)							\
18090ecd976eSBjoern A. Zeeb 		inp->inp_flags2 |= bit;					\
1810c7c0d948SAdrian Chadd 	else								\
18110ecd976eSBjoern A. Zeeb 		inp->inp_flags2 &= ~bit;				\
181237d4fc1eSSean Bruno } while (0)
181337d4fc1eSSean Bruno #define OPTSET2(bit, val) do {						\
18140ecd976eSBjoern A. Zeeb 	INP_WLOCK(inp);							\
181537d4fc1eSSean Bruno 	OPTSET2_N(bit, val);						\
18160ecd976eSBjoern A. Zeeb 	INP_WUNLOCK(inp);						\
1817c7c0d948SAdrian Chadd } while (0)
18180ecd976eSBjoern A. Zeeb #define OPTBIT2(bit) (inp->inp_flags2 & (bit) ? 1 : 0)
181937d4fc1eSSean Bruno #define OPTSET2292_EXCLUSIVE(bit)					\
182037d4fc1eSSean Bruno do {									\
18210ecd976eSBjoern A. Zeeb 	INP_WLOCK(inp);							\
182237d4fc1eSSean Bruno 	if (OPTBIT(IN6P_RFC2292)) {					\
182337d4fc1eSSean Bruno 		error = EINVAL;						\
182437d4fc1eSSean Bruno 	} else {							\
182537d4fc1eSSean Bruno 		if (optval)						\
18260ecd976eSBjoern A. Zeeb 			inp->inp_flags |= (bit);			\
182737d4fc1eSSean Bruno 		else							\
18280ecd976eSBjoern A. Zeeb 			inp->inp_flags &= ~(bit);			\
182937d4fc1eSSean Bruno 	}								\
18300ecd976eSBjoern A. Zeeb 	INP_WUNLOCK(inp);						\
183137d4fc1eSSean Bruno } while (/*CONSTCOND*/ 0)
1832c7c0d948SAdrian Chadd 
1833f95d4633SHajimu UMEMOTO 				case IPV6_RECVPKTINFO:
183437d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_PKTINFO);
1835f95d4633SHajimu UMEMOTO 					break;
1836f95d4633SHajimu UMEMOTO 
1837f95d4633SHajimu UMEMOTO 				case IPV6_HOPLIMIT:
1838f95d4633SHajimu UMEMOTO 				{
1839f95d4633SHajimu UMEMOTO 					struct ip6_pktopts **optp;
1840f95d4633SHajimu UMEMOTO 
1841f95d4633SHajimu UMEMOTO 					/* cannot mix with RFC2292 */
1842f95d4633SHajimu UMEMOTO 					if (OPTBIT(IN6P_RFC2292)) {
1843f95d4633SHajimu UMEMOTO 						error = EINVAL;
1844f95d4633SHajimu UMEMOTO 						break;
1845f95d4633SHajimu UMEMOTO 					}
18460ecd976eSBjoern A. Zeeb 					INP_WLOCK(inp);
1847*53af6903SGleb Smirnoff 					if (inp->inp_flags & INP_DROPPED) {
18480ecd976eSBjoern A. Zeeb 						INP_WUNLOCK(inp);
184956713d16SMatt Macy 						return (ECONNRESET);
185056713d16SMatt Macy 					}
18510ecd976eSBjoern A. Zeeb 					optp = &inp->in6p_outputopts;
1852f95d4633SHajimu UMEMOTO 					error = ip6_pcbopt(IPV6_HOPLIMIT,
185379ba3952SBjoern A. Zeeb 					    (u_char *)&optval, sizeof(optval),
185479ba3952SBjoern A. Zeeb 					    optp, (td != NULL) ? td->td_ucred :
185579ba3952SBjoern A. Zeeb 					    NULL, uproto);
18560ecd976eSBjoern A. Zeeb 					INP_WUNLOCK(inp);
1857f95d4633SHajimu UMEMOTO 					break;
1858f95d4633SHajimu UMEMOTO 				}
1859f95d4633SHajimu UMEMOTO 
1860f95d4633SHajimu UMEMOTO 				case IPV6_RECVHOPLIMIT:
186137d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_HOPLIMIT);
1862f95d4633SHajimu UMEMOTO 					break;
1863f95d4633SHajimu UMEMOTO 
1864f95d4633SHajimu UMEMOTO 				case IPV6_RECVHOPOPTS:
186537d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_HOPOPTS);
1866f95d4633SHajimu UMEMOTO 					break;
1867f95d4633SHajimu UMEMOTO 
1868f95d4633SHajimu UMEMOTO 				case IPV6_RECVDSTOPTS:
186937d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_DSTOPTS);
1870f95d4633SHajimu UMEMOTO 					break;
1871f95d4633SHajimu UMEMOTO 
1872f95d4633SHajimu UMEMOTO 				case IPV6_RECVRTHDRDSTOPTS:
187337d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_RTHDRDSTOPTS);
1874f95d4633SHajimu UMEMOTO 					break;
1875f95d4633SHajimu UMEMOTO 
1876f95d4633SHajimu UMEMOTO 				case IPV6_RECVRTHDR:
187737d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_RTHDR);
187882cd038dSYoshinobu Inoue 					break;
187982cd038dSYoshinobu Inoue 
1880f95d4633SHajimu UMEMOTO 				case IPV6_RECVPATHMTU:
1881f95d4633SHajimu UMEMOTO 					/*
1882f95d4633SHajimu UMEMOTO 					 * We ignore this option for TCP
1883f95d4633SHajimu UMEMOTO 					 * sockets.
188418b35df8SHajimu UMEMOTO 					 * (RFC3542 leaves this case
1885f95d4633SHajimu UMEMOTO 					 * unspecified.)
1886f95d4633SHajimu UMEMOTO 					 */
1887f95d4633SHajimu UMEMOTO 					if (uproto != IPPROTO_TCP)
1888f95d4633SHajimu UMEMOTO 						OPTSET(IN6P_MTU);
1889f95d4633SHajimu UMEMOTO 					break;
1890f95d4633SHajimu UMEMOTO 
189168bb8d62SAdrian Chadd 				case IPV6_RECVFLOWID:
189268bb8d62SAdrian Chadd 					OPTSET2(INP_RECVFLOWID, optval);
189368bb8d62SAdrian Chadd 					break;
189468bb8d62SAdrian Chadd 
189568bb8d62SAdrian Chadd #ifdef	RSS
189668bb8d62SAdrian Chadd 				case IPV6_RECVRSSBUCKETID:
189768bb8d62SAdrian Chadd 					OPTSET2(INP_RECVRSSBUCKETID, optval);
189868bb8d62SAdrian Chadd 					break;
189968bb8d62SAdrian Chadd #endif
190068bb8d62SAdrian Chadd 
190133841545SHajimu UMEMOTO 				case IPV6_V6ONLY:
1902cb49ec54SMark Johnston 					INP_WLOCK(inp);
19030ecd976eSBjoern A. Zeeb 					if (inp->inp_lport ||
19040ecd976eSBjoern A. Zeeb 					    !IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr)) {
1905cb49ec54SMark Johnston 						/*
1906cb49ec54SMark Johnston 						 * The socket is already bound.
1907cb49ec54SMark Johnston 						 */
1908cb49ec54SMark Johnston 						INP_WUNLOCK(inp);
19090554093bSHajimu UMEMOTO 						error = EINVAL;
19100554093bSHajimu UMEMOTO 						break;
19110554093bSHajimu UMEMOTO 					}
1912cb49ec54SMark Johnston 					if (optval) {
1913cb49ec54SMark Johnston 						inp->inp_flags |= IN6P_IPV6_V6ONLY;
19140ecd976eSBjoern A. Zeeb 						inp->inp_vflag &= ~INP_IPV4;
1915cb49ec54SMark Johnston 					} else {
1916cb49ec54SMark Johnston 						inp->inp_flags &= ~IN6P_IPV6_V6ONLY;
19170ecd976eSBjoern A. Zeeb 						inp->inp_vflag |= INP_IPV4;
1918cb49ec54SMark Johnston 					}
1919cb49ec54SMark Johnston 					INP_WUNLOCK(inp);
192082cd038dSYoshinobu Inoue 					break;
1921f95d4633SHajimu UMEMOTO 				case IPV6_RECVTCLASS:
1922f95d4633SHajimu UMEMOTO 					/* cannot mix with RFC2292 XXX */
192337d4fc1eSSean Bruno 					OPTSET2292_EXCLUSIVE(IN6P_TCLASS);
1924f95d4633SHajimu UMEMOTO 					break;
1925f95d4633SHajimu UMEMOTO 				case IPV6_AUTOFLOWLABEL:
1926f95d4633SHajimu UMEMOTO 					OPTSET(IN6P_AUTOFLOWLABEL);
1927f95d4633SHajimu UMEMOTO 					break;
1928f95d4633SHajimu UMEMOTO 
1929dce33a45SErmal Luçi 				case IPV6_ORIGDSTADDR:
1930dce33a45SErmal Luçi 					OPTSET2(INP_ORIGDSTADDR, optval);
1931dce33a45SErmal Luçi 					break;
1932f44270e7SPawel Jakub Dawidek 				case IPV6_BINDANY:
1933f44270e7SPawel Jakub Dawidek 					OPTSET(INP_BINDANY);
1934f44270e7SPawel Jakub Dawidek 					break;
1935c7c0d948SAdrian Chadd 
1936c7c0d948SAdrian Chadd 				case IPV6_BINDMULTI:
1937c7c0d948SAdrian Chadd 					OPTSET2(INP_BINDMULTI, optval);
1938c7c0d948SAdrian Chadd 					break;
1939c7c0d948SAdrian Chadd #ifdef	RSS
1940c7c0d948SAdrian Chadd 				case IPV6_RSS_LISTEN_BUCKET:
1941c7c0d948SAdrian Chadd 					if ((optval >= 0) &&
1942c7c0d948SAdrian Chadd 					    (optval < rss_getnumbuckets())) {
19430ecd976eSBjoern A. Zeeb 						INP_WLOCK(inp);
19440ecd976eSBjoern A. Zeeb 						inp->inp_rss_listen_bucket = optval;
194537d4fc1eSSean Bruno 						OPTSET2_N(INP_RSS_BUCKET_SET, 1);
19460ecd976eSBjoern A. Zeeb 						INP_WUNLOCK(inp);
1947c7c0d948SAdrian Chadd 					} else {
1948c7c0d948SAdrian Chadd 						error = EINVAL;
1949c7c0d948SAdrian Chadd 					}
1950c7c0d948SAdrian Chadd 					break;
1951c7c0d948SAdrian Chadd #endif
1952868aabb4SRichard Scheffenegger 				case IPV6_VLAN_PCP:
1953868aabb4SRichard Scheffenegger 					if ((optval >= -1) && (optval <=
1954868aabb4SRichard Scheffenegger 					    (INP_2PCP_MASK >> INP_2PCP_SHIFT))) {
1955868aabb4SRichard Scheffenegger 						if (optval == -1) {
1956868aabb4SRichard Scheffenegger 							INP_WLOCK(inp);
1957868aabb4SRichard Scheffenegger 							inp->inp_flags2 &=
1958868aabb4SRichard Scheffenegger 							    ~(INP_2PCP_SET |
1959868aabb4SRichard Scheffenegger 							    INP_2PCP_MASK);
1960868aabb4SRichard Scheffenegger 							INP_WUNLOCK(inp);
1961868aabb4SRichard Scheffenegger 						} else {
1962868aabb4SRichard Scheffenegger 							INP_WLOCK(inp);
1963868aabb4SRichard Scheffenegger 							inp->inp_flags2 |=
1964868aabb4SRichard Scheffenegger 							    INP_2PCP_SET;
1965868aabb4SRichard Scheffenegger 							inp->inp_flags2 &=
1966868aabb4SRichard Scheffenegger 							    ~INP_2PCP_MASK;
1967868aabb4SRichard Scheffenegger 							inp->inp_flags2 |=
1968868aabb4SRichard Scheffenegger 							    optval <<
1969868aabb4SRichard Scheffenegger 							    INP_2PCP_SHIFT;
1970868aabb4SRichard Scheffenegger 							INP_WUNLOCK(inp);
1971868aabb4SRichard Scheffenegger 						}
1972868aabb4SRichard Scheffenegger 					} else
1973868aabb4SRichard Scheffenegger 						error = EINVAL;
1974868aabb4SRichard Scheffenegger 					break;
197582cd038dSYoshinobu Inoue 				}
197633841545SHajimu UMEMOTO 				break;
197733841545SHajimu UMEMOTO 
1978f95d4633SHajimu UMEMOTO 			case IPV6_TCLASS:
1979f95d4633SHajimu UMEMOTO 			case IPV6_DONTFRAG:
1980f95d4633SHajimu UMEMOTO 			case IPV6_USE_MIN_MTU:
1981f95d4633SHajimu UMEMOTO 			case IPV6_PREFER_TEMPADDR:
1982f95d4633SHajimu UMEMOTO 				if (optlen != sizeof(optval)) {
1983f95d4633SHajimu UMEMOTO 					error = EINVAL;
1984f95d4633SHajimu UMEMOTO 					break;
1985f95d4633SHajimu UMEMOTO 				}
1986f95d4633SHajimu UMEMOTO 				error = sooptcopyin(sopt, &optval,
1987f95d4633SHajimu UMEMOTO 					sizeof optval, sizeof optval);
1988f95d4633SHajimu UMEMOTO 				if (error)
1989f95d4633SHajimu UMEMOTO 					break;
1990f95d4633SHajimu UMEMOTO 				{
1991f95d4633SHajimu UMEMOTO 					struct ip6_pktopts **optp;
19920ecd976eSBjoern A. Zeeb 					INP_WLOCK(inp);
1993*53af6903SGleb Smirnoff 					if (inp->inp_flags & INP_DROPPED) {
19940ecd976eSBjoern A. Zeeb 						INP_WUNLOCK(inp);
199556713d16SMatt Macy 						return (ECONNRESET);
199656713d16SMatt Macy 					}
19970ecd976eSBjoern A. Zeeb 					optp = &inp->in6p_outputopts;
1998f95d4633SHajimu UMEMOTO 					error = ip6_pcbopt(optname,
199979ba3952SBjoern A. Zeeb 					    (u_char *)&optval, sizeof(optval),
200079ba3952SBjoern A. Zeeb 					    optp, (td != NULL) ? td->td_ucred :
200179ba3952SBjoern A. Zeeb 					    NULL, uproto);
20020ecd976eSBjoern A. Zeeb 					INP_WUNLOCK(inp);
2003f95d4633SHajimu UMEMOTO 					break;
2004f95d4633SHajimu UMEMOTO 				}
2005f95d4633SHajimu UMEMOTO 
2006f95d4633SHajimu UMEMOTO 			case IPV6_2292PKTINFO:
2007f95d4633SHajimu UMEMOTO 			case IPV6_2292HOPLIMIT:
2008f95d4633SHajimu UMEMOTO 			case IPV6_2292HOPOPTS:
2009f95d4633SHajimu UMEMOTO 			case IPV6_2292DSTOPTS:
2010f95d4633SHajimu UMEMOTO 			case IPV6_2292RTHDR:
201133841545SHajimu UMEMOTO 				/* RFC 2292 */
201233841545SHajimu UMEMOTO 				if (optlen != sizeof(int)) {
201333841545SHajimu UMEMOTO 					error = EINVAL;
201433841545SHajimu UMEMOTO 					break;
201533841545SHajimu UMEMOTO 				}
201633841545SHajimu UMEMOTO 				error = sooptcopyin(sopt, &optval,
201733841545SHajimu UMEMOTO 					sizeof optval, sizeof optval);
201833841545SHajimu UMEMOTO 				if (error)
201933841545SHajimu UMEMOTO 					break;
202033841545SHajimu UMEMOTO 				switch (optname) {
2021f95d4633SHajimu UMEMOTO 				case IPV6_2292PKTINFO:
2022f95d4633SHajimu UMEMOTO 					OPTSET2292(IN6P_PKTINFO);
202333841545SHajimu UMEMOTO 					break;
2024f95d4633SHajimu UMEMOTO 				case IPV6_2292HOPLIMIT:
2025f95d4633SHajimu UMEMOTO 					OPTSET2292(IN6P_HOPLIMIT);
202633841545SHajimu UMEMOTO 					break;
2027f95d4633SHajimu UMEMOTO 				case IPV6_2292HOPOPTS:
202833841545SHajimu UMEMOTO 					/*
202933841545SHajimu UMEMOTO 					 * Check super-user privilege.
203033841545SHajimu UMEMOTO 					 * See comments for IPV6_RECVHOPOPTS.
203133841545SHajimu UMEMOTO 					 */
203279ba3952SBjoern A. Zeeb 					if (td != NULL) {
203379ba3952SBjoern A. Zeeb 						error = priv_check(td,
203479ba3952SBjoern A. Zeeb 						    PRIV_NETINET_SETHDROPTS);
203579ba3952SBjoern A. Zeeb 						if (error)
203679ba3952SBjoern A. Zeeb 							return (error);
203779ba3952SBjoern A. Zeeb 					}
2038f95d4633SHajimu UMEMOTO 					OPTSET2292(IN6P_HOPOPTS);
203933841545SHajimu UMEMOTO 					break;
2040f95d4633SHajimu UMEMOTO 				case IPV6_2292DSTOPTS:
204179ba3952SBjoern A. Zeeb 					if (td != NULL) {
204279ba3952SBjoern A. Zeeb 						error = priv_check(td,
204379ba3952SBjoern A. Zeeb 						    PRIV_NETINET_SETHDROPTS);
204479ba3952SBjoern A. Zeeb 						if (error)
204579ba3952SBjoern A. Zeeb 							return (error);
204679ba3952SBjoern A. Zeeb 					}
2047f95d4633SHajimu UMEMOTO 					OPTSET2292(IN6P_DSTOPTS|IN6P_RTHDRDSTOPTS); /* XXX */
204833841545SHajimu UMEMOTO 					break;
2049f95d4633SHajimu UMEMOTO 				case IPV6_2292RTHDR:
2050f95d4633SHajimu UMEMOTO 					OPTSET2292(IN6P_RTHDR);
205133841545SHajimu UMEMOTO 					break;
205282cd038dSYoshinobu Inoue 				}
205382cd038dSYoshinobu Inoue 				break;
2054f95d4633SHajimu UMEMOTO 			case IPV6_PKTINFO:
2055f95d4633SHajimu UMEMOTO 			case IPV6_HOPOPTS:
2056f95d4633SHajimu UMEMOTO 			case IPV6_RTHDR:
2057f95d4633SHajimu UMEMOTO 			case IPV6_DSTOPTS:
2058f95d4633SHajimu UMEMOTO 			case IPV6_RTHDRDSTOPTS:
2059f95d4633SHajimu UMEMOTO 			case IPV6_NEXTHOP:
2060f95d4633SHajimu UMEMOTO 			{
206118b35df8SHajimu UMEMOTO 				/* new advanced API (RFC3542) */
2062f95d4633SHajimu UMEMOTO 				u_char *optbuf;
2063e770771aSHajimu UMEMOTO 				u_char optbuf_storage[MCLBYTES];
2064f95d4633SHajimu UMEMOTO 				int optlen;
2065f95d4633SHajimu UMEMOTO 				struct ip6_pktopts **optp;
2066f95d4633SHajimu UMEMOTO 
206772bfa0bfSSean Bruno 				/* cannot mix with RFC2292 */
206872bfa0bfSSean Bruno 				if (OPTBIT(IN6P_RFC2292)) {
206972bfa0bfSSean Bruno 					error = EINVAL;
207072bfa0bfSSean Bruno 					break;
207172bfa0bfSSean Bruno 				}
207272bfa0bfSSean Bruno 
2073e770771aSHajimu UMEMOTO 				/*
2074e770771aSHajimu UMEMOTO 				 * We only ensure valsize is not too large
2075e770771aSHajimu UMEMOTO 				 * here.  Further validation will be done
2076e770771aSHajimu UMEMOTO 				 * later.
2077e770771aSHajimu UMEMOTO 				 */
2078e770771aSHajimu UMEMOTO 				error = sooptcopyin(sopt, optbuf_storage,
2079e770771aSHajimu UMEMOTO 				    sizeof(optbuf_storage), 0);
2080a5d1aae3SHajimu UMEMOTO 				if (error)
2081a5d1aae3SHajimu UMEMOTO 					break;
2082f95d4633SHajimu UMEMOTO 				optlen = sopt->sopt_valsize;
2083e770771aSHajimu UMEMOTO 				optbuf = optbuf_storage;
20840ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
2085*53af6903SGleb Smirnoff 				if (inp->inp_flags & INP_DROPPED) {
20860ecd976eSBjoern A. Zeeb 					INP_WUNLOCK(inp);
208756713d16SMatt Macy 					return (ECONNRESET);
208856713d16SMatt Macy 				}
20890ecd976eSBjoern A. Zeeb 				optp = &inp->in6p_outputopts;
209079ba3952SBjoern A. Zeeb 				error = ip6_pcbopt(optname, optbuf, optlen,
209179ba3952SBjoern A. Zeeb 				    optp, (td != NULL) ? td->td_ucred : NULL,
209279ba3952SBjoern A. Zeeb 				    uproto);
20930ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
2094f95d4633SHajimu UMEMOTO 				break;
2095f95d4633SHajimu UMEMOTO 			}
209682cd038dSYoshinobu Inoue #undef OPTSET
209782cd038dSYoshinobu Inoue 
209882cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_IF:
209982cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_HOPS:
210082cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_LOOP:
210182cd038dSYoshinobu Inoue 			case IPV6_JOIN_GROUP:
210282cd038dSYoshinobu Inoue 			case IPV6_LEAVE_GROUP:
210333cde130SBruce M Simpson 			case IPV6_MSFILTER:
210433cde130SBruce M Simpson 			case MCAST_BLOCK_SOURCE:
210533cde130SBruce M Simpson 			case MCAST_UNBLOCK_SOURCE:
210633cde130SBruce M Simpson 			case MCAST_JOIN_GROUP:
210733cde130SBruce M Simpson 			case MCAST_LEAVE_GROUP:
210833cde130SBruce M Simpson 			case MCAST_JOIN_SOURCE_GROUP:
210933cde130SBruce M Simpson 			case MCAST_LEAVE_SOURCE_GROUP:
21100ecd976eSBjoern A. Zeeb 				error = ip6_setmoptions(inp, sopt);
211182cd038dSYoshinobu Inoue 				break;
211282cd038dSYoshinobu Inoue 
211382cd038dSYoshinobu Inoue 			case IPV6_PORTRANGE:
2114686cdd19SJun-ichiro itojun Hagino 				error = sooptcopyin(sopt, &optval,
2115686cdd19SJun-ichiro itojun Hagino 				    sizeof optval, sizeof optval);
211682cd038dSYoshinobu Inoue 				if (error)
211782cd038dSYoshinobu Inoue 					break;
211882cd038dSYoshinobu Inoue 
21190ecd976eSBjoern A. Zeeb 				INP_WLOCK(inp);
212082cd038dSYoshinobu Inoue 				switch (optval) {
212182cd038dSYoshinobu Inoue 				case IPV6_PORTRANGE_DEFAULT:
21220ecd976eSBjoern A. Zeeb 					inp->inp_flags &= ~(INP_LOWPORT);
21230ecd976eSBjoern A. Zeeb 					inp->inp_flags &= ~(INP_HIGHPORT);
212482cd038dSYoshinobu Inoue 					break;
212582cd038dSYoshinobu Inoue 
212682cd038dSYoshinobu Inoue 				case IPV6_PORTRANGE_HIGH:
21270ecd976eSBjoern A. Zeeb 					inp->inp_flags &= ~(INP_LOWPORT);
21280ecd976eSBjoern A. Zeeb 					inp->inp_flags |= INP_HIGHPORT;
212982cd038dSYoshinobu Inoue 					break;
213082cd038dSYoshinobu Inoue 
213182cd038dSYoshinobu Inoue 				case IPV6_PORTRANGE_LOW:
21320ecd976eSBjoern A. Zeeb 					inp->inp_flags &= ~(INP_HIGHPORT);
21330ecd976eSBjoern A. Zeeb 					inp->inp_flags |= INP_LOWPORT;
213482cd038dSYoshinobu Inoue 					break;
213582cd038dSYoshinobu Inoue 
213682cd038dSYoshinobu Inoue 				default:
213782cd038dSYoshinobu Inoue 					error = EINVAL;
213882cd038dSYoshinobu Inoue 					break;
213982cd038dSYoshinobu Inoue 				}
21400ecd976eSBjoern A. Zeeb 				INP_WUNLOCK(inp);
214182cd038dSYoshinobu Inoue 				break;
214282cd038dSYoshinobu Inoue 
2143fcf59617SAndrey V. Elsukov #if defined(IPSEC) || defined(IPSEC_SUPPORT)
214482cd038dSYoshinobu Inoue 			case IPV6_IPSEC_POLICY:
2145fcf59617SAndrey V. Elsukov 				if (IPSEC_ENABLED(ipv6)) {
21460ecd976eSBjoern A. Zeeb 					error = IPSEC_PCBCTL(ipv6, inp, sopt);
214782cd038dSYoshinobu Inoue 					break;
2148c26fe973SBjoern A. Zeeb 				}
2149fcf59617SAndrey V. Elsukov 				/* FALLTHROUGH */
2150b2630c29SGeorge V. Neville-Neil #endif /* IPSEC */
215182cd038dSYoshinobu Inoue 
215282cd038dSYoshinobu Inoue 			default:
215382cd038dSYoshinobu Inoue 				error = ENOPROTOOPT;
215482cd038dSYoshinobu Inoue 				break;
215582cd038dSYoshinobu Inoue 			}
215682cd038dSYoshinobu Inoue 			break;
215782cd038dSYoshinobu Inoue 
215882cd038dSYoshinobu Inoue 		case SOPT_GET:
215982cd038dSYoshinobu Inoue 			switch (optname) {
2160f95d4633SHajimu UMEMOTO 			case IPV6_2292PKTOPTIONS:
2161f95d4633SHajimu UMEMOTO #ifdef IPV6_PKTOPTIONS
216282cd038dSYoshinobu Inoue 			case IPV6_PKTOPTIONS:
2163f95d4633SHajimu UMEMOTO #endif
2164f95d4633SHajimu UMEMOTO 				/*
2165f95d4633SHajimu UMEMOTO 				 * RFC3542 (effectively) deprecated the
2166f95d4633SHajimu UMEMOTO 				 * semantics of the 2292-style pktoptions.
2167f95d4633SHajimu UMEMOTO 				 * Since it was not reliable in nature (i.e.,
2168f95d4633SHajimu UMEMOTO 				 * applications had to expect the lack of some
2169f95d4633SHajimu UMEMOTO 				 * information after all), it would make sense
2170f95d4633SHajimu UMEMOTO 				 * to simplify this part by always returning
2171f95d4633SHajimu UMEMOTO 				 * empty data.
2172f95d4633SHajimu UMEMOTO 				 */
217382cd038dSYoshinobu Inoue 				sopt->sopt_valsize = 0;
217482cd038dSYoshinobu Inoue 				break;
217582cd038dSYoshinobu Inoue 
2176f95d4633SHajimu UMEMOTO 			case IPV6_RECVHOPOPTS:
2177f95d4633SHajimu UMEMOTO 			case IPV6_RECVDSTOPTS:
2178f95d4633SHajimu UMEMOTO 			case IPV6_RECVRTHDRDSTOPTS:
217982cd038dSYoshinobu Inoue 			case IPV6_UNICAST_HOPS:
2180f95d4633SHajimu UMEMOTO 			case IPV6_RECVPKTINFO:
2181f95d4633SHajimu UMEMOTO 			case IPV6_RECVHOPLIMIT:
2182f95d4633SHajimu UMEMOTO 			case IPV6_RECVRTHDR:
2183f95d4633SHajimu UMEMOTO 			case IPV6_RECVPATHMTU:
218433841545SHajimu UMEMOTO 
218533841545SHajimu UMEMOTO 			case IPV6_V6ONLY:
2186fa310a7eSYoshinobu Inoue 			case IPV6_PORTRANGE:
2187f95d4633SHajimu UMEMOTO 			case IPV6_RECVTCLASS:
2188f95d4633SHajimu UMEMOTO 			case IPV6_AUTOFLOWLABEL:
21895f6bf451SAttilio Rao 			case IPV6_BINDANY:
2190c7c0d948SAdrian Chadd 			case IPV6_FLOWID:
2191c7c0d948SAdrian Chadd 			case IPV6_FLOWTYPE:
219268bb8d62SAdrian Chadd 			case IPV6_RECVFLOWID:
2193c7c0d948SAdrian Chadd #ifdef	RSS
2194c7c0d948SAdrian Chadd 			case IPV6_RSSBUCKETID:
219568bb8d62SAdrian Chadd 			case IPV6_RECVRSSBUCKETID:
2196c7c0d948SAdrian Chadd #endif
2197912568c8SJonathan T. Looney 			case IPV6_BINDMULTI:
2198868aabb4SRichard Scheffenegger 			case IPV6_VLAN_PCP:
219982cd038dSYoshinobu Inoue 				switch (optname) {
2200f95d4633SHajimu UMEMOTO 				case IPV6_RECVHOPOPTS:
2201f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_HOPOPTS);
2202f95d4633SHajimu UMEMOTO 					break;
2203f95d4633SHajimu UMEMOTO 
2204f95d4633SHajimu UMEMOTO 				case IPV6_RECVDSTOPTS:
2205f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_DSTOPTS);
2206f95d4633SHajimu UMEMOTO 					break;
2207f95d4633SHajimu UMEMOTO 
2208f95d4633SHajimu UMEMOTO 				case IPV6_RECVRTHDRDSTOPTS:
2209f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_RTHDRDSTOPTS);
2210f95d4633SHajimu UMEMOTO 					break;
2211f95d4633SHajimu UMEMOTO 
221282cd038dSYoshinobu Inoue 				case IPV6_UNICAST_HOPS:
22130ecd976eSBjoern A. Zeeb 					optval = inp->in6p_hops;
221482cd038dSYoshinobu Inoue 					break;
221582cd038dSYoshinobu Inoue 
2216f95d4633SHajimu UMEMOTO 				case IPV6_RECVPKTINFO:
2217f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_PKTINFO);
2218f95d4633SHajimu UMEMOTO 					break;
2219f95d4633SHajimu UMEMOTO 
2220f95d4633SHajimu UMEMOTO 				case IPV6_RECVHOPLIMIT:
2221f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_HOPLIMIT);
2222f95d4633SHajimu UMEMOTO 					break;
2223f95d4633SHajimu UMEMOTO 
2224f95d4633SHajimu UMEMOTO 				case IPV6_RECVRTHDR:
2225f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_RTHDR);
2226f95d4633SHajimu UMEMOTO 					break;
2227f95d4633SHajimu UMEMOTO 
2228f95d4633SHajimu UMEMOTO 				case IPV6_RECVPATHMTU:
2229f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_MTU);
223082cd038dSYoshinobu Inoue 					break;
223182cd038dSYoshinobu Inoue 
223233841545SHajimu UMEMOTO 				case IPV6_V6ONLY:
2233854d3b19SHajimu UMEMOTO 					optval = OPTBIT(IN6P_IPV6_V6ONLY);
223482cd038dSYoshinobu Inoue 					break;
223582cd038dSYoshinobu Inoue 
223682cd038dSYoshinobu Inoue 				case IPV6_PORTRANGE:
223782cd038dSYoshinobu Inoue 				    {
223882cd038dSYoshinobu Inoue 					int flags;
22390ecd976eSBjoern A. Zeeb 					flags = inp->inp_flags;
224097590249SBjoern A. Zeeb 					if (flags & INP_HIGHPORT)
224182cd038dSYoshinobu Inoue 						optval = IPV6_PORTRANGE_HIGH;
224297590249SBjoern A. Zeeb 					else if (flags & INP_LOWPORT)
224382cd038dSYoshinobu Inoue 						optval = IPV6_PORTRANGE_LOW;
224482cd038dSYoshinobu Inoue 					else
224582cd038dSYoshinobu Inoue 						optval = 0;
224682cd038dSYoshinobu Inoue 					break;
224782cd038dSYoshinobu Inoue 				    }
2248f95d4633SHajimu UMEMOTO 				case IPV6_RECVTCLASS:
2249f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_TCLASS);
2250f95d4633SHajimu UMEMOTO 					break;
2251f95d4633SHajimu UMEMOTO 
2252f95d4633SHajimu UMEMOTO 				case IPV6_AUTOFLOWLABEL:
2253f95d4633SHajimu UMEMOTO 					optval = OPTBIT(IN6P_AUTOFLOWLABEL);
2254f95d4633SHajimu UMEMOTO 					break;
2255f44270e7SPawel Jakub Dawidek 
2256dce33a45SErmal Luçi 				case IPV6_ORIGDSTADDR:
2257dce33a45SErmal Luçi 					optval = OPTBIT2(INP_ORIGDSTADDR);
2258dce33a45SErmal Luçi 					break;
2259dce33a45SErmal Luçi 
2260f44270e7SPawel Jakub Dawidek 				case IPV6_BINDANY:
2261f44270e7SPawel Jakub Dawidek 					optval = OPTBIT(INP_BINDANY);
2262f44270e7SPawel Jakub Dawidek 					break;
2263c7c0d948SAdrian Chadd 
2264c7c0d948SAdrian Chadd 				case IPV6_FLOWID:
22650ecd976eSBjoern A. Zeeb 					optval = inp->inp_flowid;
2266c7c0d948SAdrian Chadd 					break;
2267c7c0d948SAdrian Chadd 
2268c7c0d948SAdrian Chadd 				case IPV6_FLOWTYPE:
22690ecd976eSBjoern A. Zeeb 					optval = inp->inp_flowtype;
2270c7c0d948SAdrian Chadd 					break;
227168bb8d62SAdrian Chadd 
227268bb8d62SAdrian Chadd 				case IPV6_RECVFLOWID:
227368bb8d62SAdrian Chadd 					optval = OPTBIT2(INP_RECVFLOWID);
227468bb8d62SAdrian Chadd 					break;
2275c7c0d948SAdrian Chadd #ifdef	RSS
2276c7c0d948SAdrian Chadd 				case IPV6_RSSBUCKETID:
2277c7c0d948SAdrian Chadd 					retval =
22780ecd976eSBjoern A. Zeeb 					    rss_hash2bucket(inp->inp_flowid,
22790ecd976eSBjoern A. Zeeb 					    inp->inp_flowtype,
2280c7c0d948SAdrian Chadd 					    &rss_bucket);
2281c7c0d948SAdrian Chadd 					if (retval == 0)
2282c7c0d948SAdrian Chadd 						optval = rss_bucket;
2283c7c0d948SAdrian Chadd 					else
2284c7c0d948SAdrian Chadd 						error = EINVAL;
2285c7c0d948SAdrian Chadd 					break;
228668bb8d62SAdrian Chadd 
228768bb8d62SAdrian Chadd 				case IPV6_RECVRSSBUCKETID:
228868bb8d62SAdrian Chadd 					optval = OPTBIT2(INP_RECVRSSBUCKETID);
228968bb8d62SAdrian Chadd 					break;
2290c7c0d948SAdrian Chadd #endif
2291c7c0d948SAdrian Chadd 
2292c7c0d948SAdrian Chadd 				case IPV6_BINDMULTI:
2293c7c0d948SAdrian Chadd 					optval = OPTBIT2(INP_BINDMULTI);
2294c7c0d948SAdrian Chadd 					break;
2295868aabb4SRichard Scheffenegger 
2296868aabb4SRichard Scheffenegger 				case IPV6_VLAN_PCP:
2297868aabb4SRichard Scheffenegger 					if (OPTBIT2(INP_2PCP_SET)) {
2298868aabb4SRichard Scheffenegger 						optval = (inp->inp_flags2 &
2299868aabb4SRichard Scheffenegger 							    INP_2PCP_MASK) >>
2300868aabb4SRichard Scheffenegger 							    INP_2PCP_SHIFT;
2301868aabb4SRichard Scheffenegger 					} else {
2302868aabb4SRichard Scheffenegger 						optval = -1;
230382cd038dSYoshinobu Inoue 					}
2304868aabb4SRichard Scheffenegger 					break;
2305868aabb4SRichard Scheffenegger 				}
2306868aabb4SRichard Scheffenegger 
2307f95d4633SHajimu UMEMOTO 				if (error)
2308f95d4633SHajimu UMEMOTO 					break;
230982cd038dSYoshinobu Inoue 				error = sooptcopyout(sopt, &optval,
231082cd038dSYoshinobu Inoue 					sizeof optval);
231182cd038dSYoshinobu Inoue 				break;
231282cd038dSYoshinobu Inoue 
2313f95d4633SHajimu UMEMOTO 			case IPV6_PATHMTU:
2314f95d4633SHajimu UMEMOTO 			{
2315f95d4633SHajimu UMEMOTO 				u_long pmtu = 0;
2316f95d4633SHajimu UMEMOTO 				struct ip6_mtuinfo mtuinfo;
23175cbeca44SSean Bruno 				struct in6_addr addr;
2318f95d4633SHajimu UMEMOTO 
2319f95d4633SHajimu UMEMOTO 				if (!(so->so_state & SS_ISCONNECTED))
2320f95d4633SHajimu UMEMOTO 					return (ENOTCONN);
2321f95d4633SHajimu UMEMOTO 				/*
2322f95d4633SHajimu UMEMOTO 				 * XXX: we dot not consider the case of source
2323f95d4633SHajimu UMEMOTO 				 * routing, or optional information to specify
2324f95d4633SHajimu UMEMOTO 				 * the outgoing interface.
23250ecd976eSBjoern A. Zeeb 				 * Copy faddr out of inp to avoid holding lock
23265cbeca44SSean Bruno 				 * on inp during route lookup.
2327f95d4633SHajimu UMEMOTO 				 */
23280ecd976eSBjoern A. Zeeb 				INP_RLOCK(inp);
23290ecd976eSBjoern A. Zeeb 				bcopy(&inp->in6p_faddr, &addr, sizeof(addr));
23300ecd976eSBjoern A. Zeeb 				INP_RUNLOCK(inp);
23310d4df029SAlexander V. Chernikov 				error = ip6_getpmtu_ctl(so->so_fibnum,
23325cbeca44SSean Bruno 				    &addr, &pmtu);
2333f95d4633SHajimu UMEMOTO 				if (error)
2334f95d4633SHajimu UMEMOTO 					break;
2335f95d4633SHajimu UMEMOTO 				if (pmtu > IPV6_MAXPACKET)
2336f95d4633SHajimu UMEMOTO 					pmtu = IPV6_MAXPACKET;
2337f95d4633SHajimu UMEMOTO 
2338f95d4633SHajimu UMEMOTO 				bzero(&mtuinfo, sizeof(mtuinfo));
2339f95d4633SHajimu UMEMOTO 				mtuinfo.ip6m_mtu = (u_int32_t)pmtu;
2340f95d4633SHajimu UMEMOTO 				optdata = (void *)&mtuinfo;
2341f95d4633SHajimu UMEMOTO 				optdatalen = sizeof(mtuinfo);
2342f95d4633SHajimu UMEMOTO 				error = sooptcopyout(sopt, optdata,
2343f95d4633SHajimu UMEMOTO 				    optdatalen);
2344f95d4633SHajimu UMEMOTO 				break;
2345f95d4633SHajimu UMEMOTO 			}
2346f95d4633SHajimu UMEMOTO 
2347f95d4633SHajimu UMEMOTO 			case IPV6_2292PKTINFO:
2348f95d4633SHajimu UMEMOTO 			case IPV6_2292HOPLIMIT:
2349f95d4633SHajimu UMEMOTO 			case IPV6_2292HOPOPTS:
2350f95d4633SHajimu UMEMOTO 			case IPV6_2292RTHDR:
2351f95d4633SHajimu UMEMOTO 			case IPV6_2292DSTOPTS:
235233841545SHajimu UMEMOTO 				switch (optname) {
2353f95d4633SHajimu UMEMOTO 				case IPV6_2292PKTINFO:
235433841545SHajimu UMEMOTO 					optval = OPTBIT(IN6P_PKTINFO);
235533841545SHajimu UMEMOTO 					break;
2356f95d4633SHajimu UMEMOTO 				case IPV6_2292HOPLIMIT:
235733841545SHajimu UMEMOTO 					optval = OPTBIT(IN6P_HOPLIMIT);
235833841545SHajimu UMEMOTO 					break;
2359f95d4633SHajimu UMEMOTO 				case IPV6_2292HOPOPTS:
236033841545SHajimu UMEMOTO 					optval = OPTBIT(IN6P_HOPOPTS);
236133841545SHajimu UMEMOTO 					break;
2362f95d4633SHajimu UMEMOTO 				case IPV6_2292RTHDR:
236333841545SHajimu UMEMOTO 					optval = OPTBIT(IN6P_RTHDR);
236433841545SHajimu UMEMOTO 					break;
2365f95d4633SHajimu UMEMOTO 				case IPV6_2292DSTOPTS:
236633841545SHajimu UMEMOTO 					optval = OPTBIT(IN6P_DSTOPTS|IN6P_RTHDRDSTOPTS);
236733841545SHajimu UMEMOTO 					break;
236833841545SHajimu UMEMOTO 				}
236933841545SHajimu UMEMOTO 				error = sooptcopyout(sopt, &optval,
237033841545SHajimu UMEMOTO 				    sizeof optval);
237133841545SHajimu UMEMOTO 				break;
2372f95d4633SHajimu UMEMOTO 			case IPV6_PKTINFO:
2373f95d4633SHajimu UMEMOTO 			case IPV6_HOPOPTS:
2374f95d4633SHajimu UMEMOTO 			case IPV6_RTHDR:
2375f95d4633SHajimu UMEMOTO 			case IPV6_DSTOPTS:
2376f95d4633SHajimu UMEMOTO 			case IPV6_RTHDRDSTOPTS:
2377f95d4633SHajimu UMEMOTO 			case IPV6_NEXTHOP:
2378f95d4633SHajimu UMEMOTO 			case IPV6_TCLASS:
2379f95d4633SHajimu UMEMOTO 			case IPV6_DONTFRAG:
2380f95d4633SHajimu UMEMOTO 			case IPV6_USE_MIN_MTU:
2381f95d4633SHajimu UMEMOTO 			case IPV6_PREFER_TEMPADDR:
23820ecd976eSBjoern A. Zeeb 				error = ip6_getpcbopt(inp, optname, sopt);
2383f95d4633SHajimu UMEMOTO 				break;
238433841545SHajimu UMEMOTO 
238582cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_IF:
238682cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_HOPS:
238782cd038dSYoshinobu Inoue 			case IPV6_MULTICAST_LOOP:
238833cde130SBruce M Simpson 			case IPV6_MSFILTER:
23890ecd976eSBjoern A. Zeeb 				error = ip6_getmoptions(inp, sopt);
239082cd038dSYoshinobu Inoue 				break;
239182cd038dSYoshinobu Inoue 
2392fcf59617SAndrey V. Elsukov #if defined(IPSEC) || defined(IPSEC_SUPPORT)
239382cd038dSYoshinobu Inoue 			case IPV6_IPSEC_POLICY:
2394fcf59617SAndrey V. Elsukov 				if (IPSEC_ENABLED(ipv6)) {
23950ecd976eSBjoern A. Zeeb 					error = IPSEC_PCBCTL(ipv6, inp, sopt);
239682cd038dSYoshinobu Inoue 					break;
239782cd038dSYoshinobu Inoue 				}
2398fcf59617SAndrey V. Elsukov 				/* FALLTHROUGH */
2399b2630c29SGeorge V. Neville-Neil #endif /* IPSEC */
240082cd038dSYoshinobu Inoue 			default:
240182cd038dSYoshinobu Inoue 				error = ENOPROTOOPT;
240282cd038dSYoshinobu Inoue 				break;
240382cd038dSYoshinobu Inoue 			}
240482cd038dSYoshinobu Inoue 			break;
240582cd038dSYoshinobu Inoue 		}
240682cd038dSYoshinobu Inoue 	}
240782cd038dSYoshinobu Inoue 	return (error);
240882cd038dSYoshinobu Inoue }
240982cd038dSYoshinobu Inoue 
241002b9a206SHajimu UMEMOTO int
24111272577eSXin LI ip6_raw_ctloutput(struct socket *so, struct sockopt *sopt)
241202b9a206SHajimu UMEMOTO {
241302b9a206SHajimu UMEMOTO 	int error = 0, optval, optlen;
241402b9a206SHajimu UMEMOTO 	const int icmp6off = offsetof(struct icmp6_hdr, icmp6_cksum);
24150ecd976eSBjoern A. Zeeb 	struct inpcb *inp = sotoinpcb(so);
241602b9a206SHajimu UMEMOTO 	int level, op, optname;
241702b9a206SHajimu UMEMOTO 
241802b9a206SHajimu UMEMOTO 	level = sopt->sopt_level;
241902b9a206SHajimu UMEMOTO 	op = sopt->sopt_dir;
242002b9a206SHajimu UMEMOTO 	optname = sopt->sopt_name;
242102b9a206SHajimu UMEMOTO 	optlen = sopt->sopt_valsize;
242202b9a206SHajimu UMEMOTO 
242302b9a206SHajimu UMEMOTO 	if (level != IPPROTO_IPV6) {
242402b9a206SHajimu UMEMOTO 		return (EINVAL);
242502b9a206SHajimu UMEMOTO 	}
242602b9a206SHajimu UMEMOTO 
242702b9a206SHajimu UMEMOTO 	switch (optname) {
242802b9a206SHajimu UMEMOTO 	case IPV6_CHECKSUM:
242902b9a206SHajimu UMEMOTO 		/*
243002b9a206SHajimu UMEMOTO 		 * For ICMPv6 sockets, no modification allowed for checksum
243102b9a206SHajimu UMEMOTO 		 * offset, permit "no change" values to help existing apps.
243202b9a206SHajimu UMEMOTO 		 *
243318b35df8SHajimu UMEMOTO 		 * RFC3542 says: "An attempt to set IPV6_CHECKSUM
243402b9a206SHajimu UMEMOTO 		 * for an ICMPv6 socket will fail."
243518b35df8SHajimu UMEMOTO 		 * The current behavior does not meet RFC3542.
243602b9a206SHajimu UMEMOTO 		 */
243702b9a206SHajimu UMEMOTO 		switch (op) {
243802b9a206SHajimu UMEMOTO 		case SOPT_SET:
243902b9a206SHajimu UMEMOTO 			if (optlen != sizeof(int)) {
244002b9a206SHajimu UMEMOTO 				error = EINVAL;
244102b9a206SHajimu UMEMOTO 				break;
244202b9a206SHajimu UMEMOTO 			}
244302b9a206SHajimu UMEMOTO 			error = sooptcopyin(sopt, &optval, sizeof(optval),
244402b9a206SHajimu UMEMOTO 					    sizeof(optval));
244502b9a206SHajimu UMEMOTO 			if (error)
244602b9a206SHajimu UMEMOTO 				break;
24472f041b74SMichael Tuexen 			if (optval < -1 || (optval % 2) != 0) {
24482f041b74SMichael Tuexen 				/*
24492f041b74SMichael Tuexen 				 * The API assumes non-negative even offset
24502f041b74SMichael Tuexen 				 * values or -1 as a special value.
24512f041b74SMichael Tuexen 				 */
245202b9a206SHajimu UMEMOTO 				error = EINVAL;
245374ed2e8aSGleb Smirnoff 			} else if (inp->inp_ip_p == IPPROTO_ICMPV6) {
245402b9a206SHajimu UMEMOTO 				if (optval != icmp6off)
245502b9a206SHajimu UMEMOTO 					error = EINVAL;
245602b9a206SHajimu UMEMOTO 			} else
24570ecd976eSBjoern A. Zeeb 				inp->in6p_cksum = optval;
245802b9a206SHajimu UMEMOTO 			break;
245902b9a206SHajimu UMEMOTO 
246002b9a206SHajimu UMEMOTO 		case SOPT_GET:
246174ed2e8aSGleb Smirnoff 			if (inp->inp_ip_p == IPPROTO_ICMPV6)
246202b9a206SHajimu UMEMOTO 				optval = icmp6off;
246302b9a206SHajimu UMEMOTO 			else
24640ecd976eSBjoern A. Zeeb 				optval = inp->in6p_cksum;
246502b9a206SHajimu UMEMOTO 
246602b9a206SHajimu UMEMOTO 			error = sooptcopyout(sopt, &optval, sizeof(optval));
246702b9a206SHajimu UMEMOTO 			break;
246802b9a206SHajimu UMEMOTO 
246902b9a206SHajimu UMEMOTO 		default:
247002b9a206SHajimu UMEMOTO 			error = EINVAL;
247102b9a206SHajimu UMEMOTO 			break;
247202b9a206SHajimu UMEMOTO 		}
247302b9a206SHajimu UMEMOTO 		break;
247402b9a206SHajimu UMEMOTO 
247502b9a206SHajimu UMEMOTO 	default:
247602b9a206SHajimu UMEMOTO 		error = ENOPROTOOPT;
247702b9a206SHajimu UMEMOTO 		break;
247802b9a206SHajimu UMEMOTO 	}
247902b9a206SHajimu UMEMOTO 
248002b9a206SHajimu UMEMOTO 	return (error);
248102b9a206SHajimu UMEMOTO }
248202b9a206SHajimu UMEMOTO 
248382cd038dSYoshinobu Inoue /*
248433841545SHajimu UMEMOTO  * Set up IP6 options in pcb for insertion in output packets or
248533841545SHajimu UMEMOTO  * specifying behavior of outgoing packets.
248682cd038dSYoshinobu Inoue  */
248782cd038dSYoshinobu Inoue static int
24881272577eSXin LI ip6_pcbopts(struct ip6_pktopts **pktopt, struct mbuf *m,
24891272577eSXin LI     struct socket *so, struct sockopt *sopt)
249082cd038dSYoshinobu Inoue {
249133841545SHajimu UMEMOTO 	struct ip6_pktopts *opt = *pktopt;
249282cd038dSYoshinobu Inoue 	int error = 0;
2493b40ce416SJulian Elischer 	struct thread *td = sopt->sopt_td;
24942290dfb4SRyan Stone 	struct epoch_tracker et;
249582cd038dSYoshinobu Inoue 
249682cd038dSYoshinobu Inoue 	/* turn off any old options. */
249782cd038dSYoshinobu Inoue 	if (opt) {
249833841545SHajimu UMEMOTO #ifdef DIAGNOSTIC
249933841545SHajimu UMEMOTO 		if (opt->ip6po_pktinfo || opt->ip6po_nexthop ||
250033841545SHajimu UMEMOTO 		    opt->ip6po_hbh || opt->ip6po_dest1 || opt->ip6po_dest2 ||
250133841545SHajimu UMEMOTO 		    opt->ip6po_rhinfo.ip6po_rhi_rthdr)
250233841545SHajimu UMEMOTO 			printf("ip6_pcbopts: all specified options are cleared.\n");
250333841545SHajimu UMEMOTO #endif
2504f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, -1);
2505e02582d1SMark Johnston 	} else {
2506e02582d1SMark Johnston 		opt = malloc(sizeof(*opt), M_IP6OPT, M_NOWAIT);
2507e02582d1SMark Johnston 		if (opt == NULL)
2508e02582d1SMark Johnston 			return (ENOMEM);
2509e02582d1SMark Johnston 	}
251033841545SHajimu UMEMOTO 	*pktopt = NULL;
251182cd038dSYoshinobu Inoue 
251282cd038dSYoshinobu Inoue 	if (!m || m->m_len == 0) {
251382cd038dSYoshinobu Inoue 		/*
251435f6695bSHajimu UMEMOTO 		 * Only turning off any previous options, regardless of
251535f6695bSHajimu UMEMOTO 		 * whether the opt is just created or given.
251682cd038dSYoshinobu Inoue 		 */
251782cd038dSYoshinobu Inoue 		free(opt, M_IP6OPT);
251882cd038dSYoshinobu Inoue 		return (0);
251982cd038dSYoshinobu Inoue 	}
252082cd038dSYoshinobu Inoue 
252182cd038dSYoshinobu Inoue 	/*  set options specified by user. */
25222290dfb4SRyan Stone 	NET_EPOCH_ENTER(et);
252379ba3952SBjoern A. Zeeb 	if ((error = ip6_setpktopts(m, opt, NULL, (td != NULL) ?
252479ba3952SBjoern A. Zeeb 	    td->td_ucred : NULL, so->so_proto->pr_protocol)) != 0) {
2525f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, -1); /* XXX: discard all options */
252635f6695bSHajimu UMEMOTO 		free(opt, M_IP6OPT);
25272290dfb4SRyan Stone 		NET_EPOCH_EXIT(et);
252882cd038dSYoshinobu Inoue 		return (error);
252982cd038dSYoshinobu Inoue 	}
25302290dfb4SRyan Stone 	NET_EPOCH_EXIT(et);
253182cd038dSYoshinobu Inoue 	*pktopt = opt;
253282cd038dSYoshinobu Inoue 	return (0);
253382cd038dSYoshinobu Inoue }
253482cd038dSYoshinobu Inoue 
253582cd038dSYoshinobu Inoue /*
253633841545SHajimu UMEMOTO  * initialize ip6_pktopts.  beware that there are non-zero default values in
253733841545SHajimu UMEMOTO  * the struct.
253833841545SHajimu UMEMOTO  */
253933841545SHajimu UMEMOTO void
25401272577eSXin LI ip6_initpktopts(struct ip6_pktopts *opt)
254133841545SHajimu UMEMOTO {
254233841545SHajimu UMEMOTO 
254333841545SHajimu UMEMOTO 	bzero(opt, sizeof(*opt));
254433841545SHajimu UMEMOTO 	opt->ip6po_hlim = -1;	/* -1 means default hop limit */
2545f95d4633SHajimu UMEMOTO 	opt->ip6po_tclass = -1;	/* -1 means default traffic class */
2546f95d4633SHajimu UMEMOTO 	opt->ip6po_minmtu = IP6PO_MINMTU_MCASTONLY;
2547f95d4633SHajimu UMEMOTO 	opt->ip6po_prefer_tempaddr = IP6PO_TEMPADDR_SYSTEM;
2548f95d4633SHajimu UMEMOTO }
2549f95d4633SHajimu UMEMOTO 
2550f95d4633SHajimu UMEMOTO static int
25511272577eSXin LI ip6_pcbopt(int optname, u_char *buf, int len, struct ip6_pktopts **pktopt,
255279ba3952SBjoern A. Zeeb     struct ucred *cred, int uproto)
2553f95d4633SHajimu UMEMOTO {
25549f5432d5SKristof Provost 	struct epoch_tracker et;
2555f95d4633SHajimu UMEMOTO 	struct ip6_pktopts *opt;
25569f5432d5SKristof Provost 	int ret;
2557f95d4633SHajimu UMEMOTO 
2558f95d4633SHajimu UMEMOTO 	if (*pktopt == NULL) {
2559f95d4633SHajimu UMEMOTO 		*pktopt = malloc(sizeof(struct ip6_pktopts), M_IP6OPT,
256056713d16SMatt Macy 		    M_NOWAIT);
256156713d16SMatt Macy 		if (*pktopt == NULL)
256256713d16SMatt Macy 			return (ENOBUFS);
2563d5e3406dSHajimu UMEMOTO 		ip6_initpktopts(*pktopt);
2564f95d4633SHajimu UMEMOTO 	}
2565f95d4633SHajimu UMEMOTO 	opt = *pktopt;
2566f95d4633SHajimu UMEMOTO 
25679f5432d5SKristof Provost 	NET_EPOCH_ENTER(et);
25689f5432d5SKristof Provost 	ret = ip6_setpktopt(optname, buf, len, opt, cred, 1, 0, uproto);
25699f5432d5SKristof Provost 	NET_EPOCH_EXIT(et);
25709f5432d5SKristof Provost 
25719f5432d5SKristof Provost 	return (ret);
2572f95d4633SHajimu UMEMOTO }
2573f95d4633SHajimu UMEMOTO 
257406b479a6SSean Bruno #define GET_PKTOPT_VAR(field, lenexpr) do {					\
257506b479a6SSean Bruno 	if (pktopt && pktopt->field) {						\
25760ecd976eSBjoern A. Zeeb 		INP_RUNLOCK(inp);						\
257706b479a6SSean Bruno 		optdata = malloc(sopt->sopt_valsize, M_TEMP, M_WAITOK);		\
257806b479a6SSean Bruno 		malloc_optdata = true;						\
25790ecd976eSBjoern A. Zeeb 		INP_RLOCK(inp);							\
2580*53af6903SGleb Smirnoff 		if (inp->inp_flags & INP_DROPPED) {				\
25810ecd976eSBjoern A. Zeeb 			INP_RUNLOCK(inp);					\
258206b479a6SSean Bruno 			free(optdata, M_TEMP);					\
258306b479a6SSean Bruno 			return (ECONNRESET);					\
258406b479a6SSean Bruno 		}								\
25850ecd976eSBjoern A. Zeeb 		pktopt = inp->in6p_outputopts;					\
258606b479a6SSean Bruno 		if (pktopt && pktopt->field) {					\
258706b479a6SSean Bruno 			optdatalen = min(lenexpr, sopt->sopt_valsize);		\
2588a8d54fc9SMichael Tuexen 			bcopy(pktopt->field, optdata, optdatalen);		\
258906b479a6SSean Bruno 		} else {							\
259006b479a6SSean Bruno 			free(optdata, M_TEMP);					\
259106b479a6SSean Bruno 			optdata = NULL;						\
259206b479a6SSean Bruno 			malloc_optdata = false;					\
259306b479a6SSean Bruno 		}								\
259406b479a6SSean Bruno 	}									\
259506b479a6SSean Bruno } while(0)
259606b479a6SSean Bruno 
259706b479a6SSean Bruno #define GET_PKTOPT_EXT_HDR(field) GET_PKTOPT_VAR(field,				\
259806b479a6SSean Bruno 	(((struct ip6_ext *)pktopt->field)->ip6e_len + 1) << 3)
259906b479a6SSean Bruno 
260006b479a6SSean Bruno #define GET_PKTOPT_SOCKADDR(field) GET_PKTOPT_VAR(field,			\
260106b479a6SSean Bruno 	pktopt->field->sa_len)
260206b479a6SSean Bruno 
2603f95d4633SHajimu UMEMOTO static int
26040ecd976eSBjoern A. Zeeb ip6_getpcbopt(struct inpcb *inp, int optname, struct sockopt *sopt)
2605f95d4633SHajimu UMEMOTO {
2606f95d4633SHajimu UMEMOTO 	void *optdata = NULL;
260706b479a6SSean Bruno 	bool malloc_optdata = false;
2608f95d4633SHajimu UMEMOTO 	int optdatalen = 0;
2609f95d4633SHajimu UMEMOTO 	int error = 0;
2610f95d4633SHajimu UMEMOTO 	struct in6_pktinfo null_pktinfo;
2611f95d4633SHajimu UMEMOTO 	int deftclass = 0, on;
2612f95d4633SHajimu UMEMOTO 	int defminmtu = IP6PO_MINMTU_MCASTONLY;
2613f95d4633SHajimu UMEMOTO 	int defpreftemp = IP6PO_TEMPADDR_SYSTEM;
261406b479a6SSean Bruno 	struct ip6_pktopts *pktopt;
261506b479a6SSean Bruno 
26160ecd976eSBjoern A. Zeeb 	INP_RLOCK(inp);
26170ecd976eSBjoern A. Zeeb 	pktopt = inp->in6p_outputopts;
2618f95d4633SHajimu UMEMOTO 
2619f95d4633SHajimu UMEMOTO 	switch (optname) {
2620f95d4633SHajimu UMEMOTO 	case IPV6_PKTINFO:
2621cb207f93SAndrey V. Elsukov 		optdata = (void *)&null_pktinfo;
2622cb207f93SAndrey V. Elsukov 		if (pktopt && pktopt->ip6po_pktinfo) {
2623cb207f93SAndrey V. Elsukov 			bcopy(pktopt->ip6po_pktinfo, &null_pktinfo,
2624cb207f93SAndrey V. Elsukov 			    sizeof(null_pktinfo));
2625cb207f93SAndrey V. Elsukov 			in6_clearscope(&null_pktinfo.ipi6_addr);
2626cb207f93SAndrey V. Elsukov 		} else {
2627f95d4633SHajimu UMEMOTO 			/* XXX: we don't have to do this every time... */
2628f95d4633SHajimu UMEMOTO 			bzero(&null_pktinfo, sizeof(null_pktinfo));
2629f95d4633SHajimu UMEMOTO 		}
2630f95d4633SHajimu UMEMOTO 		optdatalen = sizeof(struct in6_pktinfo);
2631f95d4633SHajimu UMEMOTO 		break;
2632f95d4633SHajimu UMEMOTO 	case IPV6_TCLASS:
2633f95d4633SHajimu UMEMOTO 		if (pktopt && pktopt->ip6po_tclass >= 0)
263406b479a6SSean Bruno 			deftclass = pktopt->ip6po_tclass;
2635f95d4633SHajimu UMEMOTO 		optdata = (void *)&deftclass;
2636f95d4633SHajimu UMEMOTO 		optdatalen = sizeof(int);
2637f95d4633SHajimu UMEMOTO 		break;
2638f95d4633SHajimu UMEMOTO 	case IPV6_HOPOPTS:
263906b479a6SSean Bruno 		GET_PKTOPT_EXT_HDR(ip6po_hbh);
2640f95d4633SHajimu UMEMOTO 		break;
2641f95d4633SHajimu UMEMOTO 	case IPV6_RTHDR:
264206b479a6SSean Bruno 		GET_PKTOPT_EXT_HDR(ip6po_rthdr);
2643f95d4633SHajimu UMEMOTO 		break;
2644f95d4633SHajimu UMEMOTO 	case IPV6_RTHDRDSTOPTS:
264506b479a6SSean Bruno 		GET_PKTOPT_EXT_HDR(ip6po_dest1);
2646f95d4633SHajimu UMEMOTO 		break;
2647f95d4633SHajimu UMEMOTO 	case IPV6_DSTOPTS:
264806b479a6SSean Bruno 		GET_PKTOPT_EXT_HDR(ip6po_dest2);
2649f95d4633SHajimu UMEMOTO 		break;
2650f95d4633SHajimu UMEMOTO 	case IPV6_NEXTHOP:
265106b479a6SSean Bruno 		GET_PKTOPT_SOCKADDR(ip6po_nexthop);
2652f95d4633SHajimu UMEMOTO 		break;
2653f95d4633SHajimu UMEMOTO 	case IPV6_USE_MIN_MTU:
2654f95d4633SHajimu UMEMOTO 		if (pktopt)
265506b479a6SSean Bruno 			defminmtu = pktopt->ip6po_minmtu;
2656f95d4633SHajimu UMEMOTO 		optdata = (void *)&defminmtu;
2657f95d4633SHajimu UMEMOTO 		optdatalen = sizeof(int);
2658f95d4633SHajimu UMEMOTO 		break;
2659f95d4633SHajimu UMEMOTO 	case IPV6_DONTFRAG:
2660f95d4633SHajimu UMEMOTO 		if (pktopt && ((pktopt->ip6po_flags) & IP6PO_DONTFRAG))
2661f95d4633SHajimu UMEMOTO 			on = 1;
2662f95d4633SHajimu UMEMOTO 		else
2663f95d4633SHajimu UMEMOTO 			on = 0;
2664f95d4633SHajimu UMEMOTO 		optdata = (void *)&on;
2665f95d4633SHajimu UMEMOTO 		optdatalen = sizeof(on);
2666f95d4633SHajimu UMEMOTO 		break;
2667f95d4633SHajimu UMEMOTO 	case IPV6_PREFER_TEMPADDR:
2668f95d4633SHajimu UMEMOTO 		if (pktopt)
266906b479a6SSean Bruno 			defpreftemp = pktopt->ip6po_prefer_tempaddr;
2670f95d4633SHajimu UMEMOTO 		optdata = (void *)&defpreftemp;
2671f95d4633SHajimu UMEMOTO 		optdatalen = sizeof(int);
2672f95d4633SHajimu UMEMOTO 		break;
2673f95d4633SHajimu UMEMOTO 	default:		/* should not happen */
2674f95d4633SHajimu UMEMOTO #ifdef DIAGNOSTIC
2675f95d4633SHajimu UMEMOTO 		panic("ip6_getpcbopt: unexpected option\n");
2676f95d4633SHajimu UMEMOTO #endif
26770ecd976eSBjoern A. Zeeb 		INP_RUNLOCK(inp);
2678f95d4633SHajimu UMEMOTO 		return (ENOPROTOOPT);
2679f95d4633SHajimu UMEMOTO 	}
26800ecd976eSBjoern A. Zeeb 	INP_RUNLOCK(inp);
2681f95d4633SHajimu UMEMOTO 
2682f95d4633SHajimu UMEMOTO 	error = sooptcopyout(sopt, optdata, optdatalen);
268306b479a6SSean Bruno 	if (malloc_optdata)
268406b479a6SSean Bruno 		free(optdata, M_TEMP);
2685f95d4633SHajimu UMEMOTO 
2686f95d4633SHajimu UMEMOTO 	return (error);
268733841545SHajimu UMEMOTO }
268833841545SHajimu UMEMOTO 
268933841545SHajimu UMEMOTO void
26901272577eSXin LI ip6_clearpktopts(struct ip6_pktopts *pktopt, int optname)
269133841545SHajimu UMEMOTO {
2692289b28bdSHajimu UMEMOTO 	if (pktopt == NULL)
2693289b28bdSHajimu UMEMOTO 		return;
2694289b28bdSHajimu UMEMOTO 
2695f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_PKTINFO) {
2696885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_pktinfo)
269733841545SHajimu UMEMOTO 			free(pktopt->ip6po_pktinfo, M_IP6OPT);
269833841545SHajimu UMEMOTO 		pktopt->ip6po_pktinfo = NULL;
269933841545SHajimu UMEMOTO 	}
2700f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_HOPLIMIT)
270133841545SHajimu UMEMOTO 		pktopt->ip6po_hlim = -1;
2702f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_TCLASS)
2703f95d4633SHajimu UMEMOTO 		pktopt->ip6po_tclass = -1;
2704f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_NEXTHOP) {
2705983066f0SAlexander V. Chernikov 		if (pktopt->ip6po_nextroute.ro_nh) {
2706983066f0SAlexander V. Chernikov 			NH_FREE(pktopt->ip6po_nextroute.ro_nh);
2707983066f0SAlexander V. Chernikov 			pktopt->ip6po_nextroute.ro_nh = NULL;
2708f95d4633SHajimu UMEMOTO 		}
2709885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_nexthop)
271033841545SHajimu UMEMOTO 			free(pktopt->ip6po_nexthop, M_IP6OPT);
271133841545SHajimu UMEMOTO 		pktopt->ip6po_nexthop = NULL;
271233841545SHajimu UMEMOTO 	}
2713f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_HOPOPTS) {
2714885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_hbh)
271533841545SHajimu UMEMOTO 			free(pktopt->ip6po_hbh, M_IP6OPT);
271633841545SHajimu UMEMOTO 		pktopt->ip6po_hbh = NULL;
271733841545SHajimu UMEMOTO 	}
2718f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_RTHDRDSTOPTS) {
2719885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_dest1)
272033841545SHajimu UMEMOTO 			free(pktopt->ip6po_dest1, M_IP6OPT);
272133841545SHajimu UMEMOTO 		pktopt->ip6po_dest1 = NULL;
272233841545SHajimu UMEMOTO 	}
2723f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_RTHDR) {
2724885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_rhinfo.ip6po_rhi_rthdr)
272533841545SHajimu UMEMOTO 			free(pktopt->ip6po_rhinfo.ip6po_rhi_rthdr, M_IP6OPT);
272633841545SHajimu UMEMOTO 		pktopt->ip6po_rhinfo.ip6po_rhi_rthdr = NULL;
2727983066f0SAlexander V. Chernikov 		if (pktopt->ip6po_route.ro_nh) {
2728983066f0SAlexander V. Chernikov 			NH_FREE(pktopt->ip6po_route.ro_nh);
2729983066f0SAlexander V. Chernikov 			pktopt->ip6po_route.ro_nh = NULL;
273033841545SHajimu UMEMOTO 		}
273133841545SHajimu UMEMOTO 	}
2732f95d4633SHajimu UMEMOTO 	if (optname == -1 || optname == IPV6_DSTOPTS) {
2733885adbfaSHajimu UMEMOTO 		if (pktopt->ip6po_dest2)
273433841545SHajimu UMEMOTO 			free(pktopt->ip6po_dest2, M_IP6OPT);
273533841545SHajimu UMEMOTO 		pktopt->ip6po_dest2 = NULL;
273633841545SHajimu UMEMOTO 	}
273733841545SHajimu UMEMOTO }
273833841545SHajimu UMEMOTO 
273933841545SHajimu UMEMOTO #define PKTOPT_EXTHDRCPY(type) \
274033841545SHajimu UMEMOTO do {\
274133841545SHajimu UMEMOTO 	if (src->type) {\
27427efe5d92SHajimu UMEMOTO 		int hlen = (((struct ip6_ext *)src->type)->ip6e_len + 1) << 3;\
274333841545SHajimu UMEMOTO 		dst->type = malloc(hlen, M_IP6OPT, canwait);\
27448b07e00eSJonathan T. Looney 		if (dst->type == NULL)\
274533841545SHajimu UMEMOTO 			goto bad;\
274633841545SHajimu UMEMOTO 		bcopy(src->type, dst->type, hlen);\
274733841545SHajimu UMEMOTO 	}\
27487efe5d92SHajimu UMEMOTO } while (/*CONSTCOND*/ 0)
274933841545SHajimu UMEMOTO 
2750885adbfaSHajimu UMEMOTO static int
27511272577eSXin LI copypktopts(struct ip6_pktopts *dst, struct ip6_pktopts *src, int canwait)
275233841545SHajimu UMEMOTO {
2753885adbfaSHajimu UMEMOTO 	if (dst == NULL || src == NULL)  {
275433841545SHajimu UMEMOTO 		printf("ip6_clearpktopts: invalid argument\n");
2755885adbfaSHajimu UMEMOTO 		return (EINVAL);
275633841545SHajimu UMEMOTO 	}
275733841545SHajimu UMEMOTO 
275833841545SHajimu UMEMOTO 	dst->ip6po_hlim = src->ip6po_hlim;
2759f95d4633SHajimu UMEMOTO 	dst->ip6po_tclass = src->ip6po_tclass;
2760f95d4633SHajimu UMEMOTO 	dst->ip6po_flags = src->ip6po_flags;
27616090ab8bSHiroki Sato 	dst->ip6po_minmtu = src->ip6po_minmtu;
27626090ab8bSHiroki Sato 	dst->ip6po_prefer_tempaddr = src->ip6po_prefer_tempaddr;
276333841545SHajimu UMEMOTO 	if (src->ip6po_pktinfo) {
276433841545SHajimu UMEMOTO 		dst->ip6po_pktinfo = malloc(sizeof(*dst->ip6po_pktinfo),
276533841545SHajimu UMEMOTO 		    M_IP6OPT, canwait);
27662cb64cb2SGeorge V. Neville-Neil 		if (dst->ip6po_pktinfo == NULL)
276733841545SHajimu UMEMOTO 			goto bad;
276833841545SHajimu UMEMOTO 		*dst->ip6po_pktinfo = *src->ip6po_pktinfo;
276933841545SHajimu UMEMOTO 	}
277033841545SHajimu UMEMOTO 	if (src->ip6po_nexthop) {
277133841545SHajimu UMEMOTO 		dst->ip6po_nexthop = malloc(src->ip6po_nexthop->sa_len,
277233841545SHajimu UMEMOTO 		    M_IP6OPT, canwait);
2773403cbcf5SGeorge V. Neville-Neil 		if (dst->ip6po_nexthop == NULL)
277433841545SHajimu UMEMOTO 			goto bad;
277533841545SHajimu UMEMOTO 		bcopy(src->ip6po_nexthop, dst->ip6po_nexthop,
277633841545SHajimu UMEMOTO 		    src->ip6po_nexthop->sa_len);
277733841545SHajimu UMEMOTO 	}
277833841545SHajimu UMEMOTO 	PKTOPT_EXTHDRCPY(ip6po_hbh);
277933841545SHajimu UMEMOTO 	PKTOPT_EXTHDRCPY(ip6po_dest1);
278033841545SHajimu UMEMOTO 	PKTOPT_EXTHDRCPY(ip6po_dest2);
278133841545SHajimu UMEMOTO 	PKTOPT_EXTHDRCPY(ip6po_rthdr); /* not copy the cached route */
2782885adbfaSHajimu UMEMOTO 	return (0);
278333841545SHajimu UMEMOTO 
278433841545SHajimu UMEMOTO   bad:
2785016fb9d9SMike Makonnen 	ip6_clearpktopts(dst, -1);
2786885adbfaSHajimu UMEMOTO 	return (ENOBUFS);
2787885adbfaSHajimu UMEMOTO }
2788885adbfaSHajimu UMEMOTO #undef PKTOPT_EXTHDRCPY
2789885adbfaSHajimu UMEMOTO 
2790885adbfaSHajimu UMEMOTO struct ip6_pktopts *
27911272577eSXin LI ip6_copypktopts(struct ip6_pktopts *src, int canwait)
2792885adbfaSHajimu UMEMOTO {
2793885adbfaSHajimu UMEMOTO 	int error;
2794885adbfaSHajimu UMEMOTO 	struct ip6_pktopts *dst;
2795885adbfaSHajimu UMEMOTO 
2796885adbfaSHajimu UMEMOTO 	dst = malloc(sizeof(*dst), M_IP6OPT, canwait);
27972cb64cb2SGeorge V. Neville-Neil 	if (dst == NULL)
2798885adbfaSHajimu UMEMOTO 		return (NULL);
2799885adbfaSHajimu UMEMOTO 	ip6_initpktopts(dst);
2800885adbfaSHajimu UMEMOTO 
2801885adbfaSHajimu UMEMOTO 	if ((error = copypktopts(dst, src, canwait)) != 0) {
280235f6695bSHajimu UMEMOTO 		free(dst, M_IP6OPT);
280333841545SHajimu UMEMOTO 		return (NULL);
280433841545SHajimu UMEMOTO 	}
2805885adbfaSHajimu UMEMOTO 
2806885adbfaSHajimu UMEMOTO 	return (dst);
2807885adbfaSHajimu UMEMOTO }
280833841545SHajimu UMEMOTO 
280933841545SHajimu UMEMOTO void
28101272577eSXin LI ip6_freepcbopts(struct ip6_pktopts *pktopt)
281133841545SHajimu UMEMOTO {
281233841545SHajimu UMEMOTO 	if (pktopt == NULL)
281333841545SHajimu UMEMOTO 		return;
281433841545SHajimu UMEMOTO 
2815f95d4633SHajimu UMEMOTO 	ip6_clearpktopts(pktopt, -1);
281633841545SHajimu UMEMOTO 
281733841545SHajimu UMEMOTO 	free(pktopt, M_IP6OPT);
281833841545SHajimu UMEMOTO }
281933841545SHajimu UMEMOTO 
282033841545SHajimu UMEMOTO /*
282182cd038dSYoshinobu Inoue  * Set IPv6 outgoing packet options based on advanced API.
282282cd038dSYoshinobu Inoue  */
282382cd038dSYoshinobu Inoue int
28241272577eSXin LI ip6_setpktopts(struct mbuf *control, struct ip6_pktopts *opt,
282579ba3952SBjoern A. Zeeb     struct ip6_pktopts *stickyopt, struct ucred *cred, int uproto)
282682cd038dSYoshinobu Inoue {
2827155d72c4SPedro F. Giffuni 	struct cmsghdr *cm = NULL;
282882cd038dSYoshinobu Inoue 
28298507acb1SHajimu UMEMOTO 	if (control == NULL || opt == NULL)
283082cd038dSYoshinobu Inoue 		return (EINVAL);
283182cd038dSYoshinobu Inoue 
28322290dfb4SRyan Stone 	/*
2833d74b7baeSGleb Smirnoff 	 * ip6_setpktopt can call ifnet_byindex(), so it's imperative that we
2834d74b7baeSGleb Smirnoff 	 * are in the network epoch here.
28352290dfb4SRyan Stone 	 */
28362290dfb4SRyan Stone 	NET_EPOCH_ASSERT();
28372290dfb4SRyan Stone 
2838885adbfaSHajimu UMEMOTO 	ip6_initpktopts(opt);
2839f95d4633SHajimu UMEMOTO 	if (stickyopt) {
2840885adbfaSHajimu UMEMOTO 		int error;
2841885adbfaSHajimu UMEMOTO 
2842f95d4633SHajimu UMEMOTO 		/*
2843f95d4633SHajimu UMEMOTO 		 * If stickyopt is provided, make a local copy of the options
2844f95d4633SHajimu UMEMOTO 		 * for this particular packet, then override them by ancillary
2845f95d4633SHajimu UMEMOTO 		 * objects.
2846885adbfaSHajimu UMEMOTO 		 * XXX: copypktopts() does not copy the cached route to a next
2847885adbfaSHajimu UMEMOTO 		 * hop (if any).  This is not very good in terms of efficiency,
2848885adbfaSHajimu UMEMOTO 		 * but we can allow this since this option should be rarely
2849885adbfaSHajimu UMEMOTO 		 * used.
2850f95d4633SHajimu UMEMOTO 		 */
2851885adbfaSHajimu UMEMOTO 		if ((error = copypktopts(opt, stickyopt, M_NOWAIT)) != 0)
2852885adbfaSHajimu UMEMOTO 			return (error);
2853f95d4633SHajimu UMEMOTO 	}
285482cd038dSYoshinobu Inoue 
285582cd038dSYoshinobu Inoue 	/*
285682cd038dSYoshinobu Inoue 	 * XXX: Currently, we assume all the optional information is stored
285782cd038dSYoshinobu Inoue 	 * in a single mbuf.
285882cd038dSYoshinobu Inoue 	 */
285982cd038dSYoshinobu Inoue 	if (control->m_next)
286082cd038dSYoshinobu Inoue 		return (EINVAL);
286182cd038dSYoshinobu Inoue 
28626f4da201SBjoern A. Zeeb 	for (; control->m_len > 0; control->m_data += CMSG_ALIGN(cm->cmsg_len),
286333841545SHajimu UMEMOTO 	    control->m_len -= CMSG_ALIGN(cm->cmsg_len)) {
2864f95d4633SHajimu UMEMOTO 		int error;
2865f95d4633SHajimu UMEMOTO 
2866f95d4633SHajimu UMEMOTO 		if (control->m_len < CMSG_LEN(0))
2867f95d4633SHajimu UMEMOTO 			return (EINVAL);
2868f95d4633SHajimu UMEMOTO 
286982cd038dSYoshinobu Inoue 		cm = mtod(control, struct cmsghdr *);
287082cd038dSYoshinobu Inoue 		if (cm->cmsg_len == 0 || cm->cmsg_len > control->m_len)
287182cd038dSYoshinobu Inoue 			return (EINVAL);
287282cd038dSYoshinobu Inoue 		if (cm->cmsg_level != IPPROTO_IPV6)
287382cd038dSYoshinobu Inoue 			continue;
287482cd038dSYoshinobu Inoue 
2875d5e3406dSHajimu UMEMOTO 		error = ip6_setpktopt(cm->cmsg_type, CMSG_DATA(cm),
287679ba3952SBjoern A. Zeeb 		    cm->cmsg_len - CMSG_LEN(0), opt, cred, 0, 1, uproto);
2877f95d4633SHajimu UMEMOTO 		if (error)
2878f95d4633SHajimu UMEMOTO 			return (error);
2879f95d4633SHajimu UMEMOTO 	}
288082cd038dSYoshinobu Inoue 
2881f95d4633SHajimu UMEMOTO 	return (0);
2882f95d4633SHajimu UMEMOTO }
2883f95d4633SHajimu UMEMOTO 
2884f95d4633SHajimu UMEMOTO /*
2885f95d4633SHajimu UMEMOTO  * Set a particular packet option, as a sticky option or an ancillary data
2886f95d4633SHajimu UMEMOTO  * item.  "len" can be 0 only when it's a sticky option.
2887f95d4633SHajimu UMEMOTO  * We have 4 cases of combination of "sticky" and "cmsg":
2888f95d4633SHajimu UMEMOTO  * "sticky=0, cmsg=0": impossible
288918b35df8SHajimu UMEMOTO  * "sticky=0, cmsg=1": RFC2292 or RFC3542 ancillary data
289018b35df8SHajimu UMEMOTO  * "sticky=1, cmsg=0": RFC3542 socket option
2891f95d4633SHajimu UMEMOTO  * "sticky=1, cmsg=1": RFC2292 socket option
2892f95d4633SHajimu UMEMOTO  */
2893f95d4633SHajimu UMEMOTO static int
28941272577eSXin LI ip6_setpktopt(int optname, u_char *buf, int len, struct ip6_pktopts *opt,
289579ba3952SBjoern A. Zeeb     struct ucred *cred, int sticky, int cmsg, int uproto)
2896f95d4633SHajimu UMEMOTO {
2897f95d4633SHajimu UMEMOTO 	int minmtupolicy, preftemp;
289879ba3952SBjoern A. Zeeb 	int error;
2899f95d4633SHajimu UMEMOTO 
29009f5432d5SKristof Provost 	NET_EPOCH_ASSERT();
29019f5432d5SKristof Provost 
2902f95d4633SHajimu UMEMOTO 	if (!sticky && !cmsg) {
2903f95d4633SHajimu UMEMOTO #ifdef DIAGNOSTIC
2904d5e3406dSHajimu UMEMOTO 		printf("ip6_setpktopt: impossible case\n");
2905f95d4633SHajimu UMEMOTO #endif
2906f95d4633SHajimu UMEMOTO 		return (EINVAL);
2907f95d4633SHajimu UMEMOTO 	}
2908f95d4633SHajimu UMEMOTO 
2909f95d4633SHajimu UMEMOTO 	/*
2910f95d4633SHajimu UMEMOTO 	 * IPV6_2292xxx is for backward compatibility to RFC2292, and should
291118b35df8SHajimu UMEMOTO 	 * not be specified in the context of RFC3542.  Conversely,
291218b35df8SHajimu UMEMOTO 	 * RFC3542 types should not be specified in the context of RFC2292.
2913f95d4633SHajimu UMEMOTO 	 */
2914f95d4633SHajimu UMEMOTO 	if (!cmsg) {
2915f95d4633SHajimu UMEMOTO 		switch (optname) {
2916f95d4633SHajimu UMEMOTO 		case IPV6_2292PKTINFO:
2917f95d4633SHajimu UMEMOTO 		case IPV6_2292HOPLIMIT:
2918f95d4633SHajimu UMEMOTO 		case IPV6_2292NEXTHOP:
2919f95d4633SHajimu UMEMOTO 		case IPV6_2292HOPOPTS:
2920f95d4633SHajimu UMEMOTO 		case IPV6_2292DSTOPTS:
2921f95d4633SHajimu UMEMOTO 		case IPV6_2292RTHDR:
2922f95d4633SHajimu UMEMOTO 		case IPV6_2292PKTOPTIONS:
2923f95d4633SHajimu UMEMOTO 			return (ENOPROTOOPT);
2924f95d4633SHajimu UMEMOTO 		}
2925f95d4633SHajimu UMEMOTO 	}
2926f95d4633SHajimu UMEMOTO 	if (sticky && cmsg) {
2927f95d4633SHajimu UMEMOTO 		switch (optname) {
2928f95d4633SHajimu UMEMOTO 		case IPV6_PKTINFO:
2929f95d4633SHajimu UMEMOTO 		case IPV6_HOPLIMIT:
2930f95d4633SHajimu UMEMOTO 		case IPV6_NEXTHOP:
2931f95d4633SHajimu UMEMOTO 		case IPV6_HOPOPTS:
2932f95d4633SHajimu UMEMOTO 		case IPV6_DSTOPTS:
2933f95d4633SHajimu UMEMOTO 		case IPV6_RTHDRDSTOPTS:
2934f95d4633SHajimu UMEMOTO 		case IPV6_RTHDR:
2935f95d4633SHajimu UMEMOTO 		case IPV6_USE_MIN_MTU:
2936f95d4633SHajimu UMEMOTO 		case IPV6_DONTFRAG:
2937f95d4633SHajimu UMEMOTO 		case IPV6_TCLASS:
293818b35df8SHajimu UMEMOTO 		case IPV6_PREFER_TEMPADDR: /* XXX: not an RFC3542 option */
2939f95d4633SHajimu UMEMOTO 			return (ENOPROTOOPT);
2940f95d4633SHajimu UMEMOTO 		}
2941f95d4633SHajimu UMEMOTO 	}
2942f95d4633SHajimu UMEMOTO 
2943f95d4633SHajimu UMEMOTO 	switch (optname) {
2944f95d4633SHajimu UMEMOTO 	case IPV6_2292PKTINFO:
2945f95d4633SHajimu UMEMOTO 	case IPV6_PKTINFO:
2946f95d4633SHajimu UMEMOTO 	{
2947f95d4633SHajimu UMEMOTO 		struct ifnet *ifp = NULL;
2948f95d4633SHajimu UMEMOTO 		struct in6_pktinfo *pktinfo;
2949f95d4633SHajimu UMEMOTO 
2950f95d4633SHajimu UMEMOTO 		if (len != sizeof(struct in6_pktinfo))
2951f95d4633SHajimu UMEMOTO 			return (EINVAL);
2952f95d4633SHajimu UMEMOTO 
2953f95d4633SHajimu UMEMOTO 		pktinfo = (struct in6_pktinfo *)buf;
2954f95d4633SHajimu UMEMOTO 
2955f95d4633SHajimu UMEMOTO 		/*
2956f95d4633SHajimu UMEMOTO 		 * An application can clear any sticky IPV6_PKTINFO option by
2957f95d4633SHajimu UMEMOTO 		 * doing a "regular" setsockopt with ipi6_addr being
2958f95d4633SHajimu UMEMOTO 		 * in6addr_any and ipi6_ifindex being zero.
2959f95d4633SHajimu UMEMOTO 		 * [RFC 3542, Section 6]
2960f95d4633SHajimu UMEMOTO 		 */
2961f95d4633SHajimu UMEMOTO 		if (optname == IPV6_PKTINFO && opt->ip6po_pktinfo &&
2962f95d4633SHajimu UMEMOTO 		    pktinfo->ipi6_ifindex == 0 &&
2963f95d4633SHajimu UMEMOTO 		    IN6_IS_ADDR_UNSPECIFIED(&pktinfo->ipi6_addr)) {
2964f95d4633SHajimu UMEMOTO 			ip6_clearpktopts(opt, optname);
2965f95d4633SHajimu UMEMOTO 			break;
2966f95d4633SHajimu UMEMOTO 		}
2967f95d4633SHajimu UMEMOTO 
2968f95d4633SHajimu UMEMOTO 		if (uproto == IPPROTO_TCP && optname == IPV6_PKTINFO &&
2969f95d4633SHajimu UMEMOTO 		    sticky && !IN6_IS_ADDR_UNSPECIFIED(&pktinfo->ipi6_addr)) {
2970f95d4633SHajimu UMEMOTO 			return (EINVAL);
2971f95d4633SHajimu UMEMOTO 		}
29729196891fSAndrey V. Elsukov 		if (IN6_IS_ADDR_MULTICAST(&pktinfo->ipi6_addr))
29739196891fSAndrey V. Elsukov 			return (EINVAL);
2974f95d4633SHajimu UMEMOTO 		/* validate the interface index if specified. */
2975f95d4633SHajimu UMEMOTO 		if (pktinfo->ipi6_ifindex) {
2976f95d4633SHajimu UMEMOTO 			ifp = ifnet_byindex(pktinfo->ipi6_ifindex);
2977f95d4633SHajimu UMEMOTO 			if (ifp == NULL)
297882cd038dSYoshinobu Inoue 				return (ENXIO);
297982cd038dSYoshinobu Inoue 		}
2980be393491SDimitry Andric 		if (ifp != NULL && (ifp->if_afdata[AF_INET6] == NULL ||
2981be393491SDimitry Andric 		    (ND_IFINFO(ifp)->flags & ND6_IFF_IFDISABLED) != 0))
29829196891fSAndrey V. Elsukov 			return (ENETDOWN);
298382cd038dSYoshinobu Inoue 
29849196891fSAndrey V. Elsukov 		if (ifp != NULL &&
29859196891fSAndrey V. Elsukov 		    !IN6_IS_ADDR_UNSPECIFIED(&pktinfo->ipi6_addr)) {
29869196891fSAndrey V. Elsukov 			struct in6_ifaddr *ia;
29879196891fSAndrey V. Elsukov 
2988cb207f93SAndrey V. Elsukov 			in6_setscope(&pktinfo->ipi6_addr, ifp, NULL);
29899196891fSAndrey V. Elsukov 			ia = in6ifa_ifpwithaddr(ifp, &pktinfo->ipi6_addr);
29909196891fSAndrey V. Elsukov 			if (ia == NULL)
29919196891fSAndrey V. Elsukov 				return (EADDRNOTAVAIL);
29929196891fSAndrey V. Elsukov 			ifa_free(&ia->ia_ifa);
29939196891fSAndrey V. Elsukov 		}
299433841545SHajimu UMEMOTO 		/*
2995f95d4633SHajimu UMEMOTO 		 * We store the address anyway, and let in6_selectsrc()
2996f95d4633SHajimu UMEMOTO 		 * validate the specified address.  This is because ipi6_addr
2997f95d4633SHajimu UMEMOTO 		 * may not have enough information about its scope zone, and
2998f95d4633SHajimu UMEMOTO 		 * we may need additional information (such as outgoing
2999f95d4633SHajimu UMEMOTO 		 * interface or the scope zone of a destination address) to
3000f95d4633SHajimu UMEMOTO 		 * disambiguate the scope.
3001f95d4633SHajimu UMEMOTO 		 * XXX: the delay of the validation may confuse the
3002f95d4633SHajimu UMEMOTO 		 * application when it is used as a sticky option.
300333841545SHajimu UMEMOTO 		 */
3004f95d4633SHajimu UMEMOTO 		if (opt->ip6po_pktinfo == NULL) {
3005f95d4633SHajimu UMEMOTO 			opt->ip6po_pktinfo = malloc(sizeof(*pktinfo),
3006885adbfaSHajimu UMEMOTO 			    M_IP6OPT, M_NOWAIT);
3007885adbfaSHajimu UMEMOTO 			if (opt->ip6po_pktinfo == NULL)
3008885adbfaSHajimu UMEMOTO 				return (ENOBUFS);
300982cd038dSYoshinobu Inoue 		}
3010f95d4633SHajimu UMEMOTO 		bcopy(pktinfo, opt->ip6po_pktinfo, sizeof(*pktinfo));
301182cd038dSYoshinobu Inoue 		break;
3012f95d4633SHajimu UMEMOTO 	}
301382cd038dSYoshinobu Inoue 
3014f95d4633SHajimu UMEMOTO 	case IPV6_2292HOPLIMIT:
301582cd038dSYoshinobu Inoue 	case IPV6_HOPLIMIT:
3016f95d4633SHajimu UMEMOTO 	{
3017f95d4633SHajimu UMEMOTO 		int *hlimp;
3018f95d4633SHajimu UMEMOTO 
3019f95d4633SHajimu UMEMOTO 		/*
3020f95d4633SHajimu UMEMOTO 		 * RFC 3542 deprecated the usage of sticky IPV6_HOPLIMIT
3021f95d4633SHajimu UMEMOTO 		 * to simplify the ordering among hoplimit options.
3022f95d4633SHajimu UMEMOTO 		 */
3023f95d4633SHajimu UMEMOTO 		if (optname == IPV6_HOPLIMIT && sticky)
3024f95d4633SHajimu UMEMOTO 			return (ENOPROTOOPT);
3025f95d4633SHajimu UMEMOTO 
3026f95d4633SHajimu UMEMOTO 		if (len != sizeof(int))
3027f95d4633SHajimu UMEMOTO 			return (EINVAL);
3028f95d4633SHajimu UMEMOTO 		hlimp = (int *)buf;
3029f95d4633SHajimu UMEMOTO 		if (*hlimp < -1 || *hlimp > 255)
303082cd038dSYoshinobu Inoue 			return (EINVAL);
303182cd038dSYoshinobu Inoue 
3032f95d4633SHajimu UMEMOTO 		opt->ip6po_hlim = *hlimp;
303382cd038dSYoshinobu Inoue 		break;
3034f95d4633SHajimu UMEMOTO 	}
303582cd038dSYoshinobu Inoue 
3036f95d4633SHajimu UMEMOTO 	case IPV6_TCLASS:
3037f95d4633SHajimu UMEMOTO 	{
3038f95d4633SHajimu UMEMOTO 		int tclass;
3039f95d4633SHajimu UMEMOTO 
3040f95d4633SHajimu UMEMOTO 		if (len != sizeof(int))
3041f95d4633SHajimu UMEMOTO 			return (EINVAL);
3042f95d4633SHajimu UMEMOTO 		tclass = *(int *)buf;
3043f95d4633SHajimu UMEMOTO 		if (tclass < -1 || tclass > 255)
3044f95d4633SHajimu UMEMOTO 			return (EINVAL);
3045f95d4633SHajimu UMEMOTO 
3046f95d4633SHajimu UMEMOTO 		opt->ip6po_tclass = tclass;
3047f95d4633SHajimu UMEMOTO 		break;
3048f95d4633SHajimu UMEMOTO 	}
3049f95d4633SHajimu UMEMOTO 
3050f95d4633SHajimu UMEMOTO 	case IPV6_2292NEXTHOP:
305182cd038dSYoshinobu Inoue 	case IPV6_NEXTHOP:
305279ba3952SBjoern A. Zeeb 		if (cred != NULL) {
3053cc426dd3SMateusz Guzik 			error = priv_check_cred(cred, PRIV_NETINET_SETHDROPTS);
305479ba3952SBjoern A. Zeeb 			if (error)
305579ba3952SBjoern A. Zeeb 				return (error);
305679ba3952SBjoern A. Zeeb 		}
305733841545SHajimu UMEMOTO 
3058f95d4633SHajimu UMEMOTO 		if (len == 0) {	/* just remove the option */
3059f95d4633SHajimu UMEMOTO 			ip6_clearpktopts(opt, IPV6_NEXTHOP);
3060f95d4633SHajimu UMEMOTO 			break;
3061f95d4633SHajimu UMEMOTO 		}
3062f95d4633SHajimu UMEMOTO 
306333841545SHajimu UMEMOTO 		/* check if cmsg_len is large enough for sa_len */
3064f95d4633SHajimu UMEMOTO 		if (len < sizeof(struct sockaddr) || len < *buf)
306582cd038dSYoshinobu Inoue 			return (EINVAL);
306682cd038dSYoshinobu Inoue 
3067f95d4633SHajimu UMEMOTO 		switch (((struct sockaddr *)buf)->sa_family) {
3068f95d4633SHajimu UMEMOTO 		case AF_INET6:
3069f95d4633SHajimu UMEMOTO 		{
3070f95d4633SHajimu UMEMOTO 			struct sockaddr_in6 *sa6 = (struct sockaddr_in6 *)buf;
3071f95d4633SHajimu UMEMOTO 			int error;
3072f95d4633SHajimu UMEMOTO 
3073f95d4633SHajimu UMEMOTO 			if (sa6->sin6_len != sizeof(struct sockaddr_in6))
3074f95d4633SHajimu UMEMOTO 				return (EINVAL);
3075f95d4633SHajimu UMEMOTO 
3076f95d4633SHajimu UMEMOTO 			if (IN6_IS_ADDR_UNSPECIFIED(&sa6->sin6_addr) ||
3077f95d4633SHajimu UMEMOTO 			    IN6_IS_ADDR_MULTICAST(&sa6->sin6_addr)) {
3078f95d4633SHajimu UMEMOTO 				return (EINVAL);
3079f95d4633SHajimu UMEMOTO 			}
3080603724d3SBjoern A. Zeeb 			if ((error = sa6_embedscope(sa6, V_ip6_use_defzone))
3081f95d4633SHajimu UMEMOTO 			    != 0) {
3082f95d4633SHajimu UMEMOTO 				return (error);
3083f95d4633SHajimu UMEMOTO 			}
3084f95d4633SHajimu UMEMOTO 			break;
3085f95d4633SHajimu UMEMOTO 		}
3086f95d4633SHajimu UMEMOTO 		case AF_LINK:	/* should eventually be supported */
3087f95d4633SHajimu UMEMOTO 		default:
3088f95d4633SHajimu UMEMOTO 			return (EAFNOSUPPORT);
3089f95d4633SHajimu UMEMOTO 		}
3090f95d4633SHajimu UMEMOTO 
3091f95d4633SHajimu UMEMOTO 		/* turn off the previous option, then set the new option. */
3092f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, IPV6_NEXTHOP);
3093743eee66SSUZUKI Shinsuke 		opt->ip6po_nexthop = malloc(*buf, M_IP6OPT, M_NOWAIT);
3094743eee66SSUZUKI Shinsuke 		if (opt->ip6po_nexthop == NULL)
3095743eee66SSUZUKI Shinsuke 			return (ENOBUFS);
3096f95d4633SHajimu UMEMOTO 		bcopy(buf, opt->ip6po_nexthop, *buf);
309782cd038dSYoshinobu Inoue 		break;
309882cd038dSYoshinobu Inoue 
3099f95d4633SHajimu UMEMOTO 	case IPV6_2292HOPOPTS:
310082cd038dSYoshinobu Inoue 	case IPV6_HOPOPTS:
310133841545SHajimu UMEMOTO 	{
310233841545SHajimu UMEMOTO 		struct ip6_hbh *hbh;
310333841545SHajimu UMEMOTO 		int hbhlen;
310433841545SHajimu UMEMOTO 
3105f95d4633SHajimu UMEMOTO 		/*
3106f95d4633SHajimu UMEMOTO 		 * XXX: We don't allow a non-privileged user to set ANY HbH
3107f95d4633SHajimu UMEMOTO 		 * options, since per-option restriction has too much
3108f95d4633SHajimu UMEMOTO 		 * overhead.
3109f95d4633SHajimu UMEMOTO 		 */
311079ba3952SBjoern A. Zeeb 		if (cred != NULL) {
3111cc426dd3SMateusz Guzik 			error = priv_check_cred(cred, PRIV_NETINET_SETHDROPTS);
311279ba3952SBjoern A. Zeeb 			if (error)
311379ba3952SBjoern A. Zeeb 				return (error);
311479ba3952SBjoern A. Zeeb 		}
3115f95d4633SHajimu UMEMOTO 
3116f95d4633SHajimu UMEMOTO 		if (len == 0) {
3117f95d4633SHajimu UMEMOTO 			ip6_clearpktopts(opt, IPV6_HOPOPTS);
3118f95d4633SHajimu UMEMOTO 			break;	/* just remove the option */
3119f95d4633SHajimu UMEMOTO 		}
3120f95d4633SHajimu UMEMOTO 
3121f95d4633SHajimu UMEMOTO 		/* message length validation */
3122f95d4633SHajimu UMEMOTO 		if (len < sizeof(struct ip6_hbh))
312382cd038dSYoshinobu Inoue 			return (EINVAL);
3124f95d4633SHajimu UMEMOTO 		hbh = (struct ip6_hbh *)buf;
312533841545SHajimu UMEMOTO 		hbhlen = (hbh->ip6h_len + 1) << 3;
3126f95d4633SHajimu UMEMOTO 		if (len != hbhlen)
312782cd038dSYoshinobu Inoue 			return (EINVAL);
312833841545SHajimu UMEMOTO 
3129f95d4633SHajimu UMEMOTO 		/* turn off the previous option, then set the new option. */
3130f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, IPV6_HOPOPTS);
3131743eee66SSUZUKI Shinsuke 		opt->ip6po_hbh = malloc(hbhlen, M_IP6OPT, M_NOWAIT);
3132743eee66SSUZUKI Shinsuke 		if (opt->ip6po_hbh == NULL)
3133743eee66SSUZUKI Shinsuke 			return (ENOBUFS);
313433841545SHajimu UMEMOTO 		bcopy(hbh, opt->ip6po_hbh, hbhlen);
3135f95d4633SHajimu UMEMOTO 
313682cd038dSYoshinobu Inoue 		break;
313733841545SHajimu UMEMOTO 	}
313882cd038dSYoshinobu Inoue 
3139f95d4633SHajimu UMEMOTO 	case IPV6_2292DSTOPTS:
314082cd038dSYoshinobu Inoue 	case IPV6_DSTOPTS:
3141f95d4633SHajimu UMEMOTO 	case IPV6_RTHDRDSTOPTS:
314233841545SHajimu UMEMOTO 	{
3143f95d4633SHajimu UMEMOTO 		struct ip6_dest *dest, **newdest = NULL;
314433841545SHajimu UMEMOTO 		int destlen;
314533841545SHajimu UMEMOTO 
314679ba3952SBjoern A. Zeeb 		if (cred != NULL) { /* XXX: see the comment for IPV6_HOPOPTS */
3147cc426dd3SMateusz Guzik 			error = priv_check_cred(cred, PRIV_NETINET_SETHDROPTS);
314879ba3952SBjoern A. Zeeb 			if (error)
314979ba3952SBjoern A. Zeeb 				return (error);
315079ba3952SBjoern A. Zeeb 		}
3151f95d4633SHajimu UMEMOTO 
3152f95d4633SHajimu UMEMOTO 		if (len == 0) {
3153f95d4633SHajimu UMEMOTO 			ip6_clearpktopts(opt, optname);
3154f95d4633SHajimu UMEMOTO 			break;	/* just remove the option */
3155f95d4633SHajimu UMEMOTO 		}
3156f95d4633SHajimu UMEMOTO 
3157f95d4633SHajimu UMEMOTO 		/* message length validation */
3158f95d4633SHajimu UMEMOTO 		if (len < sizeof(struct ip6_dest))
315982cd038dSYoshinobu Inoue 			return (EINVAL);
3160f95d4633SHajimu UMEMOTO 		dest = (struct ip6_dest *)buf;
316133841545SHajimu UMEMOTO 		destlen = (dest->ip6d_len + 1) << 3;
3162f95d4633SHajimu UMEMOTO 		if (len != destlen)
316333841545SHajimu UMEMOTO 			return (EINVAL);
316482cd038dSYoshinobu Inoue 
316582cd038dSYoshinobu Inoue 		/*
3166f95d4633SHajimu UMEMOTO 		 * Determine the position that the destination options header
3167f95d4633SHajimu UMEMOTO 		 * should be inserted; before or after the routing header.
3168f95d4633SHajimu UMEMOTO 		 */
3169f95d4633SHajimu UMEMOTO 		switch (optname) {
3170f95d4633SHajimu UMEMOTO 		case IPV6_2292DSTOPTS:
3171f95d4633SHajimu UMEMOTO 			/*
3172f95d4633SHajimu UMEMOTO 			 * The old advacned API is ambiguous on this point.
3173f95d4633SHajimu UMEMOTO 			 * Our approach is to determine the position based
3174f95d4633SHajimu UMEMOTO 			 * according to the existence of a routing header.
3175f95d4633SHajimu UMEMOTO 			 * Note, however, that this depends on the order of the
3176f95d4633SHajimu UMEMOTO 			 * extension headers in the ancillary data; the 1st
3177f95d4633SHajimu UMEMOTO 			 * part of the destination options header must appear
3178f95d4633SHajimu UMEMOTO 			 * before the routing header in the ancillary data,
3179f95d4633SHajimu UMEMOTO 			 * too.
318018b35df8SHajimu UMEMOTO 			 * RFC3542 solved the ambiguity by introducing
3181f95d4633SHajimu UMEMOTO 			 * separate ancillary data or option types.
318282cd038dSYoshinobu Inoue 			 */
318333841545SHajimu UMEMOTO 			if (opt->ip6po_rthdr == NULL)
318433841545SHajimu UMEMOTO 				newdest = &opt->ip6po_dest1;
318533841545SHajimu UMEMOTO 			else
318633841545SHajimu UMEMOTO 				newdest = &opt->ip6po_dest2;
3187f95d4633SHajimu UMEMOTO 			break;
3188f95d4633SHajimu UMEMOTO 		case IPV6_RTHDRDSTOPTS:
3189f95d4633SHajimu UMEMOTO 			newdest = &opt->ip6po_dest1;
3190f95d4633SHajimu UMEMOTO 			break;
3191f95d4633SHajimu UMEMOTO 		case IPV6_DSTOPTS:
3192f95d4633SHajimu UMEMOTO 			newdest = &opt->ip6po_dest2;
3193f95d4633SHajimu UMEMOTO 			break;
3194f95d4633SHajimu UMEMOTO 		}
319533841545SHajimu UMEMOTO 
3196f95d4633SHajimu UMEMOTO 		/* turn off the previous option, then set the new option. */
3197f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, optname);
3198743eee66SSUZUKI Shinsuke 		*newdest = malloc(destlen, M_IP6OPT, M_NOWAIT);
3199fc4c8258SRobert Watson 		if (*newdest == NULL)
3200743eee66SSUZUKI Shinsuke 			return (ENOBUFS);
320133841545SHajimu UMEMOTO 		bcopy(dest, *newdest, destlen);
320233841545SHajimu UMEMOTO 
320382cd038dSYoshinobu Inoue 		break;
320433841545SHajimu UMEMOTO 	}
320582cd038dSYoshinobu Inoue 
3206f95d4633SHajimu UMEMOTO 	case IPV6_2292RTHDR:
320782cd038dSYoshinobu Inoue 	case IPV6_RTHDR:
320833841545SHajimu UMEMOTO 	{
320933841545SHajimu UMEMOTO 		struct ip6_rthdr *rth;
321033841545SHajimu UMEMOTO 		int rthlen;
321133841545SHajimu UMEMOTO 
3212f95d4633SHajimu UMEMOTO 		if (len == 0) {
3213f95d4633SHajimu UMEMOTO 			ip6_clearpktopts(opt, IPV6_RTHDR);
3214f95d4633SHajimu UMEMOTO 			break;	/* just remove the option */
3215f95d4633SHajimu UMEMOTO 		}
3216f95d4633SHajimu UMEMOTO 
3217f95d4633SHajimu UMEMOTO 		/* message length validation */
3218f95d4633SHajimu UMEMOTO 		if (len < sizeof(struct ip6_rthdr))
321982cd038dSYoshinobu Inoue 			return (EINVAL);
3220f95d4633SHajimu UMEMOTO 		rth = (struct ip6_rthdr *)buf;
322133841545SHajimu UMEMOTO 		rthlen = (rth->ip6r_len + 1) << 3;
3222f95d4633SHajimu UMEMOTO 		if (len != rthlen)
322382cd038dSYoshinobu Inoue 			return (EINVAL);
322433841545SHajimu UMEMOTO 
322533841545SHajimu UMEMOTO 		switch (rth->ip6r_type) {
322682cd038dSYoshinobu Inoue 		case IPV6_RTHDR_TYPE_0:
3227f95d4633SHajimu UMEMOTO 			if (rth->ip6r_len == 0)	/* must contain one addr */
322833841545SHajimu UMEMOTO 				return (EINVAL);
3229f95d4633SHajimu UMEMOTO 			if (rth->ip6r_len % 2) /* length must be even */
323033841545SHajimu UMEMOTO 				return (EINVAL);
323133841545SHajimu UMEMOTO 			if (rth->ip6r_len / 2 != rth->ip6r_segleft)
323282cd038dSYoshinobu Inoue 				return (EINVAL);
323382cd038dSYoshinobu Inoue 			break;
323482cd038dSYoshinobu Inoue 		default:
323533841545SHajimu UMEMOTO 			return (EINVAL);	/* not supported */
323682cd038dSYoshinobu Inoue 		}
323733841545SHajimu UMEMOTO 
3238f95d4633SHajimu UMEMOTO 		/* turn off the previous option */
3239f95d4633SHajimu UMEMOTO 		ip6_clearpktopts(opt, IPV6_RTHDR);
3240743eee66SSUZUKI Shinsuke 		opt->ip6po_rthdr = malloc(rthlen, M_IP6OPT, M_NOWAIT);
3241743eee66SSUZUKI Shinsuke 		if (opt->ip6po_rthdr == NULL)
3242743eee66SSUZUKI Shinsuke 			return (ENOBUFS);
324333841545SHajimu UMEMOTO 		bcopy(rth, opt->ip6po_rthdr, rthlen);
324433841545SHajimu UMEMOTO 
324582cd038dSYoshinobu Inoue 		break;
324633841545SHajimu UMEMOTO 	}
324782cd038dSYoshinobu Inoue 
3248f95d4633SHajimu UMEMOTO 	case IPV6_USE_MIN_MTU:
3249f95d4633SHajimu UMEMOTO 		if (len != sizeof(int))
3250f95d4633SHajimu UMEMOTO 			return (EINVAL);
3251f95d4633SHajimu UMEMOTO 		minmtupolicy = *(int *)buf;
3252f95d4633SHajimu UMEMOTO 		if (minmtupolicy != IP6PO_MINMTU_MCASTONLY &&
3253f95d4633SHajimu UMEMOTO 		    minmtupolicy != IP6PO_MINMTU_DISABLE &&
3254f95d4633SHajimu UMEMOTO 		    minmtupolicy != IP6PO_MINMTU_ALL) {
3255f95d4633SHajimu UMEMOTO 			return (EINVAL);
3256f95d4633SHajimu UMEMOTO 		}
3257f95d4633SHajimu UMEMOTO 		opt->ip6po_minmtu = minmtupolicy;
3258f95d4633SHajimu UMEMOTO 		break;
3259f95d4633SHajimu UMEMOTO 
3260f95d4633SHajimu UMEMOTO 	case IPV6_DONTFRAG:
3261f95d4633SHajimu UMEMOTO 		if (len != sizeof(int))
3262f95d4633SHajimu UMEMOTO 			return (EINVAL);
3263f95d4633SHajimu UMEMOTO 
3264f95d4633SHajimu UMEMOTO 		if (uproto == IPPROTO_TCP || *(int *)buf == 0) {
3265f95d4633SHajimu UMEMOTO 			/*
3266f95d4633SHajimu UMEMOTO 			 * we ignore this option for TCP sockets.
326718b35df8SHajimu UMEMOTO 			 * (RFC3542 leaves this case unspecified.)
3268f95d4633SHajimu UMEMOTO 			 */
3269f95d4633SHajimu UMEMOTO 			opt->ip6po_flags &= ~IP6PO_DONTFRAG;
3270f95d4633SHajimu UMEMOTO 		} else
3271f95d4633SHajimu UMEMOTO 			opt->ip6po_flags |= IP6PO_DONTFRAG;
3272f95d4633SHajimu UMEMOTO 		break;
3273f95d4633SHajimu UMEMOTO 
3274f95d4633SHajimu UMEMOTO 	case IPV6_PREFER_TEMPADDR:
3275f95d4633SHajimu UMEMOTO 		if (len != sizeof(int))
3276f95d4633SHajimu UMEMOTO 			return (EINVAL);
3277f95d4633SHajimu UMEMOTO 		preftemp = *(int *)buf;
3278f95d4633SHajimu UMEMOTO 		if (preftemp != IP6PO_TEMPADDR_SYSTEM &&
3279f95d4633SHajimu UMEMOTO 		    preftemp != IP6PO_TEMPADDR_NOTPREFER &&
3280f95d4633SHajimu UMEMOTO 		    preftemp != IP6PO_TEMPADDR_PREFER) {
3281f95d4633SHajimu UMEMOTO 			return (EINVAL);
3282f95d4633SHajimu UMEMOTO 		}
3283f95d4633SHajimu UMEMOTO 		opt->ip6po_prefer_tempaddr = preftemp;
3284f95d4633SHajimu UMEMOTO 		break;
3285f95d4633SHajimu UMEMOTO 
328682cd038dSYoshinobu Inoue 	default:
328782cd038dSYoshinobu Inoue 		return (ENOPROTOOPT);
3288f95d4633SHajimu UMEMOTO 	} /* end of switch */
328982cd038dSYoshinobu Inoue 
329082cd038dSYoshinobu Inoue 	return (0);
329182cd038dSYoshinobu Inoue }
329282cd038dSYoshinobu Inoue 
329382cd038dSYoshinobu Inoue /*
329482cd038dSYoshinobu Inoue  * Routine called from ip6_output() to loop back a copy of an IP6 multicast
329582cd038dSYoshinobu Inoue  * packet to the input queue of a specified interface.  Note that this
329682cd038dSYoshinobu Inoue  * calls the output routine of the loopback "driver", but with an interface
329782cd038dSYoshinobu Inoue  * pointer that might NOT be &loif -- easier than replicating that code here.
329882cd038dSYoshinobu Inoue  */
329982cd038dSYoshinobu Inoue void
330056a5f52eSGleb Smirnoff ip6_mloopback(struct ifnet *ifp, struct mbuf *m)
330182cd038dSYoshinobu Inoue {
330282cd038dSYoshinobu Inoue 	struct mbuf *copym;
3303686cdd19SJun-ichiro itojun Hagino 	struct ip6_hdr *ip6;
330482cd038dSYoshinobu Inoue 
3305c3bef61eSKevin Lo 	copym = m_copym(m, 0, M_COPYALL, M_NOWAIT);
3306686cdd19SJun-ichiro itojun Hagino 	if (copym == NULL)
3307686cdd19SJun-ichiro itojun Hagino 		return;
3308686cdd19SJun-ichiro itojun Hagino 
3309686cdd19SJun-ichiro itojun Hagino 	/*
3310686cdd19SJun-ichiro itojun Hagino 	 * Make sure to deep-copy IPv6 header portion in case the data
3311686cdd19SJun-ichiro itojun Hagino 	 * is in an mbuf cluster, so that we can safely override the IPv6
3312686cdd19SJun-ichiro itojun Hagino 	 * header portion later.
3313686cdd19SJun-ichiro itojun Hagino 	 */
3314f0cace5dSRobert Watson 	if (!M_WRITABLE(copym) ||
3315686cdd19SJun-ichiro itojun Hagino 	    copym->m_len < sizeof(struct ip6_hdr)) {
3316686cdd19SJun-ichiro itojun Hagino 		copym = m_pullup(copym, sizeof(struct ip6_hdr));
3317686cdd19SJun-ichiro itojun Hagino 		if (copym == NULL)
3318686cdd19SJun-ichiro itojun Hagino 			return;
331982cd038dSYoshinobu Inoue 	}
3320686cdd19SJun-ichiro itojun Hagino 	ip6 = mtod(copym, struct ip6_hdr *);
332133841545SHajimu UMEMOTO 	/*
332233841545SHajimu UMEMOTO 	 * clear embedded scope identifiers if necessary.
332333841545SHajimu UMEMOTO 	 * in6_clearscope will touch the addresses only when necessary.
332433841545SHajimu UMEMOTO 	 */
332533841545SHajimu UMEMOTO 	in6_clearscope(&ip6->ip6_src);
332633841545SHajimu UMEMOTO 	in6_clearscope(&ip6->ip6_dst);
3327654bdb5aSAndrey V. Elsukov 	if (copym->m_pkthdr.csum_flags & CSUM_DELAY_DATA_IPV6) {
3328654bdb5aSAndrey V. Elsukov 		copym->m_pkthdr.csum_flags |= CSUM_DATA_VALID_IPV6 |
3329654bdb5aSAndrey V. Elsukov 		    CSUM_PSEUDO_HDR;
3330654bdb5aSAndrey V. Elsukov 		copym->m_pkthdr.csum_data = 0xffff;
3331654bdb5aSAndrey V. Elsukov 	}
3332331dff07SAlexander V. Chernikov 	if_simloop(ifp, copym, AF_INET6, 0);
333382cd038dSYoshinobu Inoue }
333482cd038dSYoshinobu Inoue 
333582cd038dSYoshinobu Inoue /*
333682cd038dSYoshinobu Inoue  * Chop IPv6 header off from the payload.
333782cd038dSYoshinobu Inoue  */
333882cd038dSYoshinobu Inoue static int
33391272577eSXin LI ip6_splithdr(struct mbuf *m, struct ip6_exthdrs *exthdrs)
334082cd038dSYoshinobu Inoue {
334182cd038dSYoshinobu Inoue 	struct mbuf *mh;
334282cd038dSYoshinobu Inoue 	struct ip6_hdr *ip6;
334382cd038dSYoshinobu Inoue 
334482cd038dSYoshinobu Inoue 	ip6 = mtod(m, struct ip6_hdr *);
334582cd038dSYoshinobu Inoue 	if (m->m_len > sizeof(*ip6)) {
33467b07d1beSGleb Smirnoff 		mh = m_gethdr(M_NOWAIT, MT_DATA);
33477b07d1beSGleb Smirnoff 		if (mh == NULL) {
334882cd038dSYoshinobu Inoue 			m_freem(m);
334982cd038dSYoshinobu Inoue 			return ENOBUFS;
335082cd038dSYoshinobu Inoue 		}
335110e5acc3SGleb Smirnoff 		m_move_pkthdr(mh, m);
3352ed6a66caSRobert Watson 		M_ALIGN(mh, sizeof(*ip6));
335382cd038dSYoshinobu Inoue 		m->m_len -= sizeof(*ip6);
335482cd038dSYoshinobu Inoue 		m->m_data += sizeof(*ip6);
335582cd038dSYoshinobu Inoue 		mh->m_next = m;
335682cd038dSYoshinobu Inoue 		m = mh;
335782cd038dSYoshinobu Inoue 		m->m_len = sizeof(*ip6);
335882cd038dSYoshinobu Inoue 		bcopy((caddr_t)ip6, mtod(m, caddr_t), sizeof(*ip6));
335982cd038dSYoshinobu Inoue 	}
336082cd038dSYoshinobu Inoue 	exthdrs->ip6e_ip6 = m;
336182cd038dSYoshinobu Inoue 	return 0;
336282cd038dSYoshinobu Inoue }
336382cd038dSYoshinobu Inoue 
336482cd038dSYoshinobu Inoue /*
336582cd038dSYoshinobu Inoue  * Compute IPv6 extension header length.
336682cd038dSYoshinobu Inoue  */
336782cd038dSYoshinobu Inoue int
33680ecd976eSBjoern A. Zeeb ip6_optlen(struct inpcb *inp)
336982cd038dSYoshinobu Inoue {
337082cd038dSYoshinobu Inoue 	int len;
337182cd038dSYoshinobu Inoue 
33720ecd976eSBjoern A. Zeeb 	if (!inp->in6p_outputopts)
337382cd038dSYoshinobu Inoue 		return 0;
337482cd038dSYoshinobu Inoue 
337582cd038dSYoshinobu Inoue 	len = 0;
337682cd038dSYoshinobu Inoue #define elen(x) \
337782cd038dSYoshinobu Inoue     (((struct ip6_ext *)(x)) ? (((struct ip6_ext *)(x))->ip6e_len + 1) << 3 : 0)
337882cd038dSYoshinobu Inoue 
33790ecd976eSBjoern A. Zeeb 	len += elen(inp->in6p_outputopts->ip6po_hbh);
33800ecd976eSBjoern A. Zeeb 	if (inp->in6p_outputopts->ip6po_rthdr)
338133841545SHajimu UMEMOTO 		/* dest1 is valid with rthdr only */
33820ecd976eSBjoern A. Zeeb 		len += elen(inp->in6p_outputopts->ip6po_dest1);
33830ecd976eSBjoern A. Zeeb 	len += elen(inp->in6p_outputopts->ip6po_rthdr);
33840ecd976eSBjoern A. Zeeb 	len += elen(inp->in6p_outputopts->ip6po_dest2);
338582cd038dSYoshinobu Inoue 	return len;
338682cd038dSYoshinobu Inoue #undef elen
338782cd038dSYoshinobu Inoue }
3388