xref: /freebsd/sys/netinet/in_gif.c (revision 009d82ee0fefdc797f55d25a50d3b6ebe61d56e4)
1c398230bSWarner Losh /*-
251369649SPedro F. Giffuni  * SPDX-License-Identifier: BSD-3-Clause
351369649SPedro F. Giffuni  *
4cfa1ca9dSYoshinobu Inoue  * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project.
5b941bc1dSAndrey V. Elsukov  * Copyright (c) 2018 Andrey V. Elsukov <ae@FreeBSD.org>
6cfa1ca9dSYoshinobu Inoue  * All rights reserved.
7cfa1ca9dSYoshinobu Inoue  *
8cfa1ca9dSYoshinobu Inoue  * Redistribution and use in source and binary forms, with or without
9cfa1ca9dSYoshinobu Inoue  * modification, are permitted provided that the following conditions
10cfa1ca9dSYoshinobu Inoue  * are met:
11cfa1ca9dSYoshinobu Inoue  * 1. Redistributions of source code must retain the above copyright
12cfa1ca9dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer.
13cfa1ca9dSYoshinobu Inoue  * 2. Redistributions in binary form must reproduce the above copyright
14cfa1ca9dSYoshinobu Inoue  *    notice, this list of conditions and the following disclaimer in the
15cfa1ca9dSYoshinobu Inoue  *    documentation and/or other materials provided with the distribution.
16cfa1ca9dSYoshinobu Inoue  * 3. Neither the name of the project nor the names of its contributors
17cfa1ca9dSYoshinobu Inoue  *    may be used to endorse or promote products derived from this software
18cfa1ca9dSYoshinobu Inoue  *    without specific prior written permission.
19cfa1ca9dSYoshinobu Inoue  *
20cfa1ca9dSYoshinobu Inoue  * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND
21cfa1ca9dSYoshinobu Inoue  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22cfa1ca9dSYoshinobu Inoue  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
23cfa1ca9dSYoshinobu Inoue  * ARE DISCLAIMED.  IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE
24cfa1ca9dSYoshinobu Inoue  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25cfa1ca9dSYoshinobu Inoue  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
26cfa1ca9dSYoshinobu Inoue  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27cfa1ca9dSYoshinobu Inoue  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
28cfa1ca9dSYoshinobu Inoue  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
29cfa1ca9dSYoshinobu Inoue  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
30cfa1ca9dSYoshinobu Inoue  * SUCH DAMAGE.
310b9f5f8aSAndrey V. Elsukov  *
320b9f5f8aSAndrey V. Elsukov  *	$KAME: in_gif.c,v 1.54 2001/05/14 14:02:16 itojun Exp $
33cfa1ca9dSYoshinobu Inoue  */
34cfa1ca9dSYoshinobu Inoue 
354b421e2dSMike Silbersack #include <sys/cdefs.h>
364b421e2dSMike Silbersack __FBSDID("$FreeBSD$");
374b421e2dSMike Silbersack 
38686cdd19SJun-ichiro itojun Hagino #include "opt_inet.h"
39cfa1ca9dSYoshinobu Inoue #include "opt_inet6.h"
40cfa1ca9dSYoshinobu Inoue 
41cfa1ca9dSYoshinobu Inoue #include <sys/param.h>
42cfa1ca9dSYoshinobu Inoue #include <sys/systm.h>
43b941bc1dSAndrey V. Elsukov #include <sys/jail.h>
44cfa1ca9dSYoshinobu Inoue #include <sys/socket.h>
45cfa1ca9dSYoshinobu Inoue #include <sys/sockio.h>
46cfa1ca9dSYoshinobu Inoue #include <sys/mbuf.h>
47cfa1ca9dSYoshinobu Inoue #include <sys/errno.h>
48cfa1ca9dSYoshinobu Inoue #include <sys/kernel.h>
49cfa1ca9dSYoshinobu Inoue #include <sys/sysctl.h>
50686cdd19SJun-ichiro itojun Hagino #include <sys/malloc.h>
516573d758SMatt Macy #include <sys/proc.h>
52cfa1ca9dSYoshinobu Inoue 
53b941bc1dSAndrey V. Elsukov #include <net/ethernet.h>
54cfa1ca9dSYoshinobu Inoue #include <net/if.h>
5576039bc8SGleb Smirnoff #include <net/if_var.h>
56cfa1ca9dSYoshinobu Inoue #include <net/route.h>
57530c0060SRobert Watson #include <net/vnet.h>
58cfa1ca9dSYoshinobu Inoue 
59cfa1ca9dSYoshinobu Inoue #include <netinet/in.h>
60cfa1ca9dSYoshinobu Inoue #include <netinet/in_systm.h>
61cfa1ca9dSYoshinobu Inoue #include <netinet/ip.h>
626a800098SYoshinobu Inoue #include <netinet/ip_var.h>
63686cdd19SJun-ichiro itojun Hagino #include <netinet/in_var.h>
64686cdd19SJun-ichiro itojun Hagino #include <netinet/ip_encap.h>
656a800098SYoshinobu Inoue #include <netinet/ip_ecn.h>
6665ff3638SAlexander V. Chernikov #include <netinet/in_fib.h>
67686cdd19SJun-ichiro itojun Hagino 
686a800098SYoshinobu Inoue #ifdef INET6
69686cdd19SJun-ichiro itojun Hagino #include <netinet/ip6.h>
706a800098SYoshinobu Inoue #endif
71cfa1ca9dSYoshinobu Inoue 
72cfa1ca9dSYoshinobu Inoue #include <net/if_gif.h>
73cfa1ca9dSYoshinobu Inoue 
74132c4490SAndrey V. Elsukov #define GIF_TTL		30
755f901c92SAndrew Turner VNET_DEFINE_STATIC(int, ip_gif_ttl) = GIF_TTL;
7682cea7e6SBjoern A. Zeeb #define	V_ip_gif_ttl		VNET(ip_gif_ttl)
776df8a710SGleb Smirnoff SYSCTL_INT(_net_inet_ip, IPCTL_GIF_TTL, gifttl, CTLFLAG_VNET | CTLFLAG_RW,
786d8fdfa9SAndrey V. Elsukov     &VNET_NAME(ip_gif_ttl), 0, "Default TTL value for encapsulated packets");
79cfa1ca9dSYoshinobu Inoue 
80b941bc1dSAndrey V. Elsukov /*
81b941bc1dSAndrey V. Elsukov  * We keep interfaces in a hash table using src+dst as key.
82b941bc1dSAndrey V. Elsukov  * Interfaces with GIF_IGNORE_SOURCE flag are linked into plain list.
83b941bc1dSAndrey V. Elsukov  */
845f901c92SAndrew Turner VNET_DEFINE_STATIC(struct gif_list *, ipv4_hashtbl) = NULL;
85*009d82eeSAndrey V. Elsukov VNET_DEFINE_STATIC(struct gif_list *, ipv4_srchashtbl) = NULL;
865f901c92SAndrew Turner VNET_DEFINE_STATIC(struct gif_list, ipv4_list) = CK_LIST_HEAD_INITIALIZER();
87b941bc1dSAndrey V. Elsukov #define	V_ipv4_hashtbl		VNET(ipv4_hashtbl)
88*009d82eeSAndrey V. Elsukov #define	V_ipv4_srchashtbl	VNET(ipv4_srchashtbl)
89b941bc1dSAndrey V. Elsukov #define	V_ipv4_list		VNET(ipv4_list)
90b941bc1dSAndrey V. Elsukov 
91b941bc1dSAndrey V. Elsukov #define	GIF_HASH(src, dst)	(V_ipv4_hashtbl[\
92b941bc1dSAndrey V. Elsukov     in_gif_hashval((src), (dst)) & (GIF_HASH_SIZE - 1)])
93*009d82eeSAndrey V. Elsukov #define	GIF_SRCHASH(src)	(V_ipv4_srchashtbl[\
94*009d82eeSAndrey V. Elsukov     fnv_32_buf(&(src), sizeof(src), FNV1_32_INIT) & (GIF_HASH_SIZE - 1)])
95b941bc1dSAndrey V. Elsukov #define	GIF_HASH_SC(sc)		GIF_HASH((sc)->gif_iphdr->ip_src.s_addr,\
96b941bc1dSAndrey V. Elsukov     (sc)->gif_iphdr->ip_dst.s_addr)
97b941bc1dSAndrey V. Elsukov static uint32_t
98b941bc1dSAndrey V. Elsukov in_gif_hashval(in_addr_t src, in_addr_t dst)
99b941bc1dSAndrey V. Elsukov {
100b941bc1dSAndrey V. Elsukov 	uint32_t ret;
101b941bc1dSAndrey V. Elsukov 
102b941bc1dSAndrey V. Elsukov 	ret = fnv_32_buf(&src, sizeof(src), FNV1_32_INIT);
103b941bc1dSAndrey V. Elsukov 	return (fnv_32_buf(&dst, sizeof(dst), ret));
104b941bc1dSAndrey V. Elsukov }
105b941bc1dSAndrey V. Elsukov 
106b941bc1dSAndrey V. Elsukov static int
107b941bc1dSAndrey V. Elsukov in_gif_checkdup(const struct gif_softc *sc, in_addr_t src, in_addr_t dst)
108b941bc1dSAndrey V. Elsukov {
109b941bc1dSAndrey V. Elsukov 	struct gif_softc *tmp;
110b941bc1dSAndrey V. Elsukov 
111b941bc1dSAndrey V. Elsukov 	if (sc->gif_family == AF_INET &&
112b941bc1dSAndrey V. Elsukov 	    sc->gif_iphdr->ip_src.s_addr == src &&
113b941bc1dSAndrey V. Elsukov 	    sc->gif_iphdr->ip_dst.s_addr == dst)
114b941bc1dSAndrey V. Elsukov 		return (EEXIST);
115b941bc1dSAndrey V. Elsukov 
116b941bc1dSAndrey V. Elsukov 	CK_LIST_FOREACH(tmp, &GIF_HASH(src, dst), chain) {
117b941bc1dSAndrey V. Elsukov 		if (tmp == sc)
118b941bc1dSAndrey V. Elsukov 			continue;
119b941bc1dSAndrey V. Elsukov 		if (tmp->gif_iphdr->ip_src.s_addr == src &&
120b941bc1dSAndrey V. Elsukov 		    tmp->gif_iphdr->ip_dst.s_addr == dst)
121b941bc1dSAndrey V. Elsukov 			return (EADDRNOTAVAIL);
122b941bc1dSAndrey V. Elsukov 	}
123b941bc1dSAndrey V. Elsukov 	return (0);
124b941bc1dSAndrey V. Elsukov }
125b941bc1dSAndrey V. Elsukov 
126*009d82eeSAndrey V. Elsukov /*
127*009d82eeSAndrey V. Elsukov  * Check that ingress address belongs to local host.
128*009d82eeSAndrey V. Elsukov  */
129*009d82eeSAndrey V. Elsukov static void
130*009d82eeSAndrey V. Elsukov in_gif_set_running(struct gif_softc *sc)
131*009d82eeSAndrey V. Elsukov {
132*009d82eeSAndrey V. Elsukov 
133*009d82eeSAndrey V. Elsukov 	if (in_localip(sc->gif_iphdr->ip_src))
134*009d82eeSAndrey V. Elsukov 		GIF2IFP(sc)->if_drv_flags |= IFF_DRV_RUNNING;
135*009d82eeSAndrey V. Elsukov 	else
136*009d82eeSAndrey V. Elsukov 		GIF2IFP(sc)->if_drv_flags &= ~IFF_DRV_RUNNING;
137*009d82eeSAndrey V. Elsukov }
138*009d82eeSAndrey V. Elsukov 
139*009d82eeSAndrey V. Elsukov /*
140*009d82eeSAndrey V. Elsukov  * ifaddr_event handler.
141*009d82eeSAndrey V. Elsukov  * Clear IFF_DRV_RUNNING flag when ingress address disappears to prevent
142*009d82eeSAndrey V. Elsukov  * source address spoofing.
143*009d82eeSAndrey V. Elsukov  */
144*009d82eeSAndrey V. Elsukov static void
145*009d82eeSAndrey V. Elsukov in_gif_srcaddr(void *arg __unused, const struct sockaddr *sa,
146*009d82eeSAndrey V. Elsukov     int event __unused)
147*009d82eeSAndrey V. Elsukov {
148*009d82eeSAndrey V. Elsukov 	const struct sockaddr_in *sin;
149*009d82eeSAndrey V. Elsukov 	struct gif_softc *sc;
150*009d82eeSAndrey V. Elsukov 
151*009d82eeSAndrey V. Elsukov 	if (V_ipv4_srchashtbl == NULL)
152*009d82eeSAndrey V. Elsukov 		return;
153*009d82eeSAndrey V. Elsukov 
154*009d82eeSAndrey V. Elsukov 	MPASS(in_epoch(net_epoch_preempt));
155*009d82eeSAndrey V. Elsukov 	sin = (const struct sockaddr_in *)sa;
156*009d82eeSAndrey V. Elsukov 	CK_LIST_FOREACH(sc, &GIF_SRCHASH(sin->sin_addr.s_addr), srchash) {
157*009d82eeSAndrey V. Elsukov 		if (sc->gif_iphdr->ip_src.s_addr != sin->sin_addr.s_addr)
158*009d82eeSAndrey V. Elsukov 			continue;
159*009d82eeSAndrey V. Elsukov 		in_gif_set_running(sc);
160*009d82eeSAndrey V. Elsukov 	}
161*009d82eeSAndrey V. Elsukov }
162*009d82eeSAndrey V. Elsukov 
163b941bc1dSAndrey V. Elsukov static void
164b941bc1dSAndrey V. Elsukov in_gif_attach(struct gif_softc *sc)
165b941bc1dSAndrey V. Elsukov {
166b941bc1dSAndrey V. Elsukov 
167b941bc1dSAndrey V. Elsukov 	if (sc->gif_options & GIF_IGNORE_SOURCE)
168b941bc1dSAndrey V. Elsukov 		CK_LIST_INSERT_HEAD(&V_ipv4_list, sc, chain);
169b941bc1dSAndrey V. Elsukov 	else
170b941bc1dSAndrey V. Elsukov 		CK_LIST_INSERT_HEAD(&GIF_HASH_SC(sc), sc, chain);
171*009d82eeSAndrey V. Elsukov 
172*009d82eeSAndrey V. Elsukov 	CK_LIST_INSERT_HEAD(&GIF_SRCHASH(sc->gif_iphdr->ip_src.s_addr),
173*009d82eeSAndrey V. Elsukov 	    sc, srchash);
174b941bc1dSAndrey V. Elsukov }
175b941bc1dSAndrey V. Elsukov 
176b941bc1dSAndrey V. Elsukov int
177b941bc1dSAndrey V. Elsukov in_gif_setopts(struct gif_softc *sc, u_int options)
178b941bc1dSAndrey V. Elsukov {
179b941bc1dSAndrey V. Elsukov 
180b941bc1dSAndrey V. Elsukov 	/* NOTE: we are protected with gif_ioctl_sx lock */
181b941bc1dSAndrey V. Elsukov 	MPASS(sc->gif_family == AF_INET);
182b941bc1dSAndrey V. Elsukov 	MPASS(sc->gif_options != options);
183b941bc1dSAndrey V. Elsukov 
184b941bc1dSAndrey V. Elsukov 	if ((options & GIF_IGNORE_SOURCE) !=
185b941bc1dSAndrey V. Elsukov 	    (sc->gif_options & GIF_IGNORE_SOURCE)) {
186*009d82eeSAndrey V. Elsukov 		CK_LIST_REMOVE(sc, srchash);
187b941bc1dSAndrey V. Elsukov 		CK_LIST_REMOVE(sc, chain);
188b941bc1dSAndrey V. Elsukov 		sc->gif_options = options;
189b941bc1dSAndrey V. Elsukov 		in_gif_attach(sc);
190b941bc1dSAndrey V. Elsukov 	}
191b941bc1dSAndrey V. Elsukov 	return (0);
192b941bc1dSAndrey V. Elsukov }
193b941bc1dSAndrey V. Elsukov 
194b941bc1dSAndrey V. Elsukov int
195b941bc1dSAndrey V. Elsukov in_gif_ioctl(struct gif_softc *sc, u_long cmd, caddr_t data)
196b941bc1dSAndrey V. Elsukov {
197b941bc1dSAndrey V. Elsukov 	struct ifreq *ifr = (struct ifreq *)data;
198b941bc1dSAndrey V. Elsukov 	struct sockaddr_in *dst, *src;
199b941bc1dSAndrey V. Elsukov 	struct ip *ip;
200b941bc1dSAndrey V. Elsukov 	int error;
201b941bc1dSAndrey V. Elsukov 
202b941bc1dSAndrey V. Elsukov 	/* NOTE: we are protected with gif_ioctl_sx lock */
203b941bc1dSAndrey V. Elsukov 	error = EINVAL;
204b941bc1dSAndrey V. Elsukov 	switch (cmd) {
205b941bc1dSAndrey V. Elsukov 	case SIOCSIFPHYADDR:
206b941bc1dSAndrey V. Elsukov 		src = &((struct in_aliasreq *)data)->ifra_addr;
207b941bc1dSAndrey V. Elsukov 		dst = &((struct in_aliasreq *)data)->ifra_dstaddr;
208b941bc1dSAndrey V. Elsukov 
209b941bc1dSAndrey V. Elsukov 		/* sanity checks */
210b941bc1dSAndrey V. Elsukov 		if (src->sin_family != dst->sin_family ||
211b941bc1dSAndrey V. Elsukov 		    src->sin_family != AF_INET ||
212b941bc1dSAndrey V. Elsukov 		    src->sin_len != dst->sin_len ||
213b941bc1dSAndrey V. Elsukov 		    src->sin_len != sizeof(*src))
214b941bc1dSAndrey V. Elsukov 			break;
215b941bc1dSAndrey V. Elsukov 		if (src->sin_addr.s_addr == INADDR_ANY ||
216b941bc1dSAndrey V. Elsukov 		    dst->sin_addr.s_addr == INADDR_ANY) {
217b941bc1dSAndrey V. Elsukov 			error = EADDRNOTAVAIL;
218b941bc1dSAndrey V. Elsukov 			break;
219b941bc1dSAndrey V. Elsukov 		}
220*009d82eeSAndrey V. Elsukov 		if (V_ipv4_hashtbl == NULL) {
221b941bc1dSAndrey V. Elsukov 			V_ipv4_hashtbl = gif_hashinit();
222*009d82eeSAndrey V. Elsukov 			V_ipv4_srchashtbl = gif_hashinit();
223*009d82eeSAndrey V. Elsukov 		}
224b941bc1dSAndrey V. Elsukov 		error = in_gif_checkdup(sc, src->sin_addr.s_addr,
225b941bc1dSAndrey V. Elsukov 		    dst->sin_addr.s_addr);
226b941bc1dSAndrey V. Elsukov 		if (error == EADDRNOTAVAIL)
227b941bc1dSAndrey V. Elsukov 			break;
228b941bc1dSAndrey V. Elsukov 		if (error == EEXIST) {
229b941bc1dSAndrey V. Elsukov 			/* Addresses are the same. Just return. */
230b941bc1dSAndrey V. Elsukov 			error = 0;
231b941bc1dSAndrey V. Elsukov 			break;
232b941bc1dSAndrey V. Elsukov 		}
233b941bc1dSAndrey V. Elsukov 		ip = malloc(sizeof(*ip), M_GIF, M_WAITOK | M_ZERO);
234b941bc1dSAndrey V. Elsukov 		ip->ip_src.s_addr = src->sin_addr.s_addr;
235b941bc1dSAndrey V. Elsukov 		ip->ip_dst.s_addr = dst->sin_addr.s_addr;
236b941bc1dSAndrey V. Elsukov 		if (sc->gif_family != 0) {
237b941bc1dSAndrey V. Elsukov 			/* Detach existing tunnel first */
238*009d82eeSAndrey V. Elsukov 			CK_LIST_REMOVE(sc, srchash);
239b941bc1dSAndrey V. Elsukov 			CK_LIST_REMOVE(sc, chain);
240b941bc1dSAndrey V. Elsukov 			GIF_WAIT();
241b941bc1dSAndrey V. Elsukov 			free(sc->gif_hdr, M_GIF);
242b941bc1dSAndrey V. Elsukov 			/* XXX: should we notify about link state change? */
243b941bc1dSAndrey V. Elsukov 		}
244b941bc1dSAndrey V. Elsukov 		sc->gif_family = AF_INET;
245b941bc1dSAndrey V. Elsukov 		sc->gif_iphdr = ip;
246b941bc1dSAndrey V. Elsukov 		in_gif_attach(sc);
247*009d82eeSAndrey V. Elsukov 		in_gif_set_running(sc);
248b941bc1dSAndrey V. Elsukov 		break;
249b941bc1dSAndrey V. Elsukov 	case SIOCGIFPSRCADDR:
250b941bc1dSAndrey V. Elsukov 	case SIOCGIFPDSTADDR:
251b941bc1dSAndrey V. Elsukov 		if (sc->gif_family != AF_INET) {
252b941bc1dSAndrey V. Elsukov 			error = EADDRNOTAVAIL;
253b941bc1dSAndrey V. Elsukov 			break;
254b941bc1dSAndrey V. Elsukov 		}
255b941bc1dSAndrey V. Elsukov 		src = (struct sockaddr_in *)&ifr->ifr_addr;
256b941bc1dSAndrey V. Elsukov 		memset(src, 0, sizeof(*src));
257b941bc1dSAndrey V. Elsukov 		src->sin_family = AF_INET;
258b941bc1dSAndrey V. Elsukov 		src->sin_len = sizeof(*src);
259b941bc1dSAndrey V. Elsukov 		src->sin_addr = (cmd == SIOCGIFPSRCADDR) ?
260b941bc1dSAndrey V. Elsukov 		    sc->gif_iphdr->ip_src: sc->gif_iphdr->ip_dst;
261b941bc1dSAndrey V. Elsukov 		error = prison_if(curthread->td_ucred, (struct sockaddr *)src);
262b941bc1dSAndrey V. Elsukov 		if (error != 0)
263b941bc1dSAndrey V. Elsukov 			memset(src, 0, sizeof(*src));
264b941bc1dSAndrey V. Elsukov 		break;
265b941bc1dSAndrey V. Elsukov 	}
266b941bc1dSAndrey V. Elsukov 	return (error);
267b941bc1dSAndrey V. Elsukov }
268b941bc1dSAndrey V. Elsukov 
269cfa1ca9dSYoshinobu Inoue int
2700b9f5f8aSAndrey V. Elsukov in_gif_output(struct ifnet *ifp, struct mbuf *m, int proto, uint8_t ecn)
271cfa1ca9dSYoshinobu Inoue {
272fc74a9f9SBrooks Davis 	struct gif_softc *sc = ifp->if_softc;
273cfa1ca9dSYoshinobu Inoue 	struct ip *ip;
2740b9f5f8aSAndrey V. Elsukov 	int len;
275cfa1ca9dSYoshinobu Inoue 
276cfa1ca9dSYoshinobu Inoue 	/* prepend new IP header */
2776573d758SMatt Macy 	MPASS(in_epoch(net_epoch_preempt));
278c89c8a10SMarius Strobl 	len = sizeof(struct ip);
279c89c8a10SMarius Strobl #ifndef __NO_STRICT_ALIGNMENT
2800b9f5f8aSAndrey V. Elsukov 	if (proto == IPPROTO_ETHERIP)
281c89c8a10SMarius Strobl 		len += ETHERIP_ALIGN;
282c89c8a10SMarius Strobl #endif
283eb1b1807SGleb Smirnoff 	M_PREPEND(m, len, M_NOWAIT);
2840b9f5f8aSAndrey V. Elsukov 	if (m == NULL)
2850b9f5f8aSAndrey V. Elsukov 		return (ENOBUFS);
286c89c8a10SMarius Strobl #ifndef __NO_STRICT_ALIGNMENT
2870b9f5f8aSAndrey V. Elsukov 	if (proto == IPPROTO_ETHERIP) {
288c89c8a10SMarius Strobl 		len = mtod(m, vm_offset_t) & 3;
289c89c8a10SMarius Strobl 		KASSERT(len == 0 || len == ETHERIP_ALIGN,
290c89c8a10SMarius Strobl 		    ("in_gif_output: unexpected misalignment"));
291c89c8a10SMarius Strobl 		m->m_data += len;
292c89c8a10SMarius Strobl 		m->m_len -= ETHERIP_ALIGN;
293c89c8a10SMarius Strobl 	}
294c89c8a10SMarius Strobl #endif
2950b9f5f8aSAndrey V. Elsukov 	ip = mtod(m, struct ip *);
296686cdd19SJun-ichiro itojun Hagino 
297b941bc1dSAndrey V. Elsukov 	MPASS(sc->gif_family == AF_INET);
298b941bc1dSAndrey V. Elsukov 	bcopy(sc->gif_iphdr, ip, sizeof(struct ip));
2990b9f5f8aSAndrey V. Elsukov 	ip->ip_p = proto;
3000b9f5f8aSAndrey V. Elsukov 	/* version will be set in ip_output() */
3010b9f5f8aSAndrey V. Elsukov 	ip->ip_ttl = V_ip_gif_ttl;
3020b9f5f8aSAndrey V. Elsukov 	ip->ip_len = htons(m->m_pkthdr.len);
3030b9f5f8aSAndrey V. Elsukov 	ip->ip_tos = ecn;
304cfa1ca9dSYoshinobu Inoue 
3050b9f5f8aSAndrey V. Elsukov 	return (ip_output(m, NULL, NULL, 0, NULL, NULL));
306cfa1ca9dSYoshinobu Inoue }
307cfa1ca9dSYoshinobu Inoue 
308132c4490SAndrey V. Elsukov static int
3096d8fdfa9SAndrey V. Elsukov in_gif_input(struct mbuf *m, int off, int proto, void *arg)
310cfa1ca9dSYoshinobu Inoue {
3116d8fdfa9SAndrey V. Elsukov 	struct gif_softc *sc = arg;
3120b9f5f8aSAndrey V. Elsukov 	struct ifnet *gifp;
313cfa1ca9dSYoshinobu Inoue 	struct ip *ip;
3140b9f5f8aSAndrey V. Elsukov 	uint8_t ecn;
315cfa1ca9dSYoshinobu Inoue 
3166573d758SMatt Macy 	MPASS(in_epoch(net_epoch_preempt));
31767df9f38SBjoern A. Zeeb 	if (sc == NULL) {
31867df9f38SBjoern A. Zeeb 		m_freem(m);
319315e3e38SRobert Watson 		KMOD_IPSTAT_INC(ips_nogif);
3208f5a8818SKevin Lo 		return (IPPROTO_DONE);
32167df9f38SBjoern A. Zeeb 	}
32267df9f38SBjoern A. Zeeb 	gifp = GIF2IFP(sc);
3230b9f5f8aSAndrey V. Elsukov 	if ((gifp->if_flags & IFF_UP) != 0) {
324cfa1ca9dSYoshinobu Inoue 		ip = mtod(m, struct ip *);
3250b9f5f8aSAndrey V. Elsukov 		ecn = ip->ip_tos;
3266d8fdfa9SAndrey V. Elsukov 		m_adj(m, off);
3270b9f5f8aSAndrey V. Elsukov 		gif_input(m, gifp, proto, ecn);
3280b9f5f8aSAndrey V. Elsukov 	} else {
32959dfcba4SHajimu UMEMOTO 		m_freem(m);
330315e3e38SRobert Watson 		KMOD_IPSTAT_INC(ips_nogif);
331cfa1ca9dSYoshinobu Inoue 	}
3328f5a8818SKevin Lo 	return (IPPROTO_DONE);
333cfa1ca9dSYoshinobu Inoue }
334686cdd19SJun-ichiro itojun Hagino 
335b941bc1dSAndrey V. Elsukov static int
336b941bc1dSAndrey V. Elsukov in_gif_lookup(const struct mbuf *m, int off, int proto, void **arg)
3379426aedfSHajimu UMEMOTO {
33810a0e0bfSAndrey V. Elsukov 	const struct ip *ip;
33910a0e0bfSAndrey V. Elsukov 	struct gif_softc *sc;
340c1b4f79dSAndrey V. Elsukov 	int ret;
341686cdd19SJun-ichiro itojun Hagino 
3426e081509SAndrey V. Elsukov 	if (V_ipv4_hashtbl == NULL)
3436e081509SAndrey V. Elsukov 		return (0);
3446e081509SAndrey V. Elsukov 
3456573d758SMatt Macy 	MPASS(in_epoch(net_epoch_preempt));
34610a0e0bfSAndrey V. Elsukov 	ip = mtod(m, const struct ip *);
347b941bc1dSAndrey V. Elsukov 	/*
348b941bc1dSAndrey V. Elsukov 	 * NOTE: it is safe to iterate without any locking here, because softc
349b941bc1dSAndrey V. Elsukov 	 * can be reclaimed only when we are not within net_epoch_preempt
350b941bc1dSAndrey V. Elsukov 	 * section, but ip_encap lookup+input are executed in epoch section.
351b941bc1dSAndrey V. Elsukov 	 */
352b941bc1dSAndrey V. Elsukov 	ret = 0;
353b941bc1dSAndrey V. Elsukov 	CK_LIST_FOREACH(sc, &GIF_HASH(ip->ip_dst.s_addr,
354b941bc1dSAndrey V. Elsukov 	    ip->ip_src.s_addr), chain) {
355b941bc1dSAndrey V. Elsukov 		/*
356b941bc1dSAndrey V. Elsukov 		 * This is an inbound packet, its ip_dst is source address
357b941bc1dSAndrey V. Elsukov 		 * in softc.
358b941bc1dSAndrey V. Elsukov 		 */
359b941bc1dSAndrey V. Elsukov 		if (sc->gif_iphdr->ip_src.s_addr == ip->ip_dst.s_addr &&
360b941bc1dSAndrey V. Elsukov 		    sc->gif_iphdr->ip_dst.s_addr == ip->ip_src.s_addr) {
361b941bc1dSAndrey V. Elsukov 			ret = ENCAP_DRV_LOOKUP;
362b941bc1dSAndrey V. Elsukov 			goto done;
363b941bc1dSAndrey V. Elsukov 		}
364b941bc1dSAndrey V. Elsukov 	}
365b941bc1dSAndrey V. Elsukov 	/*
366b941bc1dSAndrey V. Elsukov 	 * No exact match.
367b941bc1dSAndrey V. Elsukov 	 * Check the list of interfaces with GIF_IGNORE_SOURCE flag.
368b941bc1dSAndrey V. Elsukov 	 */
369b941bc1dSAndrey V. Elsukov 	CK_LIST_FOREACH(sc, &V_ipv4_list, chain) {
370b941bc1dSAndrey V. Elsukov 		if (sc->gif_iphdr->ip_src.s_addr == ip->ip_dst.s_addr) {
3716d8fdfa9SAndrey V. Elsukov 			ret = 32 + 8; /* src + proto */
372b941bc1dSAndrey V. Elsukov 			goto done;
373b941bc1dSAndrey V. Elsukov 		}
374b941bc1dSAndrey V. Elsukov 	}
375c1b4f79dSAndrey V. Elsukov 	return (0);
376b941bc1dSAndrey V. Elsukov done:
377b941bc1dSAndrey V. Elsukov 	if ((GIF2IFP(sc)->if_flags & IFF_UP) == 0)
378b941bc1dSAndrey V. Elsukov 		return (0);
379686cdd19SJun-ichiro itojun Hagino 	/* ingress filters on outer source */
38010a0e0bfSAndrey V. Elsukov 	if ((GIF2IFP(sc)->if_flags & IFF_LINK2) == 0) {
38165ff3638SAlexander V. Chernikov 		struct nhop4_basic nh4;
38265ff3638SAlexander V. Chernikov 		struct in_addr dst;
383686cdd19SJun-ichiro itojun Hagino 
38465ff3638SAlexander V. Chernikov 		dst = ip->ip_src;
38565ff3638SAlexander V. Chernikov 		if (fib4_lookup_nh_basic(sc->gif_fibnum, dst, 0, 0, &nh4) != 0)
3860b9f5f8aSAndrey V. Elsukov 			return (0);
38765ff3638SAlexander V. Chernikov 		if (nh4.nh_ifp != m->m_pkthdr.rcvif)
38865ff3638SAlexander V. Chernikov 			return (0);
389686cdd19SJun-ichiro itojun Hagino 	}
390b941bc1dSAndrey V. Elsukov 	*arg = sc;
391c1b4f79dSAndrey V. Elsukov 	return (ret);
392686cdd19SJun-ichiro itojun Hagino }
3939426aedfSHajimu UMEMOTO 
394*009d82eeSAndrey V. Elsukov static const struct srcaddrtab *ipv4_srcaddrtab;
395b941bc1dSAndrey V. Elsukov static struct {
396b941bc1dSAndrey V. Elsukov 	const struct encap_config encap;
397b941bc1dSAndrey V. Elsukov 	const struct encaptab *cookie;
398b941bc1dSAndrey V. Elsukov } ipv4_encap_cfg[] = {
399b941bc1dSAndrey V. Elsukov 	{
400b941bc1dSAndrey V. Elsukov 		.encap = {
401b941bc1dSAndrey V. Elsukov 			.proto = IPPROTO_IPV4,
402b941bc1dSAndrey V. Elsukov 			.min_length = 2 * sizeof(struct ip),
403b941bc1dSAndrey V. Elsukov 			.exact_match = ENCAP_DRV_LOOKUP,
404b941bc1dSAndrey V. Elsukov 			.lookup = in_gif_lookup,
4056d8fdfa9SAndrey V. Elsukov 			.input = in_gif_input
406b941bc1dSAndrey V. Elsukov 		},
407b941bc1dSAndrey V. Elsukov 	},
408b941bc1dSAndrey V. Elsukov #ifdef INET6
409b941bc1dSAndrey V. Elsukov 	{
410b941bc1dSAndrey V. Elsukov 		.encap = {
411b941bc1dSAndrey V. Elsukov 			.proto = IPPROTO_IPV6,
412b941bc1dSAndrey V. Elsukov 			.min_length = sizeof(struct ip) +
413b941bc1dSAndrey V. Elsukov 			    sizeof(struct ip6_hdr),
414b941bc1dSAndrey V. Elsukov 			.exact_match = ENCAP_DRV_LOOKUP,
415b941bc1dSAndrey V. Elsukov 			.lookup = in_gif_lookup,
416b941bc1dSAndrey V. Elsukov 			.input = in_gif_input
417b941bc1dSAndrey V. Elsukov 		},
418b941bc1dSAndrey V. Elsukov 	},
419b941bc1dSAndrey V. Elsukov #endif
420b941bc1dSAndrey V. Elsukov 	{
421b941bc1dSAndrey V. Elsukov 		.encap = {
422b941bc1dSAndrey V. Elsukov 			.proto = IPPROTO_ETHERIP,
423b941bc1dSAndrey V. Elsukov 			.min_length = sizeof(struct ip) +
424b941bc1dSAndrey V. Elsukov 			    sizeof(struct etherip_header) +
425b941bc1dSAndrey V. Elsukov 			    sizeof(struct ether_header),
426b941bc1dSAndrey V. Elsukov 			.exact_match = ENCAP_DRV_LOOKUP,
427b941bc1dSAndrey V. Elsukov 			.lookup = in_gif_lookup,
428b941bc1dSAndrey V. Elsukov 			.input = in_gif_input
429b941bc1dSAndrey V. Elsukov 		},
430b941bc1dSAndrey V. Elsukov 	}
4316d8fdfa9SAndrey V. Elsukov };
4326d8fdfa9SAndrey V. Elsukov 
433b941bc1dSAndrey V. Elsukov void
434b941bc1dSAndrey V. Elsukov in_gif_init(void)
4359426aedfSHajimu UMEMOTO {
436b941bc1dSAndrey V. Elsukov 	int i;
4370b9f5f8aSAndrey V. Elsukov 
438b941bc1dSAndrey V. Elsukov 	if (!IS_DEFAULT_VNET(curvnet))
439b941bc1dSAndrey V. Elsukov 		return;
440*009d82eeSAndrey V. Elsukov 
441*009d82eeSAndrey V. Elsukov 	ipv4_srcaddrtab = ip_encap_register_srcaddr(in_gif_srcaddr,
442*009d82eeSAndrey V. Elsukov 	    NULL, M_WAITOK);
443b941bc1dSAndrey V. Elsukov 	for (i = 0; i < nitems(ipv4_encap_cfg); i++)
444b941bc1dSAndrey V. Elsukov 		ipv4_encap_cfg[i].cookie = ip_encap_attach(
445b941bc1dSAndrey V. Elsukov 		    &ipv4_encap_cfg[i].encap, NULL, M_WAITOK);
4469426aedfSHajimu UMEMOTO }
447b941bc1dSAndrey V. Elsukov 
448b941bc1dSAndrey V. Elsukov void
449b941bc1dSAndrey V. Elsukov in_gif_uninit(void)
450b941bc1dSAndrey V. Elsukov {
451b941bc1dSAndrey V. Elsukov 	int i;
452b941bc1dSAndrey V. Elsukov 
453b941bc1dSAndrey V. Elsukov 	if (IS_DEFAULT_VNET(curvnet)) {
454b941bc1dSAndrey V. Elsukov 		for (i = 0; i < nitems(ipv4_encap_cfg); i++)
455b941bc1dSAndrey V. Elsukov 			ip_encap_detach(ipv4_encap_cfg[i].cookie);
456*009d82eeSAndrey V. Elsukov 		ip_encap_unregister_srcaddr(ipv4_srcaddrtab);
457b941bc1dSAndrey V. Elsukov 	}
458*009d82eeSAndrey V. Elsukov 	if (V_ipv4_hashtbl != NULL) {
459b941bc1dSAndrey V. Elsukov 		gif_hashdestroy(V_ipv4_hashtbl);
460*009d82eeSAndrey V. Elsukov 		gif_hashdestroy(V_ipv4_srchashtbl);
461*009d82eeSAndrey V. Elsukov 	}
462b941bc1dSAndrey V. Elsukov }
463b941bc1dSAndrey V. Elsukov 
464