1f325335cSAndrey V. Elsukov /*- 22addcba7SAndrey V. Elsukov * Copyright (c) 2014, 2018 Andrey V. Elsukov <ae@FreeBSD.org> 3f325335cSAndrey V. Elsukov * All rights reserved. 4f325335cSAndrey V. Elsukov * 5f325335cSAndrey V. Elsukov * Redistribution and use in source and binary forms, with or without 6f325335cSAndrey V. Elsukov * modification, are permitted provided that the following conditions 7f325335cSAndrey V. Elsukov * are met: 8f325335cSAndrey V. Elsukov * 9f325335cSAndrey V. Elsukov * 1. Redistributions of source code must retain the above copyright 10f325335cSAndrey V. Elsukov * notice, this list of conditions and the following disclaimer. 11f325335cSAndrey V. Elsukov * 2. Redistributions in binary form must reproduce the above copyright 12f325335cSAndrey V. Elsukov * notice, this list of conditions and the following disclaimer in the 13f325335cSAndrey V. Elsukov * documentation and/or other materials provided with the distribution. 14f325335cSAndrey V. Elsukov * 15f325335cSAndrey V. Elsukov * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 16f325335cSAndrey V. Elsukov * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 17f325335cSAndrey V. Elsukov * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 18f325335cSAndrey V. Elsukov * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 19f325335cSAndrey V. Elsukov * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 20f325335cSAndrey V. Elsukov * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 21f325335cSAndrey V. Elsukov * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 22f325335cSAndrey V. Elsukov * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 23f325335cSAndrey V. Elsukov * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 24f325335cSAndrey V. Elsukov * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25f325335cSAndrey V. Elsukov */ 26f325335cSAndrey V. Elsukov 27f325335cSAndrey V. Elsukov #include <sys/cdefs.h> 28f325335cSAndrey V. Elsukov __FBSDID("$FreeBSD$"); 29f325335cSAndrey V. Elsukov 30f325335cSAndrey V. Elsukov #include <sys/param.h> 312addcba7SAndrey V. Elsukov #include <sys/systm.h> 32f325335cSAndrey V. Elsukov #include <sys/jail.h> 33f325335cSAndrey V. Elsukov #include <sys/kernel.h> 34f325335cSAndrey V. Elsukov #include <sys/lock.h> 35f325335cSAndrey V. Elsukov #include <sys/malloc.h> 36f325335cSAndrey V. Elsukov #include <sys/module.h> 37f325335cSAndrey V. Elsukov #include <sys/mbuf.h> 38f325335cSAndrey V. Elsukov #include <sys/priv.h> 39f325335cSAndrey V. Elsukov #include <sys/proc.h> 40f325335cSAndrey V. Elsukov #include <sys/socket.h> 41f325335cSAndrey V. Elsukov #include <sys/sockio.h> 42f325335cSAndrey V. Elsukov #include <sys/sx.h> 43f325335cSAndrey V. Elsukov #include <sys/sysctl.h> 44f325335cSAndrey V. Elsukov #include <sys/syslog.h> 45f325335cSAndrey V. Elsukov 46f325335cSAndrey V. Elsukov #include <net/bpf.h> 47f325335cSAndrey V. Elsukov #include <net/ethernet.h> 48f325335cSAndrey V. Elsukov #include <net/if.h> 49f325335cSAndrey V. Elsukov #include <net/if_var.h> 50f325335cSAndrey V. Elsukov #include <net/if_clone.h> 51f325335cSAndrey V. Elsukov #include <net/if_types.h> 52f325335cSAndrey V. Elsukov #include <net/netisr.h> 53f325335cSAndrey V. Elsukov #include <net/vnet.h> 54eccfe69aSAndrey V. Elsukov #include <net/route.h> 55f325335cSAndrey V. Elsukov 56f325335cSAndrey V. Elsukov #include <netinet/in.h> 57f325335cSAndrey V. Elsukov #include <netinet/in_systm.h> 58f325335cSAndrey V. Elsukov #include <netinet/in_var.h> 59f325335cSAndrey V. Elsukov #include <netinet/ip.h> 60f325335cSAndrey V. Elsukov #include <netinet/ip_var.h> 61f325335cSAndrey V. Elsukov #include <netinet/ip_encap.h> 62f325335cSAndrey V. Elsukov 63f325335cSAndrey V. Elsukov #include <machine/in_cksum.h> 64f325335cSAndrey V. Elsukov #include <security/mac/mac_framework.h> 65f325335cSAndrey V. Elsukov 66c00bf730SAndrey V. Elsukov #define MEMTU (1500 - sizeof(struct mobhdr)) 67f325335cSAndrey V. Elsukov static const char mename[] = "me"; 68f325335cSAndrey V. Elsukov static MALLOC_DEFINE(M_IFME, mename, "Minimal Encapsulation for IP"); 69f325335cSAndrey V. Elsukov /* Minimal forwarding header RFC 2004 */ 70f325335cSAndrey V. Elsukov struct mobhdr { 71f325335cSAndrey V. Elsukov uint8_t mob_proto; /* protocol */ 72f325335cSAndrey V. Elsukov uint8_t mob_flags; /* flags */ 73f325335cSAndrey V. Elsukov #define MOB_FLAGS_SP 0x80 /* source present */ 74f325335cSAndrey V. Elsukov uint16_t mob_csum; /* header checksum */ 75f325335cSAndrey V. Elsukov struct in_addr mob_dst; /* original destination address */ 76f325335cSAndrey V. Elsukov struct in_addr mob_src; /* original source addr (optional) */ 77f325335cSAndrey V. Elsukov } __packed; 78f325335cSAndrey V. Elsukov 79f325335cSAndrey V. Elsukov struct me_softc { 80f325335cSAndrey V. Elsukov struct ifnet *me_ifp; 81f325335cSAndrey V. Elsukov u_int me_fibnum; 82f325335cSAndrey V. Elsukov struct in_addr me_src; 83f325335cSAndrey V. Elsukov struct in_addr me_dst; 842addcba7SAndrey V. Elsukov 852addcba7SAndrey V. Elsukov CK_LIST_ENTRY(me_softc) chain; 86f325335cSAndrey V. Elsukov }; 872addcba7SAndrey V. Elsukov CK_LIST_HEAD(me_list, me_softc); 88f325335cSAndrey V. Elsukov #define ME2IFP(sc) ((sc)->me_ifp) 89f325335cSAndrey V. Elsukov #define ME_READY(sc) ((sc)->me_src.s_addr != 0) 906573d758SMatt Macy #define ME_RLOCK() struct epoch_tracker me_et; epoch_enter_preempt(net_epoch_preempt, &me_et) 916573d758SMatt Macy #define ME_RUNLOCK() epoch_exit_preempt(net_epoch_preempt, &me_et) 922addcba7SAndrey V. Elsukov #define ME_WAIT() epoch_wait_preempt(net_epoch_preempt) 93f325335cSAndrey V. Elsukov 942addcba7SAndrey V. Elsukov #ifndef ME_HASH_SIZE 952addcba7SAndrey V. Elsukov #define ME_HASH_SIZE (1 << 4) 962addcba7SAndrey V. Elsukov #endif 972addcba7SAndrey V. Elsukov static VNET_DEFINE(struct me_list *, me_hashtbl) = NULL; 982addcba7SAndrey V. Elsukov #define V_me_hashtbl VNET(me_hashtbl) 992addcba7SAndrey V. Elsukov #define ME_HASH(src, dst) (V_me_hashtbl[\ 1002addcba7SAndrey V. Elsukov me_hashval((src), (dst)) & (ME_HASH_SIZE - 1)]) 101f325335cSAndrey V. Elsukov 102f325335cSAndrey V. Elsukov static struct sx me_ioctl_sx; 103f325335cSAndrey V. Elsukov SX_SYSINIT(me_ioctl_sx, &me_ioctl_sx, "me_ioctl"); 104f325335cSAndrey V. Elsukov 105f325335cSAndrey V. Elsukov static int me_clone_create(struct if_clone *, int, caddr_t); 106f325335cSAndrey V. Elsukov static void me_clone_destroy(struct ifnet *); 107f325335cSAndrey V. Elsukov static VNET_DEFINE(struct if_clone *, me_cloner); 108f325335cSAndrey V. Elsukov #define V_me_cloner VNET(me_cloner) 109f325335cSAndrey V. Elsukov 110f325335cSAndrey V. Elsukov static void me_qflush(struct ifnet *); 111f325335cSAndrey V. Elsukov static int me_transmit(struct ifnet *, struct mbuf *); 112f325335cSAndrey V. Elsukov static int me_ioctl(struct ifnet *, u_long, caddr_t); 113f325335cSAndrey V. Elsukov static int me_output(struct ifnet *, struct mbuf *, 114f325335cSAndrey V. Elsukov const struct sockaddr *, struct route *); 1156d8fdfa9SAndrey V. Elsukov static int me_input(struct mbuf *, int, int, void *); 116f325335cSAndrey V. Elsukov 1172addcba7SAndrey V. Elsukov static int me_set_tunnel(struct me_softc *, in_addr_t, in_addr_t); 1182addcba7SAndrey V. Elsukov static void me_delete_tunnel(struct me_softc *); 119f325335cSAndrey V. Elsukov 120f325335cSAndrey V. Elsukov SYSCTL_DECL(_net_link); 121f325335cSAndrey V. Elsukov static SYSCTL_NODE(_net_link, IFT_TUNNEL, me, CTLFLAG_RW, 0, 122f325335cSAndrey V. Elsukov "Minimal Encapsulation for IP (RFC 2004)"); 123f325335cSAndrey V. Elsukov #ifndef MAX_ME_NEST 124f325335cSAndrey V. Elsukov #define MAX_ME_NEST 1 125f325335cSAndrey V. Elsukov #endif 126f325335cSAndrey V. Elsukov 127f325335cSAndrey V. Elsukov static VNET_DEFINE(int, max_me_nesting) = MAX_ME_NEST; 128f325335cSAndrey V. Elsukov #define V_max_me_nesting VNET(max_me_nesting) 129f325335cSAndrey V. Elsukov SYSCTL_INT(_net_link_me, OID_AUTO, max_nesting, CTLFLAG_RW | CTLFLAG_VNET, 130f325335cSAndrey V. Elsukov &VNET_NAME(max_me_nesting), 0, "Max nested tunnels"); 131f325335cSAndrey V. Elsukov 1322addcba7SAndrey V. Elsukov static uint32_t 1332addcba7SAndrey V. Elsukov me_hashval(in_addr_t src, in_addr_t dst) 1342addcba7SAndrey V. Elsukov { 1352addcba7SAndrey V. Elsukov uint32_t ret; 1362addcba7SAndrey V. Elsukov 1372addcba7SAndrey V. Elsukov ret = fnv_32_buf(&src, sizeof(src), FNV1_32_INIT); 1382addcba7SAndrey V. Elsukov return (fnv_32_buf(&dst, sizeof(dst), ret)); 1392addcba7SAndrey V. Elsukov } 1402addcba7SAndrey V. Elsukov 1412addcba7SAndrey V. Elsukov static struct me_list * 1422addcba7SAndrey V. Elsukov me_hashinit(void) 1432addcba7SAndrey V. Elsukov { 1442addcba7SAndrey V. Elsukov struct me_list *hash; 1452addcba7SAndrey V. Elsukov int i; 1462addcba7SAndrey V. Elsukov 1472addcba7SAndrey V. Elsukov hash = malloc(sizeof(struct me_list) * ME_HASH_SIZE, 1482addcba7SAndrey V. Elsukov M_IFME, M_WAITOK); 1492addcba7SAndrey V. Elsukov for (i = 0; i < ME_HASH_SIZE; i++) 1502addcba7SAndrey V. Elsukov CK_LIST_INIT(&hash[i]); 1512addcba7SAndrey V. Elsukov 1522addcba7SAndrey V. Elsukov return (hash); 1532addcba7SAndrey V. Elsukov } 1542addcba7SAndrey V. Elsukov 155f325335cSAndrey V. Elsukov static void 156f325335cSAndrey V. Elsukov vnet_me_init(const void *unused __unused) 157f325335cSAndrey V. Elsukov { 158f325335cSAndrey V. Elsukov V_me_cloner = if_clone_simple(mename, me_clone_create, 159f325335cSAndrey V. Elsukov me_clone_destroy, 0); 160f325335cSAndrey V. Elsukov } 161f325335cSAndrey V. Elsukov VNET_SYSINIT(vnet_me_init, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_ANY, 162f325335cSAndrey V. Elsukov vnet_me_init, NULL); 163f325335cSAndrey V. Elsukov 164f325335cSAndrey V. Elsukov static void 165f325335cSAndrey V. Elsukov vnet_me_uninit(const void *unused __unused) 166f325335cSAndrey V. Elsukov { 167f325335cSAndrey V. Elsukov 1682addcba7SAndrey V. Elsukov if (V_me_hashtbl != NULL) 1692addcba7SAndrey V. Elsukov free(V_me_hashtbl, M_IFME); 170f325335cSAndrey V. Elsukov if_clone_detach(V_me_cloner); 171f325335cSAndrey V. Elsukov } 172f325335cSAndrey V. Elsukov VNET_SYSUNINIT(vnet_me_uninit, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_ANY, 173f325335cSAndrey V. Elsukov vnet_me_uninit, NULL); 174f325335cSAndrey V. Elsukov 175f325335cSAndrey V. Elsukov static int 176f325335cSAndrey V. Elsukov me_clone_create(struct if_clone *ifc, int unit, caddr_t params) 177f325335cSAndrey V. Elsukov { 178f325335cSAndrey V. Elsukov struct me_softc *sc; 179f325335cSAndrey V. Elsukov 180f325335cSAndrey V. Elsukov sc = malloc(sizeof(struct me_softc), M_IFME, M_WAITOK | M_ZERO); 181f325335cSAndrey V. Elsukov sc->me_fibnum = curthread->td_proc->p_fibnum; 182f325335cSAndrey V. Elsukov ME2IFP(sc) = if_alloc(IFT_TUNNEL); 183f325335cSAndrey V. Elsukov ME2IFP(sc)->if_softc = sc; 184f325335cSAndrey V. Elsukov if_initname(ME2IFP(sc), mename, unit); 185f325335cSAndrey V. Elsukov 186c00bf730SAndrey V. Elsukov ME2IFP(sc)->if_mtu = MEMTU;; 187f325335cSAndrey V. Elsukov ME2IFP(sc)->if_flags = IFF_POINTOPOINT|IFF_MULTICAST; 188f325335cSAndrey V. Elsukov ME2IFP(sc)->if_output = me_output; 189f325335cSAndrey V. Elsukov ME2IFP(sc)->if_ioctl = me_ioctl; 190f325335cSAndrey V. Elsukov ME2IFP(sc)->if_transmit = me_transmit; 191f325335cSAndrey V. Elsukov ME2IFP(sc)->if_qflush = me_qflush; 192f1aaad0cSHiroki Sato ME2IFP(sc)->if_capabilities |= IFCAP_LINKSTATE; 193f1aaad0cSHiroki Sato ME2IFP(sc)->if_capenable |= IFCAP_LINKSTATE; 194f325335cSAndrey V. Elsukov if_attach(ME2IFP(sc)); 195f325335cSAndrey V. Elsukov bpfattach(ME2IFP(sc), DLT_NULL, sizeof(u_int32_t)); 196f325335cSAndrey V. Elsukov return (0); 197f325335cSAndrey V. Elsukov } 198f325335cSAndrey V. Elsukov 199f325335cSAndrey V. Elsukov static void 200f325335cSAndrey V. Elsukov me_clone_destroy(struct ifnet *ifp) 201f325335cSAndrey V. Elsukov { 202f325335cSAndrey V. Elsukov struct me_softc *sc; 203f325335cSAndrey V. Elsukov 204f325335cSAndrey V. Elsukov sx_xlock(&me_ioctl_sx); 205f325335cSAndrey V. Elsukov sc = ifp->if_softc; 2062addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 207f325335cSAndrey V. Elsukov bpfdetach(ifp); 208f325335cSAndrey V. Elsukov if_detach(ifp); 209f325335cSAndrey V. Elsukov ifp->if_softc = NULL; 210f325335cSAndrey V. Elsukov sx_xunlock(&me_ioctl_sx); 211f325335cSAndrey V. Elsukov 2122addcba7SAndrey V. Elsukov ME_WAIT(); 213f325335cSAndrey V. Elsukov if_free(ifp); 214f325335cSAndrey V. Elsukov free(sc, M_IFME); 215f325335cSAndrey V. Elsukov } 216f325335cSAndrey V. Elsukov 217f325335cSAndrey V. Elsukov static int 218f325335cSAndrey V. Elsukov me_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data) 219f325335cSAndrey V. Elsukov { 220f325335cSAndrey V. Elsukov struct ifreq *ifr = (struct ifreq *)data; 221f325335cSAndrey V. Elsukov struct sockaddr_in *src, *dst; 222f325335cSAndrey V. Elsukov struct me_softc *sc; 223f325335cSAndrey V. Elsukov int error; 224f325335cSAndrey V. Elsukov 225f325335cSAndrey V. Elsukov switch (cmd) { 226f325335cSAndrey V. Elsukov case SIOCSIFMTU: 227f325335cSAndrey V. Elsukov if (ifr->ifr_mtu < 576) 228f325335cSAndrey V. Elsukov return (EINVAL); 229c00bf730SAndrey V. Elsukov ifp->if_mtu = ifr->ifr_mtu; 230f325335cSAndrey V. Elsukov return (0); 231f325335cSAndrey V. Elsukov case SIOCSIFADDR: 232f325335cSAndrey V. Elsukov ifp->if_flags |= IFF_UP; 233f325335cSAndrey V. Elsukov case SIOCSIFFLAGS: 234f325335cSAndrey V. Elsukov case SIOCADDMULTI: 235f325335cSAndrey V. Elsukov case SIOCDELMULTI: 236f325335cSAndrey V. Elsukov return (0); 237f325335cSAndrey V. Elsukov } 238f325335cSAndrey V. Elsukov sx_xlock(&me_ioctl_sx); 239f325335cSAndrey V. Elsukov sc = ifp->if_softc; 240f325335cSAndrey V. Elsukov if (sc == NULL) { 241f325335cSAndrey V. Elsukov error = ENXIO; 242f325335cSAndrey V. Elsukov goto end; 243f325335cSAndrey V. Elsukov } 244f325335cSAndrey V. Elsukov error = 0; 245f325335cSAndrey V. Elsukov switch (cmd) { 246f325335cSAndrey V. Elsukov case SIOCSIFPHYADDR: 2472addcba7SAndrey V. Elsukov src = &((struct in_aliasreq *)data)->ifra_addr; 2482addcba7SAndrey V. Elsukov dst = &((struct in_aliasreq *)data)->ifra_dstaddr; 249f325335cSAndrey V. Elsukov if (src->sin_family != dst->sin_family || 250f325335cSAndrey V. Elsukov src->sin_family != AF_INET || 251f325335cSAndrey V. Elsukov src->sin_len != dst->sin_len || 252f325335cSAndrey V. Elsukov src->sin_len != sizeof(struct sockaddr_in)) { 253f325335cSAndrey V. Elsukov error = EINVAL; 254f325335cSAndrey V. Elsukov break; 255f325335cSAndrey V. Elsukov } 256f325335cSAndrey V. Elsukov if (src->sin_addr.s_addr == INADDR_ANY || 257f325335cSAndrey V. Elsukov dst->sin_addr.s_addr == INADDR_ANY) { 258f325335cSAndrey V. Elsukov error = EADDRNOTAVAIL; 259f325335cSAndrey V. Elsukov break; 260f325335cSAndrey V. Elsukov } 2612addcba7SAndrey V. Elsukov error = me_set_tunnel(sc, src->sin_addr.s_addr, 2622addcba7SAndrey V. Elsukov dst->sin_addr.s_addr); 263f325335cSAndrey V. Elsukov break; 264f325335cSAndrey V. Elsukov case SIOCDIFPHYADDR: 2652addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 266f325335cSAndrey V. Elsukov break; 267f325335cSAndrey V. Elsukov case SIOCGIFPSRCADDR: 268f325335cSAndrey V. Elsukov case SIOCGIFPDSTADDR: 269f325335cSAndrey V. Elsukov if (!ME_READY(sc)) { 270f325335cSAndrey V. Elsukov error = EADDRNOTAVAIL; 271f325335cSAndrey V. Elsukov break; 272f325335cSAndrey V. Elsukov } 273f325335cSAndrey V. Elsukov src = (struct sockaddr_in *)&ifr->ifr_addr; 274f325335cSAndrey V. Elsukov memset(src, 0, sizeof(*src)); 275f325335cSAndrey V. Elsukov src->sin_family = AF_INET; 276f325335cSAndrey V. Elsukov src->sin_len = sizeof(*src); 277f325335cSAndrey V. Elsukov switch (cmd) { 278f325335cSAndrey V. Elsukov case SIOCGIFPSRCADDR: 279f325335cSAndrey V. Elsukov src->sin_addr = sc->me_src; 280f325335cSAndrey V. Elsukov break; 281f325335cSAndrey V. Elsukov case SIOCGIFPDSTADDR: 282f325335cSAndrey V. Elsukov src->sin_addr = sc->me_dst; 283f325335cSAndrey V. Elsukov break; 284f325335cSAndrey V. Elsukov } 285f325335cSAndrey V. Elsukov error = prison_if(curthread->td_ucred, sintosa(src)); 286f325335cSAndrey V. Elsukov if (error != 0) 287f325335cSAndrey V. Elsukov memset(src, 0, sizeof(*src)); 288f325335cSAndrey V. Elsukov break; 289eccfe69aSAndrey V. Elsukov case SIOCGTUNFIB: 290eccfe69aSAndrey V. Elsukov ifr->ifr_fib = sc->me_fibnum; 291eccfe69aSAndrey V. Elsukov break; 292eccfe69aSAndrey V. Elsukov case SIOCSTUNFIB: 293eccfe69aSAndrey V. Elsukov if ((error = priv_check(curthread, PRIV_NET_GRE)) != 0) 294eccfe69aSAndrey V. Elsukov break; 295eccfe69aSAndrey V. Elsukov if (ifr->ifr_fib >= rt_numfibs) 296eccfe69aSAndrey V. Elsukov error = EINVAL; 297eccfe69aSAndrey V. Elsukov else 298eccfe69aSAndrey V. Elsukov sc->me_fibnum = ifr->ifr_fib; 299eccfe69aSAndrey V. Elsukov break; 300f325335cSAndrey V. Elsukov default: 301f325335cSAndrey V. Elsukov error = EINVAL; 302f325335cSAndrey V. Elsukov break; 303f325335cSAndrey V. Elsukov } 304f325335cSAndrey V. Elsukov end: 305f325335cSAndrey V. Elsukov sx_xunlock(&me_ioctl_sx); 306f325335cSAndrey V. Elsukov return (error); 307f325335cSAndrey V. Elsukov } 308f325335cSAndrey V. Elsukov 309f325335cSAndrey V. Elsukov static int 3102addcba7SAndrey V. Elsukov me_lookup(const struct mbuf *m, int off, int proto, void **arg) 311f325335cSAndrey V. Elsukov { 3122addcba7SAndrey V. Elsukov const struct ip *ip; 313f325335cSAndrey V. Elsukov struct me_softc *sc; 314f325335cSAndrey V. Elsukov 3156e081509SAndrey V. Elsukov if (V_me_hashtbl == NULL) 3166e081509SAndrey V. Elsukov return (0); 3176e081509SAndrey V. Elsukov 3186573d758SMatt Macy MPASS(in_epoch(net_epoch_preempt)); 3192addcba7SAndrey V. Elsukov ip = mtod(m, const struct ip *); 3202addcba7SAndrey V. Elsukov CK_LIST_FOREACH(sc, &ME_HASH(ip->ip_dst.s_addr, 3212addcba7SAndrey V. Elsukov ip->ip_src.s_addr), chain) { 3222addcba7SAndrey V. Elsukov if (sc->me_src.s_addr == ip->ip_dst.s_addr && 3232addcba7SAndrey V. Elsukov sc->me_dst.s_addr == ip->ip_src.s_addr) { 324f325335cSAndrey V. Elsukov if ((ME2IFP(sc)->if_flags & IFF_UP) == 0) 325f325335cSAndrey V. Elsukov return (0); 3262addcba7SAndrey V. Elsukov *arg = sc; 3272addcba7SAndrey V. Elsukov return (ENCAP_DRV_LOOKUP); 328f325335cSAndrey V. Elsukov } 3292addcba7SAndrey V. Elsukov } 3302addcba7SAndrey V. Elsukov return (0); 331f325335cSAndrey V. Elsukov } 332f325335cSAndrey V. Elsukov 333f325335cSAndrey V. Elsukov static int 3342addcba7SAndrey V. Elsukov me_set_tunnel(struct me_softc *sc, in_addr_t src, in_addr_t dst) 335f325335cSAndrey V. Elsukov { 3362addcba7SAndrey V. Elsukov struct me_softc *tmp; 337f325335cSAndrey V. Elsukov 338f325335cSAndrey V. Elsukov sx_assert(&me_ioctl_sx, SA_XLOCKED); 3392addcba7SAndrey V. Elsukov 3402addcba7SAndrey V. Elsukov if (V_me_hashtbl == NULL) 3412addcba7SAndrey V. Elsukov V_me_hashtbl = me_hashinit(); 3422addcba7SAndrey V. Elsukov 3432addcba7SAndrey V. Elsukov if (sc->me_src.s_addr == src && sc->me_dst.s_addr == dst) 3442addcba7SAndrey V. Elsukov return (0); 3452addcba7SAndrey V. Elsukov 3462addcba7SAndrey V. Elsukov CK_LIST_FOREACH(tmp, &ME_HASH(src, dst), chain) { 3472addcba7SAndrey V. Elsukov if (tmp == sc) 348f325335cSAndrey V. Elsukov continue; 3492addcba7SAndrey V. Elsukov if (tmp->me_src.s_addr == src && 3502addcba7SAndrey V. Elsukov tmp->me_dst.s_addr == dst) 351f325335cSAndrey V. Elsukov return (EADDRNOTAVAIL); 352f325335cSAndrey V. Elsukov } 353f325335cSAndrey V. Elsukov 3542addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 3552addcba7SAndrey V. Elsukov sc->me_dst.s_addr = dst; 3562addcba7SAndrey V. Elsukov sc->me_src.s_addr = src; 3572addcba7SAndrey V. Elsukov CK_LIST_INSERT_HEAD(&ME_HASH(src, dst), sc, chain); 358f325335cSAndrey V. Elsukov 3592addcba7SAndrey V. Elsukov ME2IFP(sc)->if_drv_flags |= IFF_DRV_RUNNING; 3602addcba7SAndrey V. Elsukov if_link_state_change(ME2IFP(sc), LINK_STATE_UP); 361f325335cSAndrey V. Elsukov return (0); 362f325335cSAndrey V. Elsukov } 363f325335cSAndrey V. Elsukov 364f325335cSAndrey V. Elsukov static void 3652addcba7SAndrey V. Elsukov me_delete_tunnel(struct me_softc *sc) 366f325335cSAndrey V. Elsukov { 367f325335cSAndrey V. Elsukov 368f325335cSAndrey V. Elsukov sx_assert(&me_ioctl_sx, SA_XLOCKED); 3692addcba7SAndrey V. Elsukov if (ME_READY(sc)) { 3702addcba7SAndrey V. Elsukov CK_LIST_REMOVE(sc, chain); 3712addcba7SAndrey V. Elsukov ME_WAIT(); 3722addcba7SAndrey V. Elsukov 373f325335cSAndrey V. Elsukov sc->me_src.s_addr = 0; 374f325335cSAndrey V. Elsukov sc->me_dst.s_addr = 0; 3752addcba7SAndrey V. Elsukov ME2IFP(sc)->if_drv_flags &= ~IFF_DRV_RUNNING; 3762addcba7SAndrey V. Elsukov if_link_state_change(ME2IFP(sc), LINK_STATE_DOWN); 3772addcba7SAndrey V. Elsukov } 378f325335cSAndrey V. Elsukov } 379f325335cSAndrey V. Elsukov 380f325335cSAndrey V. Elsukov static uint16_t 381f325335cSAndrey V. Elsukov me_in_cksum(uint16_t *p, int nwords) 382f325335cSAndrey V. Elsukov { 383f325335cSAndrey V. Elsukov uint32_t sum = 0; 384f325335cSAndrey V. Elsukov 385f325335cSAndrey V. Elsukov while (nwords-- > 0) 386f325335cSAndrey V. Elsukov sum += *p++; 387f325335cSAndrey V. Elsukov sum = (sum >> 16) + (sum & 0xffff); 388f325335cSAndrey V. Elsukov sum += (sum >> 16); 389f325335cSAndrey V. Elsukov return (~sum); 390f325335cSAndrey V. Elsukov } 391f325335cSAndrey V. Elsukov 3926d8fdfa9SAndrey V. Elsukov static int 3936d8fdfa9SAndrey V. Elsukov me_input(struct mbuf *m, int off, int proto, void *arg) 394f325335cSAndrey V. Elsukov { 3956d8fdfa9SAndrey V. Elsukov struct me_softc *sc = arg; 396f325335cSAndrey V. Elsukov struct mobhdr *mh; 397f325335cSAndrey V. Elsukov struct ifnet *ifp; 398f325335cSAndrey V. Elsukov struct ip *ip; 399f325335cSAndrey V. Elsukov int hlen; 400f325335cSAndrey V. Elsukov 401f325335cSAndrey V. Elsukov ifp = ME2IFP(sc); 402f325335cSAndrey V. Elsukov /* checks for short packets */ 403f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr); 404f325335cSAndrey V. Elsukov if (m->m_pkthdr.len < sizeof(struct ip) + hlen) 405f325335cSAndrey V. Elsukov hlen -= sizeof(struct in_addr); 406f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip) + hlen) 407f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip) + hlen); 408f325335cSAndrey V. Elsukov if (m == NULL) 409f325335cSAndrey V. Elsukov goto drop; 410f325335cSAndrey V. Elsukov mh = (struct mobhdr *)mtodo(m, sizeof(struct ip)); 411f325335cSAndrey V. Elsukov /* check for wrong flags */ 412f325335cSAndrey V. Elsukov if (mh->mob_flags & (~MOB_FLAGS_SP)) { 413f325335cSAndrey V. Elsukov m_freem(m); 414f325335cSAndrey V. Elsukov goto drop; 415f325335cSAndrey V. Elsukov } 416f325335cSAndrey V. Elsukov if (mh->mob_flags) { 417f325335cSAndrey V. Elsukov if (hlen != sizeof(struct mobhdr)) { 418f325335cSAndrey V. Elsukov m_freem(m); 419f325335cSAndrey V. Elsukov goto drop; 420f325335cSAndrey V. Elsukov } 421f325335cSAndrey V. Elsukov } else 422f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr) - sizeof(struct in_addr); 423f325335cSAndrey V. Elsukov /* check mobile header checksum */ 424f325335cSAndrey V. Elsukov if (me_in_cksum((uint16_t *)mh, hlen / sizeof(uint16_t)) != 0) { 425f325335cSAndrey V. Elsukov m_freem(m); 426f325335cSAndrey V. Elsukov goto drop; 427f325335cSAndrey V. Elsukov } 428f325335cSAndrey V. Elsukov #ifdef MAC 429f325335cSAndrey V. Elsukov mac_ifnet_create_mbuf(ifp, m); 430f325335cSAndrey V. Elsukov #endif 431f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 432f325335cSAndrey V. Elsukov ip->ip_dst = mh->mob_dst; 433f325335cSAndrey V. Elsukov ip->ip_p = mh->mob_proto; 434f325335cSAndrey V. Elsukov ip->ip_sum = 0; 435f325335cSAndrey V. Elsukov ip->ip_len = htons(m->m_pkthdr.len - hlen); 436f325335cSAndrey V. Elsukov if (mh->mob_flags) 437f325335cSAndrey V. Elsukov ip->ip_src = mh->mob_src; 438f325335cSAndrey V. Elsukov memmove(mtodo(m, hlen), ip, sizeof(struct ip)); 439f325335cSAndrey V. Elsukov m_adj(m, hlen); 440f325335cSAndrey V. Elsukov m_clrprotoflags(m); 441f325335cSAndrey V. Elsukov m->m_pkthdr.rcvif = ifp; 442f325335cSAndrey V. Elsukov m->m_pkthdr.csum_flags |= (CSUM_IP_CHECKED | CSUM_IP_VALID); 443eccfe69aSAndrey V. Elsukov M_SETFIB(m, ifp->if_fib); 444f325335cSAndrey V. Elsukov hlen = AF_INET; 445f325335cSAndrey V. Elsukov BPF_MTAP2(ifp, &hlen, sizeof(hlen), m); 446f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IPACKETS, 1); 447f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IBYTES, m->m_pkthdr.len); 448f325335cSAndrey V. Elsukov if ((ifp->if_flags & IFF_MONITOR) != 0) 449f325335cSAndrey V. Elsukov m_freem(m); 450f325335cSAndrey V. Elsukov else 451f325335cSAndrey V. Elsukov netisr_dispatch(NETISR_IP, m); 452f325335cSAndrey V. Elsukov return (IPPROTO_DONE); 453f325335cSAndrey V. Elsukov drop: 454f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IERRORS, 1); 455f325335cSAndrey V. Elsukov return (IPPROTO_DONE); 456f325335cSAndrey V. Elsukov } 457f325335cSAndrey V. Elsukov 458f325335cSAndrey V. Elsukov static int 459f325335cSAndrey V. Elsukov me_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst, 4602addcba7SAndrey V. Elsukov struct route *ro __unused) 461f325335cSAndrey V. Elsukov { 462f325335cSAndrey V. Elsukov uint32_t af; 4632addcba7SAndrey V. Elsukov 4642addcba7SAndrey V. Elsukov if (dst->sa_family == AF_UNSPEC) 4652addcba7SAndrey V. Elsukov bcopy(dst->sa_data, &af, sizeof(af)); 4662addcba7SAndrey V. Elsukov else 4672addcba7SAndrey V. Elsukov af = dst->sa_family; 4682addcba7SAndrey V. Elsukov m->m_pkthdr.csum_data = af; 4692addcba7SAndrey V. Elsukov return (ifp->if_transmit(ifp, m)); 4702addcba7SAndrey V. Elsukov } 4712addcba7SAndrey V. Elsukov 472*98a8fdf6SAndrey V. Elsukov #define MTAG_ME 1414491977 4732addcba7SAndrey V. Elsukov static int 4742addcba7SAndrey V. Elsukov me_transmit(struct ifnet *ifp, struct mbuf *m) 4752addcba7SAndrey V. Elsukov { 4762addcba7SAndrey V. Elsukov struct mobhdr mh; 4772addcba7SAndrey V. Elsukov struct me_softc *sc; 4782addcba7SAndrey V. Elsukov struct ip *ip; 4792addcba7SAndrey V. Elsukov uint32_t af; 4802addcba7SAndrey V. Elsukov int error, hlen, plen; 481f325335cSAndrey V. Elsukov 482f325335cSAndrey V. Elsukov #ifdef MAC 483f325335cSAndrey V. Elsukov error = mac_ifnet_check_transmit(ifp, m); 484f325335cSAndrey V. Elsukov if (error != 0) 485f325335cSAndrey V. Elsukov goto drop; 486f325335cSAndrey V. Elsukov #endif 487f325335cSAndrey V. Elsukov error = ENETDOWN; 4882addcba7SAndrey V. Elsukov ME_RLOCK(); 4892addcba7SAndrey V. Elsukov sc = ifp->if_softc; 4902addcba7SAndrey V. Elsukov if (sc == NULL || !ME_READY(sc) || 4912addcba7SAndrey V. Elsukov (ifp->if_flags & IFF_MONITOR) != 0 || 4922addcba7SAndrey V. Elsukov (ifp->if_flags & IFF_UP) == 0 || 493*98a8fdf6SAndrey V. Elsukov (error = if_tunnel_check_nesting(ifp, m, MTAG_ME, 494*98a8fdf6SAndrey V. Elsukov V_max_me_nesting)) != 0) { 4952addcba7SAndrey V. Elsukov m_freem(m); 496f325335cSAndrey V. Elsukov goto drop; 497f325335cSAndrey V. Elsukov } 4982addcba7SAndrey V. Elsukov af = m->m_pkthdr.csum_data; 499f325335cSAndrey V. Elsukov if (af != AF_INET) { 500f325335cSAndrey V. Elsukov error = EAFNOSUPPORT; 501f325335cSAndrey V. Elsukov m_freem(m); 502f325335cSAndrey V. Elsukov goto drop; 503f325335cSAndrey V. Elsukov } 504f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip)) 505f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip)); 506f325335cSAndrey V. Elsukov if (m == NULL) { 507f325335cSAndrey V. Elsukov error = ENOBUFS; 508f325335cSAndrey V. Elsukov goto drop; 509f325335cSAndrey V. Elsukov } 510f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 511f325335cSAndrey V. Elsukov /* Fragmented datagramms shouldn't be encapsulated */ 512f325335cSAndrey V. Elsukov if (ip->ip_off & htons(IP_MF | IP_OFFMASK)) { 513f325335cSAndrey V. Elsukov error = EINVAL; 514f325335cSAndrey V. Elsukov m_freem(m); 515f325335cSAndrey V. Elsukov goto drop; 516f325335cSAndrey V. Elsukov } 517f325335cSAndrey V. Elsukov mh.mob_proto = ip->ip_p; 518f325335cSAndrey V. Elsukov mh.mob_src = ip->ip_src; 519f325335cSAndrey V. Elsukov mh.mob_dst = ip->ip_dst; 520f325335cSAndrey V. Elsukov if (in_hosteq(sc->me_src, ip->ip_src)) { 521f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr) - sizeof(struct in_addr); 522f325335cSAndrey V. Elsukov mh.mob_flags = 0; 523f325335cSAndrey V. Elsukov } else { 524f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr); 525f325335cSAndrey V. Elsukov mh.mob_flags = MOB_FLAGS_SP; 526f325335cSAndrey V. Elsukov } 5279597ff83SAndrey V. Elsukov BPF_MTAP2(ifp, &af, sizeof(af), m); 528f325335cSAndrey V. Elsukov plen = m->m_pkthdr.len; 529f325335cSAndrey V. Elsukov ip->ip_src = sc->me_src; 530f325335cSAndrey V. Elsukov ip->ip_dst = sc->me_dst; 5312addcba7SAndrey V. Elsukov m->m_flags &= ~(M_BCAST|M_MCAST); 532f325335cSAndrey V. Elsukov M_SETFIB(m, sc->me_fibnum); 533f325335cSAndrey V. Elsukov M_PREPEND(m, hlen, M_NOWAIT); 534f325335cSAndrey V. Elsukov if (m == NULL) { 535f325335cSAndrey V. Elsukov error = ENOBUFS; 536f325335cSAndrey V. Elsukov goto drop; 537f325335cSAndrey V. Elsukov } 538f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip) + hlen) 539f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip) + hlen); 540f325335cSAndrey V. Elsukov if (m == NULL) { 541f325335cSAndrey V. Elsukov error = ENOBUFS; 542f325335cSAndrey V. Elsukov goto drop; 543f325335cSAndrey V. Elsukov } 544f325335cSAndrey V. Elsukov memmove(mtod(m, void *), mtodo(m, hlen), sizeof(struct ip)); 545f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 546f325335cSAndrey V. Elsukov ip->ip_len = htons(m->m_pkthdr.len); 547f325335cSAndrey V. Elsukov ip->ip_p = IPPROTO_MOBILE; 548f325335cSAndrey V. Elsukov ip->ip_sum = 0; 549f325335cSAndrey V. Elsukov mh.mob_csum = 0; 550f325335cSAndrey V. Elsukov mh.mob_csum = me_in_cksum((uint16_t *)&mh, hlen / sizeof(uint16_t)); 551f325335cSAndrey V. Elsukov bcopy(&mh, mtodo(m, sizeof(struct ip)), hlen); 552f325335cSAndrey V. Elsukov error = ip_output(m, NULL, NULL, IP_FORWARDING, NULL, NULL); 553f325335cSAndrey V. Elsukov drop: 554f325335cSAndrey V. Elsukov if (error) 555f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OERRORS, 1); 556f325335cSAndrey V. Elsukov else { 557f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OPACKETS, 1); 558f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OBYTES, plen); 559f325335cSAndrey V. Elsukov } 5602addcba7SAndrey V. Elsukov ME_RUNLOCK(); 561f325335cSAndrey V. Elsukov return (error); 562f325335cSAndrey V. Elsukov } 563f325335cSAndrey V. Elsukov 564f325335cSAndrey V. Elsukov static void 565f325335cSAndrey V. Elsukov me_qflush(struct ifnet *ifp __unused) 566f325335cSAndrey V. Elsukov { 567f325335cSAndrey V. Elsukov 568f325335cSAndrey V. Elsukov } 569f325335cSAndrey V. Elsukov 5702addcba7SAndrey V. Elsukov static const struct encaptab *ecookie = NULL; 5712addcba7SAndrey V. Elsukov static const struct encap_config me_encap_cfg = { 5722addcba7SAndrey V. Elsukov .proto = IPPROTO_MOBILE, 5732addcba7SAndrey V. Elsukov .min_length = sizeof(struct ip) + sizeof(struct mobhdr) - 5742addcba7SAndrey V. Elsukov sizeof(in_addr_t), 5752addcba7SAndrey V. Elsukov .exact_match = ENCAP_DRV_LOOKUP, 5762addcba7SAndrey V. Elsukov .lookup = me_lookup, 5772addcba7SAndrey V. Elsukov .input = me_input 5782addcba7SAndrey V. Elsukov }; 5792addcba7SAndrey V. Elsukov 580f325335cSAndrey V. Elsukov static int 581f325335cSAndrey V. Elsukov memodevent(module_t mod, int type, void *data) 582f325335cSAndrey V. Elsukov { 583f325335cSAndrey V. Elsukov 584f325335cSAndrey V. Elsukov switch (type) { 585f325335cSAndrey V. Elsukov case MOD_LOAD: 5862addcba7SAndrey V. Elsukov ecookie = ip_encap_attach(&me_encap_cfg, NULL, M_WAITOK); 5872addcba7SAndrey V. Elsukov break; 588f325335cSAndrey V. Elsukov case MOD_UNLOAD: 5892addcba7SAndrey V. Elsukov ip_encap_detach(ecookie); 590f325335cSAndrey V. Elsukov break; 591f325335cSAndrey V. Elsukov default: 592f325335cSAndrey V. Elsukov return (EOPNOTSUPP); 593f325335cSAndrey V. Elsukov } 594f325335cSAndrey V. Elsukov return (0); 595f325335cSAndrey V. Elsukov } 596f325335cSAndrey V. Elsukov 597f325335cSAndrey V. Elsukov static moduledata_t me_mod = { 598f325335cSAndrey V. Elsukov "if_me", 599f325335cSAndrey V. Elsukov memodevent, 600f325335cSAndrey V. Elsukov 0 601f325335cSAndrey V. Elsukov }; 602f325335cSAndrey V. Elsukov 603f325335cSAndrey V. Elsukov DECLARE_MODULE(if_me, me_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 604f325335cSAndrey V. Elsukov MODULE_VERSION(if_me, 1); 605