1f325335cSAndrey V. Elsukov /*- 22addcba7SAndrey V. Elsukov * Copyright (c) 2014, 2018 Andrey V. Elsukov <ae@FreeBSD.org> 3f325335cSAndrey V. Elsukov * All rights reserved. 4f325335cSAndrey V. Elsukov * 5f325335cSAndrey V. Elsukov * Redistribution and use in source and binary forms, with or without 6f325335cSAndrey V. Elsukov * modification, are permitted provided that the following conditions 7f325335cSAndrey V. Elsukov * are met: 8f325335cSAndrey V. Elsukov * 9f325335cSAndrey V. Elsukov * 1. Redistributions of source code must retain the above copyright 10f325335cSAndrey V. Elsukov * notice, this list of conditions and the following disclaimer. 11f325335cSAndrey V. Elsukov * 2. Redistributions in binary form must reproduce the above copyright 12f325335cSAndrey V. Elsukov * notice, this list of conditions and the following disclaimer in the 13f325335cSAndrey V. Elsukov * documentation and/or other materials provided with the distribution. 14f325335cSAndrey V. Elsukov * 15f325335cSAndrey V. Elsukov * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 16f325335cSAndrey V. Elsukov * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 17f325335cSAndrey V. Elsukov * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 18f325335cSAndrey V. Elsukov * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 19f325335cSAndrey V. Elsukov * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT 20f325335cSAndrey V. Elsukov * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 21f325335cSAndrey V. Elsukov * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 22f325335cSAndrey V. Elsukov * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 23f325335cSAndrey V. Elsukov * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF 24f325335cSAndrey V. Elsukov * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 25f325335cSAndrey V. Elsukov */ 26f325335cSAndrey V. Elsukov 27f325335cSAndrey V. Elsukov #include <sys/cdefs.h> 28f325335cSAndrey V. Elsukov __FBSDID("$FreeBSD$"); 29f325335cSAndrey V. Elsukov 30f325335cSAndrey V. Elsukov #include <sys/param.h> 312addcba7SAndrey V. Elsukov #include <sys/systm.h> 32f325335cSAndrey V. Elsukov #include <sys/jail.h> 33f325335cSAndrey V. Elsukov #include <sys/kernel.h> 34f325335cSAndrey V. Elsukov #include <sys/lock.h> 35f325335cSAndrey V. Elsukov #include <sys/malloc.h> 36f325335cSAndrey V. Elsukov #include <sys/module.h> 37f325335cSAndrey V. Elsukov #include <sys/mbuf.h> 38f325335cSAndrey V. Elsukov #include <sys/priv.h> 39f325335cSAndrey V. Elsukov #include <sys/proc.h> 40f325335cSAndrey V. Elsukov #include <sys/socket.h> 41f325335cSAndrey V. Elsukov #include <sys/sockio.h> 42f325335cSAndrey V. Elsukov #include <sys/sx.h> 43f325335cSAndrey V. Elsukov #include <sys/sysctl.h> 44f325335cSAndrey V. Elsukov #include <sys/syslog.h> 45f325335cSAndrey V. Elsukov 46f325335cSAndrey V. Elsukov #include <net/bpf.h> 47f325335cSAndrey V. Elsukov #include <net/ethernet.h> 48f325335cSAndrey V. Elsukov #include <net/if.h> 49f325335cSAndrey V. Elsukov #include <net/if_var.h> 50f325335cSAndrey V. Elsukov #include <net/if_clone.h> 51f325335cSAndrey V. Elsukov #include <net/if_types.h> 52f325335cSAndrey V. Elsukov #include <net/netisr.h> 53f325335cSAndrey V. Elsukov #include <net/vnet.h> 54eccfe69aSAndrey V. Elsukov #include <net/route.h> 55f325335cSAndrey V. Elsukov 56f325335cSAndrey V. Elsukov #include <netinet/in.h> 57f325335cSAndrey V. Elsukov #include <netinet/in_systm.h> 58f325335cSAndrey V. Elsukov #include <netinet/in_var.h> 59f325335cSAndrey V. Elsukov #include <netinet/ip.h> 60f325335cSAndrey V. Elsukov #include <netinet/ip_var.h> 61f325335cSAndrey V. Elsukov #include <netinet/ip_encap.h> 62f325335cSAndrey V. Elsukov 63f325335cSAndrey V. Elsukov #include <machine/in_cksum.h> 64f325335cSAndrey V. Elsukov #include <security/mac/mac_framework.h> 65f325335cSAndrey V. Elsukov 66c00bf730SAndrey V. Elsukov #define MEMTU (1500 - sizeof(struct mobhdr)) 67f325335cSAndrey V. Elsukov static const char mename[] = "me"; 68f325335cSAndrey V. Elsukov static MALLOC_DEFINE(M_IFME, mename, "Minimal Encapsulation for IP"); 69f325335cSAndrey V. Elsukov /* Minimal forwarding header RFC 2004 */ 70f325335cSAndrey V. Elsukov struct mobhdr { 71f325335cSAndrey V. Elsukov uint8_t mob_proto; /* protocol */ 72f325335cSAndrey V. Elsukov uint8_t mob_flags; /* flags */ 73f325335cSAndrey V. Elsukov #define MOB_FLAGS_SP 0x80 /* source present */ 74f325335cSAndrey V. Elsukov uint16_t mob_csum; /* header checksum */ 75f325335cSAndrey V. Elsukov struct in_addr mob_dst; /* original destination address */ 76f325335cSAndrey V. Elsukov struct in_addr mob_src; /* original source addr (optional) */ 77f325335cSAndrey V. Elsukov } __packed; 78f325335cSAndrey V. Elsukov 79f325335cSAndrey V. Elsukov struct me_softc { 80f325335cSAndrey V. Elsukov struct ifnet *me_ifp; 81f325335cSAndrey V. Elsukov u_int me_fibnum; 82f325335cSAndrey V. Elsukov struct in_addr me_src; 83f325335cSAndrey V. Elsukov struct in_addr me_dst; 842addcba7SAndrey V. Elsukov 852addcba7SAndrey V. Elsukov CK_LIST_ENTRY(me_softc) chain; 86f325335cSAndrey V. Elsukov }; 872addcba7SAndrey V. Elsukov CK_LIST_HEAD(me_list, me_softc); 88f325335cSAndrey V. Elsukov #define ME2IFP(sc) ((sc)->me_ifp) 89f325335cSAndrey V. Elsukov #define ME_READY(sc) ((sc)->me_src.s_addr != 0) 902addcba7SAndrey V. Elsukov #define ME_RLOCK() epoch_enter_preempt(net_epoch_preempt) 912addcba7SAndrey V. Elsukov #define ME_RUNLOCK() epoch_exit_preempt(net_epoch_preempt) 922addcba7SAndrey V. Elsukov #define ME_WAIT() epoch_wait_preempt(net_epoch_preempt) 93f325335cSAndrey V. Elsukov 942addcba7SAndrey V. Elsukov #ifndef ME_HASH_SIZE 952addcba7SAndrey V. Elsukov #define ME_HASH_SIZE (1 << 4) 962addcba7SAndrey V. Elsukov #endif 972addcba7SAndrey V. Elsukov static VNET_DEFINE(struct me_list *, me_hashtbl) = NULL; 982addcba7SAndrey V. Elsukov #define V_me_hashtbl VNET(me_hashtbl) 992addcba7SAndrey V. Elsukov #define ME_HASH(src, dst) (V_me_hashtbl[\ 1002addcba7SAndrey V. Elsukov me_hashval((src), (dst)) & (ME_HASH_SIZE - 1)]) 101f325335cSAndrey V. Elsukov 102f325335cSAndrey V. Elsukov static struct sx me_ioctl_sx; 103f325335cSAndrey V. Elsukov SX_SYSINIT(me_ioctl_sx, &me_ioctl_sx, "me_ioctl"); 104f325335cSAndrey V. Elsukov 105f325335cSAndrey V. Elsukov static int me_clone_create(struct if_clone *, int, caddr_t); 106f325335cSAndrey V. Elsukov static void me_clone_destroy(struct ifnet *); 107f325335cSAndrey V. Elsukov static VNET_DEFINE(struct if_clone *, me_cloner); 108f325335cSAndrey V. Elsukov #define V_me_cloner VNET(me_cloner) 109f325335cSAndrey V. Elsukov 110f325335cSAndrey V. Elsukov static void me_qflush(struct ifnet *); 111f325335cSAndrey V. Elsukov static int me_transmit(struct ifnet *, struct mbuf *); 112f325335cSAndrey V. Elsukov static int me_ioctl(struct ifnet *, u_long, caddr_t); 113f325335cSAndrey V. Elsukov static int me_output(struct ifnet *, struct mbuf *, 114f325335cSAndrey V. Elsukov const struct sockaddr *, struct route *); 1156d8fdfa9SAndrey V. Elsukov static int me_input(struct mbuf *, int, int, void *); 116f325335cSAndrey V. Elsukov 1172addcba7SAndrey V. Elsukov static int me_set_tunnel(struct me_softc *, in_addr_t, in_addr_t); 1182addcba7SAndrey V. Elsukov static void me_delete_tunnel(struct me_softc *); 119f325335cSAndrey V. Elsukov 120f325335cSAndrey V. Elsukov SYSCTL_DECL(_net_link); 121f325335cSAndrey V. Elsukov static SYSCTL_NODE(_net_link, IFT_TUNNEL, me, CTLFLAG_RW, 0, 122f325335cSAndrey V. Elsukov "Minimal Encapsulation for IP (RFC 2004)"); 123f325335cSAndrey V. Elsukov #ifndef MAX_ME_NEST 124f325335cSAndrey V. Elsukov #define MAX_ME_NEST 1 125f325335cSAndrey V. Elsukov #endif 126f325335cSAndrey V. Elsukov 127f325335cSAndrey V. Elsukov static VNET_DEFINE(int, max_me_nesting) = MAX_ME_NEST; 128f325335cSAndrey V. Elsukov #define V_max_me_nesting VNET(max_me_nesting) 129f325335cSAndrey V. Elsukov SYSCTL_INT(_net_link_me, OID_AUTO, max_nesting, CTLFLAG_RW | CTLFLAG_VNET, 130f325335cSAndrey V. Elsukov &VNET_NAME(max_me_nesting), 0, "Max nested tunnels"); 131f325335cSAndrey V. Elsukov 1322addcba7SAndrey V. Elsukov static uint32_t 1332addcba7SAndrey V. Elsukov me_hashval(in_addr_t src, in_addr_t dst) 1342addcba7SAndrey V. Elsukov { 1352addcba7SAndrey V. Elsukov uint32_t ret; 1362addcba7SAndrey V. Elsukov 1372addcba7SAndrey V. Elsukov ret = fnv_32_buf(&src, sizeof(src), FNV1_32_INIT); 1382addcba7SAndrey V. Elsukov return (fnv_32_buf(&dst, sizeof(dst), ret)); 1392addcba7SAndrey V. Elsukov } 1402addcba7SAndrey V. Elsukov 1412addcba7SAndrey V. Elsukov static struct me_list * 1422addcba7SAndrey V. Elsukov me_hashinit(void) 1432addcba7SAndrey V. Elsukov { 1442addcba7SAndrey V. Elsukov struct me_list *hash; 1452addcba7SAndrey V. Elsukov int i; 1462addcba7SAndrey V. Elsukov 1472addcba7SAndrey V. Elsukov hash = malloc(sizeof(struct me_list) * ME_HASH_SIZE, 1482addcba7SAndrey V. Elsukov M_IFME, M_WAITOK); 1492addcba7SAndrey V. Elsukov for (i = 0; i < ME_HASH_SIZE; i++) 1502addcba7SAndrey V. Elsukov CK_LIST_INIT(&hash[i]); 1512addcba7SAndrey V. Elsukov 1522addcba7SAndrey V. Elsukov return (hash); 1532addcba7SAndrey V. Elsukov } 1542addcba7SAndrey V. Elsukov 155f325335cSAndrey V. Elsukov static void 156f325335cSAndrey V. Elsukov vnet_me_init(const void *unused __unused) 157f325335cSAndrey V. Elsukov { 158f325335cSAndrey V. Elsukov V_me_cloner = if_clone_simple(mename, me_clone_create, 159f325335cSAndrey V. Elsukov me_clone_destroy, 0); 160f325335cSAndrey V. Elsukov } 161f325335cSAndrey V. Elsukov VNET_SYSINIT(vnet_me_init, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_ANY, 162f325335cSAndrey V. Elsukov vnet_me_init, NULL); 163f325335cSAndrey V. Elsukov 164f325335cSAndrey V. Elsukov static void 165f325335cSAndrey V. Elsukov vnet_me_uninit(const void *unused __unused) 166f325335cSAndrey V. Elsukov { 167f325335cSAndrey V. Elsukov 1682addcba7SAndrey V. Elsukov if (V_me_hashtbl != NULL) 1692addcba7SAndrey V. Elsukov free(V_me_hashtbl, M_IFME); 170f325335cSAndrey V. Elsukov if_clone_detach(V_me_cloner); 171f325335cSAndrey V. Elsukov } 172f325335cSAndrey V. Elsukov VNET_SYSUNINIT(vnet_me_uninit, SI_SUB_PROTO_IFATTACHDOMAIN, SI_ORDER_ANY, 173f325335cSAndrey V. Elsukov vnet_me_uninit, NULL); 174f325335cSAndrey V. Elsukov 175f325335cSAndrey V. Elsukov static int 176f325335cSAndrey V. Elsukov me_clone_create(struct if_clone *ifc, int unit, caddr_t params) 177f325335cSAndrey V. Elsukov { 178f325335cSAndrey V. Elsukov struct me_softc *sc; 179f325335cSAndrey V. Elsukov 180f325335cSAndrey V. Elsukov sc = malloc(sizeof(struct me_softc), M_IFME, M_WAITOK | M_ZERO); 181f325335cSAndrey V. Elsukov sc->me_fibnum = curthread->td_proc->p_fibnum; 182f325335cSAndrey V. Elsukov ME2IFP(sc) = if_alloc(IFT_TUNNEL); 183f325335cSAndrey V. Elsukov ME2IFP(sc)->if_softc = sc; 184f325335cSAndrey V. Elsukov if_initname(ME2IFP(sc), mename, unit); 185f325335cSAndrey V. Elsukov 186c00bf730SAndrey V. Elsukov ME2IFP(sc)->if_mtu = MEMTU;; 187f325335cSAndrey V. Elsukov ME2IFP(sc)->if_flags = IFF_POINTOPOINT|IFF_MULTICAST; 188f325335cSAndrey V. Elsukov ME2IFP(sc)->if_output = me_output; 189f325335cSAndrey V. Elsukov ME2IFP(sc)->if_ioctl = me_ioctl; 190f325335cSAndrey V. Elsukov ME2IFP(sc)->if_transmit = me_transmit; 191f325335cSAndrey V. Elsukov ME2IFP(sc)->if_qflush = me_qflush; 192f1aaad0cSHiroki Sato ME2IFP(sc)->if_capabilities |= IFCAP_LINKSTATE; 193f1aaad0cSHiroki Sato ME2IFP(sc)->if_capenable |= IFCAP_LINKSTATE; 194f325335cSAndrey V. Elsukov if_attach(ME2IFP(sc)); 195f325335cSAndrey V. Elsukov bpfattach(ME2IFP(sc), DLT_NULL, sizeof(u_int32_t)); 196f325335cSAndrey V. Elsukov return (0); 197f325335cSAndrey V. Elsukov } 198f325335cSAndrey V. Elsukov 199f325335cSAndrey V. Elsukov static void 200f325335cSAndrey V. Elsukov me_clone_destroy(struct ifnet *ifp) 201f325335cSAndrey V. Elsukov { 202f325335cSAndrey V. Elsukov struct me_softc *sc; 203f325335cSAndrey V. Elsukov 204f325335cSAndrey V. Elsukov sx_xlock(&me_ioctl_sx); 205f325335cSAndrey V. Elsukov sc = ifp->if_softc; 2062addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 207f325335cSAndrey V. Elsukov bpfdetach(ifp); 208f325335cSAndrey V. Elsukov if_detach(ifp); 209f325335cSAndrey V. Elsukov ifp->if_softc = NULL; 210f325335cSAndrey V. Elsukov sx_xunlock(&me_ioctl_sx); 211f325335cSAndrey V. Elsukov 2122addcba7SAndrey V. Elsukov ME_WAIT(); 213f325335cSAndrey V. Elsukov if_free(ifp); 214f325335cSAndrey V. Elsukov free(sc, M_IFME); 215f325335cSAndrey V. Elsukov } 216f325335cSAndrey V. Elsukov 217f325335cSAndrey V. Elsukov static int 218f325335cSAndrey V. Elsukov me_ioctl(struct ifnet *ifp, u_long cmd, caddr_t data) 219f325335cSAndrey V. Elsukov { 220f325335cSAndrey V. Elsukov struct ifreq *ifr = (struct ifreq *)data; 221f325335cSAndrey V. Elsukov struct sockaddr_in *src, *dst; 222f325335cSAndrey V. Elsukov struct me_softc *sc; 223f325335cSAndrey V. Elsukov int error; 224f325335cSAndrey V. Elsukov 225f325335cSAndrey V. Elsukov switch (cmd) { 226f325335cSAndrey V. Elsukov case SIOCSIFMTU: 227f325335cSAndrey V. Elsukov if (ifr->ifr_mtu < 576) 228f325335cSAndrey V. Elsukov return (EINVAL); 229c00bf730SAndrey V. Elsukov ifp->if_mtu = ifr->ifr_mtu; 230f325335cSAndrey V. Elsukov return (0); 231f325335cSAndrey V. Elsukov case SIOCSIFADDR: 232f325335cSAndrey V. Elsukov ifp->if_flags |= IFF_UP; 233f325335cSAndrey V. Elsukov case SIOCSIFFLAGS: 234f325335cSAndrey V. Elsukov case SIOCADDMULTI: 235f325335cSAndrey V. Elsukov case SIOCDELMULTI: 236f325335cSAndrey V. Elsukov return (0); 237f325335cSAndrey V. Elsukov } 238f325335cSAndrey V. Elsukov sx_xlock(&me_ioctl_sx); 239f325335cSAndrey V. Elsukov sc = ifp->if_softc; 240f325335cSAndrey V. Elsukov if (sc == NULL) { 241f325335cSAndrey V. Elsukov error = ENXIO; 242f325335cSAndrey V. Elsukov goto end; 243f325335cSAndrey V. Elsukov } 244f325335cSAndrey V. Elsukov error = 0; 245f325335cSAndrey V. Elsukov switch (cmd) { 246f325335cSAndrey V. Elsukov case SIOCSIFPHYADDR: 2472addcba7SAndrey V. Elsukov src = &((struct in_aliasreq *)data)->ifra_addr; 2482addcba7SAndrey V. Elsukov dst = &((struct in_aliasreq *)data)->ifra_dstaddr; 249f325335cSAndrey V. Elsukov if (src->sin_family != dst->sin_family || 250f325335cSAndrey V. Elsukov src->sin_family != AF_INET || 251f325335cSAndrey V. Elsukov src->sin_len != dst->sin_len || 252f325335cSAndrey V. Elsukov src->sin_len != sizeof(struct sockaddr_in)) { 253f325335cSAndrey V. Elsukov error = EINVAL; 254f325335cSAndrey V. Elsukov break; 255f325335cSAndrey V. Elsukov } 256f325335cSAndrey V. Elsukov if (src->sin_addr.s_addr == INADDR_ANY || 257f325335cSAndrey V. Elsukov dst->sin_addr.s_addr == INADDR_ANY) { 258f325335cSAndrey V. Elsukov error = EADDRNOTAVAIL; 259f325335cSAndrey V. Elsukov break; 260f325335cSAndrey V. Elsukov } 2612addcba7SAndrey V. Elsukov error = me_set_tunnel(sc, src->sin_addr.s_addr, 2622addcba7SAndrey V. Elsukov dst->sin_addr.s_addr); 263f325335cSAndrey V. Elsukov break; 264f325335cSAndrey V. Elsukov case SIOCDIFPHYADDR: 2652addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 266f325335cSAndrey V. Elsukov break; 267f325335cSAndrey V. Elsukov case SIOCGIFPSRCADDR: 268f325335cSAndrey V. Elsukov case SIOCGIFPDSTADDR: 269f325335cSAndrey V. Elsukov if (!ME_READY(sc)) { 270f325335cSAndrey V. Elsukov error = EADDRNOTAVAIL; 271f325335cSAndrey V. Elsukov break; 272f325335cSAndrey V. Elsukov } 273f325335cSAndrey V. Elsukov src = (struct sockaddr_in *)&ifr->ifr_addr; 274f325335cSAndrey V. Elsukov memset(src, 0, sizeof(*src)); 275f325335cSAndrey V. Elsukov src->sin_family = AF_INET; 276f325335cSAndrey V. Elsukov src->sin_len = sizeof(*src); 277f325335cSAndrey V. Elsukov switch (cmd) { 278f325335cSAndrey V. Elsukov case SIOCGIFPSRCADDR: 279f325335cSAndrey V. Elsukov src->sin_addr = sc->me_src; 280f325335cSAndrey V. Elsukov break; 281f325335cSAndrey V. Elsukov case SIOCGIFPDSTADDR: 282f325335cSAndrey V. Elsukov src->sin_addr = sc->me_dst; 283f325335cSAndrey V. Elsukov break; 284f325335cSAndrey V. Elsukov } 285f325335cSAndrey V. Elsukov error = prison_if(curthread->td_ucred, sintosa(src)); 286f325335cSAndrey V. Elsukov if (error != 0) 287f325335cSAndrey V. Elsukov memset(src, 0, sizeof(*src)); 288f325335cSAndrey V. Elsukov break; 289eccfe69aSAndrey V. Elsukov case SIOCGTUNFIB: 290eccfe69aSAndrey V. Elsukov ifr->ifr_fib = sc->me_fibnum; 291eccfe69aSAndrey V. Elsukov break; 292eccfe69aSAndrey V. Elsukov case SIOCSTUNFIB: 293eccfe69aSAndrey V. Elsukov if ((error = priv_check(curthread, PRIV_NET_GRE)) != 0) 294eccfe69aSAndrey V. Elsukov break; 295eccfe69aSAndrey V. Elsukov if (ifr->ifr_fib >= rt_numfibs) 296eccfe69aSAndrey V. Elsukov error = EINVAL; 297eccfe69aSAndrey V. Elsukov else 298eccfe69aSAndrey V. Elsukov sc->me_fibnum = ifr->ifr_fib; 299eccfe69aSAndrey V. Elsukov break; 300f325335cSAndrey V. Elsukov default: 301f325335cSAndrey V. Elsukov error = EINVAL; 302f325335cSAndrey V. Elsukov break; 303f325335cSAndrey V. Elsukov } 304f325335cSAndrey V. Elsukov end: 305f325335cSAndrey V. Elsukov sx_xunlock(&me_ioctl_sx); 306f325335cSAndrey V. Elsukov return (error); 307f325335cSAndrey V. Elsukov } 308f325335cSAndrey V. Elsukov 309f325335cSAndrey V. Elsukov static int 3102addcba7SAndrey V. Elsukov me_lookup(const struct mbuf *m, int off, int proto, void **arg) 311f325335cSAndrey V. Elsukov { 3122addcba7SAndrey V. Elsukov const struct ip *ip; 313f325335cSAndrey V. Elsukov struct me_softc *sc; 314f325335cSAndrey V. Elsukov 315*6e081509SAndrey V. Elsukov if (V_me_hashtbl == NULL) 316*6e081509SAndrey V. Elsukov return (0); 317*6e081509SAndrey V. Elsukov 3182addcba7SAndrey V. Elsukov MPASS(in_epoch()); 3192addcba7SAndrey V. Elsukov ip = mtod(m, const struct ip *); 3202addcba7SAndrey V. Elsukov CK_LIST_FOREACH(sc, &ME_HASH(ip->ip_dst.s_addr, 3212addcba7SAndrey V. Elsukov ip->ip_src.s_addr), chain) { 3222addcba7SAndrey V. Elsukov if (sc->me_src.s_addr == ip->ip_dst.s_addr && 3232addcba7SAndrey V. Elsukov sc->me_dst.s_addr == ip->ip_src.s_addr) { 324f325335cSAndrey V. Elsukov if ((ME2IFP(sc)->if_flags & IFF_UP) == 0) 325f325335cSAndrey V. Elsukov return (0); 3262addcba7SAndrey V. Elsukov *arg = sc; 3272addcba7SAndrey V. Elsukov return (ENCAP_DRV_LOOKUP); 328f325335cSAndrey V. Elsukov } 3292addcba7SAndrey V. Elsukov } 3302addcba7SAndrey V. Elsukov return (0); 331f325335cSAndrey V. Elsukov } 332f325335cSAndrey V. Elsukov 333f325335cSAndrey V. Elsukov static int 3342addcba7SAndrey V. Elsukov me_set_tunnel(struct me_softc *sc, in_addr_t src, in_addr_t dst) 335f325335cSAndrey V. Elsukov { 3362addcba7SAndrey V. Elsukov struct me_softc *tmp; 337f325335cSAndrey V. Elsukov 338f325335cSAndrey V. Elsukov sx_assert(&me_ioctl_sx, SA_XLOCKED); 3392addcba7SAndrey V. Elsukov 3402addcba7SAndrey V. Elsukov if (V_me_hashtbl == NULL) 3412addcba7SAndrey V. Elsukov V_me_hashtbl = me_hashinit(); 3422addcba7SAndrey V. Elsukov 3432addcba7SAndrey V. Elsukov if (sc->me_src.s_addr == src && sc->me_dst.s_addr == dst) 3442addcba7SAndrey V. Elsukov return (0); 3452addcba7SAndrey V. Elsukov 3462addcba7SAndrey V. Elsukov CK_LIST_FOREACH(tmp, &ME_HASH(src, dst), chain) { 3472addcba7SAndrey V. Elsukov if (tmp == sc) 348f325335cSAndrey V. Elsukov continue; 3492addcba7SAndrey V. Elsukov if (tmp->me_src.s_addr == src && 3502addcba7SAndrey V. Elsukov tmp->me_dst.s_addr == dst) 351f325335cSAndrey V. Elsukov return (EADDRNOTAVAIL); 352f325335cSAndrey V. Elsukov } 353f325335cSAndrey V. Elsukov 3542addcba7SAndrey V. Elsukov me_delete_tunnel(sc); 3552addcba7SAndrey V. Elsukov sc->me_dst.s_addr = dst; 3562addcba7SAndrey V. Elsukov sc->me_src.s_addr = src; 3572addcba7SAndrey V. Elsukov CK_LIST_INSERT_HEAD(&ME_HASH(src, dst), sc, chain); 358f325335cSAndrey V. Elsukov 3592addcba7SAndrey V. Elsukov ME2IFP(sc)->if_drv_flags |= IFF_DRV_RUNNING; 3602addcba7SAndrey V. Elsukov if_link_state_change(ME2IFP(sc), LINK_STATE_UP); 361f325335cSAndrey V. Elsukov return (0); 362f325335cSAndrey V. Elsukov } 363f325335cSAndrey V. Elsukov 364f325335cSAndrey V. Elsukov static void 3652addcba7SAndrey V. Elsukov me_delete_tunnel(struct me_softc *sc) 366f325335cSAndrey V. Elsukov { 367f325335cSAndrey V. Elsukov 368f325335cSAndrey V. Elsukov sx_assert(&me_ioctl_sx, SA_XLOCKED); 3692addcba7SAndrey V. Elsukov if (ME_READY(sc)) { 3702addcba7SAndrey V. Elsukov CK_LIST_REMOVE(sc, chain); 3712addcba7SAndrey V. Elsukov ME_WAIT(); 3722addcba7SAndrey V. Elsukov 373f325335cSAndrey V. Elsukov sc->me_src.s_addr = 0; 374f325335cSAndrey V. Elsukov sc->me_dst.s_addr = 0; 3752addcba7SAndrey V. Elsukov ME2IFP(sc)->if_drv_flags &= ~IFF_DRV_RUNNING; 3762addcba7SAndrey V. Elsukov if_link_state_change(ME2IFP(sc), LINK_STATE_DOWN); 3772addcba7SAndrey V. Elsukov } 378f325335cSAndrey V. Elsukov } 379f325335cSAndrey V. Elsukov 380f325335cSAndrey V. Elsukov static uint16_t 381f325335cSAndrey V. Elsukov me_in_cksum(uint16_t *p, int nwords) 382f325335cSAndrey V. Elsukov { 383f325335cSAndrey V. Elsukov uint32_t sum = 0; 384f325335cSAndrey V. Elsukov 385f325335cSAndrey V. Elsukov while (nwords-- > 0) 386f325335cSAndrey V. Elsukov sum += *p++; 387f325335cSAndrey V. Elsukov sum = (sum >> 16) + (sum & 0xffff); 388f325335cSAndrey V. Elsukov sum += (sum >> 16); 389f325335cSAndrey V. Elsukov return (~sum); 390f325335cSAndrey V. Elsukov } 391f325335cSAndrey V. Elsukov 3926d8fdfa9SAndrey V. Elsukov static int 3936d8fdfa9SAndrey V. Elsukov me_input(struct mbuf *m, int off, int proto, void *arg) 394f325335cSAndrey V. Elsukov { 3956d8fdfa9SAndrey V. Elsukov struct me_softc *sc = arg; 396f325335cSAndrey V. Elsukov struct mobhdr *mh; 397f325335cSAndrey V. Elsukov struct ifnet *ifp; 398f325335cSAndrey V. Elsukov struct ip *ip; 399f325335cSAndrey V. Elsukov int hlen; 400f325335cSAndrey V. Elsukov 401f325335cSAndrey V. Elsukov ifp = ME2IFP(sc); 402f325335cSAndrey V. Elsukov /* checks for short packets */ 403f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr); 404f325335cSAndrey V. Elsukov if (m->m_pkthdr.len < sizeof(struct ip) + hlen) 405f325335cSAndrey V. Elsukov hlen -= sizeof(struct in_addr); 406f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip) + hlen) 407f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip) + hlen); 408f325335cSAndrey V. Elsukov if (m == NULL) 409f325335cSAndrey V. Elsukov goto drop; 410f325335cSAndrey V. Elsukov mh = (struct mobhdr *)mtodo(m, sizeof(struct ip)); 411f325335cSAndrey V. Elsukov /* check for wrong flags */ 412f325335cSAndrey V. Elsukov if (mh->mob_flags & (~MOB_FLAGS_SP)) { 413f325335cSAndrey V. Elsukov m_freem(m); 414f325335cSAndrey V. Elsukov goto drop; 415f325335cSAndrey V. Elsukov } 416f325335cSAndrey V. Elsukov if (mh->mob_flags) { 417f325335cSAndrey V. Elsukov if (hlen != sizeof(struct mobhdr)) { 418f325335cSAndrey V. Elsukov m_freem(m); 419f325335cSAndrey V. Elsukov goto drop; 420f325335cSAndrey V. Elsukov } 421f325335cSAndrey V. Elsukov } else 422f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr) - sizeof(struct in_addr); 423f325335cSAndrey V. Elsukov /* check mobile header checksum */ 424f325335cSAndrey V. Elsukov if (me_in_cksum((uint16_t *)mh, hlen / sizeof(uint16_t)) != 0) { 425f325335cSAndrey V. Elsukov m_freem(m); 426f325335cSAndrey V. Elsukov goto drop; 427f325335cSAndrey V. Elsukov } 428f325335cSAndrey V. Elsukov #ifdef MAC 429f325335cSAndrey V. Elsukov mac_ifnet_create_mbuf(ifp, m); 430f325335cSAndrey V. Elsukov #endif 431f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 432f325335cSAndrey V. Elsukov ip->ip_dst = mh->mob_dst; 433f325335cSAndrey V. Elsukov ip->ip_p = mh->mob_proto; 434f325335cSAndrey V. Elsukov ip->ip_sum = 0; 435f325335cSAndrey V. Elsukov ip->ip_len = htons(m->m_pkthdr.len - hlen); 436f325335cSAndrey V. Elsukov if (mh->mob_flags) 437f325335cSAndrey V. Elsukov ip->ip_src = mh->mob_src; 438f325335cSAndrey V. Elsukov memmove(mtodo(m, hlen), ip, sizeof(struct ip)); 439f325335cSAndrey V. Elsukov m_adj(m, hlen); 440f325335cSAndrey V. Elsukov m_clrprotoflags(m); 441f325335cSAndrey V. Elsukov m->m_pkthdr.rcvif = ifp; 442f325335cSAndrey V. Elsukov m->m_pkthdr.csum_flags |= (CSUM_IP_CHECKED | CSUM_IP_VALID); 443eccfe69aSAndrey V. Elsukov M_SETFIB(m, ifp->if_fib); 444f325335cSAndrey V. Elsukov hlen = AF_INET; 445f325335cSAndrey V. Elsukov BPF_MTAP2(ifp, &hlen, sizeof(hlen), m); 446f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IPACKETS, 1); 447f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IBYTES, m->m_pkthdr.len); 448f325335cSAndrey V. Elsukov if ((ifp->if_flags & IFF_MONITOR) != 0) 449f325335cSAndrey V. Elsukov m_freem(m); 450f325335cSAndrey V. Elsukov else 451f325335cSAndrey V. Elsukov netisr_dispatch(NETISR_IP, m); 452f325335cSAndrey V. Elsukov return (IPPROTO_DONE); 453f325335cSAndrey V. Elsukov drop: 454f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_IERRORS, 1); 455f325335cSAndrey V. Elsukov return (IPPROTO_DONE); 456f325335cSAndrey V. Elsukov } 457f325335cSAndrey V. Elsukov 458f325335cSAndrey V. Elsukov #define MTAG_ME 1414491977 459f325335cSAndrey V. Elsukov static int 460f325335cSAndrey V. Elsukov me_check_nesting(struct ifnet *ifp, struct mbuf *m) 461f325335cSAndrey V. Elsukov { 462f325335cSAndrey V. Elsukov struct m_tag *mtag; 463f325335cSAndrey V. Elsukov int count; 464f325335cSAndrey V. Elsukov 465f325335cSAndrey V. Elsukov count = 1; 466f325335cSAndrey V. Elsukov mtag = NULL; 467b347bc3bSAndrey V. Elsukov while ((mtag = m_tag_locate(m, MTAG_ME, 0, mtag)) != NULL) { 468f325335cSAndrey V. Elsukov if (*(struct ifnet **)(mtag + 1) == ifp) { 469f325335cSAndrey V. Elsukov log(LOG_NOTICE, "%s: loop detected\n", ifp->if_xname); 470f325335cSAndrey V. Elsukov return (EIO); 471f325335cSAndrey V. Elsukov } 472f325335cSAndrey V. Elsukov count++; 473f325335cSAndrey V. Elsukov } 474f325335cSAndrey V. Elsukov if (count > V_max_me_nesting) { 475f325335cSAndrey V. Elsukov log(LOG_NOTICE, 476f325335cSAndrey V. Elsukov "%s: if_output recursively called too many times(%d)\n", 477f325335cSAndrey V. Elsukov ifp->if_xname, count); 478f325335cSAndrey V. Elsukov return (EIO); 479f325335cSAndrey V. Elsukov } 480f325335cSAndrey V. Elsukov mtag = m_tag_alloc(MTAG_ME, 0, sizeof(struct ifnet *), M_NOWAIT); 481f325335cSAndrey V. Elsukov if (mtag == NULL) 482f325335cSAndrey V. Elsukov return (ENOMEM); 483f325335cSAndrey V. Elsukov *(struct ifnet **)(mtag + 1) = ifp; 484f325335cSAndrey V. Elsukov m_tag_prepend(m, mtag); 485f325335cSAndrey V. Elsukov return (0); 486f325335cSAndrey V. Elsukov } 487f325335cSAndrey V. Elsukov 488f325335cSAndrey V. Elsukov static int 489f325335cSAndrey V. Elsukov me_output(struct ifnet *ifp, struct mbuf *m, const struct sockaddr *dst, 4902addcba7SAndrey V. Elsukov struct route *ro __unused) 491f325335cSAndrey V. Elsukov { 492f325335cSAndrey V. Elsukov uint32_t af; 4932addcba7SAndrey V. Elsukov 4942addcba7SAndrey V. Elsukov if (dst->sa_family == AF_UNSPEC) 4952addcba7SAndrey V. Elsukov bcopy(dst->sa_data, &af, sizeof(af)); 4962addcba7SAndrey V. Elsukov else 4972addcba7SAndrey V. Elsukov af = dst->sa_family; 4982addcba7SAndrey V. Elsukov m->m_pkthdr.csum_data = af; 4992addcba7SAndrey V. Elsukov return (ifp->if_transmit(ifp, m)); 5002addcba7SAndrey V. Elsukov } 5012addcba7SAndrey V. Elsukov 5022addcba7SAndrey V. Elsukov static int 5032addcba7SAndrey V. Elsukov me_transmit(struct ifnet *ifp, struct mbuf *m) 5042addcba7SAndrey V. Elsukov { 5052addcba7SAndrey V. Elsukov struct mobhdr mh; 5062addcba7SAndrey V. Elsukov struct me_softc *sc; 5072addcba7SAndrey V. Elsukov struct ip *ip; 5082addcba7SAndrey V. Elsukov uint32_t af; 5092addcba7SAndrey V. Elsukov int error, hlen, plen; 510f325335cSAndrey V. Elsukov 511f325335cSAndrey V. Elsukov #ifdef MAC 512f325335cSAndrey V. Elsukov error = mac_ifnet_check_transmit(ifp, m); 513f325335cSAndrey V. Elsukov if (error != 0) 514f325335cSAndrey V. Elsukov goto drop; 515f325335cSAndrey V. Elsukov #endif 516f325335cSAndrey V. Elsukov error = ENETDOWN; 5172addcba7SAndrey V. Elsukov ME_RLOCK(); 5182addcba7SAndrey V. Elsukov sc = ifp->if_softc; 5192addcba7SAndrey V. Elsukov if (sc == NULL || !ME_READY(sc) || 5202addcba7SAndrey V. Elsukov (ifp->if_flags & IFF_MONITOR) != 0 || 5212addcba7SAndrey V. Elsukov (ifp->if_flags & IFF_UP) == 0 || 5222addcba7SAndrey V. Elsukov (error = me_check_nesting(ifp, m) != 0)) { 5232addcba7SAndrey V. Elsukov m_freem(m); 524f325335cSAndrey V. Elsukov goto drop; 525f325335cSAndrey V. Elsukov } 5262addcba7SAndrey V. Elsukov af = m->m_pkthdr.csum_data; 527f325335cSAndrey V. Elsukov if (af != AF_INET) { 528f325335cSAndrey V. Elsukov error = EAFNOSUPPORT; 529f325335cSAndrey V. Elsukov m_freem(m); 530f325335cSAndrey V. Elsukov goto drop; 531f325335cSAndrey V. Elsukov } 532f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip)) 533f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip)); 534f325335cSAndrey V. Elsukov if (m == NULL) { 535f325335cSAndrey V. Elsukov error = ENOBUFS; 536f325335cSAndrey V. Elsukov goto drop; 537f325335cSAndrey V. Elsukov } 538f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 539f325335cSAndrey V. Elsukov /* Fragmented datagramms shouldn't be encapsulated */ 540f325335cSAndrey V. Elsukov if (ip->ip_off & htons(IP_MF | IP_OFFMASK)) { 541f325335cSAndrey V. Elsukov error = EINVAL; 542f325335cSAndrey V. Elsukov m_freem(m); 543f325335cSAndrey V. Elsukov goto drop; 544f325335cSAndrey V. Elsukov } 545f325335cSAndrey V. Elsukov mh.mob_proto = ip->ip_p; 546f325335cSAndrey V. Elsukov mh.mob_src = ip->ip_src; 547f325335cSAndrey V. Elsukov mh.mob_dst = ip->ip_dst; 548f325335cSAndrey V. Elsukov if (in_hosteq(sc->me_src, ip->ip_src)) { 549f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr) - sizeof(struct in_addr); 550f325335cSAndrey V. Elsukov mh.mob_flags = 0; 551f325335cSAndrey V. Elsukov } else { 552f325335cSAndrey V. Elsukov hlen = sizeof(struct mobhdr); 553f325335cSAndrey V. Elsukov mh.mob_flags = MOB_FLAGS_SP; 554f325335cSAndrey V. Elsukov } 5559597ff83SAndrey V. Elsukov BPF_MTAP2(ifp, &af, sizeof(af), m); 556f325335cSAndrey V. Elsukov plen = m->m_pkthdr.len; 557f325335cSAndrey V. Elsukov ip->ip_src = sc->me_src; 558f325335cSAndrey V. Elsukov ip->ip_dst = sc->me_dst; 5592addcba7SAndrey V. Elsukov m->m_flags &= ~(M_BCAST|M_MCAST); 560f325335cSAndrey V. Elsukov M_SETFIB(m, sc->me_fibnum); 561f325335cSAndrey V. Elsukov M_PREPEND(m, hlen, M_NOWAIT); 562f325335cSAndrey V. Elsukov if (m == NULL) { 563f325335cSAndrey V. Elsukov error = ENOBUFS; 564f325335cSAndrey V. Elsukov goto drop; 565f325335cSAndrey V. Elsukov } 566f325335cSAndrey V. Elsukov if (m->m_len < sizeof(struct ip) + hlen) 567f325335cSAndrey V. Elsukov m = m_pullup(m, sizeof(struct ip) + hlen); 568f325335cSAndrey V. Elsukov if (m == NULL) { 569f325335cSAndrey V. Elsukov error = ENOBUFS; 570f325335cSAndrey V. Elsukov goto drop; 571f325335cSAndrey V. Elsukov } 572f325335cSAndrey V. Elsukov memmove(mtod(m, void *), mtodo(m, hlen), sizeof(struct ip)); 573f325335cSAndrey V. Elsukov ip = mtod(m, struct ip *); 574f325335cSAndrey V. Elsukov ip->ip_len = htons(m->m_pkthdr.len); 575f325335cSAndrey V. Elsukov ip->ip_p = IPPROTO_MOBILE; 576f325335cSAndrey V. Elsukov ip->ip_sum = 0; 577f325335cSAndrey V. Elsukov mh.mob_csum = 0; 578f325335cSAndrey V. Elsukov mh.mob_csum = me_in_cksum((uint16_t *)&mh, hlen / sizeof(uint16_t)); 579f325335cSAndrey V. Elsukov bcopy(&mh, mtodo(m, sizeof(struct ip)), hlen); 580f325335cSAndrey V. Elsukov error = ip_output(m, NULL, NULL, IP_FORWARDING, NULL, NULL); 581f325335cSAndrey V. Elsukov drop: 582f325335cSAndrey V. Elsukov if (error) 583f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OERRORS, 1); 584f325335cSAndrey V. Elsukov else { 585f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OPACKETS, 1); 586f325335cSAndrey V. Elsukov if_inc_counter(ifp, IFCOUNTER_OBYTES, plen); 587f325335cSAndrey V. Elsukov } 5882addcba7SAndrey V. Elsukov ME_RUNLOCK(); 589f325335cSAndrey V. Elsukov return (error); 590f325335cSAndrey V. Elsukov } 591f325335cSAndrey V. Elsukov 592f325335cSAndrey V. Elsukov static void 593f325335cSAndrey V. Elsukov me_qflush(struct ifnet *ifp __unused) 594f325335cSAndrey V. Elsukov { 595f325335cSAndrey V. Elsukov 596f325335cSAndrey V. Elsukov } 597f325335cSAndrey V. Elsukov 5982addcba7SAndrey V. Elsukov static const struct encaptab *ecookie = NULL; 5992addcba7SAndrey V. Elsukov static const struct encap_config me_encap_cfg = { 6002addcba7SAndrey V. Elsukov .proto = IPPROTO_MOBILE, 6012addcba7SAndrey V. Elsukov .min_length = sizeof(struct ip) + sizeof(struct mobhdr) - 6022addcba7SAndrey V. Elsukov sizeof(in_addr_t), 6032addcba7SAndrey V. Elsukov .exact_match = ENCAP_DRV_LOOKUP, 6042addcba7SAndrey V. Elsukov .lookup = me_lookup, 6052addcba7SAndrey V. Elsukov .input = me_input 6062addcba7SAndrey V. Elsukov }; 6072addcba7SAndrey V. Elsukov 608f325335cSAndrey V. Elsukov static int 609f325335cSAndrey V. Elsukov memodevent(module_t mod, int type, void *data) 610f325335cSAndrey V. Elsukov { 611f325335cSAndrey V. Elsukov 612f325335cSAndrey V. Elsukov switch (type) { 613f325335cSAndrey V. Elsukov case MOD_LOAD: 6142addcba7SAndrey V. Elsukov ecookie = ip_encap_attach(&me_encap_cfg, NULL, M_WAITOK); 6152addcba7SAndrey V. Elsukov break; 616f325335cSAndrey V. Elsukov case MOD_UNLOAD: 6172addcba7SAndrey V. Elsukov ip_encap_detach(ecookie); 618f325335cSAndrey V. Elsukov break; 619f325335cSAndrey V. Elsukov default: 620f325335cSAndrey V. Elsukov return (EOPNOTSUPP); 621f325335cSAndrey V. Elsukov } 622f325335cSAndrey V. Elsukov return (0); 623f325335cSAndrey V. Elsukov } 624f325335cSAndrey V. Elsukov 625f325335cSAndrey V. Elsukov static moduledata_t me_mod = { 626f325335cSAndrey V. Elsukov "if_me", 627f325335cSAndrey V. Elsukov memodevent, 628f325335cSAndrey V. Elsukov 0 629f325335cSAndrey V. Elsukov }; 630f325335cSAndrey V. Elsukov 631f325335cSAndrey V. Elsukov DECLARE_MODULE(if_me, me_mod, SI_SUB_PSEUDO, SI_ORDER_ANY); 632f325335cSAndrey V. Elsukov MODULE_VERSION(if_me, 1); 633