19d40cf60SHans Petter Selasky /*- 29d40cf60SHans Petter Selasky * Copyright (c) 2020 Mellanox Technologies. All rights reserved. 39d40cf60SHans Petter Selasky * 49d40cf60SHans Petter Selasky * Redistribution and use in source and binary forms, with or without 59d40cf60SHans Petter Selasky * modification, are permitted provided that the following conditions 69d40cf60SHans Petter Selasky * are met: 79d40cf60SHans Petter Selasky * 1. Redistributions of source code must retain the above copyright 89d40cf60SHans Petter Selasky * notice, this list of conditions and the following disclaimer. 99d40cf60SHans Petter Selasky * 2. Redistributions in binary form must reproduce the above copyright 109d40cf60SHans Petter Selasky * notice, this list of conditions and the following disclaimer in the 119d40cf60SHans Petter Selasky * documentation and/or other materials provided with the distribution. 129d40cf60SHans Petter Selasky * 139d40cf60SHans Petter Selasky * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS `AS IS' AND 149d40cf60SHans Petter Selasky * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 159d40cf60SHans Petter Selasky * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 169d40cf60SHans Petter Selasky * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE 179d40cf60SHans Petter Selasky * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 189d40cf60SHans Petter Selasky * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 199d40cf60SHans Petter Selasky * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 209d40cf60SHans Petter Selasky * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 219d40cf60SHans Petter Selasky * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 229d40cf60SHans Petter Selasky * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 239d40cf60SHans Petter Selasky * SUCH DAMAGE. 249d40cf60SHans Petter Selasky */ 259d40cf60SHans Petter Selasky 269d40cf60SHans Petter Selasky #include "opt_inet.h" 279d40cf60SHans Petter Selasky #include "opt_inet6.h" 289d40cf60SHans Petter Selasky 299d40cf60SHans Petter Selasky #include <sys/cdefs.h> 309d40cf60SHans Petter Selasky __FBSDID("$FreeBSD$"); 319d40cf60SHans Petter Selasky 32ce329aa2SHans Petter Selasky #include <sys/param.h> 331d3a22e7SHans Petter Selasky #include <sys/systm.h> 3401630a49SHans Petter Selasky #include <sys/devctl.h> 359d40cf60SHans Petter Selasky #include <sys/eventhandler.h> 3601630a49SHans Petter Selasky #include <sys/kernel.h> 3701630a49SHans Petter Selasky #include <sys/mbuf.h> 3801630a49SHans Petter Selasky #include <sys/module.h> 399d40cf60SHans Petter Selasky #include <sys/socket.h> 409d40cf60SHans Petter Selasky #include <sys/sysctl.h> 419d40cf60SHans Petter Selasky 4201630a49SHans Petter Selasky #include <net/bpf.h> 439d40cf60SHans Petter Selasky #include <net/ethernet.h> 449d40cf60SHans Petter Selasky #include <net/infiniband.h> 4501630a49SHans Petter Selasky #include <net/if.h> 4601630a49SHans Petter Selasky #include <net/if_var.h> 479d40cf60SHans Petter Selasky #include <net/if_dl.h> 489d40cf60SHans Petter Selasky #include <net/if_media.h> 49a92c4bb6SHans Petter Selasky #include <net/if_lagg.h> 5001630a49SHans Petter Selasky #include <net/if_llatbl.h> 5101630a49SHans Petter Selasky #include <net/if_types.h> 5201630a49SHans Petter Selasky #include <net/netisr.h> 5301630a49SHans Petter Selasky #include <net/route.h> 549d40cf60SHans Petter Selasky #include <netinet/if_ether.h> 5501630a49SHans Petter Selasky #include <netinet/in.h> 569d40cf60SHans Petter Selasky #include <netinet/ip6.h> 579d40cf60SHans Petter Selasky #include <netinet6/in6_var.h> 589d40cf60SHans Petter Selasky #include <netinet6/nd6.h> 599d40cf60SHans Petter Selasky 609d40cf60SHans Petter Selasky #include <security/mac/mac_framework.h> 619d40cf60SHans Petter Selasky 62a92c4bb6SHans Petter Selasky /* if_lagg(4) support */ 63a92c4bb6SHans Petter Selasky struct mbuf *(*lagg_input_infiniband_p)(struct ifnet *, struct mbuf *); 64a92c4bb6SHans Petter Selasky 659d40cf60SHans Petter Selasky #ifdef INET 669d40cf60SHans Petter Selasky static inline void 671355e2dcSHans Petter Selasky infiniband_ipv4_multicast_map(uint32_t addr, 681355e2dcSHans Petter Selasky const uint8_t *broadcast, uint8_t *buf) 699d40cf60SHans Petter Selasky { 709d40cf60SHans Petter Selasky uint8_t scope; 719d40cf60SHans Petter Selasky 729d40cf60SHans Petter Selasky addr = ntohl(addr); 739d40cf60SHans Petter Selasky scope = broadcast[5] & 0xF; 749d40cf60SHans Petter Selasky 759d40cf60SHans Petter Selasky buf[0] = 0; 769d40cf60SHans Petter Selasky buf[1] = 0xff; 779d40cf60SHans Petter Selasky buf[2] = 0xff; 789d40cf60SHans Petter Selasky buf[3] = 0xff; 799d40cf60SHans Petter Selasky buf[4] = 0xff; 809d40cf60SHans Petter Selasky buf[5] = 0x10 | scope; 819d40cf60SHans Petter Selasky buf[6] = 0x40; 829d40cf60SHans Petter Selasky buf[7] = 0x1b; 839d40cf60SHans Petter Selasky buf[8] = broadcast[8]; 849d40cf60SHans Petter Selasky buf[9] = broadcast[9]; 859d40cf60SHans Petter Selasky buf[10] = 0; 869d40cf60SHans Petter Selasky buf[11] = 0; 879d40cf60SHans Petter Selasky buf[12] = 0; 889d40cf60SHans Petter Selasky buf[13] = 0; 899d40cf60SHans Petter Selasky buf[14] = 0; 909d40cf60SHans Petter Selasky buf[15] = 0; 919d40cf60SHans Petter Selasky buf[16] = (addr >> 24) & 0xff; 929d40cf60SHans Petter Selasky buf[17] = (addr >> 16) & 0xff; 939d40cf60SHans Petter Selasky buf[18] = (addr >> 8) & 0xff; 949d40cf60SHans Petter Selasky buf[19] = addr & 0xff; 959d40cf60SHans Petter Selasky } 969d40cf60SHans Petter Selasky #endif 979d40cf60SHans Petter Selasky 989d40cf60SHans Petter Selasky #ifdef INET6 999d40cf60SHans Petter Selasky static inline void 1001355e2dcSHans Petter Selasky infiniband_ipv6_multicast_map(const struct in6_addr *addr, 1011355e2dcSHans Petter Selasky const uint8_t *broadcast, uint8_t *buf) 1029d40cf60SHans Petter Selasky { 1039d40cf60SHans Petter Selasky uint8_t scope; 1049d40cf60SHans Petter Selasky 1059d40cf60SHans Petter Selasky scope = broadcast[5] & 0xF; 1069d40cf60SHans Petter Selasky 1079d40cf60SHans Petter Selasky buf[0] = 0; 1089d40cf60SHans Petter Selasky buf[1] = 0xff; 1099d40cf60SHans Petter Selasky buf[2] = 0xff; 1109d40cf60SHans Petter Selasky buf[3] = 0xff; 1119d40cf60SHans Petter Selasky buf[4] = 0xff; 1129d40cf60SHans Petter Selasky buf[5] = 0x10 | scope; 1139d40cf60SHans Petter Selasky buf[6] = 0x60; 1149d40cf60SHans Petter Selasky buf[7] = 0x1b; 1159d40cf60SHans Petter Selasky buf[8] = broadcast[8]; 1169d40cf60SHans Petter Selasky buf[9] = broadcast[9]; 1179d40cf60SHans Petter Selasky memcpy(&buf[10], &addr->s6_addr[6], 10); 1189d40cf60SHans Petter Selasky } 1199d40cf60SHans Petter Selasky #endif 1209d40cf60SHans Petter Selasky 1219d40cf60SHans Petter Selasky /* 1229d40cf60SHans Petter Selasky * This is for clients that have an infiniband_header in the mbuf. 1239d40cf60SHans Petter Selasky */ 1249d40cf60SHans Petter Selasky void 1259d40cf60SHans Petter Selasky infiniband_bpf_mtap(struct ifnet *ifp, struct mbuf *mb) 1269d40cf60SHans Petter Selasky { 1279d40cf60SHans Petter Selasky struct infiniband_header *ibh; 1289d40cf60SHans Petter Selasky struct ether_header eh; 1299d40cf60SHans Petter Selasky 1309d40cf60SHans Petter Selasky if (mb->m_len < sizeof(*ibh)) 1319d40cf60SHans Petter Selasky return; 1329d40cf60SHans Petter Selasky 1339d40cf60SHans Petter Selasky ibh = mtod(mb, struct infiniband_header *); 1349d40cf60SHans Petter Selasky eh.ether_type = ibh->ib_protocol; 1359d40cf60SHans Petter Selasky memset(eh.ether_shost, 0, ETHER_ADDR_LEN); 1369d40cf60SHans Petter Selasky memcpy(eh.ether_dhost, ibh->ib_hwaddr + 4, ETHER_ADDR_LEN); 1379d40cf60SHans Petter Selasky mb->m_data += sizeof(*ibh); 1389d40cf60SHans Petter Selasky mb->m_len -= sizeof(*ibh); 1399d40cf60SHans Petter Selasky mb->m_pkthdr.len -= sizeof(*ibh); 1409d40cf60SHans Petter Selasky bpf_mtap2(ifp->if_bpf, &eh, sizeof(eh), mb); 1419d40cf60SHans Petter Selasky mb->m_data -= sizeof(*ibh); 1429d40cf60SHans Petter Selasky mb->m_len += sizeof(*ibh); 1439d40cf60SHans Petter Selasky mb->m_pkthdr.len += sizeof(*ibh); 1449d40cf60SHans Petter Selasky } 1459d40cf60SHans Petter Selasky 146*ec52ff6dSHans Petter Selasky static void 147*ec52ff6dSHans Petter Selasky update_mbuf_csumflags(struct mbuf *src, struct mbuf *dst) 148*ec52ff6dSHans Petter Selasky { 149*ec52ff6dSHans Petter Selasky int csum_flags = 0; 150*ec52ff6dSHans Petter Selasky 151*ec52ff6dSHans Petter Selasky if (src->m_pkthdr.csum_flags & CSUM_IP) 152*ec52ff6dSHans Petter Selasky csum_flags |= (CSUM_IP_CHECKED|CSUM_IP_VALID); 153*ec52ff6dSHans Petter Selasky if (src->m_pkthdr.csum_flags & CSUM_DELAY_DATA) 154*ec52ff6dSHans Petter Selasky csum_flags |= (CSUM_DATA_VALID|CSUM_PSEUDO_HDR); 155*ec52ff6dSHans Petter Selasky if (src->m_pkthdr.csum_flags & CSUM_SCTP) 156*ec52ff6dSHans Petter Selasky csum_flags |= CSUM_SCTP_VALID; 157*ec52ff6dSHans Petter Selasky dst->m_pkthdr.csum_flags |= csum_flags; 158*ec52ff6dSHans Petter Selasky if (csum_flags & CSUM_DATA_VALID) 159*ec52ff6dSHans Petter Selasky dst->m_pkthdr.csum_data = 0xffff; 160*ec52ff6dSHans Petter Selasky } 161*ec52ff6dSHans Petter Selasky 162*ec52ff6dSHans Petter Selasky /* 163*ec52ff6dSHans Petter Selasky * Handle link-layer encapsulation requests. 164*ec52ff6dSHans Petter Selasky */ 165*ec52ff6dSHans Petter Selasky static int 166*ec52ff6dSHans Petter Selasky infiniband_requestencap(struct ifnet *ifp, struct if_encap_req *req) 167*ec52ff6dSHans Petter Selasky { 168*ec52ff6dSHans Petter Selasky struct infiniband_header *ih; 169*ec52ff6dSHans Petter Selasky struct arphdr *ah; 170*ec52ff6dSHans Petter Selasky uint16_t etype; 171*ec52ff6dSHans Petter Selasky const uint8_t *lladdr; 172*ec52ff6dSHans Petter Selasky 173*ec52ff6dSHans Petter Selasky if (req->rtype != IFENCAP_LL) 174*ec52ff6dSHans Petter Selasky return (EOPNOTSUPP); 175*ec52ff6dSHans Petter Selasky 176*ec52ff6dSHans Petter Selasky if (req->bufsize < INFINIBAND_HDR_LEN) 177*ec52ff6dSHans Petter Selasky return (ENOMEM); 178*ec52ff6dSHans Petter Selasky 179*ec52ff6dSHans Petter Selasky ih = (struct infiniband_header *)req->buf; 180*ec52ff6dSHans Petter Selasky lladdr = req->lladdr; 181*ec52ff6dSHans Petter Selasky req->lladdr_off = 0; 182*ec52ff6dSHans Petter Selasky 183*ec52ff6dSHans Petter Selasky switch (req->family) { 184*ec52ff6dSHans Petter Selasky case AF_INET: 185*ec52ff6dSHans Petter Selasky etype = htons(ETHERTYPE_IP); 186*ec52ff6dSHans Petter Selasky break; 187*ec52ff6dSHans Petter Selasky case AF_INET6: 188*ec52ff6dSHans Petter Selasky etype = htons(ETHERTYPE_IPV6); 189*ec52ff6dSHans Petter Selasky break; 190*ec52ff6dSHans Petter Selasky case AF_ARP: 191*ec52ff6dSHans Petter Selasky ah = (struct arphdr *)req->hdata; 192*ec52ff6dSHans Petter Selasky ah->ar_hrd = htons(ARPHRD_INFINIBAND); 193*ec52ff6dSHans Petter Selasky 194*ec52ff6dSHans Petter Selasky switch (ntohs(ah->ar_op)) { 195*ec52ff6dSHans Petter Selasky case ARPOP_REVREQUEST: 196*ec52ff6dSHans Petter Selasky case ARPOP_REVREPLY: 197*ec52ff6dSHans Petter Selasky etype = htons(ETHERTYPE_REVARP); 198*ec52ff6dSHans Petter Selasky break; 199*ec52ff6dSHans Petter Selasky case ARPOP_REQUEST: 200*ec52ff6dSHans Petter Selasky case ARPOP_REPLY: 201*ec52ff6dSHans Petter Selasky default: 202*ec52ff6dSHans Petter Selasky etype = htons(ETHERTYPE_ARP); 203*ec52ff6dSHans Petter Selasky break; 204*ec52ff6dSHans Petter Selasky } 205*ec52ff6dSHans Petter Selasky 206*ec52ff6dSHans Petter Selasky if (req->flags & IFENCAP_FLAG_BROADCAST) 207*ec52ff6dSHans Petter Selasky lladdr = ifp->if_broadcastaddr; 208*ec52ff6dSHans Petter Selasky break; 209*ec52ff6dSHans Petter Selasky default: 210*ec52ff6dSHans Petter Selasky return (EAFNOSUPPORT); 211*ec52ff6dSHans Petter Selasky } 212*ec52ff6dSHans Petter Selasky 213*ec52ff6dSHans Petter Selasky ih->ib_protocol = etype; 214*ec52ff6dSHans Petter Selasky ih->ib_reserved = 0; 215*ec52ff6dSHans Petter Selasky memcpy(ih->ib_hwaddr, lladdr, INFINIBAND_ADDR_LEN); 216*ec52ff6dSHans Petter Selasky req->bufsize = sizeof(struct infiniband_header); 217*ec52ff6dSHans Petter Selasky 218*ec52ff6dSHans Petter Selasky return (0); 219*ec52ff6dSHans Petter Selasky } 220*ec52ff6dSHans Petter Selasky 221*ec52ff6dSHans Petter Selasky static int 222*ec52ff6dSHans Petter Selasky infiniband_resolve_addr(struct ifnet *ifp, struct mbuf *m, 223*ec52ff6dSHans Petter Selasky const struct sockaddr *dst, struct route *ro, uint8_t *phdr, 224*ec52ff6dSHans Petter Selasky uint32_t *pflags, struct llentry **plle) 225*ec52ff6dSHans Petter Selasky { 226*ec52ff6dSHans Petter Selasky struct infiniband_header *ih; 227*ec52ff6dSHans Petter Selasky uint32_t lleflags = 0; 228*ec52ff6dSHans Petter Selasky int error = 0; 229*ec52ff6dSHans Petter Selasky 230*ec52ff6dSHans Petter Selasky if (plle) 231*ec52ff6dSHans Petter Selasky *plle = NULL; 232*ec52ff6dSHans Petter Selasky ih = (struct infiniband_header *)phdr; 233*ec52ff6dSHans Petter Selasky 234*ec52ff6dSHans Petter Selasky switch (dst->sa_family) { 235*ec52ff6dSHans Petter Selasky #ifdef INET 236*ec52ff6dSHans Petter Selasky case AF_INET: 237*ec52ff6dSHans Petter Selasky if ((m->m_flags & (M_BCAST | M_MCAST)) == 0) { 238*ec52ff6dSHans Petter Selasky error = arpresolve(ifp, 0, m, dst, phdr, &lleflags, plle); 239*ec52ff6dSHans Petter Selasky } else { 240*ec52ff6dSHans Petter Selasky if (m->m_flags & M_BCAST) { 241*ec52ff6dSHans Petter Selasky memcpy(ih->ib_hwaddr, ifp->if_broadcastaddr, 242*ec52ff6dSHans Petter Selasky INFINIBAND_ADDR_LEN); 243*ec52ff6dSHans Petter Selasky } else { 244*ec52ff6dSHans Petter Selasky infiniband_ipv4_multicast_map( 245*ec52ff6dSHans Petter Selasky ((const struct sockaddr_in *)dst)->sin_addr.s_addr, 246*ec52ff6dSHans Petter Selasky ifp->if_broadcastaddr, ih->ib_hwaddr); 247*ec52ff6dSHans Petter Selasky } 248*ec52ff6dSHans Petter Selasky ih->ib_protocol = htons(ETHERTYPE_IP); 249*ec52ff6dSHans Petter Selasky ih->ib_reserved = 0; 250*ec52ff6dSHans Petter Selasky } 251*ec52ff6dSHans Petter Selasky break; 252*ec52ff6dSHans Petter Selasky #endif 253*ec52ff6dSHans Petter Selasky #ifdef INET6 254*ec52ff6dSHans Petter Selasky case AF_INET6: 255*ec52ff6dSHans Petter Selasky if ((m->m_flags & M_MCAST) == 0) { 256*ec52ff6dSHans Petter Selasky error = nd6_resolve(ifp, 0, m, dst, phdr, &lleflags, plle); 257*ec52ff6dSHans Petter Selasky } else { 258*ec52ff6dSHans Petter Selasky infiniband_ipv6_multicast_map( 259*ec52ff6dSHans Petter Selasky &((const struct sockaddr_in6 *)dst)->sin6_addr, 260*ec52ff6dSHans Petter Selasky ifp->if_broadcastaddr, ih->ib_hwaddr); 261*ec52ff6dSHans Petter Selasky ih->ib_protocol = htons(ETHERTYPE_IPV6); 262*ec52ff6dSHans Petter Selasky ih->ib_reserved = 0; 263*ec52ff6dSHans Petter Selasky } 264*ec52ff6dSHans Petter Selasky break; 265*ec52ff6dSHans Petter Selasky #endif 266*ec52ff6dSHans Petter Selasky default: 267*ec52ff6dSHans Petter Selasky if_printf(ifp, "can't handle af%d\n", dst->sa_family); 268*ec52ff6dSHans Petter Selasky if (m != NULL) 269*ec52ff6dSHans Petter Selasky m_freem(m); 270*ec52ff6dSHans Petter Selasky return (EAFNOSUPPORT); 271*ec52ff6dSHans Petter Selasky } 272*ec52ff6dSHans Petter Selasky 273*ec52ff6dSHans Petter Selasky if (error == EHOSTDOWN) { 274*ec52ff6dSHans Petter Selasky if (ro != NULL && (ro->ro_flags & RT_HAS_GW) != 0) 275*ec52ff6dSHans Petter Selasky error = EHOSTUNREACH; 276*ec52ff6dSHans Petter Selasky } 277*ec52ff6dSHans Petter Selasky 278*ec52ff6dSHans Petter Selasky if (error != 0) 279*ec52ff6dSHans Petter Selasky return (error); 280*ec52ff6dSHans Petter Selasky 281*ec52ff6dSHans Petter Selasky *pflags = RT_MAY_LOOP; 282*ec52ff6dSHans Petter Selasky if (lleflags & LLE_IFADDR) 283*ec52ff6dSHans Petter Selasky *pflags |= RT_L2_ME; 284*ec52ff6dSHans Petter Selasky 285*ec52ff6dSHans Petter Selasky return (0); 286*ec52ff6dSHans Petter Selasky } 287*ec52ff6dSHans Petter Selasky 2889d40cf60SHans Petter Selasky /* 2899d40cf60SHans Petter Selasky * Infiniband output routine. 2909d40cf60SHans Petter Selasky */ 2919d40cf60SHans Petter Selasky static int 292*ec52ff6dSHans Petter Selasky infiniband_output(struct ifnet *ifp, struct mbuf *m, 293*ec52ff6dSHans Petter Selasky const struct sockaddr *dst, struct route *ro) 2949d40cf60SHans Petter Selasky { 295*ec52ff6dSHans Petter Selasky uint8_t linkhdr[INFINIBAND_HDR_LEN]; 296*ec52ff6dSHans Petter Selasky uint8_t *phdr; 2979d40cf60SHans Petter Selasky #if defined(INET) || defined(INET6) 2989d40cf60SHans Petter Selasky struct llentry *lle = NULL; 2999d40cf60SHans Petter Selasky #endif 300*ec52ff6dSHans Petter Selasky struct infiniband_header *ih; 3019d40cf60SHans Petter Selasky int error = 0; 302*ec52ff6dSHans Petter Selasky int hlen; /* link layer header length */ 303*ec52ff6dSHans Petter Selasky uint32_t pflags; 304*ec52ff6dSHans Petter Selasky bool addref; 3059d40cf60SHans Petter Selasky 3069d40cf60SHans Petter Selasky NET_EPOCH_ASSERT(); 3079d40cf60SHans Petter Selasky 308*ec52ff6dSHans Petter Selasky addref = false; 309*ec52ff6dSHans Petter Selasky phdr = NULL; 310*ec52ff6dSHans Petter Selasky pflags = 0; 311*ec52ff6dSHans Petter Selasky if (ro != NULL) { 312*ec52ff6dSHans Petter Selasky /* XXX BPF uses ro_prepend */ 313*ec52ff6dSHans Petter Selasky if (ro->ro_prepend != NULL) { 314*ec52ff6dSHans Petter Selasky phdr = ro->ro_prepend; 315*ec52ff6dSHans Petter Selasky hlen = ro->ro_plen; 316*ec52ff6dSHans Petter Selasky } else if (!(m->m_flags & (M_BCAST | M_MCAST))) { 317*ec52ff6dSHans Petter Selasky if ((ro->ro_flags & RT_LLE_CACHE) != 0) { 318*ec52ff6dSHans Petter Selasky lle = ro->ro_lle; 319*ec52ff6dSHans Petter Selasky if (lle != NULL && 320*ec52ff6dSHans Petter Selasky (lle->la_flags & LLE_VALID) == 0) { 321*ec52ff6dSHans Petter Selasky LLE_FREE(lle); 322*ec52ff6dSHans Petter Selasky lle = NULL; /* redundant */ 323*ec52ff6dSHans Petter Selasky ro->ro_lle = NULL; 324*ec52ff6dSHans Petter Selasky } 325*ec52ff6dSHans Petter Selasky if (lle == NULL) { 326*ec52ff6dSHans Petter Selasky /* if we lookup, keep cache */ 327*ec52ff6dSHans Petter Selasky addref = 1; 328*ec52ff6dSHans Petter Selasky } else 329*ec52ff6dSHans Petter Selasky /* 330*ec52ff6dSHans Petter Selasky * Notify LLE code that 331*ec52ff6dSHans Petter Selasky * the entry was used 332*ec52ff6dSHans Petter Selasky * by datapath. 333*ec52ff6dSHans Petter Selasky */ 334*ec52ff6dSHans Petter Selasky llentry_mark_used(lle); 335*ec52ff6dSHans Petter Selasky } 336*ec52ff6dSHans Petter Selasky if (lle != NULL) { 337*ec52ff6dSHans Petter Selasky phdr = lle->r_linkdata; 338*ec52ff6dSHans Petter Selasky hlen = lle->r_hdrlen; 339*ec52ff6dSHans Petter Selasky pflags = lle->r_flags; 340*ec52ff6dSHans Petter Selasky } 341*ec52ff6dSHans Petter Selasky } 342*ec52ff6dSHans Petter Selasky } 3439d40cf60SHans Petter Selasky 3449d40cf60SHans Petter Selasky #ifdef MAC 3459d40cf60SHans Petter Selasky error = mac_ifnet_check_transmit(ifp, m); 3469d40cf60SHans Petter Selasky if (error) 3479d40cf60SHans Petter Selasky goto bad; 3489d40cf60SHans Petter Selasky #endif 3499d40cf60SHans Petter Selasky 3509d40cf60SHans Petter Selasky M_PROFILE(m); 3519d40cf60SHans Petter Selasky if (ifp->if_flags & IFF_MONITOR) { 3529d40cf60SHans Petter Selasky error = ENETDOWN; 3539d40cf60SHans Petter Selasky goto bad; 3549d40cf60SHans Petter Selasky } 3559d40cf60SHans Petter Selasky if (!((ifp->if_flags & IFF_UP) && 3569d40cf60SHans Petter Selasky (ifp->if_drv_flags & IFF_DRV_RUNNING))) { 3579d40cf60SHans Petter Selasky error = ENETDOWN; 3589d40cf60SHans Petter Selasky goto bad; 3599d40cf60SHans Petter Selasky } 3609d40cf60SHans Petter Selasky 361*ec52ff6dSHans Petter Selasky if (phdr == NULL) { 362*ec52ff6dSHans Petter Selasky /* No prepend data supplied. Try to calculate ourselves. */ 363*ec52ff6dSHans Petter Selasky phdr = linkhdr; 364*ec52ff6dSHans Petter Selasky hlen = INFINIBAND_HDR_LEN; 365*ec52ff6dSHans Petter Selasky error = infiniband_resolve_addr(ifp, m, dst, ro, phdr, &pflags, 366*ec52ff6dSHans Petter Selasky addref ? &lle : NULL); 367*ec52ff6dSHans Petter Selasky if (addref && lle != NULL) 368*ec52ff6dSHans Petter Selasky ro->ro_lle = lle; 369*ec52ff6dSHans Petter Selasky if (error != 0) 370*ec52ff6dSHans Petter Selasky return (error == EWOULDBLOCK ? 0 : error); 3719d40cf60SHans Petter Selasky } 3729d40cf60SHans Petter Selasky 373*ec52ff6dSHans Petter Selasky if ((pflags & RT_L2_ME) != 0) { 374*ec52ff6dSHans Petter Selasky update_mbuf_csumflags(m, m); 375*ec52ff6dSHans Petter Selasky return (if_simloop(ifp, m, dst->sa_family, 0)); 3769d40cf60SHans Petter Selasky } 3779d40cf60SHans Petter Selasky 3789d40cf60SHans Petter Selasky /* 379*ec52ff6dSHans Petter Selasky * Add local infiniband header. If no space in first mbuf, 3809d40cf60SHans Petter Selasky * allocate another. 3819d40cf60SHans Petter Selasky */ 3829d40cf60SHans Petter Selasky M_PREPEND(m, INFINIBAND_HDR_LEN, M_NOWAIT); 3839d40cf60SHans Petter Selasky if (m == NULL) { 3849d40cf60SHans Petter Selasky error = ENOBUFS; 3859d40cf60SHans Petter Selasky goto bad; 3869d40cf60SHans Petter Selasky } 387*ec52ff6dSHans Petter Selasky if ((pflags & RT_HAS_HEADER) == 0) { 388*ec52ff6dSHans Petter Selasky ih = mtod(m, struct infiniband_header *); 389*ec52ff6dSHans Petter Selasky memcpy(ih, phdr, hlen); 390*ec52ff6dSHans Petter Selasky } 3919d40cf60SHans Petter Selasky 3929d40cf60SHans Petter Selasky /* 3939d40cf60SHans Petter Selasky * Queue message on interface, update output statistics if 3949d40cf60SHans Petter Selasky * successful, and start output if interface not yet active. 3959d40cf60SHans Petter Selasky */ 3969d40cf60SHans Petter Selasky return (ifp->if_transmit(ifp, m)); 3979d40cf60SHans Petter Selasky bad: 3989d40cf60SHans Petter Selasky if (m != NULL) 3999d40cf60SHans Petter Selasky m_freem(m); 4009d40cf60SHans Petter Selasky return (error); 4019d40cf60SHans Petter Selasky } 4029d40cf60SHans Petter Selasky 4039d40cf60SHans Petter Selasky /* 4049d40cf60SHans Petter Selasky * Process a received Infiniband packet. 4059d40cf60SHans Petter Selasky */ 4069d40cf60SHans Petter Selasky static void 4079d40cf60SHans Petter Selasky infiniband_input(struct ifnet *ifp, struct mbuf *m) 4089d40cf60SHans Petter Selasky { 4099d40cf60SHans Petter Selasky struct infiniband_header *ibh; 4109d40cf60SHans Petter Selasky struct epoch_tracker et; 4119d40cf60SHans Petter Selasky int isr; 4129d40cf60SHans Petter Selasky 4139d40cf60SHans Petter Selasky CURVNET_SET_QUIET(ifp->if_vnet); 4149d40cf60SHans Petter Selasky 4159d40cf60SHans Petter Selasky if ((ifp->if_flags & IFF_UP) == 0) { 4169d40cf60SHans Petter Selasky if_inc_counter(ifp, IFCOUNTER_IERRORS, 1); 4179d40cf60SHans Petter Selasky m_freem(m); 4189d40cf60SHans Petter Selasky goto done; 4199d40cf60SHans Petter Selasky } 4209d40cf60SHans Petter Selasky 4219d40cf60SHans Petter Selasky ibh = mtod(m, struct infiniband_header *); 4229d40cf60SHans Petter Selasky 4239d40cf60SHans Petter Selasky /* 4249d40cf60SHans Petter Selasky * Reset layer specific mbuf flags to avoid confusing upper 4259d40cf60SHans Petter Selasky * layers: 4269d40cf60SHans Petter Selasky */ 4279d40cf60SHans Petter Selasky m->m_flags &= ~M_VLANTAG; 4289d40cf60SHans Petter Selasky m_clrprotoflags(m); 4299d40cf60SHans Petter Selasky 4309d40cf60SHans Petter Selasky if (INFINIBAND_IS_MULTICAST(ibh->ib_hwaddr)) { 4319d40cf60SHans Petter Selasky if (memcmp(ibh->ib_hwaddr, ifp->if_broadcastaddr, 4329d40cf60SHans Petter Selasky ifp->if_addrlen) == 0) 4339d40cf60SHans Petter Selasky m->m_flags |= M_BCAST; 4349d40cf60SHans Petter Selasky else 4359d40cf60SHans Petter Selasky m->m_flags |= M_MCAST; 4369d40cf60SHans Petter Selasky if_inc_counter(ifp, IFCOUNTER_IMCASTS, 1); 4379d40cf60SHans Petter Selasky } 4389d40cf60SHans Petter Selasky 4399d40cf60SHans Petter Selasky /* Let BPF have it before we strip the header. */ 4409d40cf60SHans Petter Selasky INFINIBAND_BPF_MTAP(ifp, m); 4419d40cf60SHans Petter Selasky 4429d40cf60SHans Petter Selasky /* Allow monitor mode to claim this frame, after stats are updated. */ 4439d40cf60SHans Petter Selasky if (ifp->if_flags & IFF_MONITOR) { 4449d40cf60SHans Petter Selasky m_freem(m); 4459d40cf60SHans Petter Selasky goto done; 4469d40cf60SHans Petter Selasky } 4479d40cf60SHans Petter Selasky 4489d40cf60SHans Petter Selasky /* Direct packet to correct FIB based on interface config. */ 4499d40cf60SHans Petter Selasky M_SETFIB(m, ifp->if_fib); 4509d40cf60SHans Petter Selasky 451a92c4bb6SHans Petter Selasky /* Handle input from a lagg<N> port */ 452a92c4bb6SHans Petter Selasky if (ifp->if_type == IFT_INFINIBANDLAG) { 453a92c4bb6SHans Petter Selasky KASSERT(lagg_input_infiniband_p != NULL, 454a92c4bb6SHans Petter Selasky ("%s: if_lagg not loaded!", __func__)); 455a92c4bb6SHans Petter Selasky m = (*lagg_input_infiniband_p)(ifp, m); 456a92c4bb6SHans Petter Selasky if (__predict_false(m == NULL)) 457a92c4bb6SHans Petter Selasky goto done; 458a92c4bb6SHans Petter Selasky ifp = m->m_pkthdr.rcvif; 459a92c4bb6SHans Petter Selasky } 460a92c4bb6SHans Petter Selasky 4619d40cf60SHans Petter Selasky /* 4629d40cf60SHans Petter Selasky * Dispatch frame to upper layer. 4639d40cf60SHans Petter Selasky */ 4649d40cf60SHans Petter Selasky switch (ibh->ib_protocol) { 4659d40cf60SHans Petter Selasky #ifdef INET 4669d40cf60SHans Petter Selasky case htons(ETHERTYPE_IP): 4679d40cf60SHans Petter Selasky isr = NETISR_IP; 4689d40cf60SHans Petter Selasky break; 4699d40cf60SHans Petter Selasky 4709d40cf60SHans Petter Selasky case htons(ETHERTYPE_ARP): 4719d40cf60SHans Petter Selasky if (ifp->if_flags & IFF_NOARP) { 4729d40cf60SHans Petter Selasky /* Discard packet if ARP is disabled on interface */ 4739d40cf60SHans Petter Selasky m_freem(m); 4749d40cf60SHans Petter Selasky goto done; 4759d40cf60SHans Petter Selasky } 4769d40cf60SHans Petter Selasky isr = NETISR_ARP; 4779d40cf60SHans Petter Selasky break; 4789d40cf60SHans Petter Selasky #endif 4799d40cf60SHans Petter Selasky #ifdef INET6 4809d40cf60SHans Petter Selasky case htons(ETHERTYPE_IPV6): 4819d40cf60SHans Petter Selasky isr = NETISR_IPV6; 4829d40cf60SHans Petter Selasky break; 4839d40cf60SHans Petter Selasky #endif 4849d40cf60SHans Petter Selasky default: 4859d40cf60SHans Petter Selasky if_inc_counter(ifp, IFCOUNTER_IERRORS, 1); 4869d40cf60SHans Petter Selasky m_freem(m); 4879d40cf60SHans Petter Selasky goto done; 4889d40cf60SHans Petter Selasky } 4899d40cf60SHans Petter Selasky 4909d40cf60SHans Petter Selasky /* Strip off the Infiniband header. */ 4919d40cf60SHans Petter Selasky m_adj(m, INFINIBAND_HDR_LEN); 4929d40cf60SHans Petter Selasky 4939d40cf60SHans Petter Selasky #ifdef MAC 4949d40cf60SHans Petter Selasky /* 4959d40cf60SHans Petter Selasky * Tag the mbuf with an appropriate MAC label before any other 4969d40cf60SHans Petter Selasky * consumers can get to it. 4979d40cf60SHans Petter Selasky */ 4989d40cf60SHans Petter Selasky mac_ifnet_create_mbuf(ifp, m); 4999d40cf60SHans Petter Selasky #endif 5009d40cf60SHans Petter Selasky /* Allow monitor mode to claim this frame, after stats are updated. */ 5019d40cf60SHans Petter Selasky NET_EPOCH_ENTER(et); 5029d40cf60SHans Petter Selasky netisr_dispatch(isr, m); 5039d40cf60SHans Petter Selasky NET_EPOCH_EXIT(et); 5049d40cf60SHans Petter Selasky done: 5059d40cf60SHans Petter Selasky CURVNET_RESTORE(); 5069d40cf60SHans Petter Selasky } 5079d40cf60SHans Petter Selasky 5089d40cf60SHans Petter Selasky static int 5091355e2dcSHans Petter Selasky infiniband_resolvemulti(struct ifnet *ifp, struct sockaddr **llsa, 5101355e2dcSHans Petter Selasky struct sockaddr *sa) 5119d40cf60SHans Petter Selasky { 5129d40cf60SHans Petter Selasky struct sockaddr_dl *sdl; 5139d40cf60SHans Petter Selasky #ifdef INET 5149d40cf60SHans Petter Selasky struct sockaddr_in *sin; 5159d40cf60SHans Petter Selasky #endif 5169d40cf60SHans Petter Selasky #ifdef INET6 5179d40cf60SHans Petter Selasky struct sockaddr_in6 *sin6; 5189d40cf60SHans Petter Selasky #endif 5199d40cf60SHans Petter Selasky uint8_t *e_addr; 5209d40cf60SHans Petter Selasky 5219d40cf60SHans Petter Selasky switch (sa->sa_family) { 5229d40cf60SHans Petter Selasky case AF_LINK: 5239d40cf60SHans Petter Selasky /* 5249d40cf60SHans Petter Selasky * No mapping needed. Just check that it's a valid MC address. 5259d40cf60SHans Petter Selasky */ 5269d40cf60SHans Petter Selasky sdl = (struct sockaddr_dl *)sa; 5279d40cf60SHans Petter Selasky e_addr = LLADDR(sdl); 5289d40cf60SHans Petter Selasky if (!INFINIBAND_IS_MULTICAST(e_addr)) 5299d40cf60SHans Petter Selasky return (EADDRNOTAVAIL); 5309d40cf60SHans Petter Selasky *llsa = NULL; 5319d40cf60SHans Petter Selasky return 0; 5329d40cf60SHans Petter Selasky 5339d40cf60SHans Petter Selasky #ifdef INET 5349d40cf60SHans Petter Selasky case AF_INET: 5359d40cf60SHans Petter Selasky sin = (struct sockaddr_in *)sa; 5369d40cf60SHans Petter Selasky if (!IN_MULTICAST(ntohl(sin->sin_addr.s_addr))) 5379d40cf60SHans Petter Selasky return (EADDRNOTAVAIL); 5389d40cf60SHans Petter Selasky sdl = link_init_sdl(ifp, *llsa, IFT_INFINIBAND); 5399d40cf60SHans Petter Selasky sdl->sdl_alen = INFINIBAND_ADDR_LEN; 5409d40cf60SHans Petter Selasky e_addr = LLADDR(sdl); 54101630a49SHans Petter Selasky infiniband_ipv4_multicast_map( 54201630a49SHans Petter Selasky sin->sin_addr.s_addr, ifp->if_broadcastaddr, e_addr); 5439d40cf60SHans Petter Selasky *llsa = (struct sockaddr *)sdl; 5449d40cf60SHans Petter Selasky return (0); 5459d40cf60SHans Petter Selasky #endif 5469d40cf60SHans Petter Selasky #ifdef INET6 5479d40cf60SHans Petter Selasky case AF_INET6: 5489d40cf60SHans Petter Selasky sin6 = (struct sockaddr_in6 *)sa; 5499d40cf60SHans Petter Selasky /* 5509d40cf60SHans Petter Selasky * An IP6 address of 0 means listen to all of the 5519d40cf60SHans Petter Selasky * multicast address used for IP6. This has no meaning 5529d40cf60SHans Petter Selasky * in infiniband. 5539d40cf60SHans Petter Selasky */ 5549d40cf60SHans Petter Selasky if (IN6_IS_ADDR_UNSPECIFIED(&sin6->sin6_addr)) 5559d40cf60SHans Petter Selasky return (EADDRNOTAVAIL); 5569d40cf60SHans Petter Selasky if (!IN6_IS_ADDR_MULTICAST(&sin6->sin6_addr)) 5579d40cf60SHans Petter Selasky return (EADDRNOTAVAIL); 5589d40cf60SHans Petter Selasky sdl = link_init_sdl(ifp, *llsa, IFT_INFINIBAND); 5599d40cf60SHans Petter Selasky sdl->sdl_alen = INFINIBAND_ADDR_LEN; 5609d40cf60SHans Petter Selasky e_addr = LLADDR(sdl); 56101630a49SHans Petter Selasky infiniband_ipv6_multicast_map( 56201630a49SHans Petter Selasky &sin6->sin6_addr, ifp->if_broadcastaddr, e_addr); 5639d40cf60SHans Petter Selasky *llsa = (struct sockaddr *)sdl; 5649d40cf60SHans Petter Selasky return (0); 5659d40cf60SHans Petter Selasky #endif 5669d40cf60SHans Petter Selasky default: 5679d40cf60SHans Petter Selasky return (EAFNOSUPPORT); 5689d40cf60SHans Petter Selasky } 5699d40cf60SHans Petter Selasky } 5709d40cf60SHans Petter Selasky 5719d40cf60SHans Petter Selasky void 5729d40cf60SHans Petter Selasky infiniband_ifattach(struct ifnet *ifp, const uint8_t *lla, const uint8_t *llb) 5739d40cf60SHans Petter Selasky { 5749d40cf60SHans Petter Selasky struct sockaddr_dl *sdl; 5759d40cf60SHans Petter Selasky struct ifaddr *ifa; 5769d40cf60SHans Petter Selasky int i; 5779d40cf60SHans Petter Selasky 5789d40cf60SHans Petter Selasky ifp->if_addrlen = INFINIBAND_ADDR_LEN; 5799d40cf60SHans Petter Selasky ifp->if_hdrlen = INFINIBAND_HDR_LEN; 5809d40cf60SHans Petter Selasky ifp->if_mtu = INFINIBAND_MTU; 5819d40cf60SHans Petter Selasky if_attach(ifp); 5829d40cf60SHans Petter Selasky ifp->if_output = infiniband_output; 5839d40cf60SHans Petter Selasky ifp->if_input = infiniband_input; 5849d40cf60SHans Petter Selasky ifp->if_resolvemulti = infiniband_resolvemulti; 585*ec52ff6dSHans Petter Selasky ifp->if_requestencap = infiniband_requestencap; 5869d40cf60SHans Petter Selasky 5879d40cf60SHans Petter Selasky if (ifp->if_baudrate == 0) 5889d40cf60SHans Petter Selasky ifp->if_baudrate = IF_Gbps(10); /* default value */ 5899d40cf60SHans Petter Selasky if (llb != NULL) 5909d40cf60SHans Petter Selasky ifp->if_broadcastaddr = llb; 5919d40cf60SHans Petter Selasky 5929d40cf60SHans Petter Selasky ifa = ifp->if_addr; 5939d40cf60SHans Petter Selasky KASSERT(ifa != NULL, ("%s: no lladdr!\n", __func__)); 5949d40cf60SHans Petter Selasky sdl = (struct sockaddr_dl *)ifa->ifa_addr; 5959d40cf60SHans Petter Selasky sdl->sdl_type = IFT_INFINIBAND; 5969d40cf60SHans Petter Selasky sdl->sdl_alen = ifp->if_addrlen; 5979d40cf60SHans Petter Selasky 5989d40cf60SHans Petter Selasky if (lla != NULL) { 5999d40cf60SHans Petter Selasky memcpy(LLADDR(sdl), lla, ifp->if_addrlen); 6009d40cf60SHans Petter Selasky 6019d40cf60SHans Petter Selasky if (ifp->if_hw_addr != NULL) 6029d40cf60SHans Petter Selasky memcpy(ifp->if_hw_addr, lla, ifp->if_addrlen); 6039d40cf60SHans Petter Selasky } else { 6049d40cf60SHans Petter Selasky lla = LLADDR(sdl); 6059d40cf60SHans Petter Selasky } 6069d40cf60SHans Petter Selasky 6079d40cf60SHans Petter Selasky /* Attach ethernet compatible network device */ 6089d40cf60SHans Petter Selasky bpfattach(ifp, DLT_EN10MB, ETHER_HDR_LEN); 6099d40cf60SHans Petter Selasky 6109d40cf60SHans Petter Selasky /* Announce Infiniband MAC address if non-zero. */ 6119d40cf60SHans Petter Selasky for (i = 0; i < ifp->if_addrlen; i++) 6129d40cf60SHans Petter Selasky if (lla[i] != 0) 6139d40cf60SHans Petter Selasky break; 6149d40cf60SHans Petter Selasky if (i != ifp->if_addrlen) 6159d40cf60SHans Petter Selasky if_printf(ifp, "Infiniband address: %20D\n", lla, ":"); 6169d40cf60SHans Petter Selasky 6179d40cf60SHans Petter Selasky /* Add necessary bits are setup; announce it now. */ 6189d40cf60SHans Petter Selasky EVENTHANDLER_INVOKE(infiniband_ifattach_event, ifp); 6199d40cf60SHans Petter Selasky 6209d40cf60SHans Petter Selasky if (IS_DEFAULT_VNET(curvnet)) 6219d40cf60SHans Petter Selasky devctl_notify("INFINIBAND", ifp->if_xname, "IFATTACH", NULL); 6229d40cf60SHans Petter Selasky } 6239d40cf60SHans Petter Selasky 6249d40cf60SHans Petter Selasky /* 6259d40cf60SHans Petter Selasky * Perform common duties while detaching an Infiniband interface 6269d40cf60SHans Petter Selasky */ 6279d40cf60SHans Petter Selasky void 6289d40cf60SHans Petter Selasky infiniband_ifdetach(struct ifnet *ifp) 6299d40cf60SHans Petter Selasky { 6309d40cf60SHans Petter Selasky bpfdetach(ifp); 6319d40cf60SHans Petter Selasky if_detach(ifp); 6329d40cf60SHans Petter Selasky } 6339d40cf60SHans Petter Selasky 6349d40cf60SHans Petter Selasky static int 6359d40cf60SHans Petter Selasky infiniband_modevent(module_t mod, int type, void *data) 6369d40cf60SHans Petter Selasky { 6379d40cf60SHans Petter Selasky switch (type) { 6389d40cf60SHans Petter Selasky case MOD_LOAD: 6399d40cf60SHans Petter Selasky case MOD_UNLOAD: 6409d40cf60SHans Petter Selasky return (0); 6419d40cf60SHans Petter Selasky default: 6429d40cf60SHans Petter Selasky return (EOPNOTSUPP); 6439d40cf60SHans Petter Selasky } 6449d40cf60SHans Petter Selasky } 6459d40cf60SHans Petter Selasky 6469d40cf60SHans Petter Selasky static moduledata_t infiniband_mod = { 6479d40cf60SHans Petter Selasky .name = "if_infiniband", 6489d40cf60SHans Petter Selasky .evhand = &infiniband_modevent, 6499d40cf60SHans Petter Selasky }; 6509d40cf60SHans Petter Selasky 6519d40cf60SHans Petter Selasky DECLARE_MODULE(if_infiniband, infiniband_mod, SI_SUB_INIT_IF, SI_ORDER_ANY); 6529d40cf60SHans Petter Selasky MODULE_VERSION(if_infiniband, 1); 653