1 /*- 2 * SPDX-License-Identifier: BSD-3-Clause 3 * 4 * Copyright (C) 1995, 1996, 1997, and 1998 WIDE Project. 5 * All rights reserved. 6 * 7 * Redistribution and use in source and binary forms, with or without 8 * modification, are permitted provided that the following conditions 9 * are met: 10 * 1. Redistributions of source code must retain the above copyright 11 * notice, this list of conditions and the following disclaimer. 12 * 2. Redistributions in binary form must reproduce the above copyright 13 * notice, this list of conditions and the following disclaimer in the 14 * documentation and/or other materials provided with the distribution. 15 * 3. Neither the name of the project nor the names of its contributors 16 * may be used to endorse or promote products derived from this software 17 * without specific prior written permission. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE PROJECT AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE PROJECT OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 32 /*- 33 * Copyright (c) 1982, 1986, 1988, 1993 34 * The Regents of the University of California. 35 * All rights reserved. 36 * 37 * Redistribution and use in source and binary forms, with or without 38 * modification, are permitted provided that the following conditions 39 * are met: 40 * 1. Redistributions of source code must retain the above copyright 41 * notice, this list of conditions and the following disclaimer. 42 * 2. Redistributions in binary form must reproduce the above copyright 43 * notice, this list of conditions and the following disclaimer in the 44 * documentation and/or other materials provided with the distribution. 45 * 3. Neither the name of the University nor the names of its contributors 46 * may be used to endorse or promote products derived from this software 47 * without specific prior written permission. 48 * 49 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 50 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 51 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 52 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 53 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 54 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 55 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 56 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 57 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 58 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 59 * SUCH DAMAGE. 60 * 61 * @(#)raw_ip.c 8.2 (Berkeley) 1/4/94 62 */ 63 64 #include <sys/cdefs.h> 65 __FBSDID("$FreeBSD$"); 66 67 #include "opt_ipsec.h" 68 #include "opt_inet6.h" 69 #include "opt_route.h" 70 71 #include <sys/param.h> 72 #include <sys/errno.h> 73 #include <sys/jail.h> 74 #include <sys/kernel.h> 75 #include <sys/lock.h> 76 #include <sys/malloc.h> 77 #include <sys/mbuf.h> 78 #include <sys/priv.h> 79 #include <sys/proc.h> 80 #include <sys/protosw.h> 81 #include <sys/signalvar.h> 82 #include <sys/socket.h> 83 #include <sys/socketvar.h> 84 #include <sys/sx.h> 85 #include <sys/syslog.h> 86 87 #include <net/if.h> 88 #include <net/if_var.h> 89 #include <net/if_types.h> 90 #include <net/route.h> 91 #include <net/vnet.h> 92 93 #include <netinet/in.h> 94 #include <netinet/in_var.h> 95 #include <netinet/in_systm.h> 96 #include <netinet/in_pcb.h> 97 98 #include <netinet/icmp6.h> 99 #include <netinet/ip6.h> 100 #include <netinet/ip_var.h> 101 #include <netinet6/ip6protosw.h> 102 #include <netinet6/ip6_mroute.h> 103 #include <netinet6/in6_pcb.h> 104 #include <netinet6/ip6_var.h> 105 #include <netinet6/nd6.h> 106 #include <netinet6/raw_ip6.h> 107 #include <netinet6/in6_fib.h> 108 #include <netinet6/scope6_var.h> 109 #include <netinet6/send.h> 110 111 #include <netipsec/ipsec_support.h> 112 113 #include <machine/stdarg.h> 114 115 #define satosin6(sa) ((struct sockaddr_in6 *)(sa)) 116 #define ifatoia6(ifa) ((struct in6_ifaddr *)(ifa)) 117 118 /* 119 * Raw interface to IP6 protocol. 120 */ 121 122 VNET_DECLARE(struct inpcbinfo, ripcbinfo); 123 #define V_ripcbinfo VNET(ripcbinfo) 124 125 extern u_long rip_sendspace; 126 extern u_long rip_recvspace; 127 128 VNET_PCPUSTAT_DEFINE(struct rip6stat, rip6stat); 129 VNET_PCPUSTAT_SYSINIT(rip6stat); 130 131 #ifdef VIMAGE 132 VNET_PCPUSTAT_SYSUNINIT(rip6stat); 133 #endif /* VIMAGE */ 134 135 /* 136 * Hooks for multicast routing. They all default to NULL, so leave them not 137 * initialized and rely on BSS being set to 0. 138 */ 139 140 /* 141 * The socket used to communicate with the multicast routing daemon. 142 */ 143 VNET_DEFINE(struct socket *, ip6_mrouter); 144 145 /* 146 * The various mrouter functions. 147 */ 148 int (*ip6_mrouter_set)(struct socket *, struct sockopt *); 149 int (*ip6_mrouter_get)(struct socket *, struct sockopt *); 150 int (*ip6_mrouter_done)(void); 151 int (*ip6_mforward)(struct ip6_hdr *, struct ifnet *, struct mbuf *); 152 int (*mrt6_ioctl)(u_long, caddr_t); 153 154 struct rip6_inp_match_ctx { 155 struct ip6_hdr *ip6; 156 int proto; 157 }; 158 159 static bool 160 rip6_inp_match(const struct inpcb *inp, void *v) 161 { 162 struct rip6_inp_match_ctx *c = v; 163 struct ip6_hdr *ip6 = c->ip6; 164 int proto = c->proto; 165 166 /* XXX inp locking */ 167 if ((inp->inp_vflag & INP_IPV6) == 0) 168 return (false); 169 if (inp->inp_ip_p && inp->inp_ip_p != proto) 170 return (false); 171 if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_laddr) && 172 !IN6_ARE_ADDR_EQUAL(&inp->in6p_laddr, &ip6->ip6_dst)) 173 return (false); 174 if (!IN6_IS_ADDR_UNSPECIFIED(&inp->in6p_faddr) && 175 !IN6_ARE_ADDR_EQUAL(&inp->in6p_faddr, &ip6->ip6_src)) 176 return (false); 177 178 return (true); 179 } 180 181 /* 182 * Setup generic address and protocol structures for raw_input routine, then 183 * pass them along with mbuf chain. 184 */ 185 int 186 rip6_input(struct mbuf **mp, int *offp, int proto) 187 { 188 struct ifnet *ifp; 189 struct mbuf *n, *m = *mp; 190 struct ip6_hdr *ip6 = mtod(m, struct ip6_hdr *); 191 struct inpcb *inp; 192 struct mbuf *opts = NULL; 193 struct sockaddr_in6 fromsa; 194 struct rip6_inp_match_ctx ctx = { .ip6 = ip6, .proto = proto }; 195 struct inpcb_iterator inpi = INP_ITERATOR(&V_ripcbinfo, 196 INPLOOKUP_RLOCKPCB, rip6_inp_match, &ctx); 197 int delivered = 0; 198 199 NET_EPOCH_ASSERT(); 200 201 RIP6STAT_INC(rip6s_ipackets); 202 203 init_sin6(&fromsa, m, 0); /* general init */ 204 205 ifp = m->m_pkthdr.rcvif; 206 207 while ((inp = inp_next(&inpi)) != NULL) { 208 INP_RLOCK_ASSERT(inp); 209 #if defined(IPSEC) || defined(IPSEC_SUPPORT) 210 /* 211 * Check AH/ESP integrity. 212 */ 213 if (IPSEC_ENABLED(ipv6) && 214 IPSEC_CHECK_POLICY(ipv6, m, inp) != 0) { 215 /* Do not inject data into pcb. */ 216 continue; 217 } 218 #endif /* IPSEC */ 219 if (jailed_without_vnet(inp->inp_cred) && 220 !IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst) && 221 prison_check_ip6(inp->inp_cred, &ip6->ip6_dst) != 0) 222 /* 223 * Allow raw socket in jail to receive multicast; 224 * assume process had PRIV_NETINET_RAW at attach, 225 * and fall through into normal filter path if so. 226 */ 227 continue; 228 if (inp->in6p_cksum != -1) { 229 RIP6STAT_INC(rip6s_isum); 230 if (m->m_pkthdr.len - (*offp + inp->in6p_cksum) < 2 || 231 in6_cksum(m, proto, *offp, 232 m->m_pkthdr.len - *offp)) { 233 RIP6STAT_INC(rip6s_badsum); 234 /* 235 * Drop the received message, don't send an 236 * ICMP6 message. Set proto to IPPROTO_NONE 237 * to achieve that. 238 */ 239 INP_RUNLOCK(inp); 240 proto = IPPROTO_NONE; 241 break; 242 } 243 } 244 /* 245 * If this raw socket has multicast state, and we 246 * have received a multicast, check if this socket 247 * should receive it, as multicast filtering is now 248 * the responsibility of the transport layer. 249 */ 250 if (inp->in6p_moptions && 251 IN6_IS_ADDR_MULTICAST(&ip6->ip6_dst)) { 252 /* 253 * If the incoming datagram is for MLD, allow it 254 * through unconditionally to the raw socket. 255 * 256 * Use the M_RTALERT_MLD flag to check for MLD 257 * traffic without having to inspect the mbuf chain 258 * more deeply, as all MLDv1/v2 host messages MUST 259 * contain the Router Alert option. 260 * 261 * In the case of MLDv1, we may not have explicitly 262 * joined the group, and may have set IFF_ALLMULTI 263 * on the interface. im6o_mc_filter() may discard 264 * control traffic we actually need to see. 265 * 266 * Userland multicast routing daemons should continue 267 * filter the control traffic appropriately. 268 */ 269 int blocked; 270 271 blocked = MCAST_PASS; 272 if ((m->m_flags & M_RTALERT_MLD) == 0) { 273 struct sockaddr_in6 mcaddr; 274 275 bzero(&mcaddr, sizeof(struct sockaddr_in6)); 276 mcaddr.sin6_len = sizeof(struct sockaddr_in6); 277 mcaddr.sin6_family = AF_INET6; 278 mcaddr.sin6_addr = ip6->ip6_dst; 279 280 blocked = im6o_mc_filter(inp->in6p_moptions, 281 ifp, 282 (struct sockaddr *)&mcaddr, 283 (struct sockaddr *)&fromsa); 284 } 285 if (blocked != MCAST_PASS) { 286 IP6STAT_INC(ip6s_notmember); 287 continue; 288 } 289 } 290 if ((n = m_copym(m, 0, M_COPYALL, M_NOWAIT)) == NULL) 291 continue; 292 if (inp->inp_flags & INP_CONTROLOPTS || 293 inp->inp_socket->so_options & SO_TIMESTAMP) 294 ip6_savecontrol(inp, n, &opts); 295 /* strip intermediate headers */ 296 m_adj(n, *offp); 297 if (sbappendaddr(&inp->inp_socket->so_rcv, 298 (struct sockaddr *)&fromsa, n, opts) == 0) { 299 soroverflow(inp->inp_socket); 300 m_freem(n); 301 if (opts) 302 m_freem(opts); 303 RIP6STAT_INC(rip6s_fullsock); 304 } else { 305 sorwakeup(inp->inp_socket); 306 delivered++; 307 } 308 opts = NULL; 309 } 310 if (delivered == 0) { 311 RIP6STAT_INC(rip6s_nosock); 312 if (m->m_flags & M_MCAST) 313 RIP6STAT_INC(rip6s_nosockmcast); 314 if (proto == IPPROTO_NONE) 315 m_freem(m); 316 else 317 icmp6_error(m, ICMP6_PARAM_PROB, 318 ICMP6_PARAMPROB_NEXTHEADER, 319 ip6_get_prevhdr(m, *offp)); 320 IP6STAT_DEC(ip6s_delivered); 321 } else 322 m_freem(m); 323 return (IPPROTO_DONE); 324 } 325 326 void 327 rip6_ctlinput(int cmd, struct sockaddr *sa, void *d) 328 { 329 struct ip6ctlparam *ip6cp = NULL; 330 const struct sockaddr_in6 *sa6_src = NULL; 331 void *cmdarg; 332 struct inpcb *(*notify)(struct inpcb *, int) = in6_rtchange; 333 334 if (sa->sa_family != AF_INET6 || 335 sa->sa_len != sizeof(struct sockaddr_in6)) 336 return; 337 338 if ((unsigned)cmd >= PRC_NCMDS) 339 return; 340 if (PRC_IS_REDIRECT(cmd)) 341 notify = in6_rtchange, d = NULL; 342 else if (cmd == PRC_HOSTDEAD) 343 d = NULL; 344 else if (inet6ctlerrmap[cmd] == 0) 345 return; 346 347 /* 348 * If the parameter is from icmp6, decode it. 349 */ 350 if (d != NULL) { 351 ip6cp = (struct ip6ctlparam *)d; 352 cmdarg = ip6cp->ip6c_cmdarg; 353 sa6_src = ip6cp->ip6c_src; 354 } else { 355 cmdarg = NULL; 356 sa6_src = &sa6_any; 357 } 358 359 (void) in6_pcbnotify(&V_ripcbinfo, sa, 0, 360 (const struct sockaddr *)sa6_src, 0, cmd, cmdarg, notify); 361 } 362 363 /* 364 * Generate IPv6 header and pass packet to ip6_output. Tack on options user 365 * may have setup with control call. 366 */ 367 int 368 rip6_output(struct mbuf *m, struct socket *so, ...) 369 { 370 struct epoch_tracker et; 371 struct mbuf *control; 372 struct m_tag *mtag; 373 struct sockaddr_in6 *dstsock; 374 struct ip6_hdr *ip6; 375 struct inpcb *inp; 376 u_int plen = m->m_pkthdr.len; 377 int error = 0; 378 struct ip6_pktopts opt, *optp; 379 struct ifnet *oifp = NULL; 380 int type = 0, code = 0; /* for ICMPv6 output statistics only */ 381 int scope_ambiguous = 0; 382 int use_defzone = 0; 383 int hlim = 0; 384 struct in6_addr in6a; 385 va_list ap; 386 387 va_start(ap, so); 388 dstsock = va_arg(ap, struct sockaddr_in6 *); 389 control = va_arg(ap, struct mbuf *); 390 va_end(ap); 391 392 inp = sotoinpcb(so); 393 INP_WLOCK(inp); 394 395 if (control != NULL) { 396 NET_EPOCH_ENTER(et); 397 error = ip6_setpktopts(control, &opt, 398 inp->in6p_outputopts, so->so_cred, 399 so->so_proto->pr_protocol); 400 NET_EPOCH_EXIT(et); 401 402 if (error != 0) { 403 goto bad; 404 } 405 optp = &opt; 406 } else 407 optp = inp->in6p_outputopts; 408 409 /* 410 * Check and convert scope zone ID into internal form. 411 * 412 * XXX: we may still need to determine the zone later. 413 */ 414 if (!(so->so_state & SS_ISCONNECTED)) { 415 if (!optp || !optp->ip6po_pktinfo || 416 !optp->ip6po_pktinfo->ipi6_ifindex) 417 use_defzone = V_ip6_use_defzone; 418 if (dstsock->sin6_scope_id == 0 && !use_defzone) 419 scope_ambiguous = 1; 420 if ((error = sa6_embedscope(dstsock, use_defzone)) != 0) 421 goto bad; 422 } 423 424 /* 425 * For an ICMPv6 packet, we should know its type and code to update 426 * statistics. 427 */ 428 if (so->so_proto->pr_protocol == IPPROTO_ICMPV6) { 429 struct icmp6_hdr *icmp6; 430 if (m->m_len < sizeof(struct icmp6_hdr) && 431 (m = m_pullup(m, sizeof(struct icmp6_hdr))) == NULL) { 432 error = ENOBUFS; 433 goto bad; 434 } 435 icmp6 = mtod(m, struct icmp6_hdr *); 436 type = icmp6->icmp6_type; 437 code = icmp6->icmp6_code; 438 } 439 440 M_PREPEND(m, sizeof(*ip6), M_NOWAIT); 441 if (m == NULL) { 442 error = ENOBUFS; 443 goto bad; 444 } 445 ip6 = mtod(m, struct ip6_hdr *); 446 447 #ifdef ROUTE_MPATH 448 if (CALC_FLOWID_OUTBOUND) { 449 uint32_t hash_type, hash_val; 450 451 hash_val = fib6_calc_software_hash(&inp->in6p_laddr, 452 &dstsock->sin6_addr, 0, 0, so->so_proto->pr_protocol, 453 &hash_type); 454 inp->inp_flowid = hash_val; 455 inp->inp_flowtype = hash_type; 456 } 457 #endif 458 /* 459 * Source address selection. 460 */ 461 NET_EPOCH_ENTER(et); 462 error = in6_selectsrc_socket(dstsock, optp, inp, so->so_cred, 463 scope_ambiguous, &in6a, &hlim); 464 NET_EPOCH_EXIT(et); 465 466 if (error) 467 goto bad; 468 error = prison_check_ip6(inp->inp_cred, &in6a); 469 if (error != 0) 470 goto bad; 471 ip6->ip6_src = in6a; 472 473 ip6->ip6_dst = dstsock->sin6_addr; 474 475 /* 476 * Fill in the rest of the IPv6 header fields. 477 */ 478 ip6->ip6_flow = (ip6->ip6_flow & ~IPV6_FLOWINFO_MASK) | 479 (inp->inp_flow & IPV6_FLOWINFO_MASK); 480 ip6->ip6_vfc = (ip6->ip6_vfc & ~IPV6_VERSION_MASK) | 481 (IPV6_VERSION & IPV6_VERSION_MASK); 482 483 /* 484 * ip6_plen will be filled in ip6_output, so not fill it here. 485 */ 486 ip6->ip6_nxt = inp->inp_ip_p; 487 ip6->ip6_hlim = hlim; 488 489 if (so->so_proto->pr_protocol == IPPROTO_ICMPV6 || 490 inp->in6p_cksum != -1) { 491 struct mbuf *n; 492 int off; 493 u_int16_t *p; 494 495 /* Compute checksum. */ 496 if (so->so_proto->pr_protocol == IPPROTO_ICMPV6) 497 off = offsetof(struct icmp6_hdr, icmp6_cksum); 498 else 499 off = inp->in6p_cksum; 500 if (plen < off + 2) { 501 error = EINVAL; 502 goto bad; 503 } 504 off += sizeof(struct ip6_hdr); 505 506 n = m; 507 while (n && n->m_len <= off) { 508 off -= n->m_len; 509 n = n->m_next; 510 } 511 if (!n) 512 goto bad; 513 p = (u_int16_t *)(mtod(n, caddr_t) + off); 514 *p = 0; 515 *p = in6_cksum(m, ip6->ip6_nxt, sizeof(*ip6), plen); 516 } 517 518 /* 519 * Send RA/RS messages to user land for protection, before sending 520 * them to rtadvd/rtsol. 521 */ 522 if ((send_sendso_input_hook != NULL) && 523 so->so_proto->pr_protocol == IPPROTO_ICMPV6) { 524 switch (type) { 525 case ND_ROUTER_ADVERT: 526 case ND_ROUTER_SOLICIT: 527 mtag = m_tag_get(PACKET_TAG_ND_OUTGOING, 528 sizeof(unsigned short), M_NOWAIT); 529 if (mtag == NULL) 530 goto bad; 531 m_tag_prepend(m, mtag); 532 } 533 } 534 535 NET_EPOCH_ENTER(et); 536 error = ip6_output(m, optp, NULL, 0, inp->in6p_moptions, &oifp, inp); 537 NET_EPOCH_EXIT(et); 538 if (so->so_proto->pr_protocol == IPPROTO_ICMPV6) { 539 if (oifp) 540 icmp6_ifoutstat_inc(oifp, type, code); 541 ICMP6STAT_INC(icp6s_outhist[type]); 542 } else 543 RIP6STAT_INC(rip6s_opackets); 544 545 goto freectl; 546 547 bad: 548 if (m) 549 m_freem(m); 550 551 freectl: 552 if (control != NULL) { 553 ip6_clearpktopts(&opt, -1); 554 m_freem(control); 555 } 556 INP_WUNLOCK(inp); 557 return (error); 558 } 559 560 /* 561 * Raw IPv6 socket option processing. 562 */ 563 int 564 rip6_ctloutput(struct socket *so, struct sockopt *sopt) 565 { 566 struct inpcb *inp; 567 int error; 568 569 if (sopt->sopt_level == IPPROTO_ICMPV6) 570 /* 571 * XXX: is it better to call icmp6_ctloutput() directly 572 * from protosw? 573 */ 574 return (icmp6_ctloutput(so, sopt)); 575 else if (sopt->sopt_level != IPPROTO_IPV6) { 576 if (sopt->sopt_level == SOL_SOCKET && 577 sopt->sopt_name == SO_SETFIB) { 578 inp = sotoinpcb(so); 579 INP_WLOCK(inp); 580 inp->inp_inc.inc_fibnum = so->so_fibnum; 581 INP_WUNLOCK(inp); 582 return (0); 583 } 584 return (EINVAL); 585 } 586 587 error = 0; 588 589 switch (sopt->sopt_dir) { 590 case SOPT_GET: 591 switch (sopt->sopt_name) { 592 case MRT6_INIT: 593 case MRT6_DONE: 594 case MRT6_ADD_MIF: 595 case MRT6_DEL_MIF: 596 case MRT6_ADD_MFC: 597 case MRT6_DEL_MFC: 598 case MRT6_PIM: 599 error = ip6_mrouter_get ? ip6_mrouter_get(so, sopt) : 600 EOPNOTSUPP; 601 break; 602 case IPV6_CHECKSUM: 603 error = ip6_raw_ctloutput(so, sopt); 604 break; 605 default: 606 error = ip6_ctloutput(so, sopt); 607 break; 608 } 609 break; 610 611 case SOPT_SET: 612 switch (sopt->sopt_name) { 613 case MRT6_INIT: 614 case MRT6_DONE: 615 case MRT6_ADD_MIF: 616 case MRT6_DEL_MIF: 617 case MRT6_ADD_MFC: 618 case MRT6_DEL_MFC: 619 case MRT6_PIM: 620 error = ip6_mrouter_set ? ip6_mrouter_set(so, sopt) : 621 EOPNOTSUPP; 622 break; 623 case IPV6_CHECKSUM: 624 error = ip6_raw_ctloutput(so, sopt); 625 break; 626 default: 627 error = ip6_ctloutput(so, sopt); 628 break; 629 } 630 break; 631 } 632 633 return (error); 634 } 635 636 static int 637 rip6_attach(struct socket *so, int proto, struct thread *td) 638 { 639 struct inpcb *inp; 640 struct icmp6_filter *filter; 641 int error; 642 643 inp = sotoinpcb(so); 644 KASSERT(inp == NULL, ("rip6_attach: inp != NULL")); 645 646 error = priv_check(td, PRIV_NETINET_RAW); 647 if (error) 648 return (error); 649 error = soreserve(so, rip_sendspace, rip_recvspace); 650 if (error) 651 return (error); 652 filter = malloc(sizeof(struct icmp6_filter), M_PCB, M_NOWAIT); 653 if (filter == NULL) 654 return (ENOMEM); 655 error = in_pcballoc(so, &V_ripcbinfo); 656 if (error) { 657 free(filter, M_PCB); 658 return (error); 659 } 660 inp = (struct inpcb *)so->so_pcb; 661 inp->inp_vflag |= INP_IPV6; 662 inp->inp_ip_p = (long)proto; 663 inp->in6p_hops = -1; /* use kernel default */ 664 inp->in6p_cksum = -1; 665 inp->in6p_icmp6filt = filter; 666 ICMP6_FILTER_SETPASSALL(inp->in6p_icmp6filt); 667 INP_WUNLOCK(inp); 668 return (0); 669 } 670 671 static void 672 rip6_detach(struct socket *so) 673 { 674 struct inpcb *inp; 675 676 inp = sotoinpcb(so); 677 KASSERT(inp != NULL, ("rip6_detach: inp == NULL")); 678 679 if (so == V_ip6_mrouter && ip6_mrouter_done) 680 ip6_mrouter_done(); 681 /* xxx: RSVP */ 682 INP_WLOCK(inp); 683 free(inp->in6p_icmp6filt, M_PCB); 684 in_pcbdetach(inp); 685 in_pcbfree(inp); 686 } 687 688 /* XXXRW: This can't ever be called. */ 689 static void 690 rip6_abort(struct socket *so) 691 { 692 struct inpcb *inp; 693 694 inp = sotoinpcb(so); 695 KASSERT(inp != NULL, ("rip6_abort: inp == NULL")); 696 697 soisdisconnected(so); 698 } 699 700 static void 701 rip6_close(struct socket *so) 702 { 703 struct inpcb *inp; 704 705 inp = sotoinpcb(so); 706 KASSERT(inp != NULL, ("rip6_close: inp == NULL")); 707 708 soisdisconnected(so); 709 } 710 711 static int 712 rip6_disconnect(struct socket *so) 713 { 714 struct inpcb *inp; 715 716 inp = sotoinpcb(so); 717 KASSERT(inp != NULL, ("rip6_disconnect: inp == NULL")); 718 719 if ((so->so_state & SS_ISCONNECTED) == 0) 720 return (ENOTCONN); 721 inp->in6p_faddr = in6addr_any; 722 rip6_abort(so); 723 return (0); 724 } 725 726 static int 727 rip6_bind(struct socket *so, struct sockaddr *nam, struct thread *td) 728 { 729 struct epoch_tracker et; 730 struct inpcb *inp; 731 struct sockaddr_in6 *addr = (struct sockaddr_in6 *)nam; 732 struct ifaddr *ifa = NULL; 733 int error = 0; 734 735 inp = sotoinpcb(so); 736 KASSERT(inp != NULL, ("rip6_bind: inp == NULL")); 737 738 if (nam->sa_family != AF_INET6) 739 return (EAFNOSUPPORT); 740 if (nam->sa_len != sizeof(*addr)) 741 return (EINVAL); 742 if ((error = prison_check_ip6(td->td_ucred, &addr->sin6_addr)) != 0) 743 return (error); 744 if (CK_STAILQ_EMPTY(&V_ifnet) || addr->sin6_family != AF_INET6) 745 return (EADDRNOTAVAIL); 746 if ((error = sa6_embedscope(addr, V_ip6_use_defzone)) != 0) 747 return (error); 748 749 NET_EPOCH_ENTER(et); 750 if (!IN6_IS_ADDR_UNSPECIFIED(&addr->sin6_addr) && 751 (ifa = ifa_ifwithaddr((struct sockaddr *)addr)) == NULL) { 752 NET_EPOCH_EXIT(et); 753 return (EADDRNOTAVAIL); 754 } 755 if (ifa != NULL && 756 ((struct in6_ifaddr *)ifa)->ia6_flags & 757 (IN6_IFF_ANYCAST|IN6_IFF_NOTREADY| 758 IN6_IFF_DETACHED|IN6_IFF_DEPRECATED)) { 759 NET_EPOCH_EXIT(et); 760 return (EADDRNOTAVAIL); 761 } 762 NET_EPOCH_EXIT(et); 763 INP_INFO_WLOCK(&V_ripcbinfo); 764 INP_WLOCK(inp); 765 inp->in6p_laddr = addr->sin6_addr; 766 INP_WUNLOCK(inp); 767 INP_INFO_WUNLOCK(&V_ripcbinfo); 768 return (0); 769 } 770 771 static int 772 rip6_connect(struct socket *so, struct sockaddr *nam, struct thread *td) 773 { 774 struct inpcb *inp; 775 struct sockaddr_in6 *addr = (struct sockaddr_in6 *)nam; 776 struct in6_addr in6a; 777 struct epoch_tracker et; 778 int error = 0, scope_ambiguous = 0; 779 780 inp = sotoinpcb(so); 781 KASSERT(inp != NULL, ("rip6_connect: inp == NULL")); 782 783 if (nam->sa_len != sizeof(*addr)) 784 return (EINVAL); 785 if (CK_STAILQ_EMPTY(&V_ifnet)) 786 return (EADDRNOTAVAIL); 787 if (addr->sin6_family != AF_INET6) 788 return (EAFNOSUPPORT); 789 790 /* 791 * Application should provide a proper zone ID or the use of default 792 * zone IDs should be enabled. Unfortunately, some applications do 793 * not behave as it should, so we need a workaround. Even if an 794 * appropriate ID is not determined, we'll see if we can determine 795 * the outgoing interface. If we can, determine the zone ID based on 796 * the interface below. 797 */ 798 if (addr->sin6_scope_id == 0 && !V_ip6_use_defzone) 799 scope_ambiguous = 1; 800 if ((error = sa6_embedscope(addr, V_ip6_use_defzone)) != 0) 801 return (error); 802 803 INP_WLOCK(inp); 804 INP_INFO_WLOCK(&V_ripcbinfo); 805 /* Source address selection. XXX: need pcblookup? */ 806 NET_EPOCH_ENTER(et); 807 error = in6_selectsrc_socket(addr, inp->in6p_outputopts, 808 inp, so->so_cred, scope_ambiguous, &in6a, NULL); 809 NET_EPOCH_EXIT(et); 810 if (error) { 811 INP_INFO_WUNLOCK(&V_ripcbinfo); 812 INP_WUNLOCK(inp); 813 return (error); 814 } 815 816 inp->in6p_faddr = addr->sin6_addr; 817 inp->in6p_laddr = in6a; 818 soisconnected(so); 819 INP_INFO_WUNLOCK(&V_ripcbinfo); 820 INP_WUNLOCK(inp); 821 return (0); 822 } 823 824 static int 825 rip6_shutdown(struct socket *so) 826 { 827 struct inpcb *inp; 828 829 inp = sotoinpcb(so); 830 KASSERT(inp != NULL, ("rip6_shutdown: inp == NULL")); 831 832 INP_WLOCK(inp); 833 socantsendmore(so); 834 INP_WUNLOCK(inp); 835 return (0); 836 } 837 838 static int 839 rip6_send(struct socket *so, int flags, struct mbuf *m, struct sockaddr *nam, 840 struct mbuf *control, struct thread *td) 841 { 842 struct inpcb *inp; 843 struct sockaddr_in6 tmp; 844 struct sockaddr_in6 *dst; 845 int error; 846 847 inp = sotoinpcb(so); 848 KASSERT(inp != NULL, ("rip6_send: inp == NULL")); 849 850 /* Always copy sockaddr to avoid overwrites. */ 851 /* Unlocked read. */ 852 if (so->so_state & SS_ISCONNECTED) { 853 if (nam) { 854 error = EISCONN; 855 goto release; 856 } 857 /* XXX */ 858 bzero(&tmp, sizeof(tmp)); 859 tmp.sin6_family = AF_INET6; 860 tmp.sin6_len = sizeof(struct sockaddr_in6); 861 INP_RLOCK(inp); 862 bcopy(&inp->in6p_faddr, &tmp.sin6_addr, 863 sizeof(struct in6_addr)); 864 INP_RUNLOCK(inp); 865 dst = &tmp; 866 } else { 867 error = 0; 868 if (nam == NULL) 869 error = ENOTCONN; 870 else if (nam->sa_family != AF_INET6) 871 error = EAFNOSUPPORT; 872 else if (nam->sa_len != sizeof(struct sockaddr_in6)) 873 error = EINVAL; 874 if (error != 0) 875 goto release; 876 tmp = *(struct sockaddr_in6 *)nam; 877 dst = &tmp; 878 879 if (dst->sin6_family == AF_UNSPEC) { 880 /* 881 * XXX: we allow this case for backward 882 * compatibility to buggy applications that 883 * rely on old (and wrong) kernel behavior. 884 */ 885 log(LOG_INFO, "rip6 SEND: address family is " 886 "unspec. Assume AF_INET6\n"); 887 dst->sin6_family = AF_INET6; 888 } else if (dst->sin6_family != AF_INET6) { 889 error = EAFNOSUPPORT; 890 goto release; 891 } 892 } 893 return (rip6_output(m, so, dst, control)); 894 895 release: 896 if (control != NULL) 897 m_freem(control); 898 m_freem(m); 899 return (error); 900 } 901 902 struct pr_usrreqs rip6_usrreqs = { 903 .pru_abort = rip6_abort, 904 .pru_attach = rip6_attach, 905 .pru_bind = rip6_bind, 906 .pru_connect = rip6_connect, 907 .pru_control = in6_control, 908 .pru_detach = rip6_detach, 909 .pru_disconnect = rip6_disconnect, 910 .pru_peeraddr = in6_getpeeraddr, 911 .pru_send = rip6_send, 912 .pru_shutdown = rip6_shutdown, 913 .pru_sockaddr = in6_getsockaddr, 914 .pru_close = rip6_close, 915 }; 916