1a6663252SAlexander V. Chernikov /*- 2a6663252SAlexander V. Chernikov * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3a6663252SAlexander V. Chernikov * 4a6663252SAlexander V. Chernikov * Copyright (c) 2020 Alexander V. Chernikov 5a6663252SAlexander V. Chernikov * 6a6663252SAlexander V. Chernikov * Redistribution and use in source and binary forms, with or without 7a6663252SAlexander V. Chernikov * modification, are permitted provided that the following conditions 8a6663252SAlexander V. Chernikov * are met: 9a6663252SAlexander V. Chernikov * 1. Redistributions of source code must retain the above copyright 10a6663252SAlexander V. Chernikov * notice, this list of conditions and the following disclaimer. 11a6663252SAlexander V. Chernikov * 2. Redistributions in binary form must reproduce the above copyright 12a6663252SAlexander V. Chernikov * notice, this list of conditions and the following disclaimer in the 13a6663252SAlexander V. Chernikov * documentation and/or other materials provided with the distribution. 14a6663252SAlexander V. Chernikov * 15a6663252SAlexander V. Chernikov * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 16a6663252SAlexander V. Chernikov * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17a6663252SAlexander V. Chernikov * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 18a6663252SAlexander V. Chernikov * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 19a6663252SAlexander V. Chernikov * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 20a6663252SAlexander V. Chernikov * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 21a6663252SAlexander V. Chernikov * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 22a6663252SAlexander V. Chernikov * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 23a6663252SAlexander V. Chernikov * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 24a6663252SAlexander V. Chernikov * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 25a6663252SAlexander V. Chernikov * SUCH DAMAGE. 26a6663252SAlexander V. Chernikov * 27a6663252SAlexander V. Chernikov * $FreeBSD$ 28a6663252SAlexander V. Chernikov */ 29a6663252SAlexander V. Chernikov 30a6663252SAlexander V. Chernikov /* 31a6663252SAlexander V. Chernikov * This header file contains public definitions for the nexthop routing subsystem. 32a6663252SAlexander V. Chernikov */ 33a6663252SAlexander V. Chernikov 34a6663252SAlexander V. Chernikov #ifndef _NET_ROUTE_NHOP_H_ 35a6663252SAlexander V. Chernikov #define _NET_ROUTE_NHOP_H_ 36a6663252SAlexander V. Chernikov 37a6663252SAlexander V. Chernikov #include <netinet/in.h> /* sockaddr_in && sockaddr_in6 */ 38a6663252SAlexander V. Chernikov 39a6663252SAlexander V. Chernikov #include <sys/counter.h> 40a6663252SAlexander V. Chernikov 41a6663252SAlexander V. Chernikov enum nhop_type { 42a6663252SAlexander V. Chernikov NH_TYPE_IPV4_ETHER_RSLV = 1, /* IPv4 ethernet without GW */ 43a6663252SAlexander V. Chernikov NH_TYPE_IPV4_ETHER_NHOP = 2, /* IPv4 with pre-calculated ethernet encap */ 44a6663252SAlexander V. Chernikov NH_TYPE_IPV6_ETHER_RSLV = 3, /* IPv6 ethernet, without GW */ 45a6663252SAlexander V. Chernikov NH_TYPE_IPV6_ETHER_NHOP = 4 /* IPv6 with pre-calculated ethernet encap*/ 46a6663252SAlexander V. Chernikov }; 47a6663252SAlexander V. Chernikov 48a6663252SAlexander V. Chernikov #ifdef _KERNEL 49a6663252SAlexander V. Chernikov 50a6663252SAlexander V. Chernikov /* 51a6663252SAlexander V. Chernikov * Define shorter version of AF_LINK sockaddr. 52a6663252SAlexander V. Chernikov * 53a6663252SAlexander V. Chernikov * Currently the only use case of AF_LINK gateway is storing 54a6663252SAlexander V. Chernikov * interface index of the interface of the source IPv6 address. 55a6663252SAlexander V. Chernikov * This is used by the IPv6 code for the connections over loopback 56a6663252SAlexander V. Chernikov * interface. 57a6663252SAlexander V. Chernikov * 58a6663252SAlexander V. Chernikov * The structure below copies 'struct sockaddr_dl', reducing the 59a6663252SAlexander V. Chernikov * size of sdl_data buffer, as it is not used. This change 60a6663252SAlexander V. Chernikov * allows to store the AF_LINK gateways in the nhop gateway itself, 61a6663252SAlexander V. Chernikov * simplifying control plane handling. 62a6663252SAlexander V. Chernikov */ 63a6663252SAlexander V. Chernikov struct sockaddr_dl_short { 64a6663252SAlexander V. Chernikov u_char sdl_len; /* Total length of sockaddr */ 65a6663252SAlexander V. Chernikov u_char sdl_family; /* AF_LINK */ 66a6663252SAlexander V. Chernikov u_short sdl_index; /* if != 0, system given index for interface */ 67a6663252SAlexander V. Chernikov u_char sdl_type; /* interface type */ 68a6663252SAlexander V. Chernikov u_char sdl_nlen; /* interface name length, no trailing 0 reqd. */ 69a6663252SAlexander V. Chernikov u_char sdl_alen; /* link level address length */ 70a6663252SAlexander V. Chernikov u_char sdl_slen; /* link layer selector length */ 71a6663252SAlexander V. Chernikov char sdl_data[8]; /* unused */ 72a6663252SAlexander V. Chernikov }; 73a6663252SAlexander V. Chernikov 74a6663252SAlexander V. Chernikov #define NHOP_RELATED_FLAGS \ 75a6663252SAlexander V. Chernikov (RTF_GATEWAY | RTF_HOST | RTF_REJECT | RTF_BLACKHOLE | \ 76a6663252SAlexander V. Chernikov RTF_FIXEDMTU | RTF_LOCAL | RTF_BROADCAST | RTF_MULTICAST) 77a6663252SAlexander V. Chernikov 78a6663252SAlexander V. Chernikov struct nh_control; 79a6663252SAlexander V. Chernikov struct nhop_priv; 80a6663252SAlexander V. Chernikov 81a6663252SAlexander V. Chernikov /* 82a6663252SAlexander V. Chernikov * Struct 'nhop_object' field description: 83a6663252SAlexander V. Chernikov * 84a6663252SAlexander V. Chernikov * nh_flags: NHF_ flags used in the dataplane code. NHF_GATEWAY or NHF_BLACKHOLE 85a6663252SAlexander V. Chernikov * can be examples of such flags. 86a6663252SAlexander V. Chernikov * nh_mtu: ready-to-use nexthop mtu. Already accounts for the link-level header, 87a6663252SAlexander V. Chernikov * interface MTU and protocol-specific limitations. 88a6663252SAlexander V. Chernikov * nh_prepend_len: link-level prepend length. Currently unused. 89a6663252SAlexander V. Chernikov * nh_ifp: logical transmit interface. The one from which if_transmit() will be 90a6663252SAlexander V. Chernikov * called. Guaranteed to be non-NULL. 91a6663252SAlexander V. Chernikov * nh_aifp: ifnet of the source address. Same as nh_ifp except IPv6 loopback 92a6663252SAlexander V. Chernikov * routes. See the example below. 93a6663252SAlexander V. Chernikov * nh_ifa: interface address to use. Guaranteed to be non-NULL. 94a6663252SAlexander V. Chernikov * nh_pksent: counter(9) reflecting the number of packets transmitted. 95a6663252SAlexander V. Chernikov * 96a6663252SAlexander V. Chernikov * gw_: storage suitable to hold AF_INET, AF_INET6 or AF_LINK gateway. More 97a6663252SAlexander V. Chernikov * details ara available in the examples below. 98a6663252SAlexander V. Chernikov * 99a6663252SAlexander V. Chernikov * Examples: 100a6663252SAlexander V. Chernikov * 101a6663252SAlexander V. Chernikov * Direct routes (routes w/o gateway): 102a6663252SAlexander V. Chernikov * NHF_GATEWAY is NOT set. 103a6663252SAlexander V. Chernikov * nh_ifp denotes the logical transmit interface (). 104a6663252SAlexander V. Chernikov * nh_aifp is the same as nh_ifp 105a6663252SAlexander V. Chernikov * gw_sa contains AF_LINK sa with nh_aifp ifindex (compat) 106a6663252SAlexander V. Chernikov * Loopback routes: 107a6663252SAlexander V. Chernikov * NHF_GATEWAY is NOT set. 108a6663252SAlexander V. Chernikov * nh_ifp points to the loopback interface (lo0). 109a6663252SAlexander V. Chernikov * nh_aifp points to the interface where the destination address belongs to. 110a6663252SAlexander V. Chernikov * This is useful in IPv6 link-local-over-loopback communications. 111a6663252SAlexander V. Chernikov * gw_sa contains AF_LINK sa with nh_aifp ifindex (compat) 112a6663252SAlexander V. Chernikov * GW routes: 113a6663252SAlexander V. Chernikov * NHF_GATEWAY is set. 114a6663252SAlexander V. Chernikov * nh_ifp denotes the logical transmit interface. 115a6663252SAlexander V. Chernikov * nh_aifp is the same as nh_ifp 116a6663252SAlexander V. Chernikov * gw_sa contains L3 address (either AF_INET or AF_INET6). 117a6663252SAlexander V. Chernikov * 118a6663252SAlexander V. Chernikov * 119a6663252SAlexander V. Chernikov * Note: struct nhop_object fields are ordered in a way that 120a6663252SAlexander V. Chernikov * supports memcmp-based comparisons. 121a6663252SAlexander V. Chernikov * 122a6663252SAlexander V. Chernikov */ 123a6663252SAlexander V. Chernikov #define NHOP_END_CMP (__offsetof(struct nhop_object, nh_pksent)) 124a6663252SAlexander V. Chernikov 125a6663252SAlexander V. Chernikov struct nhop_object { 126a6663252SAlexander V. Chernikov uint16_t nh_flags; /* nhop flags */ 127a6663252SAlexander V. Chernikov uint16_t nh_mtu; /* nexthop mtu */ 128a6663252SAlexander V. Chernikov union { 129a6663252SAlexander V. Chernikov struct sockaddr_in gw4_sa; /* GW accessor as IPv4 */ 130a6663252SAlexander V. Chernikov struct sockaddr_in6 gw6_sa; /* GW accessor as IPv6 */ 131a6663252SAlexander V. Chernikov struct sockaddr gw_sa; 132a6663252SAlexander V. Chernikov struct sockaddr_dl_short gwl_sa; /* AF_LINK gw (compat) */ 133a6663252SAlexander V. Chernikov char gw_buf[28]; 134a6663252SAlexander V. Chernikov }; 135a6663252SAlexander V. Chernikov struct ifnet *nh_ifp; /* Logical egress interface. Always != NULL */ 136a6663252SAlexander V. Chernikov struct ifaddr *nh_ifa; /* interface address to use. Always != NULL */ 137a6663252SAlexander V. Chernikov struct ifnet *nh_aifp; /* ifnet of the source address. Always != NULL */ 138a6663252SAlexander V. Chernikov counter_u64_t nh_pksent; /* packets sent using this nhop */ 139a6663252SAlexander V. Chernikov /* 32 bytes + 4xPTR == 64(amd64) / 48(i386) */ 140a6663252SAlexander V. Chernikov uint8_t nh_prepend_len; /* length of prepend data */ 141a6663252SAlexander V. Chernikov uint8_t spare[3]; 142a6663252SAlexander V. Chernikov uint32_t spare1; /* alignment */ 143a6663252SAlexander V. Chernikov char nh_prepend[48]; /* L2 prepend */ 144a6663252SAlexander V. Chernikov struct nhop_priv *nh_priv; /* control plane data */ 145a6663252SAlexander V. Chernikov /* -- 128 bytes -- */ 146a6663252SAlexander V. Chernikov }; 147a6663252SAlexander V. Chernikov 148a6663252SAlexander V. Chernikov /* 149a6663252SAlexander V. Chernikov * Nhop validness. 150a6663252SAlexander V. Chernikov * 151a6663252SAlexander V. Chernikov * Currently we verify whether link is up or not on every packet, which can be 152a6663252SAlexander V. Chernikov * quite costy. 153a6663252SAlexander V. Chernikov * TODO: subscribe for the interface notifications and update the nexthops 154a6663252SAlexander V. Chernikov * with NHF_INVALID flag. 155a6663252SAlexander V. Chernikov */ 156a6663252SAlexander V. Chernikov 157a6663252SAlexander V. Chernikov #define NH_IS_VALID(_nh) RT_LINK_IS_UP((_nh)->nh_ifp) 158fedeb08bSAlexander V. Chernikov #define NH_IS_NHGRP(_nh) ((_nh)->nh_flags & NHF_MULTIPATH) 159a6663252SAlexander V. Chernikov 160a6663252SAlexander V. Chernikov #define NH_FREE(_nh) do { \ 161a6663252SAlexander V. Chernikov nhop_free(_nh); \ 162a6663252SAlexander V. Chernikov /* guard against invalid refs */ \ 163a6663252SAlexander V. Chernikov _nh = NULL; \ 164a6663252SAlexander V. Chernikov } while (0) 165a6663252SAlexander V. Chernikov 166fedeb08bSAlexander V. Chernikov struct weightened_nhop { 167fedeb08bSAlexander V. Chernikov struct nhop_object *nh; 168fedeb08bSAlexander V. Chernikov uint32_t weight; 16976f1ab8eSAlexander V. Chernikov uint32_t storage; 170fedeb08bSAlexander V. Chernikov }; 171fedeb08bSAlexander V. Chernikov 172a6663252SAlexander V. Chernikov void nhop_free(struct nhop_object *nh); 173a6663252SAlexander V. Chernikov 174a6663252SAlexander V. Chernikov struct sysctl_req; 175a6663252SAlexander V. Chernikov struct sockaddr_dl; 176a6663252SAlexander V. Chernikov struct rib_head; 177a6663252SAlexander V. Chernikov 178800c6846SAlexander V. Chernikov /* flags that can be set using nhop_set_rtflags() */ 179800c6846SAlexander V. Chernikov #define RT_SET_RTFLAGS_MASK (RTF_PROTO1 | RTF_PROTO2 | RTF_PROTO3 | RTF_STATIC) 180800c6846SAlexander V. Chernikov #define RT_CHANGE_RTFLAGS_MASK RT_SET_RTFLAGS_MASK 181800c6846SAlexander V. Chernikov 182800c6846SAlexander V. Chernikov struct nhop_object *nhop_alloc(uint32_t fibnum, int family); 183800c6846SAlexander V. Chernikov void nhop_copy(struct nhop_object *nh, const struct nhop_object *nh_orig); 184800c6846SAlexander V. Chernikov struct nhop_object *nhop_get_nhop(struct nhop_object *nh, int *perror); 185800c6846SAlexander V. Chernikov 186800c6846SAlexander V. Chernikov void nhop_set_direct_gw(struct nhop_object *nh, struct ifnet *ifp); 187800c6846SAlexander V. Chernikov bool nhop_set_gw(struct nhop_object *nh, const struct sockaddr *sa, bool is_gw); 188800c6846SAlexander V. Chernikov 189800c6846SAlexander V. Chernikov 190800c6846SAlexander V. Chernikov void nhop_set_mtu(struct nhop_object *nh, uint32_t mtu, bool from_user); 191800c6846SAlexander V. Chernikov void nhop_set_rtflags(struct nhop_object *nh, int rt_flags); 192800c6846SAlexander V. Chernikov void nhop_set_pxtype_flag(struct nhop_object *nh, int nh_flag); 193800c6846SAlexander V. Chernikov void nhop_set_broadcast(struct nhop_object *nh, bool is_broadcast); 194800c6846SAlexander V. Chernikov void nhop_set_blackhole(struct nhop_object *nh, int blackhole_rt_flag); 195800c6846SAlexander V. Chernikov void nhop_set_pinned(struct nhop_object *nh, bool is_pinned); 196800c6846SAlexander V. Chernikov void nhop_set_redirect(struct nhop_object *nh, bool is_redirect); 197800c6846SAlexander V. Chernikov void nhop_set_type(struct nhop_object *nh, enum nhop_type nh_type); 198800c6846SAlexander V. Chernikov void nhop_set_src(struct nhop_object *nh, struct ifaddr *ifa); 199800c6846SAlexander V. Chernikov void nhop_set_transmit_ifp(struct nhop_object *nh, struct ifnet *ifp); 200800c6846SAlexander V. Chernikov 201a6663252SAlexander V. Chernikov uint32_t nhop_get_idx(const struct nhop_object *nh); 202a6663252SAlexander V. Chernikov enum nhop_type nhop_get_type(const struct nhop_object *nh); 203a6663252SAlexander V. Chernikov int nhop_get_rtflags(const struct nhop_object *nh); 2042bbab0afSAlexander V. Chernikov struct vnet *nhop_get_vnet(const struct nhop_object *nh); 2054e19e0d9SAlexander V. Chernikov struct nhop_object *nhop_select_func(struct nhop_object *nh, uint32_t flowid); 206823a08d7SAlexander V. Chernikov int nhop_get_upper_family(const struct nhop_object *nh); 207823a08d7SAlexander V. Chernikov int nhop_get_neigh_family(const struct nhop_object *nh); 208823a08d7SAlexander V. Chernikov uint32_t nhop_get_fibnum(const struct nhop_object *nh); 209*40503b79SAlexander V. Chernikov void nhop_set_fibnum(struct nhop_object *nh, uint32_t fibnum); 2102717e958SAlexander V. Chernikov uint32_t nhop_get_expire(const struct nhop_object *nh); 2112717e958SAlexander V. Chernikov void nhop_set_expire(struct nhop_object *nh, uint32_t expire); 212a6663252SAlexander V. Chernikov 213a6663252SAlexander V. Chernikov #endif /* _KERNEL */ 214a6663252SAlexander V. Chernikov 215a6663252SAlexander V. Chernikov /* Kernel <> userland structures */ 216a6663252SAlexander V. Chernikov 217a6663252SAlexander V. Chernikov /* Structure usage and layout are described in dump_nhop_entry() */ 218a6663252SAlexander V. Chernikov struct nhop_external { 219a6663252SAlexander V. Chernikov uint32_t nh_len; /* length of the datastructure */ 220a6663252SAlexander V. Chernikov uint32_t nh_idx; /* Nexthop index */ 221a6663252SAlexander V. Chernikov uint32_t nh_fib; /* Fib nexhop is attached to */ 222a6663252SAlexander V. Chernikov uint32_t ifindex; /* transmit interface ifindex */ 223a6663252SAlexander V. Chernikov uint32_t aifindex; /* address ifindex */ 224a6663252SAlexander V. Chernikov uint8_t prepend_len; /* length of the prepend */ 225a6663252SAlexander V. Chernikov uint8_t nh_family; /* address family */ 226a6663252SAlexander V. Chernikov uint16_t nh_type; /* nexthop type */ 227a6663252SAlexander V. Chernikov uint16_t nh_mtu; /* nexthop mtu */ 228a6663252SAlexander V. Chernikov 229a6663252SAlexander V. Chernikov uint16_t nh_flags; /* nhop flags */ 230a6663252SAlexander V. Chernikov struct in_addr nh_addr; /* GW/DST IPv4 address */ 231a6663252SAlexander V. Chernikov struct in_addr nh_src; /* default source IPv4 address */ 232a6663252SAlexander V. Chernikov uint64_t nh_pksent; 233a6663252SAlexander V. Chernikov /* control plane */ 234a6663252SAlexander V. Chernikov /* lookup key: address, family, type */ 235a6663252SAlexander V. Chernikov char nh_prepend[64]; /* L2 prepend */ 236a6663252SAlexander V. Chernikov uint64_t nh_refcount; /* number of references */ 237a6663252SAlexander V. Chernikov }; 238a6663252SAlexander V. Chernikov 239a6663252SAlexander V. Chernikov struct nhop_addrs { 240a6663252SAlexander V. Chernikov uint32_t na_len; /* length of the datastructure */ 241a6663252SAlexander V. Chernikov uint16_t gw_sa_off; /* offset of gateway SA */ 242a6663252SAlexander V. Chernikov uint16_t src_sa_off; /* offset of src address SA */ 243a6663252SAlexander V. Chernikov }; 244a6663252SAlexander V. Chernikov 245fedeb08bSAlexander V. Chernikov #define NHG_C_TYPE_CNHOPS 0x1 /* Control plane nhops list */ 246fedeb08bSAlexander V. Chernikov #define NHG_C_TYPE_DNHOPS 0x2 /* Dataplane nhops list */ 247fedeb08bSAlexander V. Chernikov struct nhgrp_container { 248fedeb08bSAlexander V. Chernikov uint32_t nhgc_len; /* container length */ 249fedeb08bSAlexander V. Chernikov uint16_t nhgc_count; /* number of items */ 250fedeb08bSAlexander V. Chernikov uint8_t nhgc_type; /* container type */ 251fedeb08bSAlexander V. Chernikov uint8_t nhgc_subtype; /* container subtype */ 252fedeb08bSAlexander V. Chernikov }; 253fedeb08bSAlexander V. Chernikov 254fedeb08bSAlexander V. Chernikov struct nhgrp_nhop_external { 255a6663252SAlexander V. Chernikov uint32_t nh_idx; 256a6663252SAlexander V. Chernikov uint32_t nh_weight; 257a6663252SAlexander V. Chernikov }; 258a6663252SAlexander V. Chernikov 259fedeb08bSAlexander V. Chernikov /* 260fedeb08bSAlexander V. Chernikov * Layout: 261fedeb08bSAlexander V. Chernikov * - nhgrp_external 262fedeb08bSAlexander V. Chernikov * - nhgrp_container (control plane nhops list) 263fedeb08bSAlexander V. Chernikov * - nhgrp_nhop_external 264fedeb08bSAlexander V. Chernikov * - nhgrp_nhop_external 265fedeb08bSAlexander V. Chernikov * .. 266fedeb08bSAlexander V. Chernikov * - nhgrp_container (dataplane nhops list) 267fedeb08bSAlexander V. Chernikov * - nhgrp_nhop_external 268fedeb08bSAlexander V. Chernikov * - nhgrp_nhop_external 269fedeb08bSAlexander V. Chernikov */ 270fedeb08bSAlexander V. Chernikov struct nhgrp_external { 271fedeb08bSAlexander V. Chernikov uint32_t nhg_idx; /* Nexthop group index */ 272fedeb08bSAlexander V. Chernikov uint32_t nhg_refcount; /* number of references */ 273a6663252SAlexander V. Chernikov }; 274a6663252SAlexander V. Chernikov 275a6663252SAlexander V. Chernikov #endif 276