xref: /freebsd/sys/net/route/nhop.h (revision 40503b792f7ecb9fcb349b2519036f85fa62fb4c)
1a6663252SAlexander V. Chernikov /*-
2a6663252SAlexander V. Chernikov  * SPDX-License-Identifier: BSD-2-Clause-FreeBSD
3a6663252SAlexander V. Chernikov  *
4a6663252SAlexander V. Chernikov  * Copyright (c) 2020 Alexander V. Chernikov
5a6663252SAlexander V. Chernikov  *
6a6663252SAlexander V. Chernikov  * Redistribution and use in source and binary forms, with or without
7a6663252SAlexander V. Chernikov  * modification, are permitted provided that the following conditions
8a6663252SAlexander V. Chernikov  * are met:
9a6663252SAlexander V. Chernikov  * 1. Redistributions of source code must retain the above copyright
10a6663252SAlexander V. Chernikov  *    notice, this list of conditions and the following disclaimer.
11a6663252SAlexander V. Chernikov  * 2. Redistributions in binary form must reproduce the above copyright
12a6663252SAlexander V. Chernikov  *    notice, this list of conditions and the following disclaimer in the
13a6663252SAlexander V. Chernikov  *    documentation and/or other materials provided with the distribution.
14a6663252SAlexander V. Chernikov  *
15a6663252SAlexander V. Chernikov  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
16a6663252SAlexander V. Chernikov  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17a6663252SAlexander V. Chernikov  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18a6663252SAlexander V. Chernikov  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
19a6663252SAlexander V. Chernikov  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
20a6663252SAlexander V. Chernikov  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
21a6663252SAlexander V. Chernikov  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
22a6663252SAlexander V. Chernikov  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
23a6663252SAlexander V. Chernikov  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
24a6663252SAlexander V. Chernikov  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
25a6663252SAlexander V. Chernikov  * SUCH DAMAGE.
26a6663252SAlexander V. Chernikov  *
27a6663252SAlexander V. Chernikov  * $FreeBSD$
28a6663252SAlexander V. Chernikov  */
29a6663252SAlexander V. Chernikov 
30a6663252SAlexander V. Chernikov /*
31a6663252SAlexander V. Chernikov  * This header file contains public definitions for the nexthop routing subsystem.
32a6663252SAlexander V. Chernikov  */
33a6663252SAlexander V. Chernikov 
34a6663252SAlexander V. Chernikov #ifndef	_NET_ROUTE_NHOP_H_
35a6663252SAlexander V. Chernikov #define	_NET_ROUTE_NHOP_H_
36a6663252SAlexander V. Chernikov 
37a6663252SAlexander V. Chernikov #include <netinet/in.h>			/* sockaddr_in && sockaddr_in6 */
38a6663252SAlexander V. Chernikov 
39a6663252SAlexander V. Chernikov #include <sys/counter.h>
40a6663252SAlexander V. Chernikov 
41a6663252SAlexander V. Chernikov enum nhop_type {
42a6663252SAlexander V. Chernikov 	NH_TYPE_IPV4_ETHER_RSLV = 1,	/* IPv4 ethernet without GW */
43a6663252SAlexander V. Chernikov 	NH_TYPE_IPV4_ETHER_NHOP = 2,	/* IPv4 with pre-calculated ethernet encap */
44a6663252SAlexander V. Chernikov 	NH_TYPE_IPV6_ETHER_RSLV = 3,	/* IPv6 ethernet, without GW */
45a6663252SAlexander V. Chernikov 	NH_TYPE_IPV6_ETHER_NHOP = 4	/* IPv6 with pre-calculated ethernet encap*/
46a6663252SAlexander V. Chernikov };
47a6663252SAlexander V. Chernikov 
48a6663252SAlexander V. Chernikov #ifdef _KERNEL
49a6663252SAlexander V. Chernikov 
50a6663252SAlexander V. Chernikov /*
51a6663252SAlexander V. Chernikov  * Define shorter version of AF_LINK sockaddr.
52a6663252SAlexander V. Chernikov  *
53a6663252SAlexander V. Chernikov  * Currently the only use case of AF_LINK gateway is storing
54a6663252SAlexander V. Chernikov  * interface index of the interface of the source IPv6 address.
55a6663252SAlexander V. Chernikov  * This is used by the IPv6 code for the connections over loopback
56a6663252SAlexander V. Chernikov  * interface.
57a6663252SAlexander V. Chernikov  *
58a6663252SAlexander V. Chernikov  * The structure below copies 'struct sockaddr_dl', reducing the
59a6663252SAlexander V. Chernikov  * size of sdl_data buffer, as it is not used. This change
60a6663252SAlexander V. Chernikov  * allows to store the AF_LINK gateways in the nhop gateway itself,
61a6663252SAlexander V. Chernikov  * simplifying control plane handling.
62a6663252SAlexander V. Chernikov  */
63a6663252SAlexander V. Chernikov struct sockaddr_dl_short {
64a6663252SAlexander V. Chernikov 	u_char	sdl_len;	/* Total length of sockaddr */
65a6663252SAlexander V. Chernikov 	u_char	sdl_family;	/* AF_LINK */
66a6663252SAlexander V. Chernikov 	u_short	sdl_index;	/* if != 0, system given index for interface */
67a6663252SAlexander V. Chernikov 	u_char	sdl_type;	/* interface type */
68a6663252SAlexander V. Chernikov 	u_char	sdl_nlen;	/* interface name length, no trailing 0 reqd. */
69a6663252SAlexander V. Chernikov 	u_char	sdl_alen;	/* link level address length */
70a6663252SAlexander V. Chernikov 	u_char	sdl_slen;	/* link layer selector length */
71a6663252SAlexander V. Chernikov 	char	sdl_data[8];	/* unused */
72a6663252SAlexander V. Chernikov };
73a6663252SAlexander V. Chernikov 
74a6663252SAlexander V. Chernikov #define	NHOP_RELATED_FLAGS	\
75a6663252SAlexander V. Chernikov 	(RTF_GATEWAY | RTF_HOST | RTF_REJECT | RTF_BLACKHOLE | \
76a6663252SAlexander V. Chernikov 	 RTF_FIXEDMTU | RTF_LOCAL | RTF_BROADCAST | RTF_MULTICAST)
77a6663252SAlexander V. Chernikov 
78a6663252SAlexander V. Chernikov struct nh_control;
79a6663252SAlexander V. Chernikov struct nhop_priv;
80a6663252SAlexander V. Chernikov 
81a6663252SAlexander V. Chernikov /*
82a6663252SAlexander V. Chernikov  * Struct 'nhop_object' field description:
83a6663252SAlexander V. Chernikov  *
84a6663252SAlexander V. Chernikov  * nh_flags: NHF_ flags used in the dataplane code. NHF_GATEWAY or NHF_BLACKHOLE
85a6663252SAlexander V. Chernikov  *   can be examples of such flags.
86a6663252SAlexander V. Chernikov  * nh_mtu: ready-to-use nexthop mtu. Already accounts for the link-level header,
87a6663252SAlexander V. Chernikov  *   interface MTU and protocol-specific limitations.
88a6663252SAlexander V. Chernikov  * nh_prepend_len: link-level prepend length. Currently unused.
89a6663252SAlexander V. Chernikov  * nh_ifp: logical transmit interface. The one from which if_transmit() will be
90a6663252SAlexander V. Chernikov  *   called. Guaranteed to be non-NULL.
91a6663252SAlexander V. Chernikov  * nh_aifp: ifnet of the source address. Same as nh_ifp except IPv6 loopback
92a6663252SAlexander V. Chernikov  *   routes. See the example below.
93a6663252SAlexander V. Chernikov  * nh_ifa: interface address to use. Guaranteed to be non-NULL.
94a6663252SAlexander V. Chernikov  * nh_pksent: counter(9) reflecting the number of packets transmitted.
95a6663252SAlexander V. Chernikov  *
96a6663252SAlexander V. Chernikov  * gw_: storage suitable to hold AF_INET, AF_INET6 or AF_LINK gateway. More
97a6663252SAlexander V. Chernikov  *   details ara available in the examples below.
98a6663252SAlexander V. Chernikov  *
99a6663252SAlexander V. Chernikov  * Examples:
100a6663252SAlexander V. Chernikov  *
101a6663252SAlexander V. Chernikov  * Direct routes (routes w/o gateway):
102a6663252SAlexander V. Chernikov  *  NHF_GATEWAY is NOT set.
103a6663252SAlexander V. Chernikov  *  nh_ifp denotes the logical transmit interface ().
104a6663252SAlexander V. Chernikov  *  nh_aifp is the same as nh_ifp
105a6663252SAlexander V. Chernikov  *  gw_sa contains AF_LINK sa with nh_aifp ifindex (compat)
106a6663252SAlexander V. Chernikov  * Loopback routes:
107a6663252SAlexander V. Chernikov  *  NHF_GATEWAY is NOT set.
108a6663252SAlexander V. Chernikov  *  nh_ifp points to the loopback interface (lo0).
109a6663252SAlexander V. Chernikov  *  nh_aifp points to the interface where the destination address belongs to.
110a6663252SAlexander V. Chernikov  *    This is useful in IPv6 link-local-over-loopback communications.
111a6663252SAlexander V. Chernikov  *  gw_sa contains AF_LINK sa with nh_aifp ifindex (compat)
112a6663252SAlexander V. Chernikov  * GW routes:
113a6663252SAlexander V. Chernikov  *  NHF_GATEWAY is set.
114a6663252SAlexander V. Chernikov  *  nh_ifp denotes the logical transmit interface.
115a6663252SAlexander V. Chernikov  *  nh_aifp is the same as nh_ifp
116a6663252SAlexander V. Chernikov  *  gw_sa contains L3 address (either AF_INET or AF_INET6).
117a6663252SAlexander V. Chernikov  *
118a6663252SAlexander V. Chernikov  *
119a6663252SAlexander V. Chernikov  * Note: struct nhop_object fields are ordered in a way that
120a6663252SAlexander V. Chernikov  *  supports memcmp-based comparisons.
121a6663252SAlexander V. Chernikov  *
122a6663252SAlexander V. Chernikov  */
123a6663252SAlexander V. Chernikov #define	NHOP_END_CMP	(__offsetof(struct nhop_object, nh_pksent))
124a6663252SAlexander V. Chernikov 
125a6663252SAlexander V. Chernikov struct nhop_object {
126a6663252SAlexander V. Chernikov 	uint16_t		nh_flags;	/* nhop flags */
127a6663252SAlexander V. Chernikov 	uint16_t		nh_mtu;		/* nexthop mtu */
128a6663252SAlexander V. Chernikov 	union {
129a6663252SAlexander V. Chernikov 		struct sockaddr_in		gw4_sa;	/* GW accessor as IPv4 */
130a6663252SAlexander V. Chernikov 		struct sockaddr_in6		gw6_sa; /* GW accessor as IPv6 */
131a6663252SAlexander V. Chernikov 		struct sockaddr			gw_sa;
132a6663252SAlexander V. Chernikov 		struct sockaddr_dl_short	gwl_sa; /* AF_LINK gw (compat) */
133a6663252SAlexander V. Chernikov 		char				gw_buf[28];
134a6663252SAlexander V. Chernikov 	};
135a6663252SAlexander V. Chernikov 	struct ifnet		*nh_ifp;	/* Logical egress interface. Always != NULL */
136a6663252SAlexander V. Chernikov 	struct ifaddr		*nh_ifa;	/* interface address to use. Always != NULL */
137a6663252SAlexander V. Chernikov 	struct ifnet		*nh_aifp;	/* ifnet of the source address. Always != NULL */
138a6663252SAlexander V. Chernikov 	counter_u64_t		nh_pksent;	/* packets sent using this nhop */
139a6663252SAlexander V. Chernikov 	/* 32 bytes + 4xPTR == 64(amd64) / 48(i386)  */
140a6663252SAlexander V. Chernikov 	uint8_t			nh_prepend_len;	/* length of prepend data */
141a6663252SAlexander V. Chernikov 	uint8_t			spare[3];
142a6663252SAlexander V. Chernikov 	uint32_t		spare1;		/* alignment */
143a6663252SAlexander V. Chernikov 	char			nh_prepend[48];	/* L2 prepend */
144a6663252SAlexander V. Chernikov 	struct nhop_priv	*nh_priv;	/* control plane data */
145a6663252SAlexander V. Chernikov 	/* -- 128 bytes -- */
146a6663252SAlexander V. Chernikov };
147a6663252SAlexander V. Chernikov 
148a6663252SAlexander V. Chernikov /*
149a6663252SAlexander V. Chernikov  * Nhop validness.
150a6663252SAlexander V. Chernikov  *
151a6663252SAlexander V. Chernikov  * Currently we verify whether link is up or not on every packet, which can be
152a6663252SAlexander V. Chernikov  *   quite costy.
153a6663252SAlexander V. Chernikov  * TODO: subscribe for the interface notifications and update the nexthops
154a6663252SAlexander V. Chernikov  *  with NHF_INVALID flag.
155a6663252SAlexander V. Chernikov  */
156a6663252SAlexander V. Chernikov 
157a6663252SAlexander V. Chernikov #define	NH_IS_VALID(_nh)	RT_LINK_IS_UP((_nh)->nh_ifp)
158fedeb08bSAlexander V. Chernikov #define	NH_IS_NHGRP(_nh)	((_nh)->nh_flags & NHF_MULTIPATH)
159a6663252SAlexander V. Chernikov 
160a6663252SAlexander V. Chernikov #define	NH_FREE(_nh) do {					\
161a6663252SAlexander V. Chernikov 	nhop_free(_nh);	\
162a6663252SAlexander V. Chernikov 	/* guard against invalid refs */			\
163a6663252SAlexander V. Chernikov 	_nh = NULL;						\
164a6663252SAlexander V. Chernikov } while (0)
165a6663252SAlexander V. Chernikov 
166fedeb08bSAlexander V. Chernikov struct weightened_nhop {
167fedeb08bSAlexander V. Chernikov 	struct nhop_object	*nh;
168fedeb08bSAlexander V. Chernikov 	uint32_t		weight;
16976f1ab8eSAlexander V. Chernikov 	uint32_t		storage;
170fedeb08bSAlexander V. Chernikov };
171fedeb08bSAlexander V. Chernikov 
172a6663252SAlexander V. Chernikov void nhop_free(struct nhop_object *nh);
173a6663252SAlexander V. Chernikov 
174a6663252SAlexander V. Chernikov struct sysctl_req;
175a6663252SAlexander V. Chernikov struct sockaddr_dl;
176a6663252SAlexander V. Chernikov struct rib_head;
177a6663252SAlexander V. Chernikov 
178800c6846SAlexander V. Chernikov /* flags that can be set using nhop_set_rtflags() */
179800c6846SAlexander V. Chernikov #define	RT_SET_RTFLAGS_MASK     (RTF_PROTO1 | RTF_PROTO2 | RTF_PROTO3 | RTF_STATIC)
180800c6846SAlexander V. Chernikov #define	RT_CHANGE_RTFLAGS_MASK	RT_SET_RTFLAGS_MASK
181800c6846SAlexander V. Chernikov 
182800c6846SAlexander V. Chernikov struct nhop_object *nhop_alloc(uint32_t fibnum, int family);
183800c6846SAlexander V. Chernikov void nhop_copy(struct nhop_object *nh, const struct nhop_object *nh_orig);
184800c6846SAlexander V. Chernikov struct nhop_object *nhop_get_nhop(struct nhop_object *nh, int *perror);
185800c6846SAlexander V. Chernikov 
186800c6846SAlexander V. Chernikov void nhop_set_direct_gw(struct nhop_object *nh, struct ifnet *ifp);
187800c6846SAlexander V. Chernikov bool nhop_set_gw(struct nhop_object *nh, const struct sockaddr *sa, bool is_gw);
188800c6846SAlexander V. Chernikov 
189800c6846SAlexander V. Chernikov 
190800c6846SAlexander V. Chernikov void nhop_set_mtu(struct nhop_object *nh, uint32_t mtu, bool from_user);
191800c6846SAlexander V. Chernikov void nhop_set_rtflags(struct nhop_object *nh, int rt_flags);
192800c6846SAlexander V. Chernikov void nhop_set_pxtype_flag(struct nhop_object *nh, int nh_flag);
193800c6846SAlexander V. Chernikov void nhop_set_broadcast(struct nhop_object *nh, bool is_broadcast);
194800c6846SAlexander V. Chernikov void nhop_set_blackhole(struct nhop_object *nh, int blackhole_rt_flag);
195800c6846SAlexander V. Chernikov void nhop_set_pinned(struct nhop_object *nh, bool is_pinned);
196800c6846SAlexander V. Chernikov void nhop_set_redirect(struct nhop_object *nh, bool is_redirect);
197800c6846SAlexander V. Chernikov void nhop_set_type(struct nhop_object *nh, enum nhop_type nh_type);
198800c6846SAlexander V. Chernikov void nhop_set_src(struct nhop_object *nh, struct ifaddr *ifa);
199800c6846SAlexander V. Chernikov void nhop_set_transmit_ifp(struct nhop_object *nh, struct ifnet *ifp);
200800c6846SAlexander V. Chernikov 
201a6663252SAlexander V. Chernikov uint32_t nhop_get_idx(const struct nhop_object *nh);
202a6663252SAlexander V. Chernikov enum nhop_type nhop_get_type(const struct nhop_object *nh);
203a6663252SAlexander V. Chernikov int nhop_get_rtflags(const struct nhop_object *nh);
2042bbab0afSAlexander V. Chernikov struct vnet *nhop_get_vnet(const struct nhop_object *nh);
2054e19e0d9SAlexander V. Chernikov struct nhop_object *nhop_select_func(struct nhop_object *nh, uint32_t flowid);
206823a08d7SAlexander V. Chernikov int nhop_get_upper_family(const struct nhop_object *nh);
207823a08d7SAlexander V. Chernikov int nhop_get_neigh_family(const struct nhop_object *nh);
208823a08d7SAlexander V. Chernikov uint32_t nhop_get_fibnum(const struct nhop_object *nh);
209*40503b79SAlexander V. Chernikov void nhop_set_fibnum(struct nhop_object *nh, uint32_t fibnum);
2102717e958SAlexander V. Chernikov uint32_t nhop_get_expire(const struct nhop_object *nh);
2112717e958SAlexander V. Chernikov void nhop_set_expire(struct nhop_object *nh, uint32_t expire);
212a6663252SAlexander V. Chernikov 
213a6663252SAlexander V. Chernikov #endif /* _KERNEL */
214a6663252SAlexander V. Chernikov 
215a6663252SAlexander V. Chernikov /* Kernel <> userland structures */
216a6663252SAlexander V. Chernikov 
217a6663252SAlexander V. Chernikov /* Structure usage and layout are described in dump_nhop_entry() */
218a6663252SAlexander V. Chernikov struct nhop_external {
219a6663252SAlexander V. Chernikov 	uint32_t	nh_len;		/* length of the datastructure */
220a6663252SAlexander V. Chernikov 	uint32_t	nh_idx;		/* Nexthop index */
221a6663252SAlexander V. Chernikov 	uint32_t	nh_fib;		/* Fib nexhop is attached to */
222a6663252SAlexander V. Chernikov 	uint32_t	ifindex;	/* transmit interface ifindex */
223a6663252SAlexander V. Chernikov 	uint32_t	aifindex;	/* address ifindex */
224a6663252SAlexander V. Chernikov 	uint8_t		prepend_len;	/* length of the prepend */
225a6663252SAlexander V. Chernikov 	uint8_t		nh_family;	/* address family */
226a6663252SAlexander V. Chernikov 	uint16_t	nh_type;	/* nexthop type */
227a6663252SAlexander V. Chernikov 	uint16_t	nh_mtu;		/* nexthop mtu */
228a6663252SAlexander V. Chernikov 
229a6663252SAlexander V. Chernikov 	uint16_t	nh_flags;	/* nhop flags */
230a6663252SAlexander V. Chernikov 	struct in_addr	nh_addr;	/* GW/DST IPv4 address */
231a6663252SAlexander V. Chernikov 	struct in_addr	nh_src;		/* default source IPv4 address */
232a6663252SAlexander V. Chernikov 	uint64_t	nh_pksent;
233a6663252SAlexander V. Chernikov 	/* control plane */
234a6663252SAlexander V. Chernikov 	/* lookup key: address, family, type */
235a6663252SAlexander V. Chernikov 	char		nh_prepend[64];	/* L2 prepend */
236a6663252SAlexander V. Chernikov 	uint64_t	nh_refcount;	/* number of references */
237a6663252SAlexander V. Chernikov };
238a6663252SAlexander V. Chernikov 
239a6663252SAlexander V. Chernikov struct nhop_addrs {
240a6663252SAlexander V. Chernikov 	uint32_t	na_len;		/* length of the datastructure */
241a6663252SAlexander V. Chernikov 	uint16_t	gw_sa_off;	/* offset of gateway SA */
242a6663252SAlexander V. Chernikov 	uint16_t	src_sa_off;	/* offset of src address SA */
243a6663252SAlexander V. Chernikov };
244a6663252SAlexander V. Chernikov 
245fedeb08bSAlexander V. Chernikov #define	NHG_C_TYPE_CNHOPS	0x1	/* Control plane nhops list */
246fedeb08bSAlexander V. Chernikov #define	NHG_C_TYPE_DNHOPS	0x2	/* Dataplane nhops list */
247fedeb08bSAlexander V. Chernikov struct nhgrp_container {
248fedeb08bSAlexander V. Chernikov 	uint32_t	nhgc_len;	/* container length */
249fedeb08bSAlexander V. Chernikov 	uint16_t	nhgc_count;	/* number of items */
250fedeb08bSAlexander V. Chernikov 	uint8_t		nhgc_type;	/* container type */
251fedeb08bSAlexander V. Chernikov 	uint8_t		nhgc_subtype;	/* container subtype */
252fedeb08bSAlexander V. Chernikov };
253fedeb08bSAlexander V. Chernikov 
254fedeb08bSAlexander V. Chernikov struct nhgrp_nhop_external {
255a6663252SAlexander V. Chernikov 	uint32_t	nh_idx;
256a6663252SAlexander V. Chernikov 	uint32_t	nh_weight;
257a6663252SAlexander V. Chernikov };
258a6663252SAlexander V. Chernikov 
259fedeb08bSAlexander V. Chernikov /*
260fedeb08bSAlexander V. Chernikov  * Layout:
261fedeb08bSAlexander V. Chernikov  * - nhgrp_external
262fedeb08bSAlexander V. Chernikov  * - nhgrp_container (control plane nhops list)
263fedeb08bSAlexander V. Chernikov  *   - nhgrp_nhop_external
264fedeb08bSAlexander V. Chernikov  *   - nhgrp_nhop_external
265fedeb08bSAlexander V. Chernikov  *   ..
266fedeb08bSAlexander V. Chernikov  * - nhgrp_container (dataplane nhops list)
267fedeb08bSAlexander V. Chernikov  *   - nhgrp_nhop_external
268fedeb08bSAlexander V. Chernikov  *   - nhgrp_nhop_external
269fedeb08bSAlexander V. Chernikov  */
270fedeb08bSAlexander V. Chernikov struct nhgrp_external {
271fedeb08bSAlexander V. Chernikov 	uint32_t	nhg_idx;	/* Nexthop group index */
272fedeb08bSAlexander V. Chernikov 	uint32_t	nhg_refcount;	/* number of references */
273a6663252SAlexander V. Chernikov };
274a6663252SAlexander V. Chernikov 
275a6663252SAlexander V. Chernikov #endif
276