xref: /linux/include/net/ip6_route.h (revision dfecb0c5af3b07ebfa84be63a7a21bfc9e29a872)
1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _NET_IP6_ROUTE_H
3 #define _NET_IP6_ROUTE_H
4 
5 #include <net/addrconf.h>
6 #include <net/flow.h>
7 #include <net/ip6_fib.h>
8 #include <net/sock.h>
9 #include <net/lwtunnel.h>
10 #include <linux/ip.h>
11 #include <linux/ipv6.h>
12 #include <linux/route.h>
13 #include <net/nexthop.h>
14 
15 struct route_info {
16 	__u8			type;
17 	__u8			length;
18 	__u8			prefix_len;
19 #if defined(__BIG_ENDIAN_BITFIELD)
20 	__u8			reserved_h:3,
21 				route_pref:2,
22 				reserved_l:3;
23 #elif defined(__LITTLE_ENDIAN_BITFIELD)
24 	__u8			reserved_l:3,
25 				route_pref:2,
26 				reserved_h:3;
27 #endif
28 	__be32			lifetime;
29 	__u8			prefix[];	/* 0,8 or 16 */
30 };
31 
32 #define RT6_LOOKUP_F_IFACE		0x00000001
33 #define RT6_LOOKUP_F_REACHABLE		0x00000002
34 #define RT6_LOOKUP_F_HAS_SADDR		0x00000004
35 #define RT6_LOOKUP_F_SRCPREF_TMP	0x00000008
36 #define RT6_LOOKUP_F_SRCPREF_PUBLIC	0x00000010
37 #define RT6_LOOKUP_F_SRCPREF_COA	0x00000020
38 #define RT6_LOOKUP_F_IGNORE_LINKSTATE	0x00000040
39 #define RT6_LOOKUP_F_DST_NOREF		0x00000080
40 
41 /* We do not (yet ?) support IPv6 jumbograms (RFC 2675)
42  * Unlike IPv4, hdr->seg_len doesn't include the IPv6 header
43  */
44 #define IP6_MAX_MTU (0xFFFF + sizeof(struct ipv6hdr))
45 
46 /*
47  * rt6_srcprefs2flags() and rt6_flags2srcprefs() translate
48  * between IPV6_ADDR_PREFERENCES socket option values
49  *	IPV6_PREFER_SRC_TMP    = 0x1
50  *	IPV6_PREFER_SRC_PUBLIC = 0x2
51  *	IPV6_PREFER_SRC_COA    = 0x4
52  * and above RT6_LOOKUP_F_SRCPREF_xxx flags.
53  */
54 static inline int rt6_srcprefs2flags(unsigned int srcprefs)
55 {
56 	return (srcprefs & IPV6_PREFER_SRC_MASK) << 3;
57 }
58 
59 static inline unsigned int rt6_flags2srcprefs(int flags)
60 {
61 	return (flags >> 3) & IPV6_PREFER_SRC_MASK;
62 }
63 
64 static inline bool rt6_need_strict(const struct in6_addr *daddr)
65 {
66 	return ipv6_addr_type(daddr) &
67 		(IPV6_ADDR_MULTICAST | IPV6_ADDR_LINKLOCAL | IPV6_ADDR_LOOPBACK);
68 }
69 
70 /* fib entries using a nexthop object can not be coalesced into
71  * a multipath route
72  */
73 static inline bool rt6_qualify_for_ecmp(const struct fib6_info *f6i)
74 {
75 	/* the RTF_ADDRCONF flag filters out RA's */
76 	return !(f6i->fib6_flags & RTF_ADDRCONF) && !f6i->nh &&
77 		f6i->fib6_nh->fib_nh_gw_family;
78 }
79 
80 #if IS_ENABLED(CONFIG_IPV6)
81 void ip6_route_input(struct sk_buff *skb);
82 #else
83 static inline void ip6_route_input(struct sk_buff *skb)
84 {
85 }
86 #endif
87 
88 struct dst_entry *ip6_route_input_lookup(struct net *net,
89 					 struct net_device *dev,
90 					 struct flowi6 *fl6,
91 					 const struct sk_buff *skb, int flags);
92 
93 struct dst_entry *ip6_route_output_flags(struct net *net, const struct sock *sk,
94 					 struct flowi6 *fl6, int flags);
95 
96 static inline struct dst_entry *ip6_route_output(struct net *net,
97 						 const struct sock *sk,
98 						 struct flowi6 *fl6)
99 {
100 	return ip6_route_output_flags(net, sk, fl6, 0);
101 }
102 
103 /* Only conditionally release dst if flags indicates
104  * !RT6_LOOKUP_F_DST_NOREF or dst is in uncached_list.
105  */
106 static inline void ip6_rt_put_flags(struct rt6_info *rt, int flags)
107 {
108 	if (!(flags & RT6_LOOKUP_F_DST_NOREF) ||
109 	    !list_empty(&rt->dst.rt_uncached))
110 		ip6_rt_put(rt);
111 }
112 
113 struct dst_entry *ip6_route_lookup(struct net *net, struct flowi6 *fl6,
114 				   const struct sk_buff *skb, int flags);
115 struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table,
116 			       int ifindex, struct flowi6 *fl6,
117 			       const struct sk_buff *skb, int flags);
118 
119 void ip6_route_init_special_entries(void);
120 int ip6_route_init(void);
121 void ip6_route_cleanup(void);
122 
123 int ipv6_route_ioctl(struct net *net, unsigned int cmd,
124 		struct in6_rtmsg *rtmsg);
125 
126 int ip6_route_add(struct fib6_config *cfg, gfp_t gfp_flags,
127 		  struct netlink_ext_ack *extack);
128 int ip6_ins_rt(struct net *net, struct fib6_info *f6i);
129 #if IS_ENABLED(CONFIG_IPV6)
130 int ip6_del_rt(struct net *net, struct fib6_info *f6i, bool skip_notify);
131 #else
132 static inline int ip6_del_rt(struct net *net, struct fib6_info *f6i,
133 			     bool skip_notify)
134 {
135 	return -EAFNOSUPPORT;
136 }
137 #endif
138 
139 void rt6_flush_exceptions(struct fib6_info *f6i);
140 void rt6_age_exceptions(struct fib6_info *f6i, struct fib6_gc_args *gc_args,
141 			unsigned long now);
142 
143 static inline int ip6_route_get_saddr(struct net *net, struct fib6_info *f6i,
144 				      const struct in6_addr *daddr,
145 				      unsigned int prefs, int l3mdev_index,
146 				      struct in6_addr *saddr)
147 {
148 	struct net_device *l3mdev;
149 	struct net_device *dev;
150 	bool same_vrf;
151 	int err = 0;
152 
153 	rcu_read_lock();
154 
155 	l3mdev = dev_get_by_index_rcu(net, l3mdev_index);
156 	if (!f6i || !f6i->fib6_prefsrc.plen || l3mdev)
157 		dev = f6i ? fib6_info_nh_dev(f6i) : NULL;
158 	same_vrf = !l3mdev || l3mdev_master_dev_rcu(dev) == l3mdev;
159 	if (f6i && f6i->fib6_prefsrc.plen && same_vrf)
160 		*saddr = f6i->fib6_prefsrc.addr;
161 	else
162 		err = ipv6_dev_get_saddr(net, same_vrf ? dev : l3mdev, daddr, prefs, saddr);
163 
164 	rcu_read_unlock();
165 
166 	return err;
167 }
168 
169 struct rt6_info *rt6_lookup(struct net *net, const struct in6_addr *daddr,
170 			    const struct in6_addr *saddr, int oif,
171 			    const struct sk_buff *skb, int flags);
172 u32 rt6_multipath_hash(const struct net *net, const struct flowi6 *fl6,
173 		       const struct sk_buff *skb, struct flow_keys *hkeys);
174 
175 struct dst_entry *icmp6_dst_alloc(struct net_device *dev, struct flowi6 *fl6);
176 
177 void fib6_force_start_gc(struct net *net);
178 
179 struct fib6_info *addrconf_f6i_alloc(struct net *net, struct inet6_dev *idev,
180 				     const struct in6_addr *addr, bool anycast,
181 				     gfp_t gfp_flags, struct netlink_ext_ack *extack);
182 
183 struct rt6_info *ip6_dst_alloc(struct net *net, struct net_device *dev,
184 			       int flags);
185 
186 /*
187  *	support functions for ND
188  *
189  */
190 struct fib6_info *rt6_get_dflt_router(struct net *net,
191 				     const struct in6_addr *addr,
192 				     struct net_device *dev);
193 struct fib6_info *rt6_add_dflt_router(struct net *net,
194 				     const struct in6_addr *gwaddr,
195 				     struct net_device *dev, unsigned int pref,
196 				     u32 defrtr_usr_metric,
197 				     int lifetime);
198 
199 void rt6_purge_dflt_routers(struct net *net);
200 
201 int rt6_route_rcv(struct net_device *dev, u8 *opt, int len,
202 		  const struct in6_addr *gwaddr);
203 
204 void ip6_update_pmtu(struct sk_buff *skb, struct net *net, __be32 mtu, int oif,
205 		     u32 mark, kuid_t uid);
206 void ip6_sk_update_pmtu(struct sk_buff *skb, struct sock *sk, __be32 mtu);
207 void ip6_redirect(struct sk_buff *skb, struct net *net, int oif, u32 mark,
208 		  kuid_t uid);
209 void ip6_redirect_no_header(struct sk_buff *skb, struct net *net, int oif);
210 void ip6_sk_redirect(struct sk_buff *skb, struct sock *sk);
211 
212 struct netlink_callback;
213 
214 struct rt6_rtnl_dump_arg {
215 	struct sk_buff *skb;
216 	struct netlink_callback *cb;
217 	struct net *net;
218 	struct fib_dump_filter filter;
219 };
220 
221 int rt6_dump_route(struct fib6_info *f6i, void *p_arg, unsigned int skip);
222 void rt6_mtu_change(struct net_device *dev, unsigned int mtu);
223 void rt6_remove_prefsrc(struct inet6_ifaddr *ifp);
224 void rt6_clean_tohost(struct net *net, struct in6_addr *gateway);
225 void rt6_sync_up(struct net_device *dev, unsigned char nh_flags);
226 void rt6_disable_ip(struct net_device *dev, unsigned long event);
227 void rt6_sync_down_dev(struct net_device *dev, unsigned long event);
228 void rt6_multipath_rebalance(struct fib6_info *f6i);
229 
230 void rt6_uncached_list_add(struct rt6_info *rt);
231 void rt6_uncached_list_del(struct rt6_info *rt);
232 
233 static inline const struct rt6_info *skb_rt6_info(const struct sk_buff *skb)
234 {
235 	const struct dst_entry *dst = skb_dst(skb);
236 
237 	if (dst)
238 		return dst_rt6_info(dst);
239 
240 	return NULL;
241 }
242 
243 /*
244  *	Store a destination cache entry in a socket
245  */
246 static inline void ip6_dst_store(struct sock *sk, struct dst_entry *dst,
247 				 bool daddr_set,
248 				 bool saddr_set)
249 {
250 	struct ipv6_pinfo *np = inet6_sk(sk);
251 
252 	np->dst_cookie = rt6_get_cookie(dst_rt6_info(dst));
253 	sk_setup_caps(sk, dst);
254 	np->daddr_cache = daddr_set;
255 #ifdef CONFIG_IPV6_SUBTREES
256 	np->saddr_cache = saddr_set;
257 #endif
258 }
259 
260 void ip6_sk_dst_store_flow(struct sock *sk, struct dst_entry *dst,
261 			   const struct flowi6 *fl6);
262 
263 static inline bool ipv6_unicast_destination(const struct sk_buff *skb)
264 {
265 	const struct rt6_info *rt = dst_rt6_info(skb_dst(skb));
266 
267 	return rt->rt6i_flags & RTF_LOCAL;
268 }
269 
270 static inline bool __ipv6_anycast_destination(const struct rt6key *rt6i_dst,
271 					      u32 rt6i_flags,
272 					      const struct in6_addr *daddr)
273 {
274 	return rt6i_flags & RTF_ANYCAST ||
275 	       (rt6i_dst->plen < 127 &&
276 	       !(rt6i_flags & (RTF_GATEWAY | RTF_NONEXTHOP)) &&
277 	       ipv6_addr_equal(&rt6i_dst->addr, daddr));
278 }
279 
280 static inline bool ipv6_anycast_destination(const struct dst_entry *dst,
281 					    const struct in6_addr *daddr)
282 {
283 	const struct rt6_info *rt = dst_rt6_info(dst);
284 
285 	return __ipv6_anycast_destination(&rt->rt6i_dst, rt->rt6i_flags, daddr);
286 }
287 
288 #if IS_ENABLED(CONFIG_IPV6)
289 int ip6_fragment(struct net *net, struct sock *sk, struct sk_buff *skb,
290 		 int (*output)(struct net *, struct sock *, struct sk_buff *));
291 #else
292 static inline int ip6_fragment(struct net *net, struct sock *sk,
293 			       struct sk_buff *skb,
294 			       int (*output)(struct net *, struct sock *,
295 					     struct sk_buff *))
296 {
297 	kfree_skb(skb);
298 	return -EAFNOSUPPORT;
299 }
300 #endif
301 
302 /* Variant of dst_mtu() for IPv6 users */
303 static inline u32 dst6_mtu(const struct dst_entry *dst)
304 {
305 	return INDIRECT_CALL_1(dst->ops->mtu, ip6_mtu, dst);
306 }
307 
308 static inline unsigned int ip6_skb_dst_mtu(const struct sk_buff *skb)
309 {
310 	const struct ipv6_pinfo *np = skb->sk && !dev_recursion_level() ?
311 				inet6_sk(skb->sk) : NULL;
312 	const struct dst_entry *dst = skb_dst(skb);
313 	unsigned int mtu;
314 
315 	if (np && READ_ONCE(np->pmtudisc) >= IPV6_PMTUDISC_PROBE) {
316 		mtu = READ_ONCE(dst_dev(dst)->mtu);
317 		mtu -= lwtunnel_headroom(dst->lwtstate, mtu);
318 	} else {
319 		mtu = dst_mtu(dst);
320 	}
321 	return mtu;
322 }
323 
324 static inline bool ip6_sk_accept_pmtu(const struct sock *sk)
325 {
326 	u8 pmtudisc = READ_ONCE(inet6_sk(sk)->pmtudisc);
327 
328 	return pmtudisc != IPV6_PMTUDISC_INTERFACE &&
329 	       pmtudisc != IPV6_PMTUDISC_OMIT;
330 }
331 
332 static inline bool ip6_sk_ignore_df(const struct sock *sk)
333 {
334 	u8 pmtudisc = READ_ONCE(inet6_sk(sk)->pmtudisc);
335 
336 	return pmtudisc < IPV6_PMTUDISC_DO ||
337 	       pmtudisc == IPV6_PMTUDISC_OMIT;
338 }
339 
340 static inline const struct in6_addr *rt6_nexthop(const struct rt6_info *rt,
341 						 const struct in6_addr *daddr)
342 {
343 	if (rt->rt6i_flags & RTF_GATEWAY)
344 		return &rt->rt6i_gateway;
345 	else if (unlikely(rt->rt6i_flags & RTF_CACHE))
346 		return &rt->rt6i_dst.addr;
347 	else
348 		return daddr;
349 }
350 
351 static inline bool rt6_duplicate_nexthop(struct fib6_info *a, struct fib6_info *b)
352 {
353 	struct fib6_nh *nha, *nhb;
354 
355 	if (a->nh || b->nh)
356 		return nexthop_cmp(a->nh, b->nh);
357 
358 	nha = a->fib6_nh;
359 	nhb = b->fib6_nh;
360 	return nha->fib_nh_dev == nhb->fib_nh_dev &&
361 	       ipv6_addr_equal(&nha->fib_nh_gw6, &nhb->fib_nh_gw6) &&
362 	       !lwtunnel_cmp_encap(nha->fib_nh_lws, nhb->fib_nh_lws);
363 }
364 
365 static inline unsigned int ip6_dst_mtu_maybe_forward(const struct dst_entry *dst,
366 						     bool forwarding)
367 {
368 	struct inet6_dev *idev;
369 	unsigned int mtu;
370 
371 	if (!forwarding || dst_metric_locked(dst, RTAX_MTU)) {
372 		mtu = dst_metric_raw(dst, RTAX_MTU);
373 		if (mtu)
374 			goto out;
375 	}
376 
377 	mtu = IPV6_MIN_MTU;
378 	rcu_read_lock();
379 	idev = __in6_dev_get(dst_dev_rcu(dst));
380 	if (idev)
381 		mtu = READ_ONCE(idev->cnf.mtu6);
382 	rcu_read_unlock();
383 
384 out:
385 	return mtu - lwtunnel_headroom(dst->lwtstate, mtu);
386 }
387 
388 u32 ip6_mtu_from_fib6(const struct fib6_result *res,
389 		      const struct in6_addr *daddr,
390 		      const struct in6_addr *saddr);
391 
392 struct neighbour *ip6_neigh_lookup(const struct in6_addr *gw,
393 				   struct net_device *dev, struct sk_buff *skb,
394 				   const void *daddr);
395 #endif
396