1 /* SPDX-License-Identifier: GPL-2.0 */ 2 #ifndef _NET_IP6_ROUTE_H 3 #define _NET_IP6_ROUTE_H 4 5 #include <net/addrconf.h> 6 #include <net/flow.h> 7 #include <net/ip6_fib.h> 8 #include <net/sock.h> 9 #include <net/lwtunnel.h> 10 #include <linux/ip.h> 11 #include <linux/ipv6.h> 12 #include <linux/route.h> 13 #include <net/nexthop.h> 14 15 struct route_info { 16 __u8 type; 17 __u8 length; 18 __u8 prefix_len; 19 #if defined(__BIG_ENDIAN_BITFIELD) 20 __u8 reserved_h:3, 21 route_pref:2, 22 reserved_l:3; 23 #elif defined(__LITTLE_ENDIAN_BITFIELD) 24 __u8 reserved_l:3, 25 route_pref:2, 26 reserved_h:3; 27 #endif 28 __be32 lifetime; 29 __u8 prefix[]; /* 0,8 or 16 */ 30 }; 31 32 #define RT6_LOOKUP_F_IFACE 0x00000001 33 #define RT6_LOOKUP_F_REACHABLE 0x00000002 34 #define RT6_LOOKUP_F_HAS_SADDR 0x00000004 35 #define RT6_LOOKUP_F_SRCPREF_TMP 0x00000008 36 #define RT6_LOOKUP_F_SRCPREF_PUBLIC 0x00000010 37 #define RT6_LOOKUP_F_SRCPREF_COA 0x00000020 38 #define RT6_LOOKUP_F_IGNORE_LINKSTATE 0x00000040 39 #define RT6_LOOKUP_F_DST_NOREF 0x00000080 40 41 /* We do not (yet ?) support IPv6 jumbograms (RFC 2675) 42 * Unlike IPv4, hdr->seg_len doesn't include the IPv6 header 43 */ 44 #define IP6_MAX_MTU (0xFFFF + sizeof(struct ipv6hdr)) 45 46 /* 47 * rt6_srcprefs2flags() and rt6_flags2srcprefs() translate 48 * between IPV6_ADDR_PREFERENCES socket option values 49 * IPV6_PREFER_SRC_TMP = 0x1 50 * IPV6_PREFER_SRC_PUBLIC = 0x2 51 * IPV6_PREFER_SRC_COA = 0x4 52 * and above RT6_LOOKUP_F_SRCPREF_xxx flags. 53 */ 54 static inline int rt6_srcprefs2flags(unsigned int srcprefs) 55 { 56 return (srcprefs & IPV6_PREFER_SRC_MASK) << 3; 57 } 58 59 static inline unsigned int rt6_flags2srcprefs(int flags) 60 { 61 return (flags >> 3) & IPV6_PREFER_SRC_MASK; 62 } 63 64 static inline bool rt6_need_strict(const struct in6_addr *daddr) 65 { 66 return ipv6_addr_type(daddr) & 67 (IPV6_ADDR_MULTICAST | IPV6_ADDR_LINKLOCAL | IPV6_ADDR_LOOPBACK); 68 } 69 70 /* fib entries using a nexthop object can not be coalesced into 71 * a multipath route 72 */ 73 static inline bool rt6_qualify_for_ecmp(const struct fib6_info *f6i) 74 { 75 /* the RTF_ADDRCONF flag filters out RA's */ 76 return !(f6i->fib6_flags & RTF_ADDRCONF) && !f6i->nh && 77 f6i->fib6_nh->fib_nh_gw_family; 78 } 79 80 #if IS_ENABLED(CONFIG_IPV6) 81 void ip6_route_input(struct sk_buff *skb); 82 #else 83 static inline void ip6_route_input(struct sk_buff *skb) 84 { 85 } 86 #endif 87 88 struct dst_entry *ip6_route_input_lookup(struct net *net, 89 struct net_device *dev, 90 struct flowi6 *fl6, 91 const struct sk_buff *skb, int flags); 92 93 struct dst_entry *ip6_route_output_flags(struct net *net, const struct sock *sk, 94 struct flowi6 *fl6, int flags); 95 96 static inline struct dst_entry *ip6_route_output(struct net *net, 97 const struct sock *sk, 98 struct flowi6 *fl6) 99 { 100 return ip6_route_output_flags(net, sk, fl6, 0); 101 } 102 103 /* Only conditionally release dst if flags indicates 104 * !RT6_LOOKUP_F_DST_NOREF or dst is in uncached_list. 105 */ 106 static inline void ip6_rt_put_flags(struct rt6_info *rt, int flags) 107 { 108 if (!(flags & RT6_LOOKUP_F_DST_NOREF) || 109 !list_empty(&rt->dst.rt_uncached)) 110 ip6_rt_put(rt); 111 } 112 113 struct dst_entry *ip6_route_lookup(struct net *net, struct flowi6 *fl6, 114 const struct sk_buff *skb, int flags); 115 struct rt6_info *ip6_pol_route(struct net *net, struct fib6_table *table, 116 int ifindex, struct flowi6 *fl6, 117 const struct sk_buff *skb, int flags); 118 119 void ip6_route_init_special_entries(void); 120 int ip6_route_init(void); 121 void ip6_route_cleanup(void); 122 123 int ipv6_route_ioctl(struct net *net, unsigned int cmd, 124 struct in6_rtmsg *rtmsg); 125 126 int ip6_route_add(struct fib6_config *cfg, gfp_t gfp_flags, 127 struct netlink_ext_ack *extack); 128 int ip6_ins_rt(struct net *net, struct fib6_info *f6i); 129 #if IS_ENABLED(CONFIG_IPV6) 130 int ip6_del_rt(struct net *net, struct fib6_info *f6i, bool skip_notify); 131 #else 132 static inline int ip6_del_rt(struct net *net, struct fib6_info *f6i, 133 bool skip_notify) 134 { 135 return -EAFNOSUPPORT; 136 } 137 #endif 138 139 void rt6_flush_exceptions(struct fib6_info *f6i); 140 void rt6_age_exceptions(struct fib6_info *f6i, struct fib6_gc_args *gc_args, 141 unsigned long now); 142 143 static inline int ip6_route_get_saddr(struct net *net, struct fib6_info *f6i, 144 const struct in6_addr *daddr, 145 unsigned int prefs, int l3mdev_index, 146 struct in6_addr *saddr) 147 { 148 struct net_device *l3mdev; 149 struct net_device *dev; 150 bool same_vrf; 151 int err = 0; 152 153 rcu_read_lock(); 154 155 l3mdev = dev_get_by_index_rcu(net, l3mdev_index); 156 if (!f6i || !f6i->fib6_prefsrc.plen || l3mdev) 157 dev = f6i ? fib6_info_nh_dev(f6i) : NULL; 158 same_vrf = !l3mdev || l3mdev_master_dev_rcu(dev) == l3mdev; 159 if (f6i && f6i->fib6_prefsrc.plen && same_vrf) 160 *saddr = f6i->fib6_prefsrc.addr; 161 else 162 err = ipv6_dev_get_saddr(net, same_vrf ? dev : l3mdev, daddr, prefs, saddr); 163 164 rcu_read_unlock(); 165 166 return err; 167 } 168 169 struct rt6_info *rt6_lookup(struct net *net, const struct in6_addr *daddr, 170 const struct in6_addr *saddr, int oif, 171 const struct sk_buff *skb, int flags); 172 u32 rt6_multipath_hash(const struct net *net, const struct flowi6 *fl6, 173 const struct sk_buff *skb, struct flow_keys *hkeys); 174 175 struct dst_entry *icmp6_dst_alloc(struct net_device *dev, struct flowi6 *fl6); 176 177 void fib6_force_start_gc(struct net *net); 178 179 struct fib6_info *addrconf_f6i_alloc(struct net *net, struct inet6_dev *idev, 180 const struct in6_addr *addr, bool anycast, 181 gfp_t gfp_flags, struct netlink_ext_ack *extack); 182 183 struct rt6_info *ip6_dst_alloc(struct net *net, struct net_device *dev, 184 int flags); 185 186 /* 187 * support functions for ND 188 * 189 */ 190 struct fib6_info *rt6_get_dflt_router(struct net *net, 191 const struct in6_addr *addr, 192 struct net_device *dev); 193 struct fib6_info *rt6_add_dflt_router(struct net *net, 194 const struct in6_addr *gwaddr, 195 struct net_device *dev, unsigned int pref, 196 u32 defrtr_usr_metric, 197 int lifetime); 198 199 void rt6_purge_dflt_routers(struct net *net); 200 201 int rt6_route_rcv(struct net_device *dev, u8 *opt, int len, 202 const struct in6_addr *gwaddr); 203 204 void ip6_update_pmtu(struct sk_buff *skb, struct net *net, __be32 mtu, int oif, 205 u32 mark, kuid_t uid); 206 void ip6_sk_update_pmtu(struct sk_buff *skb, struct sock *sk, __be32 mtu); 207 void ip6_redirect(struct sk_buff *skb, struct net *net, int oif, u32 mark, 208 kuid_t uid); 209 void ip6_redirect_no_header(struct sk_buff *skb, struct net *net, int oif); 210 void ip6_sk_redirect(struct sk_buff *skb, struct sock *sk); 211 212 struct netlink_callback; 213 214 struct rt6_rtnl_dump_arg { 215 struct sk_buff *skb; 216 struct netlink_callback *cb; 217 struct net *net; 218 struct fib_dump_filter filter; 219 }; 220 221 int rt6_dump_route(struct fib6_info *f6i, void *p_arg, unsigned int skip); 222 void rt6_mtu_change(struct net_device *dev, unsigned int mtu); 223 void rt6_remove_prefsrc(struct inet6_ifaddr *ifp); 224 void rt6_clean_tohost(struct net *net, struct in6_addr *gateway); 225 void rt6_sync_up(struct net_device *dev, unsigned char nh_flags); 226 void rt6_disable_ip(struct net_device *dev, unsigned long event); 227 void rt6_sync_down_dev(struct net_device *dev, unsigned long event); 228 void rt6_multipath_rebalance(struct fib6_info *f6i); 229 230 void rt6_uncached_list_add(struct rt6_info *rt); 231 void rt6_uncached_list_del(struct rt6_info *rt); 232 233 static inline const struct rt6_info *skb_rt6_info(const struct sk_buff *skb) 234 { 235 const struct dst_entry *dst = skb_dst(skb); 236 237 if (dst) 238 return dst_rt6_info(dst); 239 240 return NULL; 241 } 242 243 /* 244 * Store a destination cache entry in a socket 245 */ 246 static inline void ip6_dst_store(struct sock *sk, struct dst_entry *dst, 247 bool daddr_set, 248 bool saddr_set) 249 { 250 struct ipv6_pinfo *np = inet6_sk(sk); 251 252 np->dst_cookie = rt6_get_cookie(dst_rt6_info(dst)); 253 sk_setup_caps(sk, dst); 254 np->daddr_cache = daddr_set; 255 #ifdef CONFIG_IPV6_SUBTREES 256 np->saddr_cache = saddr_set; 257 #endif 258 } 259 260 void ip6_sk_dst_store_flow(struct sock *sk, struct dst_entry *dst, 261 const struct flowi6 *fl6); 262 263 static inline bool ipv6_unicast_destination(const struct sk_buff *skb) 264 { 265 const struct rt6_info *rt = dst_rt6_info(skb_dst(skb)); 266 267 return rt->rt6i_flags & RTF_LOCAL; 268 } 269 270 static inline bool __ipv6_anycast_destination(const struct rt6key *rt6i_dst, 271 u32 rt6i_flags, 272 const struct in6_addr *daddr) 273 { 274 return rt6i_flags & RTF_ANYCAST || 275 (rt6i_dst->plen < 127 && 276 !(rt6i_flags & (RTF_GATEWAY | RTF_NONEXTHOP)) && 277 ipv6_addr_equal(&rt6i_dst->addr, daddr)); 278 } 279 280 static inline bool ipv6_anycast_destination(const struct dst_entry *dst, 281 const struct in6_addr *daddr) 282 { 283 const struct rt6_info *rt = dst_rt6_info(dst); 284 285 return __ipv6_anycast_destination(&rt->rt6i_dst, rt->rt6i_flags, daddr); 286 } 287 288 #if IS_ENABLED(CONFIG_IPV6) 289 int ip6_fragment(struct net *net, struct sock *sk, struct sk_buff *skb, 290 int (*output)(struct net *, struct sock *, struct sk_buff *)); 291 #else 292 static inline int ip6_fragment(struct net *net, struct sock *sk, 293 struct sk_buff *skb, 294 int (*output)(struct net *, struct sock *, 295 struct sk_buff *)) 296 { 297 kfree_skb(skb); 298 return -EAFNOSUPPORT; 299 } 300 #endif 301 302 /* Variant of dst_mtu() for IPv6 users */ 303 static inline u32 dst6_mtu(const struct dst_entry *dst) 304 { 305 return INDIRECT_CALL_1(dst->ops->mtu, ip6_mtu, dst); 306 } 307 308 static inline unsigned int ip6_skb_dst_mtu(const struct sk_buff *skb) 309 { 310 const struct ipv6_pinfo *np = skb->sk && !dev_recursion_level() ? 311 inet6_sk(skb->sk) : NULL; 312 const struct dst_entry *dst = skb_dst(skb); 313 unsigned int mtu; 314 315 if (np && READ_ONCE(np->pmtudisc) >= IPV6_PMTUDISC_PROBE) { 316 mtu = READ_ONCE(dst_dev(dst)->mtu); 317 mtu -= lwtunnel_headroom(dst->lwtstate, mtu); 318 } else { 319 mtu = dst_mtu(dst); 320 } 321 return mtu; 322 } 323 324 static inline bool ip6_sk_accept_pmtu(const struct sock *sk) 325 { 326 u8 pmtudisc = READ_ONCE(inet6_sk(sk)->pmtudisc); 327 328 return pmtudisc != IPV6_PMTUDISC_INTERFACE && 329 pmtudisc != IPV6_PMTUDISC_OMIT; 330 } 331 332 static inline bool ip6_sk_ignore_df(const struct sock *sk) 333 { 334 u8 pmtudisc = READ_ONCE(inet6_sk(sk)->pmtudisc); 335 336 return pmtudisc < IPV6_PMTUDISC_DO || 337 pmtudisc == IPV6_PMTUDISC_OMIT; 338 } 339 340 static inline const struct in6_addr *rt6_nexthop(const struct rt6_info *rt, 341 const struct in6_addr *daddr) 342 { 343 if (rt->rt6i_flags & RTF_GATEWAY) 344 return &rt->rt6i_gateway; 345 else if (unlikely(rt->rt6i_flags & RTF_CACHE)) 346 return &rt->rt6i_dst.addr; 347 else 348 return daddr; 349 } 350 351 static inline bool rt6_duplicate_nexthop(struct fib6_info *a, struct fib6_info *b) 352 { 353 struct fib6_nh *nha, *nhb; 354 355 if (a->nh || b->nh) 356 return nexthop_cmp(a->nh, b->nh); 357 358 nha = a->fib6_nh; 359 nhb = b->fib6_nh; 360 return nha->fib_nh_dev == nhb->fib_nh_dev && 361 ipv6_addr_equal(&nha->fib_nh_gw6, &nhb->fib_nh_gw6) && 362 !lwtunnel_cmp_encap(nha->fib_nh_lws, nhb->fib_nh_lws); 363 } 364 365 static inline unsigned int ip6_dst_mtu_maybe_forward(const struct dst_entry *dst, 366 bool forwarding) 367 { 368 struct inet6_dev *idev; 369 unsigned int mtu; 370 371 if (!forwarding || dst_metric_locked(dst, RTAX_MTU)) { 372 mtu = dst_metric_raw(dst, RTAX_MTU); 373 if (mtu) 374 goto out; 375 } 376 377 mtu = IPV6_MIN_MTU; 378 rcu_read_lock(); 379 idev = __in6_dev_get(dst_dev_rcu(dst)); 380 if (idev) 381 mtu = READ_ONCE(idev->cnf.mtu6); 382 rcu_read_unlock(); 383 384 out: 385 return mtu - lwtunnel_headroom(dst->lwtstate, mtu); 386 } 387 388 u32 ip6_mtu_from_fib6(const struct fib6_result *res, 389 const struct in6_addr *daddr, 390 const struct in6_addr *saddr); 391 392 struct neighbour *ip6_neigh_lookup(const struct in6_addr *gw, 393 struct net_device *dev, struct sk_buff *skb, 394 const void *daddr); 395 #endif 396