xref: /linux/net/ipv4/udp_tunnel_core.c (revision 9410645520e9b820069761f3450ef6661418e279)
1cc4e3835SJakub Kicinski // SPDX-License-Identifier: GPL-2.0-only
2cc4e3835SJakub Kicinski #include <linux/module.h>
3cc4e3835SJakub Kicinski #include <linux/errno.h>
4cc4e3835SJakub Kicinski #include <linux/socket.h>
5cc4e3835SJakub Kicinski #include <linux/kernel.h>
6cc4e3835SJakub Kicinski #include <net/dst_metadata.h>
7cc4e3835SJakub Kicinski #include <net/udp.h>
8cc4e3835SJakub Kicinski #include <net/udp_tunnel.h>
9*2c60fc9cSIdo Schimmel #include <net/inet_dscp.h>
10cc4e3835SJakub Kicinski 
udp_sock_create4(struct net * net,struct udp_port_cfg * cfg,struct socket ** sockp)11cc4e3835SJakub Kicinski int udp_sock_create4(struct net *net, struct udp_port_cfg *cfg,
12cc4e3835SJakub Kicinski 		     struct socket **sockp)
13cc4e3835SJakub Kicinski {
14cc4e3835SJakub Kicinski 	int err;
15cc4e3835SJakub Kicinski 	struct socket *sock = NULL;
16cc4e3835SJakub Kicinski 	struct sockaddr_in udp_addr;
17cc4e3835SJakub Kicinski 
18cc4e3835SJakub Kicinski 	err = sock_create_kern(net, AF_INET, SOCK_DGRAM, 0, &sock);
19cc4e3835SJakub Kicinski 	if (err < 0)
20cc4e3835SJakub Kicinski 		goto error;
21cc4e3835SJakub Kicinski 
22cc4e3835SJakub Kicinski 	if (cfg->bind_ifindex) {
23cc4e3835SJakub Kicinski 		err = sock_bindtoindex(sock->sk, cfg->bind_ifindex, true);
24cc4e3835SJakub Kicinski 		if (err < 0)
25cc4e3835SJakub Kicinski 			goto error;
26cc4e3835SJakub Kicinski 	}
27cc4e3835SJakub Kicinski 
28cc4e3835SJakub Kicinski 	udp_addr.sin_family = AF_INET;
29cc4e3835SJakub Kicinski 	udp_addr.sin_addr = cfg->local_ip;
30cc4e3835SJakub Kicinski 	udp_addr.sin_port = cfg->local_udp_port;
31cc4e3835SJakub Kicinski 	err = kernel_bind(sock, (struct sockaddr *)&udp_addr,
32cc4e3835SJakub Kicinski 			  sizeof(udp_addr));
33cc4e3835SJakub Kicinski 	if (err < 0)
34cc4e3835SJakub Kicinski 		goto error;
35cc4e3835SJakub Kicinski 
36cc4e3835SJakub Kicinski 	if (cfg->peer_udp_port) {
37cc4e3835SJakub Kicinski 		udp_addr.sin_family = AF_INET;
38cc4e3835SJakub Kicinski 		udp_addr.sin_addr = cfg->peer_ip;
39cc4e3835SJakub Kicinski 		udp_addr.sin_port = cfg->peer_udp_port;
40cc4e3835SJakub Kicinski 		err = kernel_connect(sock, (struct sockaddr *)&udp_addr,
41cc4e3835SJakub Kicinski 				     sizeof(udp_addr), 0);
42cc4e3835SJakub Kicinski 		if (err < 0)
43cc4e3835SJakub Kicinski 			goto error;
44cc4e3835SJakub Kicinski 	}
45cc4e3835SJakub Kicinski 
46cc4e3835SJakub Kicinski 	sock->sk->sk_no_check_tx = !cfg->use_udp_checksums;
47cc4e3835SJakub Kicinski 
48cc4e3835SJakub Kicinski 	*sockp = sock;
49cc4e3835SJakub Kicinski 	return 0;
50cc4e3835SJakub Kicinski 
51cc4e3835SJakub Kicinski error:
52cc4e3835SJakub Kicinski 	if (sock) {
53cc4e3835SJakub Kicinski 		kernel_sock_shutdown(sock, SHUT_RDWR);
54cc4e3835SJakub Kicinski 		sock_release(sock);
55cc4e3835SJakub Kicinski 	}
56cc4e3835SJakub Kicinski 	*sockp = NULL;
57cc4e3835SJakub Kicinski 	return err;
58cc4e3835SJakub Kicinski }
59cc4e3835SJakub Kicinski EXPORT_SYMBOL(udp_sock_create4);
60cc4e3835SJakub Kicinski 
setup_udp_tunnel_sock(struct net * net,struct socket * sock,struct udp_tunnel_sock_cfg * cfg)61cc4e3835SJakub Kicinski void setup_udp_tunnel_sock(struct net *net, struct socket *sock,
62cc4e3835SJakub Kicinski 			   struct udp_tunnel_sock_cfg *cfg)
63cc4e3835SJakub Kicinski {
64cc4e3835SJakub Kicinski 	struct sock *sk = sock->sk;
65cc4e3835SJakub Kicinski 
66cc4e3835SJakub Kicinski 	/* Disable multicast loopback */
67b09bde5cSEric Dumazet 	inet_clear_bit(MC_LOOP, sk);
68cc4e3835SJakub Kicinski 
69cc4e3835SJakub Kicinski 	/* Enable CHECKSUM_UNNECESSARY to CHECKSUM_COMPLETE conversion */
70cc4e3835SJakub Kicinski 	inet_inc_convert_csum(sk);
71cc4e3835SJakub Kicinski 
72cc4e3835SJakub Kicinski 	rcu_assign_sk_user_data(sk, cfg->sk_user_data);
73cc4e3835SJakub Kicinski 
74cc4e3835SJakub Kicinski 	udp_sk(sk)->encap_type = cfg->encap_type;
75cc4e3835SJakub Kicinski 	udp_sk(sk)->encap_rcv = cfg->encap_rcv;
76ac56a0b4SDavid Howells 	udp_sk(sk)->encap_err_rcv = cfg->encap_err_rcv;
77cc4e3835SJakub Kicinski 	udp_sk(sk)->encap_err_lookup = cfg->encap_err_lookup;
78cc4e3835SJakub Kicinski 	udp_sk(sk)->encap_destroy = cfg->encap_destroy;
79cc4e3835SJakub Kicinski 	udp_sk(sk)->gro_receive = cfg->gro_receive;
80cc4e3835SJakub Kicinski 	udp_sk(sk)->gro_complete = cfg->gro_complete;
81cc4e3835SJakub Kicinski 
82ac9a7f4cSEric Dumazet 	udp_tunnel_encap_enable(sk);
83cc4e3835SJakub Kicinski }
84cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(setup_udp_tunnel_sock);
85cc4e3835SJakub Kicinski 
udp_tunnel_push_rx_port(struct net_device * dev,struct socket * sock,unsigned short type)86cc4e3835SJakub Kicinski void udp_tunnel_push_rx_port(struct net_device *dev, struct socket *sock,
87cc4e3835SJakub Kicinski 			     unsigned short type)
88cc4e3835SJakub Kicinski {
89cc4e3835SJakub Kicinski 	struct sock *sk = sock->sk;
90cc4e3835SJakub Kicinski 	struct udp_tunnel_info ti;
91cc4e3835SJakub Kicinski 
92cc4e3835SJakub Kicinski 	ti.type = type;
93cc4e3835SJakub Kicinski 	ti.sa_family = sk->sk_family;
94cc4e3835SJakub Kicinski 	ti.port = inet_sk(sk)->inet_sport;
95cc4e3835SJakub Kicinski 
96876c4384SJakub Kicinski 	udp_tunnel_nic_add_port(dev, &ti);
97cc4e3835SJakub Kicinski }
98cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_push_rx_port);
99cc4e3835SJakub Kicinski 
udp_tunnel_drop_rx_port(struct net_device * dev,struct socket * sock,unsigned short type)100cc4e3835SJakub Kicinski void udp_tunnel_drop_rx_port(struct net_device *dev, struct socket *sock,
101cc4e3835SJakub Kicinski 			     unsigned short type)
102cc4e3835SJakub Kicinski {
103cc4e3835SJakub Kicinski 	struct sock *sk = sock->sk;
104cc4e3835SJakub Kicinski 	struct udp_tunnel_info ti;
105cc4e3835SJakub Kicinski 
106cc4e3835SJakub Kicinski 	ti.type = type;
107cc4e3835SJakub Kicinski 	ti.sa_family = sk->sk_family;
108cc4e3835SJakub Kicinski 	ti.port = inet_sk(sk)->inet_sport;
109cc4e3835SJakub Kicinski 
110876c4384SJakub Kicinski 	udp_tunnel_nic_del_port(dev, &ti);
111cc4e3835SJakub Kicinski }
112cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_drop_rx_port);
113cc4e3835SJakub Kicinski 
114cc4e3835SJakub Kicinski /* Notify netdevs that UDP port started listening */
udp_tunnel_notify_add_rx_port(struct socket * sock,unsigned short type)115cc4e3835SJakub Kicinski void udp_tunnel_notify_add_rx_port(struct socket *sock, unsigned short type)
116cc4e3835SJakub Kicinski {
117cc4e3835SJakub Kicinski 	struct sock *sk = sock->sk;
118cc4e3835SJakub Kicinski 	struct net *net = sock_net(sk);
119cc4e3835SJakub Kicinski 	struct udp_tunnel_info ti;
120cc4e3835SJakub Kicinski 	struct net_device *dev;
121cc4e3835SJakub Kicinski 
122cc4e3835SJakub Kicinski 	ti.type = type;
123cc4e3835SJakub Kicinski 	ti.sa_family = sk->sk_family;
124cc4e3835SJakub Kicinski 	ti.port = inet_sk(sk)->inet_sport;
125cc4e3835SJakub Kicinski 
126cc4e3835SJakub Kicinski 	rcu_read_lock();
127cc4e3835SJakub Kicinski 	for_each_netdev_rcu(net, dev) {
128876c4384SJakub Kicinski 		udp_tunnel_nic_add_port(dev, &ti);
129cc4e3835SJakub Kicinski 	}
130cc4e3835SJakub Kicinski 	rcu_read_unlock();
131cc4e3835SJakub Kicinski }
132cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_notify_add_rx_port);
133cc4e3835SJakub Kicinski 
134cc4e3835SJakub Kicinski /* Notify netdevs that UDP port is no more listening */
udp_tunnel_notify_del_rx_port(struct socket * sock,unsigned short type)135cc4e3835SJakub Kicinski void udp_tunnel_notify_del_rx_port(struct socket *sock, unsigned short type)
136cc4e3835SJakub Kicinski {
137cc4e3835SJakub Kicinski 	struct sock *sk = sock->sk;
138cc4e3835SJakub Kicinski 	struct net *net = sock_net(sk);
139cc4e3835SJakub Kicinski 	struct udp_tunnel_info ti;
140cc4e3835SJakub Kicinski 	struct net_device *dev;
141cc4e3835SJakub Kicinski 
142cc4e3835SJakub Kicinski 	ti.type = type;
143cc4e3835SJakub Kicinski 	ti.sa_family = sk->sk_family;
144cc4e3835SJakub Kicinski 	ti.port = inet_sk(sk)->inet_sport;
145cc4e3835SJakub Kicinski 
146cc4e3835SJakub Kicinski 	rcu_read_lock();
147cc4e3835SJakub Kicinski 	for_each_netdev_rcu(net, dev) {
148876c4384SJakub Kicinski 		udp_tunnel_nic_del_port(dev, &ti);
149cc4e3835SJakub Kicinski 	}
150cc4e3835SJakub Kicinski 	rcu_read_unlock();
151cc4e3835SJakub Kicinski }
152cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_notify_del_rx_port);
153cc4e3835SJakub Kicinski 
udp_tunnel_xmit_skb(struct rtable * rt,struct sock * sk,struct sk_buff * skb,__be32 src,__be32 dst,__u8 tos,__u8 ttl,__be16 df,__be16 src_port,__be16 dst_port,bool xnet,bool nocheck)154cc4e3835SJakub Kicinski void udp_tunnel_xmit_skb(struct rtable *rt, struct sock *sk, struct sk_buff *skb,
155cc4e3835SJakub Kicinski 			 __be32 src, __be32 dst, __u8 tos, __u8 ttl,
156cc4e3835SJakub Kicinski 			 __be16 df, __be16 src_port, __be16 dst_port,
157cc4e3835SJakub Kicinski 			 bool xnet, bool nocheck)
158cc4e3835SJakub Kicinski {
159cc4e3835SJakub Kicinski 	struct udphdr *uh;
160cc4e3835SJakub Kicinski 
161cc4e3835SJakub Kicinski 	__skb_push(skb, sizeof(*uh));
162cc4e3835SJakub Kicinski 	skb_reset_transport_header(skb);
163cc4e3835SJakub Kicinski 	uh = udp_hdr(skb);
164cc4e3835SJakub Kicinski 
165cc4e3835SJakub Kicinski 	uh->dest = dst_port;
166cc4e3835SJakub Kicinski 	uh->source = src_port;
167cc4e3835SJakub Kicinski 	uh->len = htons(skb->len);
168cc4e3835SJakub Kicinski 
169cc4e3835SJakub Kicinski 	memset(&(IPCB(skb)->opt), 0, sizeof(IPCB(skb)->opt));
170cc4e3835SJakub Kicinski 
171cc4e3835SJakub Kicinski 	udp_set_csum(nocheck, skb, src, dst, skb->len);
172cc4e3835SJakub Kicinski 
173cc4e3835SJakub Kicinski 	iptunnel_xmit(sk, rt, skb, src, dst, IPPROTO_UDP, tos, ttl, df, xnet);
174cc4e3835SJakub Kicinski }
175cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_xmit_skb);
176cc4e3835SJakub Kicinski 
udp_tunnel_sock_release(struct socket * sock)177cc4e3835SJakub Kicinski void udp_tunnel_sock_release(struct socket *sock)
178cc4e3835SJakub Kicinski {
179cc4e3835SJakub Kicinski 	rcu_assign_sk_user_data(sock->sk, NULL);
1803cf7203cSHangbin Liu 	synchronize_rcu();
181cc4e3835SJakub Kicinski 	kernel_sock_shutdown(sock, SHUT_RDWR);
182cc4e3835SJakub Kicinski 	sock_release(sock);
183cc4e3835SJakub Kicinski }
184cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tunnel_sock_release);
185cc4e3835SJakub Kicinski 
udp_tun_rx_dst(struct sk_buff * skb,unsigned short family,const unsigned long * flags,__be64 tunnel_id,int md_size)186cc4e3835SJakub Kicinski struct metadata_dst *udp_tun_rx_dst(struct sk_buff *skb,  unsigned short family,
1875832c4a7SAlexander Lobakin 				    const unsigned long *flags,
1885832c4a7SAlexander Lobakin 				    __be64 tunnel_id, int md_size)
189cc4e3835SJakub Kicinski {
190cc4e3835SJakub Kicinski 	struct metadata_dst *tun_dst;
191cc4e3835SJakub Kicinski 	struct ip_tunnel_info *info;
192cc4e3835SJakub Kicinski 
193cc4e3835SJakub Kicinski 	if (family == AF_INET)
194cc4e3835SJakub Kicinski 		tun_dst = ip_tun_rx_dst(skb, flags, tunnel_id, md_size);
195cc4e3835SJakub Kicinski 	else
196cc4e3835SJakub Kicinski 		tun_dst = ipv6_tun_rx_dst(skb, flags, tunnel_id, md_size);
197cc4e3835SJakub Kicinski 	if (!tun_dst)
198cc4e3835SJakub Kicinski 		return NULL;
199cc4e3835SJakub Kicinski 
200cc4e3835SJakub Kicinski 	info = &tun_dst->u.tun_info;
201cc4e3835SJakub Kicinski 	info->key.tp_src = udp_hdr(skb)->source;
202cc4e3835SJakub Kicinski 	info->key.tp_dst = udp_hdr(skb)->dest;
203cc4e3835SJakub Kicinski 	if (udp_hdr(skb)->check)
2045832c4a7SAlexander Lobakin 		__set_bit(IP_TUNNEL_CSUM_BIT, info->key.tun_flags);
205cc4e3835SJakub Kicinski 	return tun_dst;
206cc4e3835SJakub Kicinski }
207cc4e3835SJakub Kicinski EXPORT_SYMBOL_GPL(udp_tun_rx_dst);
208cc4e3835SJakub Kicinski 
udp_tunnel_dst_lookup(struct sk_buff * skb,struct net_device * dev,struct net * net,int oif,__be32 * saddr,const struct ip_tunnel_key * key,__be16 sport,__be16 dport,u8 tos,struct dst_cache * dst_cache)209bf3fcbf7SBeniamino Galvani struct rtable *udp_tunnel_dst_lookup(struct sk_buff *skb,
210bf3fcbf7SBeniamino Galvani 				     struct net_device *dev,
21172fc68c6SBeniamino Galvani 				     struct net *net, int oif,
21272fc68c6SBeniamino Galvani 				     __be32 *saddr,
21372fc68c6SBeniamino Galvani 				     const struct ip_tunnel_key *key,
21472fc68c6SBeniamino Galvani 				     __be16 sport, __be16 dport, u8 tos,
21572fc68c6SBeniamino Galvani 				     struct dst_cache *dst_cache)
216bf3fcbf7SBeniamino Galvani {
217bf3fcbf7SBeniamino Galvani 	struct rtable *rt = NULL;
218bf3fcbf7SBeniamino Galvani 	struct flowi4 fl4;
219bf3fcbf7SBeniamino Galvani 
220bf3fcbf7SBeniamino Galvani #ifdef CONFIG_DST_CACHE
22172fc68c6SBeniamino Galvani 	if (dst_cache) {
222bf3fcbf7SBeniamino Galvani 		rt = dst_cache_get_ip4(dst_cache, saddr);
223bf3fcbf7SBeniamino Galvani 		if (rt)
224bf3fcbf7SBeniamino Galvani 			return rt;
225bf3fcbf7SBeniamino Galvani 	}
226bf3fcbf7SBeniamino Galvani #endif
22772fc68c6SBeniamino Galvani 
228bf3fcbf7SBeniamino Galvani 	memset(&fl4, 0, sizeof(fl4));
229bf3fcbf7SBeniamino Galvani 	fl4.flowi4_mark = skb->mark;
23078f3655aSBeniamino Galvani 	fl4.flowi4_proto = IPPROTO_UDP;
23172fc68c6SBeniamino Galvani 	fl4.flowi4_oif = oif;
23272fc68c6SBeniamino Galvani 	fl4.daddr = key->u.ipv4.dst;
23372fc68c6SBeniamino Galvani 	fl4.saddr = key->u.ipv4.src;
23472fc68c6SBeniamino Galvani 	fl4.fl4_dport = dport;
23572fc68c6SBeniamino Galvani 	fl4.fl4_sport = sport;
236*2c60fc9cSIdo Schimmel 	fl4.flowi4_tos = tos & INET_DSCP_MASK;
2373ae983a6SBeniamino Galvani 	fl4.flowi4_flags = key->flow_flags;
238bf3fcbf7SBeniamino Galvani 
239bf3fcbf7SBeniamino Galvani 	rt = ip_route_output_key(net, &fl4);
240bf3fcbf7SBeniamino Galvani 	if (IS_ERR(rt)) {
241bf3fcbf7SBeniamino Galvani 		netdev_dbg(dev, "no route to %pI4\n", &fl4.daddr);
242bf3fcbf7SBeniamino Galvani 		return ERR_PTR(-ENETUNREACH);
243bf3fcbf7SBeniamino Galvani 	}
244bf3fcbf7SBeniamino Galvani 	if (rt->dst.dev == dev) { /* is this necessary? */
245bf3fcbf7SBeniamino Galvani 		netdev_dbg(dev, "circular route to %pI4\n", &fl4.daddr);
246bf3fcbf7SBeniamino Galvani 		ip_rt_put(rt);
247bf3fcbf7SBeniamino Galvani 		return ERR_PTR(-ELOOP);
248bf3fcbf7SBeniamino Galvani 	}
249bf3fcbf7SBeniamino Galvani #ifdef CONFIG_DST_CACHE
25072fc68c6SBeniamino Galvani 	if (dst_cache)
251bf3fcbf7SBeniamino Galvani 		dst_cache_set_ip4(dst_cache, &rt->dst, fl4.saddr);
252bf3fcbf7SBeniamino Galvani #endif
253bf3fcbf7SBeniamino Galvani 	*saddr = fl4.saddr;
254bf3fcbf7SBeniamino Galvani 	return rt;
255bf3fcbf7SBeniamino Galvani }
256bf3fcbf7SBeniamino Galvani EXPORT_SYMBOL_GPL(udp_tunnel_dst_lookup);
257bf3fcbf7SBeniamino Galvani 
258b058a5d2SBreno Leitao MODULE_DESCRIPTION("IPv4 Foo over UDP tunnel driver");
259cc4e3835SJakub Kicinski MODULE_LICENSE("GPL");
260