xref: /linux/net/ipv6/datagram.c (revision 13abf8130139c2ccd4962a7e5a8902be5e6cb5a7)
1 /*
2  *	common UDP/RAW code
3  *	Linux INET6 implementation
4  *
5  *	Authors:
6  *	Pedro Roque		<roque@di.fc.ul.pt>
7  *
8  *	$Id: datagram.c,v 1.24 2002/02/01 22:01:04 davem Exp $
9  *
10  *	This program is free software; you can redistribute it and/or
11  *      modify it under the terms of the GNU General Public License
12  *      as published by the Free Software Foundation; either version
13  *      2 of the License, or (at your option) any later version.
14  */
15 
16 #include <linux/errno.h>
17 #include <linux/types.h>
18 #include <linux/kernel.h>
19 #include <linux/sched.h>
20 #include <linux/interrupt.h>
21 #include <linux/socket.h>
22 #include <linux/sockios.h>
23 #include <linux/in6.h>
24 #include <linux/ipv6.h>
25 #include <linux/route.h>
26 
27 #include <net/ipv6.h>
28 #include <net/ndisc.h>
29 #include <net/addrconf.h>
30 #include <net/transp_v6.h>
31 #include <net/ip6_route.h>
32 #include <net/tcp_states.h>
33 
34 #include <linux/errqueue.h>
35 #include <asm/uaccess.h>
36 
37 int ip6_datagram_connect(struct sock *sk, struct sockaddr *uaddr, int addr_len)
38 {
39 	struct sockaddr_in6	*usin = (struct sockaddr_in6 *) uaddr;
40 	struct inet_sock      	*inet = inet_sk(sk);
41 	struct ipv6_pinfo      	*np = inet6_sk(sk);
42 	struct in6_addr		*daddr, *final_p = NULL, final;
43 	struct dst_entry	*dst;
44 	struct flowi		fl;
45 	struct ip6_flowlabel	*flowlabel = NULL;
46 	int			addr_type;
47 	int			err;
48 
49 	if (usin->sin6_family == AF_INET) {
50 		if (__ipv6_only_sock(sk))
51 			return -EAFNOSUPPORT;
52 		err = ip4_datagram_connect(sk, uaddr, addr_len);
53 		goto ipv4_connected;
54 	}
55 
56 	if (addr_len < SIN6_LEN_RFC2133)
57 	  	return -EINVAL;
58 
59 	if (usin->sin6_family != AF_INET6)
60 	  	return -EAFNOSUPPORT;
61 
62 	memset(&fl, 0, sizeof(fl));
63 	if (np->sndflow) {
64 		fl.fl6_flowlabel = usin->sin6_flowinfo&IPV6_FLOWINFO_MASK;
65 		if (fl.fl6_flowlabel&IPV6_FLOWLABEL_MASK) {
66 			flowlabel = fl6_sock_lookup(sk, fl.fl6_flowlabel);
67 			if (flowlabel == NULL)
68 				return -EINVAL;
69 			ipv6_addr_copy(&usin->sin6_addr, &flowlabel->dst);
70 		}
71 	}
72 
73 	addr_type = ipv6_addr_type(&usin->sin6_addr);
74 
75 	if (addr_type == IPV6_ADDR_ANY) {
76 		/*
77 		 *	connect to self
78 		 */
79 		usin->sin6_addr.s6_addr[15] = 0x01;
80 	}
81 
82 	daddr = &usin->sin6_addr;
83 
84 	if (addr_type == IPV6_ADDR_MAPPED) {
85 		struct sockaddr_in sin;
86 
87 		if (__ipv6_only_sock(sk)) {
88 			err = -ENETUNREACH;
89 			goto out;
90 		}
91 		sin.sin_family = AF_INET;
92 		sin.sin_addr.s_addr = daddr->s6_addr32[3];
93 		sin.sin_port = usin->sin6_port;
94 
95 		err = ip4_datagram_connect(sk,
96 					   (struct sockaddr*) &sin,
97 					   sizeof(sin));
98 
99 ipv4_connected:
100 		if (err)
101 			goto out;
102 
103 		ipv6_addr_set(&np->daddr, 0, 0, htonl(0x0000ffff), inet->daddr);
104 
105 		if (ipv6_addr_any(&np->saddr)) {
106 			ipv6_addr_set(&np->saddr, 0, 0, htonl(0x0000ffff),
107 				      inet->saddr);
108 		}
109 
110 		if (ipv6_addr_any(&np->rcv_saddr)) {
111 			ipv6_addr_set(&np->rcv_saddr, 0, 0, htonl(0x0000ffff),
112 				      inet->rcv_saddr);
113 		}
114 		goto out;
115 	}
116 
117 	if (addr_type&IPV6_ADDR_LINKLOCAL) {
118 		if (addr_len >= sizeof(struct sockaddr_in6) &&
119 		    usin->sin6_scope_id) {
120 			if (sk->sk_bound_dev_if &&
121 			    sk->sk_bound_dev_if != usin->sin6_scope_id) {
122 				err = -EINVAL;
123 				goto out;
124 			}
125 			sk->sk_bound_dev_if = usin->sin6_scope_id;
126 			if (!sk->sk_bound_dev_if &&
127 			    (addr_type & IPV6_ADDR_MULTICAST))
128 				fl.oif = np->mcast_oif;
129 		}
130 
131 		/* Connect to link-local address requires an interface */
132 		if (!sk->sk_bound_dev_if) {
133 			err = -EINVAL;
134 			goto out;
135 		}
136 	}
137 
138 	ipv6_addr_copy(&np->daddr, daddr);
139 	np->flow_label = fl.fl6_flowlabel;
140 
141 	inet->dport = usin->sin6_port;
142 
143 	/*
144 	 *	Check for a route to destination an obtain the
145 	 *	destination cache for it.
146 	 */
147 
148 	fl.proto = sk->sk_protocol;
149 	ipv6_addr_copy(&fl.fl6_dst, &np->daddr);
150 	ipv6_addr_copy(&fl.fl6_src, &np->saddr);
151 	fl.oif = sk->sk_bound_dev_if;
152 	fl.fl_ip_dport = inet->dport;
153 	fl.fl_ip_sport = inet->sport;
154 
155 	if (!fl.oif && (addr_type&IPV6_ADDR_MULTICAST))
156 		fl.oif = np->mcast_oif;
157 
158 	if (flowlabel) {
159 		if (flowlabel->opt && flowlabel->opt->srcrt) {
160 			struct rt0_hdr *rt0 = (struct rt0_hdr *) flowlabel->opt->srcrt;
161 			ipv6_addr_copy(&final, &fl.fl6_dst);
162 			ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
163 			final_p = &final;
164 		}
165 	} else if (np->opt && np->opt->srcrt) {
166 		struct rt0_hdr *rt0 = (struct rt0_hdr *)np->opt->srcrt;
167 		ipv6_addr_copy(&final, &fl.fl6_dst);
168 		ipv6_addr_copy(&fl.fl6_dst, rt0->addr);
169 		final_p = &final;
170 	}
171 
172 	err = ip6_dst_lookup(sk, &dst, &fl);
173 	if (err)
174 		goto out;
175 	if (final_p)
176 		ipv6_addr_copy(&fl.fl6_dst, final_p);
177 
178 	if ((err = xfrm_lookup(&dst, &fl, sk, 0)) < 0) {
179 		dst_release(dst);
180 		goto out;
181 	}
182 
183 	/* source address lookup done in ip6_dst_lookup */
184 
185 	if (ipv6_addr_any(&np->saddr))
186 		ipv6_addr_copy(&np->saddr, &fl.fl6_src);
187 
188 	if (ipv6_addr_any(&np->rcv_saddr)) {
189 		ipv6_addr_copy(&np->rcv_saddr, &fl.fl6_src);
190 		inet->rcv_saddr = LOOPBACK4_IPV6;
191 	}
192 
193 	ip6_dst_store(sk, dst,
194 		      ipv6_addr_equal(&fl.fl6_dst, &np->daddr) ?
195 		      &np->daddr : NULL);
196 
197 	sk->sk_state = TCP_ESTABLISHED;
198 out:
199 	fl6_sock_release(flowlabel);
200 	return err;
201 }
202 
203 void ipv6_icmp_error(struct sock *sk, struct sk_buff *skb, int err,
204 		     u16 port, u32 info, u8 *payload)
205 {
206 	struct ipv6_pinfo *np  = inet6_sk(sk);
207 	struct icmp6hdr *icmph = (struct icmp6hdr *)skb->h.raw;
208 	struct sock_exterr_skb *serr;
209 
210 	if (!np->recverr)
211 		return;
212 
213 	skb = skb_clone(skb, GFP_ATOMIC);
214 	if (!skb)
215 		return;
216 
217 	serr = SKB_EXT_ERR(skb);
218 	serr->ee.ee_errno = err;
219 	serr->ee.ee_origin = SO_EE_ORIGIN_ICMP6;
220 	serr->ee.ee_type = icmph->icmp6_type;
221 	serr->ee.ee_code = icmph->icmp6_code;
222 	serr->ee.ee_pad = 0;
223 	serr->ee.ee_info = info;
224 	serr->ee.ee_data = 0;
225 	serr->addr_offset = (u8*)&(((struct ipv6hdr*)(icmph+1))->daddr) - skb->nh.raw;
226 	serr->port = port;
227 
228 	skb->h.raw = payload;
229 	__skb_pull(skb, payload - skb->data);
230 
231 	if (sock_queue_err_skb(sk, skb))
232 		kfree_skb(skb);
233 }
234 
235 void ipv6_local_error(struct sock *sk, int err, struct flowi *fl, u32 info)
236 {
237 	struct ipv6_pinfo *np = inet6_sk(sk);
238 	struct sock_exterr_skb *serr;
239 	struct ipv6hdr *iph;
240 	struct sk_buff *skb;
241 
242 	if (!np->recverr)
243 		return;
244 
245 	skb = alloc_skb(sizeof(struct ipv6hdr), GFP_ATOMIC);
246 	if (!skb)
247 		return;
248 
249 	iph = (struct ipv6hdr*)skb_put(skb, sizeof(struct ipv6hdr));
250 	skb->nh.ipv6h = iph;
251 	ipv6_addr_copy(&iph->daddr, &fl->fl6_dst);
252 
253 	serr = SKB_EXT_ERR(skb);
254 	serr->ee.ee_errno = err;
255 	serr->ee.ee_origin = SO_EE_ORIGIN_LOCAL;
256 	serr->ee.ee_type = 0;
257 	serr->ee.ee_code = 0;
258 	serr->ee.ee_pad = 0;
259 	serr->ee.ee_info = info;
260 	serr->ee.ee_data = 0;
261 	serr->addr_offset = (u8*)&iph->daddr - skb->nh.raw;
262 	serr->port = fl->fl_ip_dport;
263 
264 	skb->h.raw = skb->tail;
265 	__skb_pull(skb, skb->tail - skb->data);
266 
267 	if (sock_queue_err_skb(sk, skb))
268 		kfree_skb(skb);
269 }
270 
271 /*
272  *	Handle MSG_ERRQUEUE
273  */
274 int ipv6_recv_error(struct sock *sk, struct msghdr *msg, int len)
275 {
276 	struct ipv6_pinfo *np = inet6_sk(sk);
277 	struct sock_exterr_skb *serr;
278 	struct sk_buff *skb, *skb2;
279 	struct sockaddr_in6 *sin;
280 	struct {
281 		struct sock_extended_err ee;
282 		struct sockaddr_in6	 offender;
283 	} errhdr;
284 	int err;
285 	int copied;
286 
287 	err = -EAGAIN;
288 	skb = skb_dequeue(&sk->sk_error_queue);
289 	if (skb == NULL)
290 		goto out;
291 
292 	copied = skb->len;
293 	if (copied > len) {
294 		msg->msg_flags |= MSG_TRUNC;
295 		copied = len;
296 	}
297 	err = skb_copy_datagram_iovec(skb, 0, msg->msg_iov, copied);
298 	if (err)
299 		goto out_free_skb;
300 
301 	sock_recv_timestamp(msg, sk, skb);
302 
303 	serr = SKB_EXT_ERR(skb);
304 
305 	sin = (struct sockaddr_in6 *)msg->msg_name;
306 	if (sin) {
307 		sin->sin6_family = AF_INET6;
308 		sin->sin6_flowinfo = 0;
309 		sin->sin6_port = serr->port;
310 		sin->sin6_scope_id = 0;
311 		if (serr->ee.ee_origin == SO_EE_ORIGIN_ICMP6) {
312 			ipv6_addr_copy(&sin->sin6_addr,
313 			  (struct in6_addr *)(skb->nh.raw + serr->addr_offset));
314 			if (np->sndflow)
315 				sin->sin6_flowinfo = *(u32*)(skb->nh.raw + serr->addr_offset - 24) & IPV6_FLOWINFO_MASK;
316 			if (ipv6_addr_type(&sin->sin6_addr) & IPV6_ADDR_LINKLOCAL)
317 				sin->sin6_scope_id = IP6CB(skb)->iif;
318 		} else {
319 			ipv6_addr_set(&sin->sin6_addr, 0, 0,
320 				      htonl(0xffff),
321 				      *(u32*)(skb->nh.raw + serr->addr_offset));
322 		}
323 	}
324 
325 	memcpy(&errhdr.ee, &serr->ee, sizeof(struct sock_extended_err));
326 	sin = &errhdr.offender;
327 	sin->sin6_family = AF_UNSPEC;
328 	if (serr->ee.ee_origin != SO_EE_ORIGIN_LOCAL) {
329 		sin->sin6_family = AF_INET6;
330 		sin->sin6_flowinfo = 0;
331 		sin->sin6_scope_id = 0;
332 		if (serr->ee.ee_origin == SO_EE_ORIGIN_ICMP6) {
333 			ipv6_addr_copy(&sin->sin6_addr, &skb->nh.ipv6h->saddr);
334 			if (np->rxopt.all)
335 				datagram_recv_ctl(sk, msg, skb);
336 			if (ipv6_addr_type(&sin->sin6_addr) & IPV6_ADDR_LINKLOCAL)
337 				sin->sin6_scope_id = IP6CB(skb)->iif;
338 		} else {
339 			struct inet_sock *inet = inet_sk(sk);
340 
341 			ipv6_addr_set(&sin->sin6_addr, 0, 0,
342 				      htonl(0xffff),
343 				      skb->nh.iph->saddr);
344 			if (inet->cmsg_flags)
345 				ip_cmsg_recv(msg, skb);
346 		}
347 	}
348 
349 	put_cmsg(msg, SOL_IPV6, IPV6_RECVERR, sizeof(errhdr), &errhdr);
350 
351 	/* Now we could try to dump offended packet options */
352 
353 	msg->msg_flags |= MSG_ERRQUEUE;
354 	err = copied;
355 
356 	/* Reset and regenerate socket error */
357 	spin_lock_bh(&sk->sk_error_queue.lock);
358 	sk->sk_err = 0;
359 	if ((skb2 = skb_peek(&sk->sk_error_queue)) != NULL) {
360 		sk->sk_err = SKB_EXT_ERR(skb2)->ee.ee_errno;
361 		spin_unlock_bh(&sk->sk_error_queue.lock);
362 		sk->sk_error_report(sk);
363 	} else {
364 		spin_unlock_bh(&sk->sk_error_queue.lock);
365 	}
366 
367 out_free_skb:
368 	kfree_skb(skb);
369 out:
370 	return err;
371 }
372 
373 
374 
375 int datagram_recv_ctl(struct sock *sk, struct msghdr *msg, struct sk_buff *skb)
376 {
377 	struct ipv6_pinfo *np = inet6_sk(sk);
378 	struct inet6_skb_parm *opt = IP6CB(skb);
379 
380 	if (np->rxopt.bits.rxinfo) {
381 		struct in6_pktinfo src_info;
382 
383 		src_info.ipi6_ifindex = opt->iif;
384 		ipv6_addr_copy(&src_info.ipi6_addr, &skb->nh.ipv6h->daddr);
385 		put_cmsg(msg, SOL_IPV6, IPV6_PKTINFO, sizeof(src_info), &src_info);
386 	}
387 
388 	if (np->rxopt.bits.rxhlim) {
389 		int hlim = skb->nh.ipv6h->hop_limit;
390 		put_cmsg(msg, SOL_IPV6, IPV6_HOPLIMIT, sizeof(hlim), &hlim);
391 	}
392 
393 	if (np->rxopt.bits.rxflow && (*(u32*)skb->nh.raw & IPV6_FLOWINFO_MASK)) {
394 		u32 flowinfo = *(u32*)skb->nh.raw & IPV6_FLOWINFO_MASK;
395 		put_cmsg(msg, SOL_IPV6, IPV6_FLOWINFO, sizeof(flowinfo), &flowinfo);
396 	}
397 	if (np->rxopt.bits.hopopts && opt->hop) {
398 		u8 *ptr = skb->nh.raw + opt->hop;
399 		put_cmsg(msg, SOL_IPV6, IPV6_HOPOPTS, (ptr[1]+1)<<3, ptr);
400 	}
401 	if (np->rxopt.bits.dstopts && opt->dst0) {
402 		u8 *ptr = skb->nh.raw + opt->dst0;
403 		put_cmsg(msg, SOL_IPV6, IPV6_DSTOPTS, (ptr[1]+1)<<3, ptr);
404 	}
405 	if (np->rxopt.bits.srcrt && opt->srcrt) {
406 		struct ipv6_rt_hdr *rthdr = (struct ipv6_rt_hdr *)(skb->nh.raw + opt->srcrt);
407 		put_cmsg(msg, SOL_IPV6, IPV6_RTHDR, (rthdr->hdrlen+1) << 3, rthdr);
408 	}
409 	if (np->rxopt.bits.dstopts && opt->dst1) {
410 		u8 *ptr = skb->nh.raw + opt->dst1;
411 		put_cmsg(msg, SOL_IPV6, IPV6_DSTOPTS, (ptr[1]+1)<<3, ptr);
412 	}
413 	return 0;
414 }
415 
416 int datagram_send_ctl(struct msghdr *msg, struct flowi *fl,
417 		      struct ipv6_txoptions *opt,
418 		      int *hlimit)
419 {
420 	struct in6_pktinfo *src_info;
421 	struct cmsghdr *cmsg;
422 	struct ipv6_rt_hdr *rthdr;
423 	struct ipv6_opt_hdr *hdr;
424 	int len;
425 	int err = 0;
426 
427 	for (cmsg = CMSG_FIRSTHDR(msg); cmsg; cmsg = CMSG_NXTHDR(msg, cmsg)) {
428 		int addr_type;
429 		struct net_device *dev = NULL;
430 
431 		if (!CMSG_OK(msg, cmsg)) {
432 			err = -EINVAL;
433 			goto exit_f;
434 		}
435 
436 		if (cmsg->cmsg_level != SOL_IPV6)
437 			continue;
438 
439 		switch (cmsg->cmsg_type) {
440  		case IPV6_PKTINFO:
441  			if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct in6_pktinfo))) {
442 				err = -EINVAL;
443 				goto exit_f;
444 			}
445 
446 			src_info = (struct in6_pktinfo *)CMSG_DATA(cmsg);
447 
448 			if (src_info->ipi6_ifindex) {
449 				if (fl->oif && src_info->ipi6_ifindex != fl->oif)
450 					return -EINVAL;
451 				fl->oif = src_info->ipi6_ifindex;
452 			}
453 
454 			addr_type = ipv6_addr_type(&src_info->ipi6_addr);
455 
456 			if (addr_type == IPV6_ADDR_ANY)
457 				break;
458 
459 			if (addr_type & IPV6_ADDR_LINKLOCAL) {
460 				if (!src_info->ipi6_ifindex)
461 					return -EINVAL;
462 				else {
463 					dev = dev_get_by_index(src_info->ipi6_ifindex);
464 					if (!dev)
465 						return -ENODEV;
466 				}
467 			}
468 			if (!ipv6_chk_addr(&src_info->ipi6_addr, dev, 0)) {
469 				if (dev)
470 					dev_put(dev);
471 				err = -EINVAL;
472 				goto exit_f;
473 			}
474 			if (dev)
475 				dev_put(dev);
476 
477 			ipv6_addr_copy(&fl->fl6_src, &src_info->ipi6_addr);
478 			break;
479 
480 		case IPV6_FLOWINFO:
481                         if (cmsg->cmsg_len < CMSG_LEN(4)) {
482 				err = -EINVAL;
483 				goto exit_f;
484 			}
485 
486 			if (fl->fl6_flowlabel&IPV6_FLOWINFO_MASK) {
487 				if ((fl->fl6_flowlabel^*(u32 *)CMSG_DATA(cmsg))&~IPV6_FLOWINFO_MASK) {
488 					err = -EINVAL;
489 					goto exit_f;
490 				}
491 			}
492 			fl->fl6_flowlabel = IPV6_FLOWINFO_MASK & *(u32 *)CMSG_DATA(cmsg);
493 			break;
494 
495 		case IPV6_HOPOPTS:
496                         if (opt->hopopt || cmsg->cmsg_len < CMSG_LEN(sizeof(struct ipv6_opt_hdr))) {
497 				err = -EINVAL;
498 				goto exit_f;
499 			}
500 
501 			hdr = (struct ipv6_opt_hdr *)CMSG_DATA(cmsg);
502 			len = ((hdr->hdrlen + 1) << 3);
503 			if (cmsg->cmsg_len < CMSG_LEN(len)) {
504 				err = -EINVAL;
505 				goto exit_f;
506 			}
507 			if (!capable(CAP_NET_RAW)) {
508 				err = -EPERM;
509 				goto exit_f;
510 			}
511 			opt->opt_nflen += len;
512 			opt->hopopt = hdr;
513 			break;
514 
515 		case IPV6_DSTOPTS:
516                         if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct ipv6_opt_hdr))) {
517 				err = -EINVAL;
518 				goto exit_f;
519 			}
520 
521 			hdr = (struct ipv6_opt_hdr *)CMSG_DATA(cmsg);
522 			len = ((hdr->hdrlen + 1) << 3);
523 			if (cmsg->cmsg_len < CMSG_LEN(len)) {
524 				err = -EINVAL;
525 				goto exit_f;
526 			}
527 			if (!capable(CAP_NET_RAW)) {
528 				err = -EPERM;
529 				goto exit_f;
530 			}
531 			if (opt->dst1opt) {
532 				err = -EINVAL;
533 				goto exit_f;
534 			}
535 			opt->opt_flen += len;
536 			opt->dst1opt = hdr;
537 			break;
538 
539 		case IPV6_RTHDR:
540                         if (cmsg->cmsg_len < CMSG_LEN(sizeof(struct ipv6_rt_hdr))) {
541 				err = -EINVAL;
542 				goto exit_f;
543 			}
544 
545 			rthdr = (struct ipv6_rt_hdr *)CMSG_DATA(cmsg);
546 
547 			/*
548 			 *	TYPE 0
549 			 */
550 			if (rthdr->type) {
551 				err = -EINVAL;
552 				goto exit_f;
553 			}
554 
555 			len = ((rthdr->hdrlen + 1) << 3);
556 
557                         if (cmsg->cmsg_len < CMSG_LEN(len)) {
558 				err = -EINVAL;
559 				goto exit_f;
560 			}
561 
562 			/* segments left must also match */
563 			if ((rthdr->hdrlen >> 1) != rthdr->segments_left) {
564 				err = -EINVAL;
565 				goto exit_f;
566 			}
567 
568 			opt->opt_nflen += len;
569 			opt->srcrt = rthdr;
570 
571 			if (opt->dst1opt) {
572 				int dsthdrlen = ((opt->dst1opt->hdrlen+1)<<3);
573 
574 				opt->opt_nflen += dsthdrlen;
575 				opt->dst0opt = opt->dst1opt;
576 				opt->dst1opt = NULL;
577 				opt->opt_flen -= dsthdrlen;
578 			}
579 
580 			break;
581 
582 		case IPV6_HOPLIMIT:
583 			if (cmsg->cmsg_len != CMSG_LEN(sizeof(int))) {
584 				err = -EINVAL;
585 				goto exit_f;
586 			}
587 
588 			*hlimit = *(int *)CMSG_DATA(cmsg);
589 			break;
590 
591 		default:
592 			LIMIT_NETDEBUG(KERN_DEBUG "invalid cmsg type: %d\n",
593 			               cmsg->cmsg_type);
594 			err = -EINVAL;
595 			break;
596 		};
597 	}
598 
599 exit_f:
600 	return err;
601 }
602