xref: /linux/net/sctp/socket.c (revision 9baa0b0364103dd726384c71db30b74044754743)
1 /* SCTP kernel implementation
2  * (C) Copyright IBM Corp. 2001, 2004
3  * Copyright (c) 1999-2000 Cisco, Inc.
4  * Copyright (c) 1999-2001 Motorola, Inc.
5  * Copyright (c) 2001-2003 Intel Corp.
6  * Copyright (c) 2001-2002 Nokia, Inc.
7  * Copyright (c) 2001 La Monte H.P. Yarroll
8  *
9  * This file is part of the SCTP kernel implementation
10  *
11  * These functions interface with the sockets layer to implement the
12  * SCTP Extensions for the Sockets API.
13  *
14  * Note that the descriptions from the specification are USER level
15  * functions--this file is the functions which populate the struct proto
16  * for SCTP which is the BOTTOM of the sockets interface.
17  *
18  * This SCTP implementation is free software;
19  * you can redistribute it and/or modify it under the terms of
20  * the GNU General Public License as published by
21  * the Free Software Foundation; either version 2, or (at your option)
22  * any later version.
23  *
24  * This SCTP implementation is distributed in the hope that it
25  * will be useful, but WITHOUT ANY WARRANTY; without even the implied
26  *                 ************************
27  * warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
28  * See the GNU General Public License for more details.
29  *
30  * You should have received a copy of the GNU General Public License
31  * along with GNU CC; see the file COPYING.  If not, write to
32  * the Free Software Foundation, 59 Temple Place - Suite 330,
33  * Boston, MA 02111-1307, USA.
34  *
35  * Please send any bug reports or fixes you make to the
36  * email address(es):
37  *    lksctp developers <lksctp-developers@lists.sourceforge.net>
38  *
39  * Or submit a bug report through the following website:
40  *    http://www.sf.net/projects/lksctp
41  *
42  * Written or modified by:
43  *    La Monte H.P. Yarroll <piggy@acm.org>
44  *    Narasimha Budihal     <narsi@refcode.org>
45  *    Karl Knutson          <karl@athena.chicago.il.us>
46  *    Jon Grimm             <jgrimm@us.ibm.com>
47  *    Xingang Guo           <xingang.guo@intel.com>
48  *    Daisy Chang           <daisyc@us.ibm.com>
49  *    Sridhar Samudrala     <samudrala@us.ibm.com>
50  *    Inaky Perez-Gonzalez  <inaky.gonzalez@intel.com>
51  *    Ardelle Fan	    <ardelle.fan@intel.com>
52  *    Ryan Layer	    <rmlayer@us.ibm.com>
53  *    Anup Pemmaiah         <pemmaiah@cc.usu.edu>
54  *    Kevin Gao             <kevin.gao@intel.com>
55  *
56  * Any bugs reported given to us we will try to fix... any fixes shared will
57  * be incorporated into the next SCTP release.
58  */
59 
60 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
61 
62 #include <linux/types.h>
63 #include <linux/kernel.h>
64 #include <linux/wait.h>
65 #include <linux/time.h>
66 #include <linux/ip.h>
67 #include <linux/capability.h>
68 #include <linux/fcntl.h>
69 #include <linux/poll.h>
70 #include <linux/init.h>
71 #include <linux/crypto.h>
72 #include <linux/slab.h>
73 
74 #include <net/ip.h>
75 #include <net/icmp.h>
76 #include <net/route.h>
77 #include <net/ipv6.h>
78 #include <net/inet_common.h>
79 
80 #include <linux/socket.h> /* for sa_family_t */
81 #include <linux/export.h>
82 #include <net/sock.h>
83 #include <net/sctp/sctp.h>
84 #include <net/sctp/sm.h>
85 
86 /* WARNING:  Please do not remove the SCTP_STATIC attribute to
87  * any of the functions below as they are used to export functions
88  * used by a project regression testsuite.
89  */
90 
91 /* Forward declarations for internal helper functions. */
92 static int sctp_writeable(struct sock *sk);
93 static void sctp_wfree(struct sk_buff *skb);
94 static int sctp_wait_for_sndbuf(struct sctp_association *, long *timeo_p,
95 				size_t msg_len);
96 static int sctp_wait_for_packet(struct sock * sk, int *err, long *timeo_p);
97 static int sctp_wait_for_connect(struct sctp_association *, long *timeo_p);
98 static int sctp_wait_for_accept(struct sock *sk, long timeo);
99 static void sctp_wait_for_close(struct sock *sk, long timeo);
100 static struct sctp_af *sctp_sockaddr_af(struct sctp_sock *opt,
101 					union sctp_addr *addr, int len);
102 static int sctp_bindx_add(struct sock *, struct sockaddr *, int);
103 static int sctp_bindx_rem(struct sock *, struct sockaddr *, int);
104 static int sctp_send_asconf_add_ip(struct sock *, struct sockaddr *, int);
105 static int sctp_send_asconf_del_ip(struct sock *, struct sockaddr *, int);
106 static int sctp_send_asconf(struct sctp_association *asoc,
107 			    struct sctp_chunk *chunk);
108 static int sctp_do_bind(struct sock *, union sctp_addr *, int);
109 static int sctp_autobind(struct sock *sk);
110 static void sctp_sock_migrate(struct sock *, struct sock *,
111 			      struct sctp_association *, sctp_socket_type_t);
112 static char *sctp_hmac_alg = SCTP_COOKIE_HMAC_ALG;
113 
114 extern struct kmem_cache *sctp_bucket_cachep;
115 extern long sysctl_sctp_mem[3];
116 extern int sysctl_sctp_rmem[3];
117 extern int sysctl_sctp_wmem[3];
118 
119 static int sctp_memory_pressure;
120 static atomic_long_t sctp_memory_allocated;
121 struct percpu_counter sctp_sockets_allocated;
122 
123 static void sctp_enter_memory_pressure(struct sock *sk)
124 {
125 	sctp_memory_pressure = 1;
126 }
127 
128 
129 /* Get the sndbuf space available at the time on the association.  */
130 static inline int sctp_wspace(struct sctp_association *asoc)
131 {
132 	int amt;
133 
134 	if (asoc->ep->sndbuf_policy)
135 		amt = asoc->sndbuf_used;
136 	else
137 		amt = sk_wmem_alloc_get(asoc->base.sk);
138 
139 	if (amt >= asoc->base.sk->sk_sndbuf) {
140 		if (asoc->base.sk->sk_userlocks & SOCK_SNDBUF_LOCK)
141 			amt = 0;
142 		else {
143 			amt = sk_stream_wspace(asoc->base.sk);
144 			if (amt < 0)
145 				amt = 0;
146 		}
147 	} else {
148 		amt = asoc->base.sk->sk_sndbuf - amt;
149 	}
150 	return amt;
151 }
152 
153 /* Increment the used sndbuf space count of the corresponding association by
154  * the size of the outgoing data chunk.
155  * Also, set the skb destructor for sndbuf accounting later.
156  *
157  * Since it is always 1-1 between chunk and skb, and also a new skb is always
158  * allocated for chunk bundling in sctp_packet_transmit(), we can use the
159  * destructor in the data chunk skb for the purpose of the sndbuf space
160  * tracking.
161  */
162 static inline void sctp_set_owner_w(struct sctp_chunk *chunk)
163 {
164 	struct sctp_association *asoc = chunk->asoc;
165 	struct sock *sk = asoc->base.sk;
166 
167 	/* The sndbuf space is tracked per association.  */
168 	sctp_association_hold(asoc);
169 
170 	skb_set_owner_w(chunk->skb, sk);
171 
172 	chunk->skb->destructor = sctp_wfree;
173 	/* Save the chunk pointer in skb for sctp_wfree to use later.  */
174 	*((struct sctp_chunk **)(chunk->skb->cb)) = chunk;
175 
176 	asoc->sndbuf_used += SCTP_DATA_SNDSIZE(chunk) +
177 				sizeof(struct sk_buff) +
178 				sizeof(struct sctp_chunk);
179 
180 	atomic_add(sizeof(struct sctp_chunk), &sk->sk_wmem_alloc);
181 	sk->sk_wmem_queued += chunk->skb->truesize;
182 	sk_mem_charge(sk, chunk->skb->truesize);
183 }
184 
185 /* Verify that this is a valid address. */
186 static inline int sctp_verify_addr(struct sock *sk, union sctp_addr *addr,
187 				   int len)
188 {
189 	struct sctp_af *af;
190 
191 	/* Verify basic sockaddr. */
192 	af = sctp_sockaddr_af(sctp_sk(sk), addr, len);
193 	if (!af)
194 		return -EINVAL;
195 
196 	/* Is this a valid SCTP address?  */
197 	if (!af->addr_valid(addr, sctp_sk(sk), NULL))
198 		return -EINVAL;
199 
200 	if (!sctp_sk(sk)->pf->send_verify(sctp_sk(sk), (addr)))
201 		return -EINVAL;
202 
203 	return 0;
204 }
205 
206 /* Look up the association by its id.  If this is not a UDP-style
207  * socket, the ID field is always ignored.
208  */
209 struct sctp_association *sctp_id2assoc(struct sock *sk, sctp_assoc_t id)
210 {
211 	struct sctp_association *asoc = NULL;
212 
213 	/* If this is not a UDP-style socket, assoc id should be ignored. */
214 	if (!sctp_style(sk, UDP)) {
215 		/* Return NULL if the socket state is not ESTABLISHED. It
216 		 * could be a TCP-style listening socket or a socket which
217 		 * hasn't yet called connect() to establish an association.
218 		 */
219 		if (!sctp_sstate(sk, ESTABLISHED))
220 			return NULL;
221 
222 		/* Get the first and the only association from the list. */
223 		if (!list_empty(&sctp_sk(sk)->ep->asocs))
224 			asoc = list_entry(sctp_sk(sk)->ep->asocs.next,
225 					  struct sctp_association, asocs);
226 		return asoc;
227 	}
228 
229 	/* Otherwise this is a UDP-style socket. */
230 	if (!id || (id == (sctp_assoc_t)-1))
231 		return NULL;
232 
233 	spin_lock_bh(&sctp_assocs_id_lock);
234 	asoc = (struct sctp_association *)idr_find(&sctp_assocs_id, (int)id);
235 	spin_unlock_bh(&sctp_assocs_id_lock);
236 
237 	if (!asoc || (asoc->base.sk != sk) || asoc->base.dead)
238 		return NULL;
239 
240 	return asoc;
241 }
242 
243 /* Look up the transport from an address and an assoc id. If both address and
244  * id are specified, the associations matching the address and the id should be
245  * the same.
246  */
247 static struct sctp_transport *sctp_addr_id2transport(struct sock *sk,
248 					      struct sockaddr_storage *addr,
249 					      sctp_assoc_t id)
250 {
251 	struct sctp_association *addr_asoc = NULL, *id_asoc = NULL;
252 	struct sctp_transport *transport;
253 	union sctp_addr *laddr = (union sctp_addr *)addr;
254 
255 	addr_asoc = sctp_endpoint_lookup_assoc(sctp_sk(sk)->ep,
256 					       laddr,
257 					       &transport);
258 
259 	if (!addr_asoc)
260 		return NULL;
261 
262 	id_asoc = sctp_id2assoc(sk, id);
263 	if (id_asoc && (id_asoc != addr_asoc))
264 		return NULL;
265 
266 	sctp_get_pf_specific(sk->sk_family)->addr_v4map(sctp_sk(sk),
267 						(union sctp_addr *)addr);
268 
269 	return transport;
270 }
271 
272 /* API 3.1.2 bind() - UDP Style Syntax
273  * The syntax of bind() is,
274  *
275  *   ret = bind(int sd, struct sockaddr *addr, int addrlen);
276  *
277  *   sd      - the socket descriptor returned by socket().
278  *   addr    - the address structure (struct sockaddr_in or struct
279  *             sockaddr_in6 [RFC 2553]),
280  *   addr_len - the size of the address structure.
281  */
282 SCTP_STATIC int sctp_bind(struct sock *sk, struct sockaddr *addr, int addr_len)
283 {
284 	int retval = 0;
285 
286 	sctp_lock_sock(sk);
287 
288 	SCTP_DEBUG_PRINTK("sctp_bind(sk: %p, addr: %p, addr_len: %d)\n",
289 			  sk, addr, addr_len);
290 
291 	/* Disallow binding twice. */
292 	if (!sctp_sk(sk)->ep->base.bind_addr.port)
293 		retval = sctp_do_bind(sk, (union sctp_addr *)addr,
294 				      addr_len);
295 	else
296 		retval = -EINVAL;
297 
298 	sctp_release_sock(sk);
299 
300 	return retval;
301 }
302 
303 static long sctp_get_port_local(struct sock *, union sctp_addr *);
304 
305 /* Verify this is a valid sockaddr. */
306 static struct sctp_af *sctp_sockaddr_af(struct sctp_sock *opt,
307 					union sctp_addr *addr, int len)
308 {
309 	struct sctp_af *af;
310 
311 	/* Check minimum size.  */
312 	if (len < sizeof (struct sockaddr))
313 		return NULL;
314 
315 	/* V4 mapped address are really of AF_INET family */
316 	if (addr->sa.sa_family == AF_INET6 &&
317 	    ipv6_addr_v4mapped(&addr->v6.sin6_addr)) {
318 		if (!opt->pf->af_supported(AF_INET, opt))
319 			return NULL;
320 	} else {
321 		/* Does this PF support this AF? */
322 		if (!opt->pf->af_supported(addr->sa.sa_family, opt))
323 			return NULL;
324 	}
325 
326 	/* If we get this far, af is valid. */
327 	af = sctp_get_af_specific(addr->sa.sa_family);
328 
329 	if (len < af->sockaddr_len)
330 		return NULL;
331 
332 	return af;
333 }
334 
335 /* Bind a local address either to an endpoint or to an association.  */
336 SCTP_STATIC int sctp_do_bind(struct sock *sk, union sctp_addr *addr, int len)
337 {
338 	struct sctp_sock *sp = sctp_sk(sk);
339 	struct sctp_endpoint *ep = sp->ep;
340 	struct sctp_bind_addr *bp = &ep->base.bind_addr;
341 	struct sctp_af *af;
342 	unsigned short snum;
343 	int ret = 0;
344 
345 	/* Common sockaddr verification. */
346 	af = sctp_sockaddr_af(sp, addr, len);
347 	if (!af) {
348 		SCTP_DEBUG_PRINTK("sctp_do_bind(sk: %p, newaddr: %p, len: %d) EINVAL\n",
349 				  sk, addr, len);
350 		return -EINVAL;
351 	}
352 
353 	snum = ntohs(addr->v4.sin_port);
354 
355 	SCTP_DEBUG_PRINTK_IPADDR("sctp_do_bind(sk: %p, new addr: ",
356 				 ", port: %d, new port: %d, len: %d)\n",
357 				 sk,
358 				 addr,
359 				 bp->port, snum,
360 				 len);
361 
362 	/* PF specific bind() address verification. */
363 	if (!sp->pf->bind_verify(sp, addr))
364 		return -EADDRNOTAVAIL;
365 
366 	/* We must either be unbound, or bind to the same port.
367 	 * It's OK to allow 0 ports if we are already bound.
368 	 * We'll just inhert an already bound port in this case
369 	 */
370 	if (bp->port) {
371 		if (!snum)
372 			snum = bp->port;
373 		else if (snum != bp->port) {
374 			SCTP_DEBUG_PRINTK("sctp_do_bind:"
375 				  " New port %d does not match existing port "
376 				  "%d.\n", snum, bp->port);
377 			return -EINVAL;
378 		}
379 	}
380 
381 	if (snum && snum < PROT_SOCK && !capable(CAP_NET_BIND_SERVICE))
382 		return -EACCES;
383 
384 	/* See if the address matches any of the addresses we may have
385 	 * already bound before checking against other endpoints.
386 	 */
387 	if (sctp_bind_addr_match(bp, addr, sp))
388 		return -EINVAL;
389 
390 	/* Make sure we are allowed to bind here.
391 	 * The function sctp_get_port_local() does duplicate address
392 	 * detection.
393 	 */
394 	addr->v4.sin_port = htons(snum);
395 	if ((ret = sctp_get_port_local(sk, addr))) {
396 		return -EADDRINUSE;
397 	}
398 
399 	/* Refresh ephemeral port.  */
400 	if (!bp->port)
401 		bp->port = inet_sk(sk)->inet_num;
402 
403 	/* Add the address to the bind address list.
404 	 * Use GFP_ATOMIC since BHs will be disabled.
405 	 */
406 	ret = sctp_add_bind_addr(bp, addr, SCTP_ADDR_SRC, GFP_ATOMIC);
407 
408 	/* Copy back into socket for getsockname() use. */
409 	if (!ret) {
410 		inet_sk(sk)->inet_sport = htons(inet_sk(sk)->inet_num);
411 		af->to_sk_saddr(addr, sk);
412 	}
413 
414 	return ret;
415 }
416 
417  /* ADDIP Section 4.1.1 Congestion Control of ASCONF Chunks
418  *
419  * R1) One and only one ASCONF Chunk MAY be in transit and unacknowledged
420  * at any one time.  If a sender, after sending an ASCONF chunk, decides
421  * it needs to transfer another ASCONF Chunk, it MUST wait until the
422  * ASCONF-ACK Chunk returns from the previous ASCONF Chunk before sending a
423  * subsequent ASCONF. Note this restriction binds each side, so at any
424  * time two ASCONF may be in-transit on any given association (one sent
425  * from each endpoint).
426  */
427 static int sctp_send_asconf(struct sctp_association *asoc,
428 			    struct sctp_chunk *chunk)
429 {
430 	struct net 	*net = sock_net(asoc->base.sk);
431 	int		retval = 0;
432 
433 	/* If there is an outstanding ASCONF chunk, queue it for later
434 	 * transmission.
435 	 */
436 	if (asoc->addip_last_asconf) {
437 		list_add_tail(&chunk->list, &asoc->addip_chunk_list);
438 		goto out;
439 	}
440 
441 	/* Hold the chunk until an ASCONF_ACK is received. */
442 	sctp_chunk_hold(chunk);
443 	retval = sctp_primitive_ASCONF(net, asoc, chunk);
444 	if (retval)
445 		sctp_chunk_free(chunk);
446 	else
447 		asoc->addip_last_asconf = chunk;
448 
449 out:
450 	return retval;
451 }
452 
453 /* Add a list of addresses as bind addresses to local endpoint or
454  * association.
455  *
456  * Basically run through each address specified in the addrs/addrcnt
457  * array/length pair, determine if it is IPv6 or IPv4 and call
458  * sctp_do_bind() on it.
459  *
460  * If any of them fails, then the operation will be reversed and the
461  * ones that were added will be removed.
462  *
463  * Only sctp_setsockopt_bindx() is supposed to call this function.
464  */
465 static int sctp_bindx_add(struct sock *sk, struct sockaddr *addrs, int addrcnt)
466 {
467 	int cnt;
468 	int retval = 0;
469 	void *addr_buf;
470 	struct sockaddr *sa_addr;
471 	struct sctp_af *af;
472 
473 	SCTP_DEBUG_PRINTK("sctp_bindx_add (sk: %p, addrs: %p, addrcnt: %d)\n",
474 			  sk, addrs, addrcnt);
475 
476 	addr_buf = addrs;
477 	for (cnt = 0; cnt < addrcnt; cnt++) {
478 		/* The list may contain either IPv4 or IPv6 address;
479 		 * determine the address length for walking thru the list.
480 		 */
481 		sa_addr = addr_buf;
482 		af = sctp_get_af_specific(sa_addr->sa_family);
483 		if (!af) {
484 			retval = -EINVAL;
485 			goto err_bindx_add;
486 		}
487 
488 		retval = sctp_do_bind(sk, (union sctp_addr *)sa_addr,
489 				      af->sockaddr_len);
490 
491 		addr_buf += af->sockaddr_len;
492 
493 err_bindx_add:
494 		if (retval < 0) {
495 			/* Failed. Cleanup the ones that have been added */
496 			if (cnt > 0)
497 				sctp_bindx_rem(sk, addrs, cnt);
498 			return retval;
499 		}
500 	}
501 
502 	return retval;
503 }
504 
505 /* Send an ASCONF chunk with Add IP address parameters to all the peers of the
506  * associations that are part of the endpoint indicating that a list of local
507  * addresses are added to the endpoint.
508  *
509  * If any of the addresses is already in the bind address list of the
510  * association, we do not send the chunk for that association.  But it will not
511  * affect other associations.
512  *
513  * Only sctp_setsockopt_bindx() is supposed to call this function.
514  */
515 static int sctp_send_asconf_add_ip(struct sock		*sk,
516 				   struct sockaddr	*addrs,
517 				   int 			addrcnt)
518 {
519 	struct net *net = sock_net(sk);
520 	struct sctp_sock		*sp;
521 	struct sctp_endpoint		*ep;
522 	struct sctp_association		*asoc;
523 	struct sctp_bind_addr		*bp;
524 	struct sctp_chunk		*chunk;
525 	struct sctp_sockaddr_entry	*laddr;
526 	union sctp_addr			*addr;
527 	union sctp_addr			saveaddr;
528 	void				*addr_buf;
529 	struct sctp_af			*af;
530 	struct list_head		*p;
531 	int 				i;
532 	int 				retval = 0;
533 
534 	if (!net->sctp.addip_enable)
535 		return retval;
536 
537 	sp = sctp_sk(sk);
538 	ep = sp->ep;
539 
540 	SCTP_DEBUG_PRINTK("%s: (sk: %p, addrs: %p, addrcnt: %d)\n",
541 			  __func__, sk, addrs, addrcnt);
542 
543 	list_for_each_entry(asoc, &ep->asocs, asocs) {
544 
545 		if (!asoc->peer.asconf_capable)
546 			continue;
547 
548 		if (asoc->peer.addip_disabled_mask & SCTP_PARAM_ADD_IP)
549 			continue;
550 
551 		if (!sctp_state(asoc, ESTABLISHED))
552 			continue;
553 
554 		/* Check if any address in the packed array of addresses is
555 		 * in the bind address list of the association. If so,
556 		 * do not send the asconf chunk to its peer, but continue with
557 		 * other associations.
558 		 */
559 		addr_buf = addrs;
560 		for (i = 0; i < addrcnt; i++) {
561 			addr = addr_buf;
562 			af = sctp_get_af_specific(addr->v4.sin_family);
563 			if (!af) {
564 				retval = -EINVAL;
565 				goto out;
566 			}
567 
568 			if (sctp_assoc_lookup_laddr(asoc, addr))
569 				break;
570 
571 			addr_buf += af->sockaddr_len;
572 		}
573 		if (i < addrcnt)
574 			continue;
575 
576 		/* Use the first valid address in bind addr list of
577 		 * association as Address Parameter of ASCONF CHUNK.
578 		 */
579 		bp = &asoc->base.bind_addr;
580 		p = bp->address_list.next;
581 		laddr = list_entry(p, struct sctp_sockaddr_entry, list);
582 		chunk = sctp_make_asconf_update_ip(asoc, &laddr->a, addrs,
583 						   addrcnt, SCTP_PARAM_ADD_IP);
584 		if (!chunk) {
585 			retval = -ENOMEM;
586 			goto out;
587 		}
588 
589 		/* Add the new addresses to the bind address list with
590 		 * use_as_src set to 0.
591 		 */
592 		addr_buf = addrs;
593 		for (i = 0; i < addrcnt; i++) {
594 			addr = addr_buf;
595 			af = sctp_get_af_specific(addr->v4.sin_family);
596 			memcpy(&saveaddr, addr, af->sockaddr_len);
597 			retval = sctp_add_bind_addr(bp, &saveaddr,
598 						    SCTP_ADDR_NEW, GFP_ATOMIC);
599 			addr_buf += af->sockaddr_len;
600 		}
601 		if (asoc->src_out_of_asoc_ok) {
602 			struct sctp_transport *trans;
603 
604 			list_for_each_entry(trans,
605 			    &asoc->peer.transport_addr_list, transports) {
606 				/* Clear the source and route cache */
607 				dst_release(trans->dst);
608 				trans->cwnd = min(4*asoc->pathmtu, max_t(__u32,
609 				    2*asoc->pathmtu, 4380));
610 				trans->ssthresh = asoc->peer.i.a_rwnd;
611 				trans->rto = asoc->rto_initial;
612 				trans->rtt = trans->srtt = trans->rttvar = 0;
613 				sctp_transport_route(trans, NULL,
614 				    sctp_sk(asoc->base.sk));
615 			}
616 		}
617 		retval = sctp_send_asconf(asoc, chunk);
618 	}
619 
620 out:
621 	return retval;
622 }
623 
624 /* Remove a list of addresses from bind addresses list.  Do not remove the
625  * last address.
626  *
627  * Basically run through each address specified in the addrs/addrcnt
628  * array/length pair, determine if it is IPv6 or IPv4 and call
629  * sctp_del_bind() on it.
630  *
631  * If any of them fails, then the operation will be reversed and the
632  * ones that were removed will be added back.
633  *
634  * At least one address has to be left; if only one address is
635  * available, the operation will return -EBUSY.
636  *
637  * Only sctp_setsockopt_bindx() is supposed to call this function.
638  */
639 static int sctp_bindx_rem(struct sock *sk, struct sockaddr *addrs, int addrcnt)
640 {
641 	struct sctp_sock *sp = sctp_sk(sk);
642 	struct sctp_endpoint *ep = sp->ep;
643 	int cnt;
644 	struct sctp_bind_addr *bp = &ep->base.bind_addr;
645 	int retval = 0;
646 	void *addr_buf;
647 	union sctp_addr *sa_addr;
648 	struct sctp_af *af;
649 
650 	SCTP_DEBUG_PRINTK("sctp_bindx_rem (sk: %p, addrs: %p, addrcnt: %d)\n",
651 			  sk, addrs, addrcnt);
652 
653 	addr_buf = addrs;
654 	for (cnt = 0; cnt < addrcnt; cnt++) {
655 		/* If the bind address list is empty or if there is only one
656 		 * bind address, there is nothing more to be removed (we need
657 		 * at least one address here).
658 		 */
659 		if (list_empty(&bp->address_list) ||
660 		    (sctp_list_single_entry(&bp->address_list))) {
661 			retval = -EBUSY;
662 			goto err_bindx_rem;
663 		}
664 
665 		sa_addr = addr_buf;
666 		af = sctp_get_af_specific(sa_addr->sa.sa_family);
667 		if (!af) {
668 			retval = -EINVAL;
669 			goto err_bindx_rem;
670 		}
671 
672 		if (!af->addr_valid(sa_addr, sp, NULL)) {
673 			retval = -EADDRNOTAVAIL;
674 			goto err_bindx_rem;
675 		}
676 
677 		if (sa_addr->v4.sin_port &&
678 		    sa_addr->v4.sin_port != htons(bp->port)) {
679 			retval = -EINVAL;
680 			goto err_bindx_rem;
681 		}
682 
683 		if (!sa_addr->v4.sin_port)
684 			sa_addr->v4.sin_port = htons(bp->port);
685 
686 		/* FIXME - There is probably a need to check if sk->sk_saddr and
687 		 * sk->sk_rcv_addr are currently set to one of the addresses to
688 		 * be removed. This is something which needs to be looked into
689 		 * when we are fixing the outstanding issues with multi-homing
690 		 * socket routing and failover schemes. Refer to comments in
691 		 * sctp_do_bind(). -daisy
692 		 */
693 		retval = sctp_del_bind_addr(bp, sa_addr);
694 
695 		addr_buf += af->sockaddr_len;
696 err_bindx_rem:
697 		if (retval < 0) {
698 			/* Failed. Add the ones that has been removed back */
699 			if (cnt > 0)
700 				sctp_bindx_add(sk, addrs, cnt);
701 			return retval;
702 		}
703 	}
704 
705 	return retval;
706 }
707 
708 /* Send an ASCONF chunk with Delete IP address parameters to all the peers of
709  * the associations that are part of the endpoint indicating that a list of
710  * local addresses are removed from the endpoint.
711  *
712  * If any of the addresses is already in the bind address list of the
713  * association, we do not send the chunk for that association.  But it will not
714  * affect other associations.
715  *
716  * Only sctp_setsockopt_bindx() is supposed to call this function.
717  */
718 static int sctp_send_asconf_del_ip(struct sock		*sk,
719 				   struct sockaddr	*addrs,
720 				   int			addrcnt)
721 {
722 	struct net *net = sock_net(sk);
723 	struct sctp_sock	*sp;
724 	struct sctp_endpoint	*ep;
725 	struct sctp_association	*asoc;
726 	struct sctp_transport	*transport;
727 	struct sctp_bind_addr	*bp;
728 	struct sctp_chunk	*chunk;
729 	union sctp_addr		*laddr;
730 	void			*addr_buf;
731 	struct sctp_af		*af;
732 	struct sctp_sockaddr_entry *saddr;
733 	int 			i;
734 	int 			retval = 0;
735 	int			stored = 0;
736 
737 	chunk = NULL;
738 	if (!net->sctp.addip_enable)
739 		return retval;
740 
741 	sp = sctp_sk(sk);
742 	ep = sp->ep;
743 
744 	SCTP_DEBUG_PRINTK("%s: (sk: %p, addrs: %p, addrcnt: %d)\n",
745 			  __func__, sk, addrs, addrcnt);
746 
747 	list_for_each_entry(asoc, &ep->asocs, asocs) {
748 
749 		if (!asoc->peer.asconf_capable)
750 			continue;
751 
752 		if (asoc->peer.addip_disabled_mask & SCTP_PARAM_DEL_IP)
753 			continue;
754 
755 		if (!sctp_state(asoc, ESTABLISHED))
756 			continue;
757 
758 		/* Check if any address in the packed array of addresses is
759 		 * not present in the bind address list of the association.
760 		 * If so, do not send the asconf chunk to its peer, but
761 		 * continue with other associations.
762 		 */
763 		addr_buf = addrs;
764 		for (i = 0; i < addrcnt; i++) {
765 			laddr = addr_buf;
766 			af = sctp_get_af_specific(laddr->v4.sin_family);
767 			if (!af) {
768 				retval = -EINVAL;
769 				goto out;
770 			}
771 
772 			if (!sctp_assoc_lookup_laddr(asoc, laddr))
773 				break;
774 
775 			addr_buf += af->sockaddr_len;
776 		}
777 		if (i < addrcnt)
778 			continue;
779 
780 		/* Find one address in the association's bind address list
781 		 * that is not in the packed array of addresses. This is to
782 		 * make sure that we do not delete all the addresses in the
783 		 * association.
784 		 */
785 		bp = &asoc->base.bind_addr;
786 		laddr = sctp_find_unmatch_addr(bp, (union sctp_addr *)addrs,
787 					       addrcnt, sp);
788 		if ((laddr == NULL) && (addrcnt == 1)) {
789 			if (asoc->asconf_addr_del_pending)
790 				continue;
791 			asoc->asconf_addr_del_pending =
792 			    kzalloc(sizeof(union sctp_addr), GFP_ATOMIC);
793 			if (asoc->asconf_addr_del_pending == NULL) {
794 				retval = -ENOMEM;
795 				goto out;
796 			}
797 			asoc->asconf_addr_del_pending->sa.sa_family =
798 				    addrs->sa_family;
799 			asoc->asconf_addr_del_pending->v4.sin_port =
800 				    htons(bp->port);
801 			if (addrs->sa_family == AF_INET) {
802 				struct sockaddr_in *sin;
803 
804 				sin = (struct sockaddr_in *)addrs;
805 				asoc->asconf_addr_del_pending->v4.sin_addr.s_addr = sin->sin_addr.s_addr;
806 			} else if (addrs->sa_family == AF_INET6) {
807 				struct sockaddr_in6 *sin6;
808 
809 				sin6 = (struct sockaddr_in6 *)addrs;
810 				asoc->asconf_addr_del_pending->v6.sin6_addr = sin6->sin6_addr;
811 			}
812 			SCTP_DEBUG_PRINTK_IPADDR("send_asconf_del_ip: keep the last address asoc: %p ",
813 			    " at %p\n", asoc, asoc->asconf_addr_del_pending,
814 			    asoc->asconf_addr_del_pending);
815 			asoc->src_out_of_asoc_ok = 1;
816 			stored = 1;
817 			goto skip_mkasconf;
818 		}
819 
820 		/* We do not need RCU protection throughout this loop
821 		 * because this is done under a socket lock from the
822 		 * setsockopt call.
823 		 */
824 		chunk = sctp_make_asconf_update_ip(asoc, laddr, addrs, addrcnt,
825 						   SCTP_PARAM_DEL_IP);
826 		if (!chunk) {
827 			retval = -ENOMEM;
828 			goto out;
829 		}
830 
831 skip_mkasconf:
832 		/* Reset use_as_src flag for the addresses in the bind address
833 		 * list that are to be deleted.
834 		 */
835 		addr_buf = addrs;
836 		for (i = 0; i < addrcnt; i++) {
837 			laddr = addr_buf;
838 			af = sctp_get_af_specific(laddr->v4.sin_family);
839 			list_for_each_entry(saddr, &bp->address_list, list) {
840 				if (sctp_cmp_addr_exact(&saddr->a, laddr))
841 					saddr->state = SCTP_ADDR_DEL;
842 			}
843 			addr_buf += af->sockaddr_len;
844 		}
845 
846 		/* Update the route and saddr entries for all the transports
847 		 * as some of the addresses in the bind address list are
848 		 * about to be deleted and cannot be used as source addresses.
849 		 */
850 		list_for_each_entry(transport, &asoc->peer.transport_addr_list,
851 					transports) {
852 			dst_release(transport->dst);
853 			sctp_transport_route(transport, NULL,
854 					     sctp_sk(asoc->base.sk));
855 		}
856 
857 		if (stored)
858 			/* We don't need to transmit ASCONF */
859 			continue;
860 		retval = sctp_send_asconf(asoc, chunk);
861 	}
862 out:
863 	return retval;
864 }
865 
866 /* set addr events to assocs in the endpoint.  ep and addr_wq must be locked */
867 int sctp_asconf_mgmt(struct sctp_sock *sp, struct sctp_sockaddr_entry *addrw)
868 {
869 	struct sock *sk = sctp_opt2sk(sp);
870 	union sctp_addr *addr;
871 	struct sctp_af *af;
872 
873 	/* It is safe to write port space in caller. */
874 	addr = &addrw->a;
875 	addr->v4.sin_port = htons(sp->ep->base.bind_addr.port);
876 	af = sctp_get_af_specific(addr->sa.sa_family);
877 	if (!af)
878 		return -EINVAL;
879 	if (sctp_verify_addr(sk, addr, af->sockaddr_len))
880 		return -EINVAL;
881 
882 	if (addrw->state == SCTP_ADDR_NEW)
883 		return sctp_send_asconf_add_ip(sk, (struct sockaddr *)addr, 1);
884 	else
885 		return sctp_send_asconf_del_ip(sk, (struct sockaddr *)addr, 1);
886 }
887 
888 /* Helper for tunneling sctp_bindx() requests through sctp_setsockopt()
889  *
890  * API 8.1
891  * int sctp_bindx(int sd, struct sockaddr *addrs, int addrcnt,
892  *                int flags);
893  *
894  * If sd is an IPv4 socket, the addresses passed must be IPv4 addresses.
895  * If the sd is an IPv6 socket, the addresses passed can either be IPv4
896  * or IPv6 addresses.
897  *
898  * A single address may be specified as INADDR_ANY or IN6ADDR_ANY, see
899  * Section 3.1.2 for this usage.
900  *
901  * addrs is a pointer to an array of one or more socket addresses. Each
902  * address is contained in its appropriate structure (i.e. struct
903  * sockaddr_in or struct sockaddr_in6) the family of the address type
904  * must be used to distinguish the address length (note that this
905  * representation is termed a "packed array" of addresses). The caller
906  * specifies the number of addresses in the array with addrcnt.
907  *
908  * On success, sctp_bindx() returns 0. On failure, sctp_bindx() returns
909  * -1, and sets errno to the appropriate error code.
910  *
911  * For SCTP, the port given in each socket address must be the same, or
912  * sctp_bindx() will fail, setting errno to EINVAL.
913  *
914  * The flags parameter is formed from the bitwise OR of zero or more of
915  * the following currently defined flags:
916  *
917  * SCTP_BINDX_ADD_ADDR
918  *
919  * SCTP_BINDX_REM_ADDR
920  *
921  * SCTP_BINDX_ADD_ADDR directs SCTP to add the given addresses to the
922  * association, and SCTP_BINDX_REM_ADDR directs SCTP to remove the given
923  * addresses from the association. The two flags are mutually exclusive;
924  * if both are given, sctp_bindx() will fail with EINVAL. A caller may
925  * not remove all addresses from an association; sctp_bindx() will
926  * reject such an attempt with EINVAL.
927  *
928  * An application can use sctp_bindx(SCTP_BINDX_ADD_ADDR) to associate
929  * additional addresses with an endpoint after calling bind().  Or use
930  * sctp_bindx(SCTP_BINDX_REM_ADDR) to remove some addresses a listening
931  * socket is associated with so that no new association accepted will be
932  * associated with those addresses. If the endpoint supports dynamic
933  * address a SCTP_BINDX_REM_ADDR or SCTP_BINDX_ADD_ADDR may cause a
934  * endpoint to send the appropriate message to the peer to change the
935  * peers address lists.
936  *
937  * Adding and removing addresses from a connected association is
938  * optional functionality. Implementations that do not support this
939  * functionality should return EOPNOTSUPP.
940  *
941  * Basically do nothing but copying the addresses from user to kernel
942  * land and invoking either sctp_bindx_add() or sctp_bindx_rem() on the sk.
943  * This is used for tunneling the sctp_bindx() request through sctp_setsockopt()
944  * from userspace.
945  *
946  * We don't use copy_from_user() for optimization: we first do the
947  * sanity checks (buffer size -fast- and access check-healthy
948  * pointer); if all of those succeed, then we can alloc the memory
949  * (expensive operation) needed to copy the data to kernel. Then we do
950  * the copying without checking the user space area
951  * (__copy_from_user()).
952  *
953  * On exit there is no need to do sockfd_put(), sys_setsockopt() does
954  * it.
955  *
956  * sk        The sk of the socket
957  * addrs     The pointer to the addresses in user land
958  * addrssize Size of the addrs buffer
959  * op        Operation to perform (add or remove, see the flags of
960  *           sctp_bindx)
961  *
962  * Returns 0 if ok, <0 errno code on error.
963  */
964 SCTP_STATIC int sctp_setsockopt_bindx(struct sock* sk,
965 				      struct sockaddr __user *addrs,
966 				      int addrs_size, int op)
967 {
968 	struct sockaddr *kaddrs;
969 	int err;
970 	int addrcnt = 0;
971 	int walk_size = 0;
972 	struct sockaddr *sa_addr;
973 	void *addr_buf;
974 	struct sctp_af *af;
975 
976 	SCTP_DEBUG_PRINTK("sctp_setsocktopt_bindx: sk %p addrs %p"
977 			  " addrs_size %d opt %d\n", sk, addrs, addrs_size, op);
978 
979 	if (unlikely(addrs_size <= 0))
980 		return -EINVAL;
981 
982 	/* Check the user passed a healthy pointer.  */
983 	if (unlikely(!access_ok(VERIFY_READ, addrs, addrs_size)))
984 		return -EFAULT;
985 
986 	/* Alloc space for the address array in kernel memory.  */
987 	kaddrs = kmalloc(addrs_size, GFP_KERNEL);
988 	if (unlikely(!kaddrs))
989 		return -ENOMEM;
990 
991 	if (__copy_from_user(kaddrs, addrs, addrs_size)) {
992 		kfree(kaddrs);
993 		return -EFAULT;
994 	}
995 
996 	/* Walk through the addrs buffer and count the number of addresses. */
997 	addr_buf = kaddrs;
998 	while (walk_size < addrs_size) {
999 		if (walk_size + sizeof(sa_family_t) > addrs_size) {
1000 			kfree(kaddrs);
1001 			return -EINVAL;
1002 		}
1003 
1004 		sa_addr = addr_buf;
1005 		af = sctp_get_af_specific(sa_addr->sa_family);
1006 
1007 		/* If the address family is not supported or if this address
1008 		 * causes the address buffer to overflow return EINVAL.
1009 		 */
1010 		if (!af || (walk_size + af->sockaddr_len) > addrs_size) {
1011 			kfree(kaddrs);
1012 			return -EINVAL;
1013 		}
1014 		addrcnt++;
1015 		addr_buf += af->sockaddr_len;
1016 		walk_size += af->sockaddr_len;
1017 	}
1018 
1019 	/* Do the work. */
1020 	switch (op) {
1021 	case SCTP_BINDX_ADD_ADDR:
1022 		err = sctp_bindx_add(sk, kaddrs, addrcnt);
1023 		if (err)
1024 			goto out;
1025 		err = sctp_send_asconf_add_ip(sk, kaddrs, addrcnt);
1026 		break;
1027 
1028 	case SCTP_BINDX_REM_ADDR:
1029 		err = sctp_bindx_rem(sk, kaddrs, addrcnt);
1030 		if (err)
1031 			goto out;
1032 		err = sctp_send_asconf_del_ip(sk, kaddrs, addrcnt);
1033 		break;
1034 
1035 	default:
1036 		err = -EINVAL;
1037 		break;
1038 	}
1039 
1040 out:
1041 	kfree(kaddrs);
1042 
1043 	return err;
1044 }
1045 
1046 /* __sctp_connect(struct sock* sk, struct sockaddr *kaddrs, int addrs_size)
1047  *
1048  * Common routine for handling connect() and sctp_connectx().
1049  * Connect will come in with just a single address.
1050  */
1051 static int __sctp_connect(struct sock* sk,
1052 			  struct sockaddr *kaddrs,
1053 			  int addrs_size,
1054 			  sctp_assoc_t *assoc_id)
1055 {
1056 	struct net *net = sock_net(sk);
1057 	struct sctp_sock *sp;
1058 	struct sctp_endpoint *ep;
1059 	struct sctp_association *asoc = NULL;
1060 	struct sctp_association *asoc2;
1061 	struct sctp_transport *transport;
1062 	union sctp_addr to;
1063 	struct sctp_af *af;
1064 	sctp_scope_t scope;
1065 	long timeo;
1066 	int err = 0;
1067 	int addrcnt = 0;
1068 	int walk_size = 0;
1069 	union sctp_addr *sa_addr = NULL;
1070 	void *addr_buf;
1071 	unsigned short port;
1072 	unsigned int f_flags = 0;
1073 
1074 	sp = sctp_sk(sk);
1075 	ep = sp->ep;
1076 
1077 	/* connect() cannot be done on a socket that is already in ESTABLISHED
1078 	 * state - UDP-style peeled off socket or a TCP-style socket that
1079 	 * is already connected.
1080 	 * It cannot be done even on a TCP-style listening socket.
1081 	 */
1082 	if (sctp_sstate(sk, ESTABLISHED) ||
1083 	    (sctp_style(sk, TCP) && sctp_sstate(sk, LISTENING))) {
1084 		err = -EISCONN;
1085 		goto out_free;
1086 	}
1087 
1088 	/* Walk through the addrs buffer and count the number of addresses. */
1089 	addr_buf = kaddrs;
1090 	while (walk_size < addrs_size) {
1091 		if (walk_size + sizeof(sa_family_t) > addrs_size) {
1092 			err = -EINVAL;
1093 			goto out_free;
1094 		}
1095 
1096 		sa_addr = addr_buf;
1097 		af = sctp_get_af_specific(sa_addr->sa.sa_family);
1098 
1099 		/* If the address family is not supported or if this address
1100 		 * causes the address buffer to overflow return EINVAL.
1101 		 */
1102 		if (!af || (walk_size + af->sockaddr_len) > addrs_size) {
1103 			err = -EINVAL;
1104 			goto out_free;
1105 		}
1106 
1107 		port = ntohs(sa_addr->v4.sin_port);
1108 
1109 		/* Save current address so we can work with it */
1110 		memcpy(&to, sa_addr, af->sockaddr_len);
1111 
1112 		err = sctp_verify_addr(sk, &to, af->sockaddr_len);
1113 		if (err)
1114 			goto out_free;
1115 
1116 		/* Make sure the destination port is correctly set
1117 		 * in all addresses.
1118 		 */
1119 		if (asoc && asoc->peer.port && asoc->peer.port != port)
1120 			goto out_free;
1121 
1122 
1123 		/* Check if there already is a matching association on the
1124 		 * endpoint (other than the one created here).
1125 		 */
1126 		asoc2 = sctp_endpoint_lookup_assoc(ep, &to, &transport);
1127 		if (asoc2 && asoc2 != asoc) {
1128 			if (asoc2->state >= SCTP_STATE_ESTABLISHED)
1129 				err = -EISCONN;
1130 			else
1131 				err = -EALREADY;
1132 			goto out_free;
1133 		}
1134 
1135 		/* If we could not find a matching association on the endpoint,
1136 		 * make sure that there is no peeled-off association matching
1137 		 * the peer address even on another socket.
1138 		 */
1139 		if (sctp_endpoint_is_peeled_off(ep, &to)) {
1140 			err = -EADDRNOTAVAIL;
1141 			goto out_free;
1142 		}
1143 
1144 		if (!asoc) {
1145 			/* If a bind() or sctp_bindx() is not called prior to
1146 			 * an sctp_connectx() call, the system picks an
1147 			 * ephemeral port and will choose an address set
1148 			 * equivalent to binding with a wildcard address.
1149 			 */
1150 			if (!ep->base.bind_addr.port) {
1151 				if (sctp_autobind(sk)) {
1152 					err = -EAGAIN;
1153 					goto out_free;
1154 				}
1155 			} else {
1156 				/*
1157 				 * If an unprivileged user inherits a 1-many
1158 				 * style socket with open associations on a
1159 				 * privileged port, it MAY be permitted to
1160 				 * accept new associations, but it SHOULD NOT
1161 				 * be permitted to open new associations.
1162 				 */
1163 				if (ep->base.bind_addr.port < PROT_SOCK &&
1164 				    !capable(CAP_NET_BIND_SERVICE)) {
1165 					err = -EACCES;
1166 					goto out_free;
1167 				}
1168 			}
1169 
1170 			scope = sctp_scope(&to);
1171 			asoc = sctp_association_new(ep, sk, scope, GFP_KERNEL);
1172 			if (!asoc) {
1173 				err = -ENOMEM;
1174 				goto out_free;
1175 			}
1176 
1177 			err = sctp_assoc_set_bind_addr_from_ep(asoc, scope,
1178 							      GFP_KERNEL);
1179 			if (err < 0) {
1180 				goto out_free;
1181 			}
1182 
1183 		}
1184 
1185 		/* Prime the peer's transport structures.  */
1186 		transport = sctp_assoc_add_peer(asoc, &to, GFP_KERNEL,
1187 						SCTP_UNKNOWN);
1188 		if (!transport) {
1189 			err = -ENOMEM;
1190 			goto out_free;
1191 		}
1192 
1193 		addrcnt++;
1194 		addr_buf += af->sockaddr_len;
1195 		walk_size += af->sockaddr_len;
1196 	}
1197 
1198 	/* In case the user of sctp_connectx() wants an association
1199 	 * id back, assign one now.
1200 	 */
1201 	if (assoc_id) {
1202 		err = sctp_assoc_set_id(asoc, GFP_KERNEL);
1203 		if (err < 0)
1204 			goto out_free;
1205 	}
1206 
1207 	err = sctp_primitive_ASSOCIATE(net, asoc, NULL);
1208 	if (err < 0) {
1209 		goto out_free;
1210 	}
1211 
1212 	/* Initialize sk's dport and daddr for getpeername() */
1213 	inet_sk(sk)->inet_dport = htons(asoc->peer.port);
1214 	af = sctp_get_af_specific(sa_addr->sa.sa_family);
1215 	af->to_sk_daddr(sa_addr, sk);
1216 	sk->sk_err = 0;
1217 
1218 	/* in-kernel sockets don't generally have a file allocated to them
1219 	 * if all they do is call sock_create_kern().
1220 	 */
1221 	if (sk->sk_socket->file)
1222 		f_flags = sk->sk_socket->file->f_flags;
1223 
1224 	timeo = sock_sndtimeo(sk, f_flags & O_NONBLOCK);
1225 
1226 	err = sctp_wait_for_connect(asoc, &timeo);
1227 	if ((err == 0 || err == -EINPROGRESS) && assoc_id)
1228 		*assoc_id = asoc->assoc_id;
1229 
1230 	/* Don't free association on exit. */
1231 	asoc = NULL;
1232 
1233 out_free:
1234 
1235 	SCTP_DEBUG_PRINTK("About to exit __sctp_connect() free asoc: %p"
1236 			  " kaddrs: %p err: %d\n",
1237 			  asoc, kaddrs, err);
1238 	if (asoc) {
1239 		/* sctp_primitive_ASSOCIATE may have added this association
1240 		 * To the hash table, try to unhash it, just in case, its a noop
1241 		 * if it wasn't hashed so we're safe
1242 		 */
1243 		sctp_unhash_established(asoc);
1244 		sctp_association_free(asoc);
1245 	}
1246 	return err;
1247 }
1248 
1249 /* Helper for tunneling sctp_connectx() requests through sctp_setsockopt()
1250  *
1251  * API 8.9
1252  * int sctp_connectx(int sd, struct sockaddr *addrs, int addrcnt,
1253  * 			sctp_assoc_t *asoc);
1254  *
1255  * If sd is an IPv4 socket, the addresses passed must be IPv4 addresses.
1256  * If the sd is an IPv6 socket, the addresses passed can either be IPv4
1257  * or IPv6 addresses.
1258  *
1259  * A single address may be specified as INADDR_ANY or IN6ADDR_ANY, see
1260  * Section 3.1.2 for this usage.
1261  *
1262  * addrs is a pointer to an array of one or more socket addresses. Each
1263  * address is contained in its appropriate structure (i.e. struct
1264  * sockaddr_in or struct sockaddr_in6) the family of the address type
1265  * must be used to distengish the address length (note that this
1266  * representation is termed a "packed array" of addresses). The caller
1267  * specifies the number of addresses in the array with addrcnt.
1268  *
1269  * On success, sctp_connectx() returns 0. It also sets the assoc_id to
1270  * the association id of the new association.  On failure, sctp_connectx()
1271  * returns -1, and sets errno to the appropriate error code.  The assoc_id
1272  * is not touched by the kernel.
1273  *
1274  * For SCTP, the port given in each socket address must be the same, or
1275  * sctp_connectx() will fail, setting errno to EINVAL.
1276  *
1277  * An application can use sctp_connectx to initiate an association with
1278  * an endpoint that is multi-homed.  Much like sctp_bindx() this call
1279  * allows a caller to specify multiple addresses at which a peer can be
1280  * reached.  The way the SCTP stack uses the list of addresses to set up
1281  * the association is implementation dependent.  This function only
1282  * specifies that the stack will try to make use of all the addresses in
1283  * the list when needed.
1284  *
1285  * Note that the list of addresses passed in is only used for setting up
1286  * the association.  It does not necessarily equal the set of addresses
1287  * the peer uses for the resulting association.  If the caller wants to
1288  * find out the set of peer addresses, it must use sctp_getpaddrs() to
1289  * retrieve them after the association has been set up.
1290  *
1291  * Basically do nothing but copying the addresses from user to kernel
1292  * land and invoking either sctp_connectx(). This is used for tunneling
1293  * the sctp_connectx() request through sctp_setsockopt() from userspace.
1294  *
1295  * We don't use copy_from_user() for optimization: we first do the
1296  * sanity checks (buffer size -fast- and access check-healthy
1297  * pointer); if all of those succeed, then we can alloc the memory
1298  * (expensive operation) needed to copy the data to kernel. Then we do
1299  * the copying without checking the user space area
1300  * (__copy_from_user()).
1301  *
1302  * On exit there is no need to do sockfd_put(), sys_setsockopt() does
1303  * it.
1304  *
1305  * sk        The sk of the socket
1306  * addrs     The pointer to the addresses in user land
1307  * addrssize Size of the addrs buffer
1308  *
1309  * Returns >=0 if ok, <0 errno code on error.
1310  */
1311 SCTP_STATIC int __sctp_setsockopt_connectx(struct sock* sk,
1312 				      struct sockaddr __user *addrs,
1313 				      int addrs_size,
1314 				      sctp_assoc_t *assoc_id)
1315 {
1316 	int err = 0;
1317 	struct sockaddr *kaddrs;
1318 
1319 	SCTP_DEBUG_PRINTK("%s - sk %p addrs %p addrs_size %d\n",
1320 			  __func__, sk, addrs, addrs_size);
1321 
1322 	if (unlikely(addrs_size <= 0))
1323 		return -EINVAL;
1324 
1325 	/* Check the user passed a healthy pointer.  */
1326 	if (unlikely(!access_ok(VERIFY_READ, addrs, addrs_size)))
1327 		return -EFAULT;
1328 
1329 	/* Alloc space for the address array in kernel memory.  */
1330 	kaddrs = kmalloc(addrs_size, GFP_KERNEL);
1331 	if (unlikely(!kaddrs))
1332 		return -ENOMEM;
1333 
1334 	if (__copy_from_user(kaddrs, addrs, addrs_size)) {
1335 		err = -EFAULT;
1336 	} else {
1337 		err = __sctp_connect(sk, kaddrs, addrs_size, assoc_id);
1338 	}
1339 
1340 	kfree(kaddrs);
1341 
1342 	return err;
1343 }
1344 
1345 /*
1346  * This is an older interface.  It's kept for backward compatibility
1347  * to the option that doesn't provide association id.
1348  */
1349 SCTP_STATIC int sctp_setsockopt_connectx_old(struct sock* sk,
1350 				      struct sockaddr __user *addrs,
1351 				      int addrs_size)
1352 {
1353 	return __sctp_setsockopt_connectx(sk, addrs, addrs_size, NULL);
1354 }
1355 
1356 /*
1357  * New interface for the API.  The since the API is done with a socket
1358  * option, to make it simple we feed back the association id is as a return
1359  * indication to the call.  Error is always negative and association id is
1360  * always positive.
1361  */
1362 SCTP_STATIC int sctp_setsockopt_connectx(struct sock* sk,
1363 				      struct sockaddr __user *addrs,
1364 				      int addrs_size)
1365 {
1366 	sctp_assoc_t assoc_id = 0;
1367 	int err = 0;
1368 
1369 	err = __sctp_setsockopt_connectx(sk, addrs, addrs_size, &assoc_id);
1370 
1371 	if (err)
1372 		return err;
1373 	else
1374 		return assoc_id;
1375 }
1376 
1377 /*
1378  * New (hopefully final) interface for the API.
1379  * We use the sctp_getaddrs_old structure so that use-space library
1380  * can avoid any unnecessary allocations.   The only defferent part
1381  * is that we store the actual length of the address buffer into the
1382  * addrs_num structure member.  That way we can re-use the existing
1383  * code.
1384  */
1385 SCTP_STATIC int sctp_getsockopt_connectx3(struct sock* sk, int len,
1386 					char __user *optval,
1387 					int __user *optlen)
1388 {
1389 	struct sctp_getaddrs_old param;
1390 	sctp_assoc_t assoc_id = 0;
1391 	int err = 0;
1392 
1393 	if (len < sizeof(param))
1394 		return -EINVAL;
1395 
1396 	if (copy_from_user(&param, optval, sizeof(param)))
1397 		return -EFAULT;
1398 
1399 	err = __sctp_setsockopt_connectx(sk,
1400 			(struct sockaddr __user *)param.addrs,
1401 			param.addr_num, &assoc_id);
1402 
1403 	if (err == 0 || err == -EINPROGRESS) {
1404 		if (copy_to_user(optval, &assoc_id, sizeof(assoc_id)))
1405 			return -EFAULT;
1406 		if (put_user(sizeof(assoc_id), optlen))
1407 			return -EFAULT;
1408 	}
1409 
1410 	return err;
1411 }
1412 
1413 /* API 3.1.4 close() - UDP Style Syntax
1414  * Applications use close() to perform graceful shutdown (as described in
1415  * Section 10.1 of [SCTP]) on ALL the associations currently represented
1416  * by a UDP-style socket.
1417  *
1418  * The syntax is
1419  *
1420  *   ret = close(int sd);
1421  *
1422  *   sd      - the socket descriptor of the associations to be closed.
1423  *
1424  * To gracefully shutdown a specific association represented by the
1425  * UDP-style socket, an application should use the sendmsg() call,
1426  * passing no user data, but including the appropriate flag in the
1427  * ancillary data (see Section xxxx).
1428  *
1429  * If sd in the close() call is a branched-off socket representing only
1430  * one association, the shutdown is performed on that association only.
1431  *
1432  * 4.1.6 close() - TCP Style Syntax
1433  *
1434  * Applications use close() to gracefully close down an association.
1435  *
1436  * The syntax is:
1437  *
1438  *    int close(int sd);
1439  *
1440  *      sd      - the socket descriptor of the association to be closed.
1441  *
1442  * After an application calls close() on a socket descriptor, no further
1443  * socket operations will succeed on that descriptor.
1444  *
1445  * API 7.1.4 SO_LINGER
1446  *
1447  * An application using the TCP-style socket can use this option to
1448  * perform the SCTP ABORT primitive.  The linger option structure is:
1449  *
1450  *  struct  linger {
1451  *     int     l_onoff;                // option on/off
1452  *     int     l_linger;               // linger time
1453  * };
1454  *
1455  * To enable the option, set l_onoff to 1.  If the l_linger value is set
1456  * to 0, calling close() is the same as the ABORT primitive.  If the
1457  * value is set to a negative value, the setsockopt() call will return
1458  * an error.  If the value is set to a positive value linger_time, the
1459  * close() can be blocked for at most linger_time ms.  If the graceful
1460  * shutdown phase does not finish during this period, close() will
1461  * return but the graceful shutdown phase continues in the system.
1462  */
1463 SCTP_STATIC void sctp_close(struct sock *sk, long timeout)
1464 {
1465 	struct net *net = sock_net(sk);
1466 	struct sctp_endpoint *ep;
1467 	struct sctp_association *asoc;
1468 	struct list_head *pos, *temp;
1469 	unsigned int data_was_unread;
1470 
1471 	SCTP_DEBUG_PRINTK("sctp_close(sk: 0x%p, timeout:%ld)\n", sk, timeout);
1472 
1473 	sctp_lock_sock(sk);
1474 	sk->sk_shutdown = SHUTDOWN_MASK;
1475 	sk->sk_state = SCTP_SS_CLOSING;
1476 
1477 	ep = sctp_sk(sk)->ep;
1478 
1479 	/* Clean up any skbs sitting on the receive queue.  */
1480 	data_was_unread = sctp_queue_purge_ulpevents(&sk->sk_receive_queue);
1481 	data_was_unread += sctp_queue_purge_ulpevents(&sctp_sk(sk)->pd_lobby);
1482 
1483 	/* Walk all associations on an endpoint.  */
1484 	list_for_each_safe(pos, temp, &ep->asocs) {
1485 		asoc = list_entry(pos, struct sctp_association, asocs);
1486 
1487 		if (sctp_style(sk, TCP)) {
1488 			/* A closed association can still be in the list if
1489 			 * it belongs to a TCP-style listening socket that is
1490 			 * not yet accepted. If so, free it. If not, send an
1491 			 * ABORT or SHUTDOWN based on the linger options.
1492 			 */
1493 			if (sctp_state(asoc, CLOSED)) {
1494 				sctp_unhash_established(asoc);
1495 				sctp_association_free(asoc);
1496 				continue;
1497 			}
1498 		}
1499 
1500 		if (data_was_unread || !skb_queue_empty(&asoc->ulpq.lobby) ||
1501 		    !skb_queue_empty(&asoc->ulpq.reasm) ||
1502 		    (sock_flag(sk, SOCK_LINGER) && !sk->sk_lingertime)) {
1503 			struct sctp_chunk *chunk;
1504 
1505 			chunk = sctp_make_abort_user(asoc, NULL, 0);
1506 			if (chunk)
1507 				sctp_primitive_ABORT(net, asoc, chunk);
1508 		} else
1509 			sctp_primitive_SHUTDOWN(net, asoc, NULL);
1510 	}
1511 
1512 	/* On a TCP-style socket, block for at most linger_time if set. */
1513 	if (sctp_style(sk, TCP) && timeout)
1514 		sctp_wait_for_close(sk, timeout);
1515 
1516 	/* This will run the backlog queue.  */
1517 	sctp_release_sock(sk);
1518 
1519 	/* Supposedly, no process has access to the socket, but
1520 	 * the net layers still may.
1521 	 */
1522 	sctp_local_bh_disable();
1523 	sctp_bh_lock_sock(sk);
1524 
1525 	/* Hold the sock, since sk_common_release() will put sock_put()
1526 	 * and we have just a little more cleanup.
1527 	 */
1528 	sock_hold(sk);
1529 	sk_common_release(sk);
1530 
1531 	sctp_bh_unlock_sock(sk);
1532 	sctp_local_bh_enable();
1533 
1534 	sock_put(sk);
1535 
1536 	SCTP_DBG_OBJCNT_DEC(sock);
1537 }
1538 
1539 /* Handle EPIPE error. */
1540 static int sctp_error(struct sock *sk, int flags, int err)
1541 {
1542 	if (err == -EPIPE)
1543 		err = sock_error(sk) ? : -EPIPE;
1544 	if (err == -EPIPE && !(flags & MSG_NOSIGNAL))
1545 		send_sig(SIGPIPE, current, 0);
1546 	return err;
1547 }
1548 
1549 /* API 3.1.3 sendmsg() - UDP Style Syntax
1550  *
1551  * An application uses sendmsg() and recvmsg() calls to transmit data to
1552  * and receive data from its peer.
1553  *
1554  *  ssize_t sendmsg(int socket, const struct msghdr *message,
1555  *                  int flags);
1556  *
1557  *  socket  - the socket descriptor of the endpoint.
1558  *  message - pointer to the msghdr structure which contains a single
1559  *            user message and possibly some ancillary data.
1560  *
1561  *            See Section 5 for complete description of the data
1562  *            structures.
1563  *
1564  *  flags   - flags sent or received with the user message, see Section
1565  *            5 for complete description of the flags.
1566  *
1567  * Note:  This function could use a rewrite especially when explicit
1568  * connect support comes in.
1569  */
1570 /* BUG:  We do not implement the equivalent of sk_stream_wait_memory(). */
1571 
1572 SCTP_STATIC int sctp_msghdr_parse(const struct msghdr *, sctp_cmsgs_t *);
1573 
1574 SCTP_STATIC int sctp_sendmsg(struct kiocb *iocb, struct sock *sk,
1575 			     struct msghdr *msg, size_t msg_len)
1576 {
1577 	struct net *net = sock_net(sk);
1578 	struct sctp_sock *sp;
1579 	struct sctp_endpoint *ep;
1580 	struct sctp_association *new_asoc=NULL, *asoc=NULL;
1581 	struct sctp_transport *transport, *chunk_tp;
1582 	struct sctp_chunk *chunk;
1583 	union sctp_addr to;
1584 	struct sockaddr *msg_name = NULL;
1585 	struct sctp_sndrcvinfo default_sinfo;
1586 	struct sctp_sndrcvinfo *sinfo;
1587 	struct sctp_initmsg *sinit;
1588 	sctp_assoc_t associd = 0;
1589 	sctp_cmsgs_t cmsgs = { NULL };
1590 	int err;
1591 	sctp_scope_t scope;
1592 	long timeo;
1593 	__u16 sinfo_flags = 0;
1594 	struct sctp_datamsg *datamsg;
1595 	int msg_flags = msg->msg_flags;
1596 
1597 	SCTP_DEBUG_PRINTK("sctp_sendmsg(sk: %p, msg: %p, msg_len: %zu)\n",
1598 			  sk, msg, msg_len);
1599 
1600 	err = 0;
1601 	sp = sctp_sk(sk);
1602 	ep = sp->ep;
1603 
1604 	SCTP_DEBUG_PRINTK("Using endpoint: %p.\n", ep);
1605 
1606 	/* We cannot send a message over a TCP-style listening socket. */
1607 	if (sctp_style(sk, TCP) && sctp_sstate(sk, LISTENING)) {
1608 		err = -EPIPE;
1609 		goto out_nounlock;
1610 	}
1611 
1612 	/* Parse out the SCTP CMSGs.  */
1613 	err = sctp_msghdr_parse(msg, &cmsgs);
1614 
1615 	if (err) {
1616 		SCTP_DEBUG_PRINTK("msghdr parse err = %x\n", err);
1617 		goto out_nounlock;
1618 	}
1619 
1620 	/* Fetch the destination address for this packet.  This
1621 	 * address only selects the association--it is not necessarily
1622 	 * the address we will send to.
1623 	 * For a peeled-off socket, msg_name is ignored.
1624 	 */
1625 	if (!sctp_style(sk, UDP_HIGH_BANDWIDTH) && msg->msg_name) {
1626 		int msg_namelen = msg->msg_namelen;
1627 
1628 		err = sctp_verify_addr(sk, (union sctp_addr *)msg->msg_name,
1629 				       msg_namelen);
1630 		if (err)
1631 			return err;
1632 
1633 		if (msg_namelen > sizeof(to))
1634 			msg_namelen = sizeof(to);
1635 		memcpy(&to, msg->msg_name, msg_namelen);
1636 		msg_name = msg->msg_name;
1637 	}
1638 
1639 	sinfo = cmsgs.info;
1640 	sinit = cmsgs.init;
1641 
1642 	/* Did the user specify SNDRCVINFO?  */
1643 	if (sinfo) {
1644 		sinfo_flags = sinfo->sinfo_flags;
1645 		associd = sinfo->sinfo_assoc_id;
1646 	}
1647 
1648 	SCTP_DEBUG_PRINTK("msg_len: %zu, sinfo_flags: 0x%x\n",
1649 			  msg_len, sinfo_flags);
1650 
1651 	/* SCTP_EOF or SCTP_ABORT cannot be set on a TCP-style socket. */
1652 	if (sctp_style(sk, TCP) && (sinfo_flags & (SCTP_EOF | SCTP_ABORT))) {
1653 		err = -EINVAL;
1654 		goto out_nounlock;
1655 	}
1656 
1657 	/* If SCTP_EOF is set, no data can be sent. Disallow sending zero
1658 	 * length messages when SCTP_EOF|SCTP_ABORT is not set.
1659 	 * If SCTP_ABORT is set, the message length could be non zero with
1660 	 * the msg_iov set to the user abort reason.
1661 	 */
1662 	if (((sinfo_flags & SCTP_EOF) && (msg_len > 0)) ||
1663 	    (!(sinfo_flags & (SCTP_EOF|SCTP_ABORT)) && (msg_len == 0))) {
1664 		err = -EINVAL;
1665 		goto out_nounlock;
1666 	}
1667 
1668 	/* If SCTP_ADDR_OVER is set, there must be an address
1669 	 * specified in msg_name.
1670 	 */
1671 	if ((sinfo_flags & SCTP_ADDR_OVER) && (!msg->msg_name)) {
1672 		err = -EINVAL;
1673 		goto out_nounlock;
1674 	}
1675 
1676 	transport = NULL;
1677 
1678 	SCTP_DEBUG_PRINTK("About to look up association.\n");
1679 
1680 	sctp_lock_sock(sk);
1681 
1682 	/* If a msg_name has been specified, assume this is to be used.  */
1683 	if (msg_name) {
1684 		/* Look for a matching association on the endpoint. */
1685 		asoc = sctp_endpoint_lookup_assoc(ep, &to, &transport);
1686 		if (!asoc) {
1687 			/* If we could not find a matching association on the
1688 			 * endpoint, make sure that it is not a TCP-style
1689 			 * socket that already has an association or there is
1690 			 * no peeled-off association on another socket.
1691 			 */
1692 			if ((sctp_style(sk, TCP) &&
1693 			     sctp_sstate(sk, ESTABLISHED)) ||
1694 			    sctp_endpoint_is_peeled_off(ep, &to)) {
1695 				err = -EADDRNOTAVAIL;
1696 				goto out_unlock;
1697 			}
1698 		}
1699 	} else {
1700 		asoc = sctp_id2assoc(sk, associd);
1701 		if (!asoc) {
1702 			err = -EPIPE;
1703 			goto out_unlock;
1704 		}
1705 	}
1706 
1707 	if (asoc) {
1708 		SCTP_DEBUG_PRINTK("Just looked up association: %p.\n", asoc);
1709 
1710 		/* We cannot send a message on a TCP-style SCTP_SS_ESTABLISHED
1711 		 * socket that has an association in CLOSED state. This can
1712 		 * happen when an accepted socket has an association that is
1713 		 * already CLOSED.
1714 		 */
1715 		if (sctp_state(asoc, CLOSED) && sctp_style(sk, TCP)) {
1716 			err = -EPIPE;
1717 			goto out_unlock;
1718 		}
1719 
1720 		if (sinfo_flags & SCTP_EOF) {
1721 			SCTP_DEBUG_PRINTK("Shutting down association: %p\n",
1722 					  asoc);
1723 			sctp_primitive_SHUTDOWN(net, asoc, NULL);
1724 			err = 0;
1725 			goto out_unlock;
1726 		}
1727 		if (sinfo_flags & SCTP_ABORT) {
1728 
1729 			chunk = sctp_make_abort_user(asoc, msg, msg_len);
1730 			if (!chunk) {
1731 				err = -ENOMEM;
1732 				goto out_unlock;
1733 			}
1734 
1735 			SCTP_DEBUG_PRINTK("Aborting association: %p\n", asoc);
1736 			sctp_primitive_ABORT(net, asoc, chunk);
1737 			err = 0;
1738 			goto out_unlock;
1739 		}
1740 	}
1741 
1742 	/* Do we need to create the association?  */
1743 	if (!asoc) {
1744 		SCTP_DEBUG_PRINTK("There is no association yet.\n");
1745 
1746 		if (sinfo_flags & (SCTP_EOF | SCTP_ABORT)) {
1747 			err = -EINVAL;
1748 			goto out_unlock;
1749 		}
1750 
1751 		/* Check for invalid stream against the stream counts,
1752 		 * either the default or the user specified stream counts.
1753 		 */
1754 		if (sinfo) {
1755 			if (!sinit || (sinit && !sinit->sinit_num_ostreams)) {
1756 				/* Check against the defaults. */
1757 				if (sinfo->sinfo_stream >=
1758 				    sp->initmsg.sinit_num_ostreams) {
1759 					err = -EINVAL;
1760 					goto out_unlock;
1761 				}
1762 			} else {
1763 				/* Check against the requested.  */
1764 				if (sinfo->sinfo_stream >=
1765 				    sinit->sinit_num_ostreams) {
1766 					err = -EINVAL;
1767 					goto out_unlock;
1768 				}
1769 			}
1770 		}
1771 
1772 		/*
1773 		 * API 3.1.2 bind() - UDP Style Syntax
1774 		 * If a bind() or sctp_bindx() is not called prior to a
1775 		 * sendmsg() call that initiates a new association, the
1776 		 * system picks an ephemeral port and will choose an address
1777 		 * set equivalent to binding with a wildcard address.
1778 		 */
1779 		if (!ep->base.bind_addr.port) {
1780 			if (sctp_autobind(sk)) {
1781 				err = -EAGAIN;
1782 				goto out_unlock;
1783 			}
1784 		} else {
1785 			/*
1786 			 * If an unprivileged user inherits a one-to-many
1787 			 * style socket with open associations on a privileged
1788 			 * port, it MAY be permitted to accept new associations,
1789 			 * but it SHOULD NOT be permitted to open new
1790 			 * associations.
1791 			 */
1792 			if (ep->base.bind_addr.port < PROT_SOCK &&
1793 			    !capable(CAP_NET_BIND_SERVICE)) {
1794 				err = -EACCES;
1795 				goto out_unlock;
1796 			}
1797 		}
1798 
1799 		scope = sctp_scope(&to);
1800 		new_asoc = sctp_association_new(ep, sk, scope, GFP_KERNEL);
1801 		if (!new_asoc) {
1802 			err = -ENOMEM;
1803 			goto out_unlock;
1804 		}
1805 		asoc = new_asoc;
1806 		err = sctp_assoc_set_bind_addr_from_ep(asoc, scope, GFP_KERNEL);
1807 		if (err < 0) {
1808 			err = -ENOMEM;
1809 			goto out_free;
1810 		}
1811 
1812 		/* If the SCTP_INIT ancillary data is specified, set all
1813 		 * the association init values accordingly.
1814 		 */
1815 		if (sinit) {
1816 			if (sinit->sinit_num_ostreams) {
1817 				asoc->c.sinit_num_ostreams =
1818 					sinit->sinit_num_ostreams;
1819 			}
1820 			if (sinit->sinit_max_instreams) {
1821 				asoc->c.sinit_max_instreams =
1822 					sinit->sinit_max_instreams;
1823 			}
1824 			if (sinit->sinit_max_attempts) {
1825 				asoc->max_init_attempts
1826 					= sinit->sinit_max_attempts;
1827 			}
1828 			if (sinit->sinit_max_init_timeo) {
1829 				asoc->max_init_timeo =
1830 				 msecs_to_jiffies(sinit->sinit_max_init_timeo);
1831 			}
1832 		}
1833 
1834 		/* Prime the peer's transport structures.  */
1835 		transport = sctp_assoc_add_peer(asoc, &to, GFP_KERNEL, SCTP_UNKNOWN);
1836 		if (!transport) {
1837 			err = -ENOMEM;
1838 			goto out_free;
1839 		}
1840 	}
1841 
1842 	/* ASSERT: we have a valid association at this point.  */
1843 	SCTP_DEBUG_PRINTK("We have a valid association.\n");
1844 
1845 	if (!sinfo) {
1846 		/* If the user didn't specify SNDRCVINFO, make up one with
1847 		 * some defaults.
1848 		 */
1849 		memset(&default_sinfo, 0, sizeof(default_sinfo));
1850 		default_sinfo.sinfo_stream = asoc->default_stream;
1851 		default_sinfo.sinfo_flags = asoc->default_flags;
1852 		default_sinfo.sinfo_ppid = asoc->default_ppid;
1853 		default_sinfo.sinfo_context = asoc->default_context;
1854 		default_sinfo.sinfo_timetolive = asoc->default_timetolive;
1855 		default_sinfo.sinfo_assoc_id = sctp_assoc2id(asoc);
1856 		sinfo = &default_sinfo;
1857 	}
1858 
1859 	/* API 7.1.7, the sndbuf size per association bounds the
1860 	 * maximum size of data that can be sent in a single send call.
1861 	 */
1862 	if (msg_len > sk->sk_sndbuf) {
1863 		err = -EMSGSIZE;
1864 		goto out_free;
1865 	}
1866 
1867 	if (asoc->pmtu_pending)
1868 		sctp_assoc_pending_pmtu(sk, asoc);
1869 
1870 	/* If fragmentation is disabled and the message length exceeds the
1871 	 * association fragmentation point, return EMSGSIZE.  The I-D
1872 	 * does not specify what this error is, but this looks like
1873 	 * a great fit.
1874 	 */
1875 	if (sctp_sk(sk)->disable_fragments && (msg_len > asoc->frag_point)) {
1876 		err = -EMSGSIZE;
1877 		goto out_free;
1878 	}
1879 
1880 	/* Check for invalid stream. */
1881 	if (sinfo->sinfo_stream >= asoc->c.sinit_num_ostreams) {
1882 		err = -EINVAL;
1883 		goto out_free;
1884 	}
1885 
1886 	timeo = sock_sndtimeo(sk, msg->msg_flags & MSG_DONTWAIT);
1887 	if (!sctp_wspace(asoc)) {
1888 		err = sctp_wait_for_sndbuf(asoc, &timeo, msg_len);
1889 		if (err)
1890 			goto out_free;
1891 	}
1892 
1893 	/* If an address is passed with the sendto/sendmsg call, it is used
1894 	 * to override the primary destination address in the TCP model, or
1895 	 * when SCTP_ADDR_OVER flag is set in the UDP model.
1896 	 */
1897 	if ((sctp_style(sk, TCP) && msg_name) ||
1898 	    (sinfo_flags & SCTP_ADDR_OVER)) {
1899 		chunk_tp = sctp_assoc_lookup_paddr(asoc, &to);
1900 		if (!chunk_tp) {
1901 			err = -EINVAL;
1902 			goto out_free;
1903 		}
1904 	} else
1905 		chunk_tp = NULL;
1906 
1907 	/* Auto-connect, if we aren't connected already. */
1908 	if (sctp_state(asoc, CLOSED)) {
1909 		err = sctp_primitive_ASSOCIATE(net, asoc, NULL);
1910 		if (err < 0)
1911 			goto out_free;
1912 		SCTP_DEBUG_PRINTK("We associated primitively.\n");
1913 	}
1914 
1915 	/* Break the message into multiple chunks of maximum size. */
1916 	datamsg = sctp_datamsg_from_user(asoc, sinfo, msg, msg_len);
1917 	if (!datamsg) {
1918 		err = -ENOMEM;
1919 		goto out_free;
1920 	}
1921 
1922 	/* Now send the (possibly) fragmented message. */
1923 	list_for_each_entry(chunk, &datamsg->chunks, frag_list) {
1924 		sctp_chunk_hold(chunk);
1925 
1926 		/* Do accounting for the write space.  */
1927 		sctp_set_owner_w(chunk);
1928 
1929 		chunk->transport = chunk_tp;
1930 	}
1931 
1932 	/* Send it to the lower layers.  Note:  all chunks
1933 	 * must either fail or succeed.   The lower layer
1934 	 * works that way today.  Keep it that way or this
1935 	 * breaks.
1936 	 */
1937 	err = sctp_primitive_SEND(net, asoc, datamsg);
1938 	/* Did the lower layer accept the chunk? */
1939 	if (err)
1940 		sctp_datamsg_free(datamsg);
1941 	else
1942 		sctp_datamsg_put(datamsg);
1943 
1944 	SCTP_DEBUG_PRINTK("We sent primitively.\n");
1945 
1946 	if (err)
1947 		goto out_free;
1948 	else
1949 		err = msg_len;
1950 
1951 	/* If we are already past ASSOCIATE, the lower
1952 	 * layers are responsible for association cleanup.
1953 	 */
1954 	goto out_unlock;
1955 
1956 out_free:
1957 	if (new_asoc) {
1958 		sctp_unhash_established(asoc);
1959 		sctp_association_free(asoc);
1960 	}
1961 out_unlock:
1962 	sctp_release_sock(sk);
1963 
1964 out_nounlock:
1965 	return sctp_error(sk, msg_flags, err);
1966 
1967 #if 0
1968 do_sock_err:
1969 	if (msg_len)
1970 		err = msg_len;
1971 	else
1972 		err = sock_error(sk);
1973 	goto out;
1974 
1975 do_interrupted:
1976 	if (msg_len)
1977 		err = msg_len;
1978 	goto out;
1979 #endif /* 0 */
1980 }
1981 
1982 /* This is an extended version of skb_pull() that removes the data from the
1983  * start of a skb even when data is spread across the list of skb's in the
1984  * frag_list. len specifies the total amount of data that needs to be removed.
1985  * when 'len' bytes could be removed from the skb, it returns 0.
1986  * If 'len' exceeds the total skb length,  it returns the no. of bytes that
1987  * could not be removed.
1988  */
1989 static int sctp_skb_pull(struct sk_buff *skb, int len)
1990 {
1991 	struct sk_buff *list;
1992 	int skb_len = skb_headlen(skb);
1993 	int rlen;
1994 
1995 	if (len <= skb_len) {
1996 		__skb_pull(skb, len);
1997 		return 0;
1998 	}
1999 	len -= skb_len;
2000 	__skb_pull(skb, skb_len);
2001 
2002 	skb_walk_frags(skb, list) {
2003 		rlen = sctp_skb_pull(list, len);
2004 		skb->len -= (len-rlen);
2005 		skb->data_len -= (len-rlen);
2006 
2007 		if (!rlen)
2008 			return 0;
2009 
2010 		len = rlen;
2011 	}
2012 
2013 	return len;
2014 }
2015 
2016 /* API 3.1.3  recvmsg() - UDP Style Syntax
2017  *
2018  *  ssize_t recvmsg(int socket, struct msghdr *message,
2019  *                    int flags);
2020  *
2021  *  socket  - the socket descriptor of the endpoint.
2022  *  message - pointer to the msghdr structure which contains a single
2023  *            user message and possibly some ancillary data.
2024  *
2025  *            See Section 5 for complete description of the data
2026  *            structures.
2027  *
2028  *  flags   - flags sent or received with the user message, see Section
2029  *            5 for complete description of the flags.
2030  */
2031 static struct sk_buff *sctp_skb_recv_datagram(struct sock *, int, int, int *);
2032 
2033 SCTP_STATIC int sctp_recvmsg(struct kiocb *iocb, struct sock *sk,
2034 			     struct msghdr *msg, size_t len, int noblock,
2035 			     int flags, int *addr_len)
2036 {
2037 	struct sctp_ulpevent *event = NULL;
2038 	struct sctp_sock *sp = sctp_sk(sk);
2039 	struct sk_buff *skb;
2040 	int copied;
2041 	int err = 0;
2042 	int skb_len;
2043 
2044 	SCTP_DEBUG_PRINTK("sctp_recvmsg(%s: %p, %s: %p, %s: %zd, %s: %d, %s: "
2045 			  "0x%x, %s: %p)\n", "sk", sk, "msghdr", msg,
2046 			  "len", len, "knoblauch", noblock,
2047 			  "flags", flags, "addr_len", addr_len);
2048 
2049 	sctp_lock_sock(sk);
2050 
2051 	if (sctp_style(sk, TCP) && !sctp_sstate(sk, ESTABLISHED)) {
2052 		err = -ENOTCONN;
2053 		goto out;
2054 	}
2055 
2056 	skb = sctp_skb_recv_datagram(sk, flags, noblock, &err);
2057 	if (!skb)
2058 		goto out;
2059 
2060 	/* Get the total length of the skb including any skb's in the
2061 	 * frag_list.
2062 	 */
2063 	skb_len = skb->len;
2064 
2065 	copied = skb_len;
2066 	if (copied > len)
2067 		copied = len;
2068 
2069 	err = skb_copy_datagram_iovec(skb, 0, msg->msg_iov, copied);
2070 
2071 	event = sctp_skb2event(skb);
2072 
2073 	if (err)
2074 		goto out_free;
2075 
2076 	sock_recv_ts_and_drops(msg, sk, skb);
2077 	if (sctp_ulpevent_is_notification(event)) {
2078 		msg->msg_flags |= MSG_NOTIFICATION;
2079 		sp->pf->event_msgname(event, msg->msg_name, addr_len);
2080 	} else {
2081 		sp->pf->skb_msgname(skb, msg->msg_name, addr_len);
2082 	}
2083 
2084 	/* Check if we allow SCTP_SNDRCVINFO. */
2085 	if (sp->subscribe.sctp_data_io_event)
2086 		sctp_ulpevent_read_sndrcvinfo(event, msg);
2087 #if 0
2088 	/* FIXME: we should be calling IP/IPv6 layers.  */
2089 	if (sk->sk_protinfo.af_inet.cmsg_flags)
2090 		ip_cmsg_recv(msg, skb);
2091 #endif
2092 
2093 	err = copied;
2094 
2095 	/* If skb's length exceeds the user's buffer, update the skb and
2096 	 * push it back to the receive_queue so that the next call to
2097 	 * recvmsg() will return the remaining data. Don't set MSG_EOR.
2098 	 */
2099 	if (skb_len > copied) {
2100 		msg->msg_flags &= ~MSG_EOR;
2101 		if (flags & MSG_PEEK)
2102 			goto out_free;
2103 		sctp_skb_pull(skb, copied);
2104 		skb_queue_head(&sk->sk_receive_queue, skb);
2105 
2106 		/* When only partial message is copied to the user, increase
2107 		 * rwnd by that amount. If all the data in the skb is read,
2108 		 * rwnd is updated when the event is freed.
2109 		 */
2110 		if (!sctp_ulpevent_is_notification(event))
2111 			sctp_assoc_rwnd_increase(event->asoc, copied);
2112 		goto out;
2113 	} else if ((event->msg_flags & MSG_NOTIFICATION) ||
2114 		   (event->msg_flags & MSG_EOR))
2115 		msg->msg_flags |= MSG_EOR;
2116 	else
2117 		msg->msg_flags &= ~MSG_EOR;
2118 
2119 out_free:
2120 	if (flags & MSG_PEEK) {
2121 		/* Release the skb reference acquired after peeking the skb in
2122 		 * sctp_skb_recv_datagram().
2123 		 */
2124 		kfree_skb(skb);
2125 	} else {
2126 		/* Free the event which includes releasing the reference to
2127 		 * the owner of the skb, freeing the skb and updating the
2128 		 * rwnd.
2129 		 */
2130 		sctp_ulpevent_free(event);
2131 	}
2132 out:
2133 	sctp_release_sock(sk);
2134 	return err;
2135 }
2136 
2137 /* 7.1.12 Enable/Disable message fragmentation (SCTP_DISABLE_FRAGMENTS)
2138  *
2139  * This option is a on/off flag.  If enabled no SCTP message
2140  * fragmentation will be performed.  Instead if a message being sent
2141  * exceeds the current PMTU size, the message will NOT be sent and
2142  * instead a error will be indicated to the user.
2143  */
2144 static int sctp_setsockopt_disable_fragments(struct sock *sk,
2145 					     char __user *optval,
2146 					     unsigned int optlen)
2147 {
2148 	int val;
2149 
2150 	if (optlen < sizeof(int))
2151 		return -EINVAL;
2152 
2153 	if (get_user(val, (int __user *)optval))
2154 		return -EFAULT;
2155 
2156 	sctp_sk(sk)->disable_fragments = (val == 0) ? 0 : 1;
2157 
2158 	return 0;
2159 }
2160 
2161 static int sctp_setsockopt_events(struct sock *sk, char __user *optval,
2162 				  unsigned int optlen)
2163 {
2164 	struct sctp_association *asoc;
2165 	struct sctp_ulpevent *event;
2166 
2167 	if (optlen > sizeof(struct sctp_event_subscribe))
2168 		return -EINVAL;
2169 	if (copy_from_user(&sctp_sk(sk)->subscribe, optval, optlen))
2170 		return -EFAULT;
2171 
2172 	/*
2173 	 * At the time when a user app subscribes to SCTP_SENDER_DRY_EVENT,
2174 	 * if there is no data to be sent or retransmit, the stack will
2175 	 * immediately send up this notification.
2176 	 */
2177 	if (sctp_ulpevent_type_enabled(SCTP_SENDER_DRY_EVENT,
2178 				       &sctp_sk(sk)->subscribe)) {
2179 		asoc = sctp_id2assoc(sk, 0);
2180 
2181 		if (asoc && sctp_outq_is_empty(&asoc->outqueue)) {
2182 			event = sctp_ulpevent_make_sender_dry_event(asoc,
2183 					GFP_ATOMIC);
2184 			if (!event)
2185 				return -ENOMEM;
2186 
2187 			sctp_ulpq_tail_event(&asoc->ulpq, event);
2188 		}
2189 	}
2190 
2191 	return 0;
2192 }
2193 
2194 /* 7.1.8 Automatic Close of associations (SCTP_AUTOCLOSE)
2195  *
2196  * This socket option is applicable to the UDP-style socket only.  When
2197  * set it will cause associations that are idle for more than the
2198  * specified number of seconds to automatically close.  An association
2199  * being idle is defined an association that has NOT sent or received
2200  * user data.  The special value of '0' indicates that no automatic
2201  * close of any associations should be performed.  The option expects an
2202  * integer defining the number of seconds of idle time before an
2203  * association is closed.
2204  */
2205 static int sctp_setsockopt_autoclose(struct sock *sk, char __user *optval,
2206 				     unsigned int optlen)
2207 {
2208 	struct sctp_sock *sp = sctp_sk(sk);
2209 
2210 	/* Applicable to UDP-style socket only */
2211 	if (sctp_style(sk, TCP))
2212 		return -EOPNOTSUPP;
2213 	if (optlen != sizeof(int))
2214 		return -EINVAL;
2215 	if (copy_from_user(&sp->autoclose, optval, optlen))
2216 		return -EFAULT;
2217 
2218 	return 0;
2219 }
2220 
2221 /* 7.1.13 Peer Address Parameters (SCTP_PEER_ADDR_PARAMS)
2222  *
2223  * Applications can enable or disable heartbeats for any peer address of
2224  * an association, modify an address's heartbeat interval, force a
2225  * heartbeat to be sent immediately, and adjust the address's maximum
2226  * number of retransmissions sent before an address is considered
2227  * unreachable.  The following structure is used to access and modify an
2228  * address's parameters:
2229  *
2230  *  struct sctp_paddrparams {
2231  *     sctp_assoc_t            spp_assoc_id;
2232  *     struct sockaddr_storage spp_address;
2233  *     uint32_t                spp_hbinterval;
2234  *     uint16_t                spp_pathmaxrxt;
2235  *     uint32_t                spp_pathmtu;
2236  *     uint32_t                spp_sackdelay;
2237  *     uint32_t                spp_flags;
2238  * };
2239  *
2240  *   spp_assoc_id    - (one-to-many style socket) This is filled in the
2241  *                     application, and identifies the association for
2242  *                     this query.
2243  *   spp_address     - This specifies which address is of interest.
2244  *   spp_hbinterval  - This contains the value of the heartbeat interval,
2245  *                     in milliseconds.  If a  value of zero
2246  *                     is present in this field then no changes are to
2247  *                     be made to this parameter.
2248  *   spp_pathmaxrxt  - This contains the maximum number of
2249  *                     retransmissions before this address shall be
2250  *                     considered unreachable. If a  value of zero
2251  *                     is present in this field then no changes are to
2252  *                     be made to this parameter.
2253  *   spp_pathmtu     - When Path MTU discovery is disabled the value
2254  *                     specified here will be the "fixed" path mtu.
2255  *                     Note that if the spp_address field is empty
2256  *                     then all associations on this address will
2257  *                     have this fixed path mtu set upon them.
2258  *
2259  *   spp_sackdelay   - When delayed sack is enabled, this value specifies
2260  *                     the number of milliseconds that sacks will be delayed
2261  *                     for. This value will apply to all addresses of an
2262  *                     association if the spp_address field is empty. Note
2263  *                     also, that if delayed sack is enabled and this
2264  *                     value is set to 0, no change is made to the last
2265  *                     recorded delayed sack timer value.
2266  *
2267  *   spp_flags       - These flags are used to control various features
2268  *                     on an association. The flag field may contain
2269  *                     zero or more of the following options.
2270  *
2271  *                     SPP_HB_ENABLE  - Enable heartbeats on the
2272  *                     specified address. Note that if the address
2273  *                     field is empty all addresses for the association
2274  *                     have heartbeats enabled upon them.
2275  *
2276  *                     SPP_HB_DISABLE - Disable heartbeats on the
2277  *                     speicifed address. Note that if the address
2278  *                     field is empty all addresses for the association
2279  *                     will have their heartbeats disabled. Note also
2280  *                     that SPP_HB_ENABLE and SPP_HB_DISABLE are
2281  *                     mutually exclusive, only one of these two should
2282  *                     be specified. Enabling both fields will have
2283  *                     undetermined results.
2284  *
2285  *                     SPP_HB_DEMAND - Request a user initiated heartbeat
2286  *                     to be made immediately.
2287  *
2288  *                     SPP_HB_TIME_IS_ZERO - Specify's that the time for
2289  *                     heartbeat delayis to be set to the value of 0
2290  *                     milliseconds.
2291  *
2292  *                     SPP_PMTUD_ENABLE - This field will enable PMTU
2293  *                     discovery upon the specified address. Note that
2294  *                     if the address feild is empty then all addresses
2295  *                     on the association are effected.
2296  *
2297  *                     SPP_PMTUD_DISABLE - This field will disable PMTU
2298  *                     discovery upon the specified address. Note that
2299  *                     if the address feild is empty then all addresses
2300  *                     on the association are effected. Not also that
2301  *                     SPP_PMTUD_ENABLE and SPP_PMTUD_DISABLE are mutually
2302  *                     exclusive. Enabling both will have undetermined
2303  *                     results.
2304  *
2305  *                     SPP_SACKDELAY_ENABLE - Setting this flag turns
2306  *                     on delayed sack. The time specified in spp_sackdelay
2307  *                     is used to specify the sack delay for this address. Note
2308  *                     that if spp_address is empty then all addresses will
2309  *                     enable delayed sack and take on the sack delay
2310  *                     value specified in spp_sackdelay.
2311  *                     SPP_SACKDELAY_DISABLE - Setting this flag turns
2312  *                     off delayed sack. If the spp_address field is blank then
2313  *                     delayed sack is disabled for the entire association. Note
2314  *                     also that this field is mutually exclusive to
2315  *                     SPP_SACKDELAY_ENABLE, setting both will have undefined
2316  *                     results.
2317  */
2318 static int sctp_apply_peer_addr_params(struct sctp_paddrparams *params,
2319 				       struct sctp_transport   *trans,
2320 				       struct sctp_association *asoc,
2321 				       struct sctp_sock        *sp,
2322 				       int                      hb_change,
2323 				       int                      pmtud_change,
2324 				       int                      sackdelay_change)
2325 {
2326 	int error;
2327 
2328 	if (params->spp_flags & SPP_HB_DEMAND && trans) {
2329 		struct net *net = sock_net(trans->asoc->base.sk);
2330 
2331 		error = sctp_primitive_REQUESTHEARTBEAT(net, trans->asoc, trans);
2332 		if (error)
2333 			return error;
2334 	}
2335 
2336 	/* Note that unless the spp_flag is set to SPP_HB_ENABLE the value of
2337 	 * this field is ignored.  Note also that a value of zero indicates
2338 	 * the current setting should be left unchanged.
2339 	 */
2340 	if (params->spp_flags & SPP_HB_ENABLE) {
2341 
2342 		/* Re-zero the interval if the SPP_HB_TIME_IS_ZERO is
2343 		 * set.  This lets us use 0 value when this flag
2344 		 * is set.
2345 		 */
2346 		if (params->spp_flags & SPP_HB_TIME_IS_ZERO)
2347 			params->spp_hbinterval = 0;
2348 
2349 		if (params->spp_hbinterval ||
2350 		    (params->spp_flags & SPP_HB_TIME_IS_ZERO)) {
2351 			if (trans) {
2352 				trans->hbinterval =
2353 				    msecs_to_jiffies(params->spp_hbinterval);
2354 			} else if (asoc) {
2355 				asoc->hbinterval =
2356 				    msecs_to_jiffies(params->spp_hbinterval);
2357 			} else {
2358 				sp->hbinterval = params->spp_hbinterval;
2359 			}
2360 		}
2361 	}
2362 
2363 	if (hb_change) {
2364 		if (trans) {
2365 			trans->param_flags =
2366 				(trans->param_flags & ~SPP_HB) | hb_change;
2367 		} else if (asoc) {
2368 			asoc->param_flags =
2369 				(asoc->param_flags & ~SPP_HB) | hb_change;
2370 		} else {
2371 			sp->param_flags =
2372 				(sp->param_flags & ~SPP_HB) | hb_change;
2373 		}
2374 	}
2375 
2376 	/* When Path MTU discovery is disabled the value specified here will
2377 	 * be the "fixed" path mtu (i.e. the value of the spp_flags field must
2378 	 * include the flag SPP_PMTUD_DISABLE for this field to have any
2379 	 * effect).
2380 	 */
2381 	if ((params->spp_flags & SPP_PMTUD_DISABLE) && params->spp_pathmtu) {
2382 		if (trans) {
2383 			trans->pathmtu = params->spp_pathmtu;
2384 			sctp_assoc_sync_pmtu(sctp_opt2sk(sp), asoc);
2385 		} else if (asoc) {
2386 			asoc->pathmtu = params->spp_pathmtu;
2387 			sctp_frag_point(asoc, params->spp_pathmtu);
2388 		} else {
2389 			sp->pathmtu = params->spp_pathmtu;
2390 		}
2391 	}
2392 
2393 	if (pmtud_change) {
2394 		if (trans) {
2395 			int update = (trans->param_flags & SPP_PMTUD_DISABLE) &&
2396 				(params->spp_flags & SPP_PMTUD_ENABLE);
2397 			trans->param_flags =
2398 				(trans->param_flags & ~SPP_PMTUD) | pmtud_change;
2399 			if (update) {
2400 				sctp_transport_pmtu(trans, sctp_opt2sk(sp));
2401 				sctp_assoc_sync_pmtu(sctp_opt2sk(sp), asoc);
2402 			}
2403 		} else if (asoc) {
2404 			asoc->param_flags =
2405 				(asoc->param_flags & ~SPP_PMTUD) | pmtud_change;
2406 		} else {
2407 			sp->param_flags =
2408 				(sp->param_flags & ~SPP_PMTUD) | pmtud_change;
2409 		}
2410 	}
2411 
2412 	/* Note that unless the spp_flag is set to SPP_SACKDELAY_ENABLE the
2413 	 * value of this field is ignored.  Note also that a value of zero
2414 	 * indicates the current setting should be left unchanged.
2415 	 */
2416 	if ((params->spp_flags & SPP_SACKDELAY_ENABLE) && params->spp_sackdelay) {
2417 		if (trans) {
2418 			trans->sackdelay =
2419 				msecs_to_jiffies(params->spp_sackdelay);
2420 		} else if (asoc) {
2421 			asoc->sackdelay =
2422 				msecs_to_jiffies(params->spp_sackdelay);
2423 		} else {
2424 			sp->sackdelay = params->spp_sackdelay;
2425 		}
2426 	}
2427 
2428 	if (sackdelay_change) {
2429 		if (trans) {
2430 			trans->param_flags =
2431 				(trans->param_flags & ~SPP_SACKDELAY) |
2432 				sackdelay_change;
2433 		} else if (asoc) {
2434 			asoc->param_flags =
2435 				(asoc->param_flags & ~SPP_SACKDELAY) |
2436 				sackdelay_change;
2437 		} else {
2438 			sp->param_flags =
2439 				(sp->param_flags & ~SPP_SACKDELAY) |
2440 				sackdelay_change;
2441 		}
2442 	}
2443 
2444 	/* Note that a value of zero indicates the current setting should be
2445 	   left unchanged.
2446 	 */
2447 	if (params->spp_pathmaxrxt) {
2448 		if (trans) {
2449 			trans->pathmaxrxt = params->spp_pathmaxrxt;
2450 		} else if (asoc) {
2451 			asoc->pathmaxrxt = params->spp_pathmaxrxt;
2452 		} else {
2453 			sp->pathmaxrxt = params->spp_pathmaxrxt;
2454 		}
2455 	}
2456 
2457 	return 0;
2458 }
2459 
2460 static int sctp_setsockopt_peer_addr_params(struct sock *sk,
2461 					    char __user *optval,
2462 					    unsigned int optlen)
2463 {
2464 	struct sctp_paddrparams  params;
2465 	struct sctp_transport   *trans = NULL;
2466 	struct sctp_association *asoc = NULL;
2467 	struct sctp_sock        *sp = sctp_sk(sk);
2468 	int error;
2469 	int hb_change, pmtud_change, sackdelay_change;
2470 
2471 	if (optlen != sizeof(struct sctp_paddrparams))
2472 		return - EINVAL;
2473 
2474 	if (copy_from_user(&params, optval, optlen))
2475 		return -EFAULT;
2476 
2477 	/* Validate flags and value parameters. */
2478 	hb_change        = params.spp_flags & SPP_HB;
2479 	pmtud_change     = params.spp_flags & SPP_PMTUD;
2480 	sackdelay_change = params.spp_flags & SPP_SACKDELAY;
2481 
2482 	if (hb_change        == SPP_HB ||
2483 	    pmtud_change     == SPP_PMTUD ||
2484 	    sackdelay_change == SPP_SACKDELAY ||
2485 	    params.spp_sackdelay > 500 ||
2486 	    (params.spp_pathmtu &&
2487 	     params.spp_pathmtu < SCTP_DEFAULT_MINSEGMENT))
2488 		return -EINVAL;
2489 
2490 	/* If an address other than INADDR_ANY is specified, and
2491 	 * no transport is found, then the request is invalid.
2492 	 */
2493 	if (!sctp_is_any(sk, ( union sctp_addr *)&params.spp_address)) {
2494 		trans = sctp_addr_id2transport(sk, &params.spp_address,
2495 					       params.spp_assoc_id);
2496 		if (!trans)
2497 			return -EINVAL;
2498 	}
2499 
2500 	/* Get association, if assoc_id != 0 and the socket is a one
2501 	 * to many style socket, and an association was not found, then
2502 	 * the id was invalid.
2503 	 */
2504 	asoc = sctp_id2assoc(sk, params.spp_assoc_id);
2505 	if (!asoc && params.spp_assoc_id && sctp_style(sk, UDP))
2506 		return -EINVAL;
2507 
2508 	/* Heartbeat demand can only be sent on a transport or
2509 	 * association, but not a socket.
2510 	 */
2511 	if (params.spp_flags & SPP_HB_DEMAND && !trans && !asoc)
2512 		return -EINVAL;
2513 
2514 	/* Process parameters. */
2515 	error = sctp_apply_peer_addr_params(&params, trans, asoc, sp,
2516 					    hb_change, pmtud_change,
2517 					    sackdelay_change);
2518 
2519 	if (error)
2520 		return error;
2521 
2522 	/* If changes are for association, also apply parameters to each
2523 	 * transport.
2524 	 */
2525 	if (!trans && asoc) {
2526 		list_for_each_entry(trans, &asoc->peer.transport_addr_list,
2527 				transports) {
2528 			sctp_apply_peer_addr_params(&params, trans, asoc, sp,
2529 						    hb_change, pmtud_change,
2530 						    sackdelay_change);
2531 		}
2532 	}
2533 
2534 	return 0;
2535 }
2536 
2537 /*
2538  * 7.1.23.  Get or set delayed ack timer (SCTP_DELAYED_SACK)
2539  *
2540  * This option will effect the way delayed acks are performed.  This
2541  * option allows you to get or set the delayed ack time, in
2542  * milliseconds.  It also allows changing the delayed ack frequency.
2543  * Changing the frequency to 1 disables the delayed sack algorithm.  If
2544  * the assoc_id is 0, then this sets or gets the endpoints default
2545  * values.  If the assoc_id field is non-zero, then the set or get
2546  * effects the specified association for the one to many model (the
2547  * assoc_id field is ignored by the one to one model).  Note that if
2548  * sack_delay or sack_freq are 0 when setting this option, then the
2549  * current values will remain unchanged.
2550  *
2551  * struct sctp_sack_info {
2552  *     sctp_assoc_t            sack_assoc_id;
2553  *     uint32_t                sack_delay;
2554  *     uint32_t                sack_freq;
2555  * };
2556  *
2557  * sack_assoc_id -  This parameter, indicates which association the user
2558  *    is performing an action upon.  Note that if this field's value is
2559  *    zero then the endpoints default value is changed (effecting future
2560  *    associations only).
2561  *
2562  * sack_delay -  This parameter contains the number of milliseconds that
2563  *    the user is requesting the delayed ACK timer be set to.  Note that
2564  *    this value is defined in the standard to be between 200 and 500
2565  *    milliseconds.
2566  *
2567  * sack_freq -  This parameter contains the number of packets that must
2568  *    be received before a sack is sent without waiting for the delay
2569  *    timer to expire.  The default value for this is 2, setting this
2570  *    value to 1 will disable the delayed sack algorithm.
2571  */
2572 
2573 static int sctp_setsockopt_delayed_ack(struct sock *sk,
2574 				       char __user *optval, unsigned int optlen)
2575 {
2576 	struct sctp_sack_info    params;
2577 	struct sctp_transport   *trans = NULL;
2578 	struct sctp_association *asoc = NULL;
2579 	struct sctp_sock        *sp = sctp_sk(sk);
2580 
2581 	if (optlen == sizeof(struct sctp_sack_info)) {
2582 		if (copy_from_user(&params, optval, optlen))
2583 			return -EFAULT;
2584 
2585 		if (params.sack_delay == 0 && params.sack_freq == 0)
2586 			return 0;
2587 	} else if (optlen == sizeof(struct sctp_assoc_value)) {
2588 		pr_warn("Use of struct sctp_assoc_value in delayed_ack socket option deprecated\n");
2589 		pr_warn("Use struct sctp_sack_info instead\n");
2590 		if (copy_from_user(&params, optval, optlen))
2591 			return -EFAULT;
2592 
2593 		if (params.sack_delay == 0)
2594 			params.sack_freq = 1;
2595 		else
2596 			params.sack_freq = 0;
2597 	} else
2598 		return - EINVAL;
2599 
2600 	/* Validate value parameter. */
2601 	if (params.sack_delay > 500)
2602 		return -EINVAL;
2603 
2604 	/* Get association, if sack_assoc_id != 0 and the socket is a one
2605 	 * to many style socket, and an association was not found, then
2606 	 * the id was invalid.
2607 	 */
2608 	asoc = sctp_id2assoc(sk, params.sack_assoc_id);
2609 	if (!asoc && params.sack_assoc_id && sctp_style(sk, UDP))
2610 		return -EINVAL;
2611 
2612 	if (params.sack_delay) {
2613 		if (asoc) {
2614 			asoc->sackdelay =
2615 				msecs_to_jiffies(params.sack_delay);
2616 			asoc->param_flags =
2617 				(asoc->param_flags & ~SPP_SACKDELAY) |
2618 				SPP_SACKDELAY_ENABLE;
2619 		} else {
2620 			sp->sackdelay = params.sack_delay;
2621 			sp->param_flags =
2622 				(sp->param_flags & ~SPP_SACKDELAY) |
2623 				SPP_SACKDELAY_ENABLE;
2624 		}
2625 	}
2626 
2627 	if (params.sack_freq == 1) {
2628 		if (asoc) {
2629 			asoc->param_flags =
2630 				(asoc->param_flags & ~SPP_SACKDELAY) |
2631 				SPP_SACKDELAY_DISABLE;
2632 		} else {
2633 			sp->param_flags =
2634 				(sp->param_flags & ~SPP_SACKDELAY) |
2635 				SPP_SACKDELAY_DISABLE;
2636 		}
2637 	} else if (params.sack_freq > 1) {
2638 		if (asoc) {
2639 			asoc->sackfreq = params.sack_freq;
2640 			asoc->param_flags =
2641 				(asoc->param_flags & ~SPP_SACKDELAY) |
2642 				SPP_SACKDELAY_ENABLE;
2643 		} else {
2644 			sp->sackfreq = params.sack_freq;
2645 			sp->param_flags =
2646 				(sp->param_flags & ~SPP_SACKDELAY) |
2647 				SPP_SACKDELAY_ENABLE;
2648 		}
2649 	}
2650 
2651 	/* If change is for association, also apply to each transport. */
2652 	if (asoc) {
2653 		list_for_each_entry(trans, &asoc->peer.transport_addr_list,
2654 				transports) {
2655 			if (params.sack_delay) {
2656 				trans->sackdelay =
2657 					msecs_to_jiffies(params.sack_delay);
2658 				trans->param_flags =
2659 					(trans->param_flags & ~SPP_SACKDELAY) |
2660 					SPP_SACKDELAY_ENABLE;
2661 			}
2662 			if (params.sack_freq == 1) {
2663 				trans->param_flags =
2664 					(trans->param_flags & ~SPP_SACKDELAY) |
2665 					SPP_SACKDELAY_DISABLE;
2666 			} else if (params.sack_freq > 1) {
2667 				trans->sackfreq = params.sack_freq;
2668 				trans->param_flags =
2669 					(trans->param_flags & ~SPP_SACKDELAY) |
2670 					SPP_SACKDELAY_ENABLE;
2671 			}
2672 		}
2673 	}
2674 
2675 	return 0;
2676 }
2677 
2678 /* 7.1.3 Initialization Parameters (SCTP_INITMSG)
2679  *
2680  * Applications can specify protocol parameters for the default association
2681  * initialization.  The option name argument to setsockopt() and getsockopt()
2682  * is SCTP_INITMSG.
2683  *
2684  * Setting initialization parameters is effective only on an unconnected
2685  * socket (for UDP-style sockets only future associations are effected
2686  * by the change).  With TCP-style sockets, this option is inherited by
2687  * sockets derived from a listener socket.
2688  */
2689 static int sctp_setsockopt_initmsg(struct sock *sk, char __user *optval, unsigned int optlen)
2690 {
2691 	struct sctp_initmsg sinit;
2692 	struct sctp_sock *sp = sctp_sk(sk);
2693 
2694 	if (optlen != sizeof(struct sctp_initmsg))
2695 		return -EINVAL;
2696 	if (copy_from_user(&sinit, optval, optlen))
2697 		return -EFAULT;
2698 
2699 	if (sinit.sinit_num_ostreams)
2700 		sp->initmsg.sinit_num_ostreams = sinit.sinit_num_ostreams;
2701 	if (sinit.sinit_max_instreams)
2702 		sp->initmsg.sinit_max_instreams = sinit.sinit_max_instreams;
2703 	if (sinit.sinit_max_attempts)
2704 		sp->initmsg.sinit_max_attempts = sinit.sinit_max_attempts;
2705 	if (sinit.sinit_max_init_timeo)
2706 		sp->initmsg.sinit_max_init_timeo = sinit.sinit_max_init_timeo;
2707 
2708 	return 0;
2709 }
2710 
2711 /*
2712  * 7.1.14 Set default send parameters (SCTP_DEFAULT_SEND_PARAM)
2713  *
2714  *   Applications that wish to use the sendto() system call may wish to
2715  *   specify a default set of parameters that would normally be supplied
2716  *   through the inclusion of ancillary data.  This socket option allows
2717  *   such an application to set the default sctp_sndrcvinfo structure.
2718  *   The application that wishes to use this socket option simply passes
2719  *   in to this call the sctp_sndrcvinfo structure defined in Section
2720  *   5.2.2) The input parameters accepted by this call include
2721  *   sinfo_stream, sinfo_flags, sinfo_ppid, sinfo_context,
2722  *   sinfo_timetolive.  The user must provide the sinfo_assoc_id field in
2723  *   to this call if the caller is using the UDP model.
2724  */
2725 static int sctp_setsockopt_default_send_param(struct sock *sk,
2726 					      char __user *optval,
2727 					      unsigned int optlen)
2728 {
2729 	struct sctp_sndrcvinfo info;
2730 	struct sctp_association *asoc;
2731 	struct sctp_sock *sp = sctp_sk(sk);
2732 
2733 	if (optlen != sizeof(struct sctp_sndrcvinfo))
2734 		return -EINVAL;
2735 	if (copy_from_user(&info, optval, optlen))
2736 		return -EFAULT;
2737 
2738 	asoc = sctp_id2assoc(sk, info.sinfo_assoc_id);
2739 	if (!asoc && info.sinfo_assoc_id && sctp_style(sk, UDP))
2740 		return -EINVAL;
2741 
2742 	if (asoc) {
2743 		asoc->default_stream = info.sinfo_stream;
2744 		asoc->default_flags = info.sinfo_flags;
2745 		asoc->default_ppid = info.sinfo_ppid;
2746 		asoc->default_context = info.sinfo_context;
2747 		asoc->default_timetolive = info.sinfo_timetolive;
2748 	} else {
2749 		sp->default_stream = info.sinfo_stream;
2750 		sp->default_flags = info.sinfo_flags;
2751 		sp->default_ppid = info.sinfo_ppid;
2752 		sp->default_context = info.sinfo_context;
2753 		sp->default_timetolive = info.sinfo_timetolive;
2754 	}
2755 
2756 	return 0;
2757 }
2758 
2759 /* 7.1.10 Set Primary Address (SCTP_PRIMARY_ADDR)
2760  *
2761  * Requests that the local SCTP stack use the enclosed peer address as
2762  * the association primary.  The enclosed address must be one of the
2763  * association peer's addresses.
2764  */
2765 static int sctp_setsockopt_primary_addr(struct sock *sk, char __user *optval,
2766 					unsigned int optlen)
2767 {
2768 	struct sctp_prim prim;
2769 	struct sctp_transport *trans;
2770 
2771 	if (optlen != sizeof(struct sctp_prim))
2772 		return -EINVAL;
2773 
2774 	if (copy_from_user(&prim, optval, sizeof(struct sctp_prim)))
2775 		return -EFAULT;
2776 
2777 	trans = sctp_addr_id2transport(sk, &prim.ssp_addr, prim.ssp_assoc_id);
2778 	if (!trans)
2779 		return -EINVAL;
2780 
2781 	sctp_assoc_set_primary(trans->asoc, trans);
2782 
2783 	return 0;
2784 }
2785 
2786 /*
2787  * 7.1.5 SCTP_NODELAY
2788  *
2789  * Turn on/off any Nagle-like algorithm.  This means that packets are
2790  * generally sent as soon as possible and no unnecessary delays are
2791  * introduced, at the cost of more packets in the network.  Expects an
2792  *  integer boolean flag.
2793  */
2794 static int sctp_setsockopt_nodelay(struct sock *sk, char __user *optval,
2795 				   unsigned int optlen)
2796 {
2797 	int val;
2798 
2799 	if (optlen < sizeof(int))
2800 		return -EINVAL;
2801 	if (get_user(val, (int __user *)optval))
2802 		return -EFAULT;
2803 
2804 	sctp_sk(sk)->nodelay = (val == 0) ? 0 : 1;
2805 	return 0;
2806 }
2807 
2808 /*
2809  *
2810  * 7.1.1 SCTP_RTOINFO
2811  *
2812  * The protocol parameters used to initialize and bound retransmission
2813  * timeout (RTO) are tunable. sctp_rtoinfo structure is used to access
2814  * and modify these parameters.
2815  * All parameters are time values, in milliseconds.  A value of 0, when
2816  * modifying the parameters, indicates that the current value should not
2817  * be changed.
2818  *
2819  */
2820 static int sctp_setsockopt_rtoinfo(struct sock *sk, char __user *optval, unsigned int optlen)
2821 {
2822 	struct sctp_rtoinfo rtoinfo;
2823 	struct sctp_association *asoc;
2824 
2825 	if (optlen != sizeof (struct sctp_rtoinfo))
2826 		return -EINVAL;
2827 
2828 	if (copy_from_user(&rtoinfo, optval, optlen))
2829 		return -EFAULT;
2830 
2831 	asoc = sctp_id2assoc(sk, rtoinfo.srto_assoc_id);
2832 
2833 	/* Set the values to the specific association */
2834 	if (!asoc && rtoinfo.srto_assoc_id && sctp_style(sk, UDP))
2835 		return -EINVAL;
2836 
2837 	if (asoc) {
2838 		if (rtoinfo.srto_initial != 0)
2839 			asoc->rto_initial =
2840 				msecs_to_jiffies(rtoinfo.srto_initial);
2841 		if (rtoinfo.srto_max != 0)
2842 			asoc->rto_max = msecs_to_jiffies(rtoinfo.srto_max);
2843 		if (rtoinfo.srto_min != 0)
2844 			asoc->rto_min = msecs_to_jiffies(rtoinfo.srto_min);
2845 	} else {
2846 		/* If there is no association or the association-id = 0
2847 		 * set the values to the endpoint.
2848 		 */
2849 		struct sctp_sock *sp = sctp_sk(sk);
2850 
2851 		if (rtoinfo.srto_initial != 0)
2852 			sp->rtoinfo.srto_initial = rtoinfo.srto_initial;
2853 		if (rtoinfo.srto_max != 0)
2854 			sp->rtoinfo.srto_max = rtoinfo.srto_max;
2855 		if (rtoinfo.srto_min != 0)
2856 			sp->rtoinfo.srto_min = rtoinfo.srto_min;
2857 	}
2858 
2859 	return 0;
2860 }
2861 
2862 /*
2863  *
2864  * 7.1.2 SCTP_ASSOCINFO
2865  *
2866  * This option is used to tune the maximum retransmission attempts
2867  * of the association.
2868  * Returns an error if the new association retransmission value is
2869  * greater than the sum of the retransmission value  of the peer.
2870  * See [SCTP] for more information.
2871  *
2872  */
2873 static int sctp_setsockopt_associnfo(struct sock *sk, char __user *optval, unsigned int optlen)
2874 {
2875 
2876 	struct sctp_assocparams assocparams;
2877 	struct sctp_association *asoc;
2878 
2879 	if (optlen != sizeof(struct sctp_assocparams))
2880 		return -EINVAL;
2881 	if (copy_from_user(&assocparams, optval, optlen))
2882 		return -EFAULT;
2883 
2884 	asoc = sctp_id2assoc(sk, assocparams.sasoc_assoc_id);
2885 
2886 	if (!asoc && assocparams.sasoc_assoc_id && sctp_style(sk, UDP))
2887 		return -EINVAL;
2888 
2889 	/* Set the values to the specific association */
2890 	if (asoc) {
2891 		if (assocparams.sasoc_asocmaxrxt != 0) {
2892 			__u32 path_sum = 0;
2893 			int   paths = 0;
2894 			struct sctp_transport *peer_addr;
2895 
2896 			list_for_each_entry(peer_addr, &asoc->peer.transport_addr_list,
2897 					transports) {
2898 				path_sum += peer_addr->pathmaxrxt;
2899 				paths++;
2900 			}
2901 
2902 			/* Only validate asocmaxrxt if we have more than
2903 			 * one path/transport.  We do this because path
2904 			 * retransmissions are only counted when we have more
2905 			 * then one path.
2906 			 */
2907 			if (paths > 1 &&
2908 			    assocparams.sasoc_asocmaxrxt > path_sum)
2909 				return -EINVAL;
2910 
2911 			asoc->max_retrans = assocparams.sasoc_asocmaxrxt;
2912 		}
2913 
2914 		if (assocparams.sasoc_cookie_life != 0) {
2915 			asoc->cookie_life.tv_sec =
2916 					assocparams.sasoc_cookie_life / 1000;
2917 			asoc->cookie_life.tv_usec =
2918 					(assocparams.sasoc_cookie_life % 1000)
2919 					* 1000;
2920 		}
2921 	} else {
2922 		/* Set the values to the endpoint */
2923 		struct sctp_sock *sp = sctp_sk(sk);
2924 
2925 		if (assocparams.sasoc_asocmaxrxt != 0)
2926 			sp->assocparams.sasoc_asocmaxrxt =
2927 						assocparams.sasoc_asocmaxrxt;
2928 		if (assocparams.sasoc_cookie_life != 0)
2929 			sp->assocparams.sasoc_cookie_life =
2930 						assocparams.sasoc_cookie_life;
2931 	}
2932 	return 0;
2933 }
2934 
2935 /*
2936  * 7.1.16 Set/clear IPv4 mapped addresses (SCTP_I_WANT_MAPPED_V4_ADDR)
2937  *
2938  * This socket option is a boolean flag which turns on or off mapped V4
2939  * addresses.  If this option is turned on and the socket is type
2940  * PF_INET6, then IPv4 addresses will be mapped to V6 representation.
2941  * If this option is turned off, then no mapping will be done of V4
2942  * addresses and a user will receive both PF_INET6 and PF_INET type
2943  * addresses on the socket.
2944  */
2945 static int sctp_setsockopt_mappedv4(struct sock *sk, char __user *optval, unsigned int optlen)
2946 {
2947 	int val;
2948 	struct sctp_sock *sp = sctp_sk(sk);
2949 
2950 	if (optlen < sizeof(int))
2951 		return -EINVAL;
2952 	if (get_user(val, (int __user *)optval))
2953 		return -EFAULT;
2954 	if (val)
2955 		sp->v4mapped = 1;
2956 	else
2957 		sp->v4mapped = 0;
2958 
2959 	return 0;
2960 }
2961 
2962 /*
2963  * 8.1.16.  Get or Set the Maximum Fragmentation Size (SCTP_MAXSEG)
2964  * This option will get or set the maximum size to put in any outgoing
2965  * SCTP DATA chunk.  If a message is larger than this size it will be
2966  * fragmented by SCTP into the specified size.  Note that the underlying
2967  * SCTP implementation may fragment into smaller sized chunks when the
2968  * PMTU of the underlying association is smaller than the value set by
2969  * the user.  The default value for this option is '0' which indicates
2970  * the user is NOT limiting fragmentation and only the PMTU will effect
2971  * SCTP's choice of DATA chunk size.  Note also that values set larger
2972  * than the maximum size of an IP datagram will effectively let SCTP
2973  * control fragmentation (i.e. the same as setting this option to 0).
2974  *
2975  * The following structure is used to access and modify this parameter:
2976  *
2977  * struct sctp_assoc_value {
2978  *   sctp_assoc_t assoc_id;
2979  *   uint32_t assoc_value;
2980  * };
2981  *
2982  * assoc_id:  This parameter is ignored for one-to-one style sockets.
2983  *    For one-to-many style sockets this parameter indicates which
2984  *    association the user is performing an action upon.  Note that if
2985  *    this field's value is zero then the endpoints default value is
2986  *    changed (effecting future associations only).
2987  * assoc_value:  This parameter specifies the maximum size in bytes.
2988  */
2989 static int sctp_setsockopt_maxseg(struct sock *sk, char __user *optval, unsigned int optlen)
2990 {
2991 	struct sctp_assoc_value params;
2992 	struct sctp_association *asoc;
2993 	struct sctp_sock *sp = sctp_sk(sk);
2994 	int val;
2995 
2996 	if (optlen == sizeof(int)) {
2997 		pr_warn("Use of int in maxseg socket option deprecated\n");
2998 		pr_warn("Use struct sctp_assoc_value instead\n");
2999 		if (copy_from_user(&val, optval, optlen))
3000 			return -EFAULT;
3001 		params.assoc_id = 0;
3002 	} else if (optlen == sizeof(struct sctp_assoc_value)) {
3003 		if (copy_from_user(&params, optval, optlen))
3004 			return -EFAULT;
3005 		val = params.assoc_value;
3006 	} else
3007 		return -EINVAL;
3008 
3009 	if ((val != 0) && ((val < 8) || (val > SCTP_MAX_CHUNK_LEN)))
3010 		return -EINVAL;
3011 
3012 	asoc = sctp_id2assoc(sk, params.assoc_id);
3013 	if (!asoc && params.assoc_id && sctp_style(sk, UDP))
3014 		return -EINVAL;
3015 
3016 	if (asoc) {
3017 		if (val == 0) {
3018 			val = asoc->pathmtu;
3019 			val -= sp->pf->af->net_header_len;
3020 			val -= sizeof(struct sctphdr) +
3021 					sizeof(struct sctp_data_chunk);
3022 		}
3023 		asoc->user_frag = val;
3024 		asoc->frag_point = sctp_frag_point(asoc, asoc->pathmtu);
3025 	} else {
3026 		sp->user_frag = val;
3027 	}
3028 
3029 	return 0;
3030 }
3031 
3032 
3033 /*
3034  *  7.1.9 Set Peer Primary Address (SCTP_SET_PEER_PRIMARY_ADDR)
3035  *
3036  *   Requests that the peer mark the enclosed address as the association
3037  *   primary. The enclosed address must be one of the association's
3038  *   locally bound addresses. The following structure is used to make a
3039  *   set primary request:
3040  */
3041 static int sctp_setsockopt_peer_primary_addr(struct sock *sk, char __user *optval,
3042 					     unsigned int optlen)
3043 {
3044 	struct net *net = sock_net(sk);
3045 	struct sctp_sock	*sp;
3046 	struct sctp_association	*asoc = NULL;
3047 	struct sctp_setpeerprim	prim;
3048 	struct sctp_chunk	*chunk;
3049 	struct sctp_af		*af;
3050 	int 			err;
3051 
3052 	sp = sctp_sk(sk);
3053 
3054 	if (!net->sctp.addip_enable)
3055 		return -EPERM;
3056 
3057 	if (optlen != sizeof(struct sctp_setpeerprim))
3058 		return -EINVAL;
3059 
3060 	if (copy_from_user(&prim, optval, optlen))
3061 		return -EFAULT;
3062 
3063 	asoc = sctp_id2assoc(sk, prim.sspp_assoc_id);
3064 	if (!asoc)
3065 		return -EINVAL;
3066 
3067 	if (!asoc->peer.asconf_capable)
3068 		return -EPERM;
3069 
3070 	if (asoc->peer.addip_disabled_mask & SCTP_PARAM_SET_PRIMARY)
3071 		return -EPERM;
3072 
3073 	if (!sctp_state(asoc, ESTABLISHED))
3074 		return -ENOTCONN;
3075 
3076 	af = sctp_get_af_specific(prim.sspp_addr.ss_family);
3077 	if (!af)
3078 		return -EINVAL;
3079 
3080 	if (!af->addr_valid((union sctp_addr *)&prim.sspp_addr, sp, NULL))
3081 		return -EADDRNOTAVAIL;
3082 
3083 	if (!sctp_assoc_lookup_laddr(asoc, (union sctp_addr *)&prim.sspp_addr))
3084 		return -EADDRNOTAVAIL;
3085 
3086 	/* Create an ASCONF chunk with SET_PRIMARY parameter	*/
3087 	chunk = sctp_make_asconf_set_prim(asoc,
3088 					  (union sctp_addr *)&prim.sspp_addr);
3089 	if (!chunk)
3090 		return -ENOMEM;
3091 
3092 	err = sctp_send_asconf(asoc, chunk);
3093 
3094 	SCTP_DEBUG_PRINTK("We set peer primary addr primitively.\n");
3095 
3096 	return err;
3097 }
3098 
3099 static int sctp_setsockopt_adaptation_layer(struct sock *sk, char __user *optval,
3100 					    unsigned int optlen)
3101 {
3102 	struct sctp_setadaptation adaptation;
3103 
3104 	if (optlen != sizeof(struct sctp_setadaptation))
3105 		return -EINVAL;
3106 	if (copy_from_user(&adaptation, optval, optlen))
3107 		return -EFAULT;
3108 
3109 	sctp_sk(sk)->adaptation_ind = adaptation.ssb_adaptation_ind;
3110 
3111 	return 0;
3112 }
3113 
3114 /*
3115  * 7.1.29.  Set or Get the default context (SCTP_CONTEXT)
3116  *
3117  * The context field in the sctp_sndrcvinfo structure is normally only
3118  * used when a failed message is retrieved holding the value that was
3119  * sent down on the actual send call.  This option allows the setting of
3120  * a default context on an association basis that will be received on
3121  * reading messages from the peer.  This is especially helpful in the
3122  * one-2-many model for an application to keep some reference to an
3123  * internal state machine that is processing messages on the
3124  * association.  Note that the setting of this value only effects
3125  * received messages from the peer and does not effect the value that is
3126  * saved with outbound messages.
3127  */
3128 static int sctp_setsockopt_context(struct sock *sk, char __user *optval,
3129 				   unsigned int optlen)
3130 {
3131 	struct sctp_assoc_value params;
3132 	struct sctp_sock *sp;
3133 	struct sctp_association *asoc;
3134 
3135 	if (optlen != sizeof(struct sctp_assoc_value))
3136 		return -EINVAL;
3137 	if (copy_from_user(&params, optval, optlen))
3138 		return -EFAULT;
3139 
3140 	sp = sctp_sk(sk);
3141 
3142 	if (params.assoc_id != 0) {
3143 		asoc = sctp_id2assoc(sk, params.assoc_id);
3144 		if (!asoc)
3145 			return -EINVAL;
3146 		asoc->default_rcv_context = params.assoc_value;
3147 	} else {
3148 		sp->default_rcv_context = params.assoc_value;
3149 	}
3150 
3151 	return 0;
3152 }
3153 
3154 /*
3155  * 7.1.24.  Get or set fragmented interleave (SCTP_FRAGMENT_INTERLEAVE)
3156  *
3157  * This options will at a minimum specify if the implementation is doing
3158  * fragmented interleave.  Fragmented interleave, for a one to many
3159  * socket, is when subsequent calls to receive a message may return
3160  * parts of messages from different associations.  Some implementations
3161  * may allow you to turn this value on or off.  If so, when turned off,
3162  * no fragment interleave will occur (which will cause a head of line
3163  * blocking amongst multiple associations sharing the same one to many
3164  * socket).  When this option is turned on, then each receive call may
3165  * come from a different association (thus the user must receive data
3166  * with the extended calls (e.g. sctp_recvmsg) to keep track of which
3167  * association each receive belongs to.
3168  *
3169  * This option takes a boolean value.  A non-zero value indicates that
3170  * fragmented interleave is on.  A value of zero indicates that
3171  * fragmented interleave is off.
3172  *
3173  * Note that it is important that an implementation that allows this
3174  * option to be turned on, have it off by default.  Otherwise an unaware
3175  * application using the one to many model may become confused and act
3176  * incorrectly.
3177  */
3178 static int sctp_setsockopt_fragment_interleave(struct sock *sk,
3179 					       char __user *optval,
3180 					       unsigned int optlen)
3181 {
3182 	int val;
3183 
3184 	if (optlen != sizeof(int))
3185 		return -EINVAL;
3186 	if (get_user(val, (int __user *)optval))
3187 		return -EFAULT;
3188 
3189 	sctp_sk(sk)->frag_interleave = (val == 0) ? 0 : 1;
3190 
3191 	return 0;
3192 }
3193 
3194 /*
3195  * 8.1.21.  Set or Get the SCTP Partial Delivery Point
3196  *       (SCTP_PARTIAL_DELIVERY_POINT)
3197  *
3198  * This option will set or get the SCTP partial delivery point.  This
3199  * point is the size of a message where the partial delivery API will be
3200  * invoked to help free up rwnd space for the peer.  Setting this to a
3201  * lower value will cause partial deliveries to happen more often.  The
3202  * calls argument is an integer that sets or gets the partial delivery
3203  * point.  Note also that the call will fail if the user attempts to set
3204  * this value larger than the socket receive buffer size.
3205  *
3206  * Note that any single message having a length smaller than or equal to
3207  * the SCTP partial delivery point will be delivered in one single read
3208  * call as long as the user provided buffer is large enough to hold the
3209  * message.
3210  */
3211 static int sctp_setsockopt_partial_delivery_point(struct sock *sk,
3212 						  char __user *optval,
3213 						  unsigned int optlen)
3214 {
3215 	u32 val;
3216 
3217 	if (optlen != sizeof(u32))
3218 		return -EINVAL;
3219 	if (get_user(val, (int __user *)optval))
3220 		return -EFAULT;
3221 
3222 	/* Note: We double the receive buffer from what the user sets
3223 	 * it to be, also initial rwnd is based on rcvbuf/2.
3224 	 */
3225 	if (val > (sk->sk_rcvbuf >> 1))
3226 		return -EINVAL;
3227 
3228 	sctp_sk(sk)->pd_point = val;
3229 
3230 	return 0; /* is this the right error code? */
3231 }
3232 
3233 /*
3234  * 7.1.28.  Set or Get the maximum burst (SCTP_MAX_BURST)
3235  *
3236  * This option will allow a user to change the maximum burst of packets
3237  * that can be emitted by this association.  Note that the default value
3238  * is 4, and some implementations may restrict this setting so that it
3239  * can only be lowered.
3240  *
3241  * NOTE: This text doesn't seem right.  Do this on a socket basis with
3242  * future associations inheriting the socket value.
3243  */
3244 static int sctp_setsockopt_maxburst(struct sock *sk,
3245 				    char __user *optval,
3246 				    unsigned int optlen)
3247 {
3248 	struct sctp_assoc_value params;
3249 	struct sctp_sock *sp;
3250 	struct sctp_association *asoc;
3251 	int val;
3252 	int assoc_id = 0;
3253 
3254 	if (optlen == sizeof(int)) {
3255 		pr_warn("Use of int in max_burst socket option deprecated\n");
3256 		pr_warn("Use struct sctp_assoc_value instead\n");
3257 		if (copy_from_user(&val, optval, optlen))
3258 			return -EFAULT;
3259 	} else if (optlen == sizeof(struct sctp_assoc_value)) {
3260 		if (copy_from_user(&params, optval, optlen))
3261 			return -EFAULT;
3262 		val = params.assoc_value;
3263 		assoc_id = params.assoc_id;
3264 	} else
3265 		return -EINVAL;
3266 
3267 	sp = sctp_sk(sk);
3268 
3269 	if (assoc_id != 0) {
3270 		asoc = sctp_id2assoc(sk, assoc_id);
3271 		if (!asoc)
3272 			return -EINVAL;
3273 		asoc->max_burst = val;
3274 	} else
3275 		sp->max_burst = val;
3276 
3277 	return 0;
3278 }
3279 
3280 /*
3281  * 7.1.18.  Add a chunk that must be authenticated (SCTP_AUTH_CHUNK)
3282  *
3283  * This set option adds a chunk type that the user is requesting to be
3284  * received only in an authenticated way.  Changes to the list of chunks
3285  * will only effect future associations on the socket.
3286  */
3287 static int sctp_setsockopt_auth_chunk(struct sock *sk,
3288 				      char __user *optval,
3289 				      unsigned int optlen)
3290 {
3291 	struct net *net = sock_net(sk);
3292 	struct sctp_authchunk val;
3293 
3294 	if (!net->sctp.auth_enable)
3295 		return -EACCES;
3296 
3297 	if (optlen != sizeof(struct sctp_authchunk))
3298 		return -EINVAL;
3299 	if (copy_from_user(&val, optval, optlen))
3300 		return -EFAULT;
3301 
3302 	switch (val.sauth_chunk) {
3303 	case SCTP_CID_INIT:
3304 	case SCTP_CID_INIT_ACK:
3305 	case SCTP_CID_SHUTDOWN_COMPLETE:
3306 	case SCTP_CID_AUTH:
3307 		return -EINVAL;
3308 	}
3309 
3310 	/* add this chunk id to the endpoint */
3311 	return sctp_auth_ep_add_chunkid(sctp_sk(sk)->ep, val.sauth_chunk);
3312 }
3313 
3314 /*
3315  * 7.1.19.  Get or set the list of supported HMAC Identifiers (SCTP_HMAC_IDENT)
3316  *
3317  * This option gets or sets the list of HMAC algorithms that the local
3318  * endpoint requires the peer to use.
3319  */
3320 static int sctp_setsockopt_hmac_ident(struct sock *sk,
3321 				      char __user *optval,
3322 				      unsigned int optlen)
3323 {
3324 	struct net *net = sock_net(sk);
3325 	struct sctp_hmacalgo *hmacs;
3326 	u32 idents;
3327 	int err;
3328 
3329 	if (!net->sctp.auth_enable)
3330 		return -EACCES;
3331 
3332 	if (optlen < sizeof(struct sctp_hmacalgo))
3333 		return -EINVAL;
3334 
3335 	hmacs= memdup_user(optval, optlen);
3336 	if (IS_ERR(hmacs))
3337 		return PTR_ERR(hmacs);
3338 
3339 	idents = hmacs->shmac_num_idents;
3340 	if (idents == 0 || idents > SCTP_AUTH_NUM_HMACS ||
3341 	    (idents * sizeof(u16)) > (optlen - sizeof(struct sctp_hmacalgo))) {
3342 		err = -EINVAL;
3343 		goto out;
3344 	}
3345 
3346 	err = sctp_auth_ep_set_hmacs(sctp_sk(sk)->ep, hmacs);
3347 out:
3348 	kfree(hmacs);
3349 	return err;
3350 }
3351 
3352 /*
3353  * 7.1.20.  Set a shared key (SCTP_AUTH_KEY)
3354  *
3355  * This option will set a shared secret key which is used to build an
3356  * association shared key.
3357  */
3358 static int sctp_setsockopt_auth_key(struct sock *sk,
3359 				    char __user *optval,
3360 				    unsigned int optlen)
3361 {
3362 	struct net *net = sock_net(sk);
3363 	struct sctp_authkey *authkey;
3364 	struct sctp_association *asoc;
3365 	int ret;
3366 
3367 	if (!net->sctp.auth_enable)
3368 		return -EACCES;
3369 
3370 	if (optlen <= sizeof(struct sctp_authkey))
3371 		return -EINVAL;
3372 
3373 	authkey= memdup_user(optval, optlen);
3374 	if (IS_ERR(authkey))
3375 		return PTR_ERR(authkey);
3376 
3377 	if (authkey->sca_keylength > optlen - sizeof(struct sctp_authkey)) {
3378 		ret = -EINVAL;
3379 		goto out;
3380 	}
3381 
3382 	asoc = sctp_id2assoc(sk, authkey->sca_assoc_id);
3383 	if (!asoc && authkey->sca_assoc_id && sctp_style(sk, UDP)) {
3384 		ret = -EINVAL;
3385 		goto out;
3386 	}
3387 
3388 	ret = sctp_auth_set_key(sctp_sk(sk)->ep, asoc, authkey);
3389 out:
3390 	kfree(authkey);
3391 	return ret;
3392 }
3393 
3394 /*
3395  * 7.1.21.  Get or set the active shared key (SCTP_AUTH_ACTIVE_KEY)
3396  *
3397  * This option will get or set the active shared key to be used to build
3398  * the association shared key.
3399  */
3400 static int sctp_setsockopt_active_key(struct sock *sk,
3401 				      char __user *optval,
3402 				      unsigned int optlen)
3403 {
3404 	struct net *net = sock_net(sk);
3405 	struct sctp_authkeyid val;
3406 	struct sctp_association *asoc;
3407 
3408 	if (!net->sctp.auth_enable)
3409 		return -EACCES;
3410 
3411 	if (optlen != sizeof(struct sctp_authkeyid))
3412 		return -EINVAL;
3413 	if (copy_from_user(&val, optval, optlen))
3414 		return -EFAULT;
3415 
3416 	asoc = sctp_id2assoc(sk, val.scact_assoc_id);
3417 	if (!asoc && val.scact_assoc_id && sctp_style(sk, UDP))
3418 		return -EINVAL;
3419 
3420 	return sctp_auth_set_active_key(sctp_sk(sk)->ep, asoc,
3421 					val.scact_keynumber);
3422 }
3423 
3424 /*
3425  * 7.1.22.  Delete a shared key (SCTP_AUTH_DELETE_KEY)
3426  *
3427  * This set option will delete a shared secret key from use.
3428  */
3429 static int sctp_setsockopt_del_key(struct sock *sk,
3430 				   char __user *optval,
3431 				   unsigned int optlen)
3432 {
3433 	struct net *net = sock_net(sk);
3434 	struct sctp_authkeyid val;
3435 	struct sctp_association *asoc;
3436 
3437 	if (!net->sctp.auth_enable)
3438 		return -EACCES;
3439 
3440 	if (optlen != sizeof(struct sctp_authkeyid))
3441 		return -EINVAL;
3442 	if (copy_from_user(&val, optval, optlen))
3443 		return -EFAULT;
3444 
3445 	asoc = sctp_id2assoc(sk, val.scact_assoc_id);
3446 	if (!asoc && val.scact_assoc_id && sctp_style(sk, UDP))
3447 		return -EINVAL;
3448 
3449 	return sctp_auth_del_key_id(sctp_sk(sk)->ep, asoc,
3450 				    val.scact_keynumber);
3451 
3452 }
3453 
3454 /*
3455  * 8.1.23 SCTP_AUTO_ASCONF
3456  *
3457  * This option will enable or disable the use of the automatic generation of
3458  * ASCONF chunks to add and delete addresses to an existing association.  Note
3459  * that this option has two caveats namely: a) it only affects sockets that
3460  * are bound to all addresses available to the SCTP stack, and b) the system
3461  * administrator may have an overriding control that turns the ASCONF feature
3462  * off no matter what setting the socket option may have.
3463  * This option expects an integer boolean flag, where a non-zero value turns on
3464  * the option, and a zero value turns off the option.
3465  * Note. In this implementation, socket operation overrides default parameter
3466  * being set by sysctl as well as FreeBSD implementation
3467  */
3468 static int sctp_setsockopt_auto_asconf(struct sock *sk, char __user *optval,
3469 					unsigned int optlen)
3470 {
3471 	int val;
3472 	struct sctp_sock *sp = sctp_sk(sk);
3473 
3474 	if (optlen < sizeof(int))
3475 		return -EINVAL;
3476 	if (get_user(val, (int __user *)optval))
3477 		return -EFAULT;
3478 	if (!sctp_is_ep_boundall(sk) && val)
3479 		return -EINVAL;
3480 	if ((val && sp->do_auto_asconf) || (!val && !sp->do_auto_asconf))
3481 		return 0;
3482 
3483 	if (val == 0 && sp->do_auto_asconf) {
3484 		list_del(&sp->auto_asconf_list);
3485 		sp->do_auto_asconf = 0;
3486 	} else if (val && !sp->do_auto_asconf) {
3487 		list_add_tail(&sp->auto_asconf_list,
3488 		    &sock_net(sk)->sctp.auto_asconf_splist);
3489 		sp->do_auto_asconf = 1;
3490 	}
3491 	return 0;
3492 }
3493 
3494 
3495 /*
3496  * SCTP_PEER_ADDR_THLDS
3497  *
3498  * This option allows us to alter the partially failed threshold for one or all
3499  * transports in an association.  See Section 6.1 of:
3500  * http://www.ietf.org/id/draft-nishida-tsvwg-sctp-failover-05.txt
3501  */
3502 static int sctp_setsockopt_paddr_thresholds(struct sock *sk,
3503 					    char __user *optval,
3504 					    unsigned int optlen)
3505 {
3506 	struct sctp_paddrthlds val;
3507 	struct sctp_transport *trans;
3508 	struct sctp_association *asoc;
3509 
3510 	if (optlen < sizeof(struct sctp_paddrthlds))
3511 		return -EINVAL;
3512 	if (copy_from_user(&val, (struct sctp_paddrthlds __user *)optval,
3513 			   sizeof(struct sctp_paddrthlds)))
3514 		return -EFAULT;
3515 
3516 
3517 	if (sctp_is_any(sk, (const union sctp_addr *)&val.spt_address)) {
3518 		asoc = sctp_id2assoc(sk, val.spt_assoc_id);
3519 		if (!asoc)
3520 			return -ENOENT;
3521 		list_for_each_entry(trans, &asoc->peer.transport_addr_list,
3522 				    transports) {
3523 			if (val.spt_pathmaxrxt)
3524 				trans->pathmaxrxt = val.spt_pathmaxrxt;
3525 			trans->pf_retrans = val.spt_pathpfthld;
3526 		}
3527 
3528 		if (val.spt_pathmaxrxt)
3529 			asoc->pathmaxrxt = val.spt_pathmaxrxt;
3530 		asoc->pf_retrans = val.spt_pathpfthld;
3531 	} else {
3532 		trans = sctp_addr_id2transport(sk, &val.spt_address,
3533 					       val.spt_assoc_id);
3534 		if (!trans)
3535 			return -ENOENT;
3536 
3537 		if (val.spt_pathmaxrxt)
3538 			trans->pathmaxrxt = val.spt_pathmaxrxt;
3539 		trans->pf_retrans = val.spt_pathpfthld;
3540 	}
3541 
3542 	return 0;
3543 }
3544 
3545 /* API 6.2 setsockopt(), getsockopt()
3546  *
3547  * Applications use setsockopt() and getsockopt() to set or retrieve
3548  * socket options.  Socket options are used to change the default
3549  * behavior of sockets calls.  They are described in Section 7.
3550  *
3551  * The syntax is:
3552  *
3553  *   ret = getsockopt(int sd, int level, int optname, void __user *optval,
3554  *                    int __user *optlen);
3555  *   ret = setsockopt(int sd, int level, int optname, const void __user *optval,
3556  *                    int optlen);
3557  *
3558  *   sd      - the socket descript.
3559  *   level   - set to IPPROTO_SCTP for all SCTP options.
3560  *   optname - the option name.
3561  *   optval  - the buffer to store the value of the option.
3562  *   optlen  - the size of the buffer.
3563  */
3564 SCTP_STATIC int sctp_setsockopt(struct sock *sk, int level, int optname,
3565 				char __user *optval, unsigned int optlen)
3566 {
3567 	int retval = 0;
3568 
3569 	SCTP_DEBUG_PRINTK("sctp_setsockopt(sk: %p... optname: %d)\n",
3570 			  sk, optname);
3571 
3572 	/* I can hardly begin to describe how wrong this is.  This is
3573 	 * so broken as to be worse than useless.  The API draft
3574 	 * REALLY is NOT helpful here...  I am not convinced that the
3575 	 * semantics of setsockopt() with a level OTHER THAN SOL_SCTP
3576 	 * are at all well-founded.
3577 	 */
3578 	if (level != SOL_SCTP) {
3579 		struct sctp_af *af = sctp_sk(sk)->pf->af;
3580 		retval = af->setsockopt(sk, level, optname, optval, optlen);
3581 		goto out_nounlock;
3582 	}
3583 
3584 	sctp_lock_sock(sk);
3585 
3586 	switch (optname) {
3587 	case SCTP_SOCKOPT_BINDX_ADD:
3588 		/* 'optlen' is the size of the addresses buffer. */
3589 		retval = sctp_setsockopt_bindx(sk, (struct sockaddr __user *)optval,
3590 					       optlen, SCTP_BINDX_ADD_ADDR);
3591 		break;
3592 
3593 	case SCTP_SOCKOPT_BINDX_REM:
3594 		/* 'optlen' is the size of the addresses buffer. */
3595 		retval = sctp_setsockopt_bindx(sk, (struct sockaddr __user *)optval,
3596 					       optlen, SCTP_BINDX_REM_ADDR);
3597 		break;
3598 
3599 	case SCTP_SOCKOPT_CONNECTX_OLD:
3600 		/* 'optlen' is the size of the addresses buffer. */
3601 		retval = sctp_setsockopt_connectx_old(sk,
3602 					    (struct sockaddr __user *)optval,
3603 					    optlen);
3604 		break;
3605 
3606 	case SCTP_SOCKOPT_CONNECTX:
3607 		/* 'optlen' is the size of the addresses buffer. */
3608 		retval = sctp_setsockopt_connectx(sk,
3609 					    (struct sockaddr __user *)optval,
3610 					    optlen);
3611 		break;
3612 
3613 	case SCTP_DISABLE_FRAGMENTS:
3614 		retval = sctp_setsockopt_disable_fragments(sk, optval, optlen);
3615 		break;
3616 
3617 	case SCTP_EVENTS:
3618 		retval = sctp_setsockopt_events(sk, optval, optlen);
3619 		break;
3620 
3621 	case SCTP_AUTOCLOSE:
3622 		retval = sctp_setsockopt_autoclose(sk, optval, optlen);
3623 		break;
3624 
3625 	case SCTP_PEER_ADDR_PARAMS:
3626 		retval = sctp_setsockopt_peer_addr_params(sk, optval, optlen);
3627 		break;
3628 
3629 	case SCTP_DELAYED_SACK:
3630 		retval = sctp_setsockopt_delayed_ack(sk, optval, optlen);
3631 		break;
3632 	case SCTP_PARTIAL_DELIVERY_POINT:
3633 		retval = sctp_setsockopt_partial_delivery_point(sk, optval, optlen);
3634 		break;
3635 
3636 	case SCTP_INITMSG:
3637 		retval = sctp_setsockopt_initmsg(sk, optval, optlen);
3638 		break;
3639 	case SCTP_DEFAULT_SEND_PARAM:
3640 		retval = sctp_setsockopt_default_send_param(sk, optval,
3641 							    optlen);
3642 		break;
3643 	case SCTP_PRIMARY_ADDR:
3644 		retval = sctp_setsockopt_primary_addr(sk, optval, optlen);
3645 		break;
3646 	case SCTP_SET_PEER_PRIMARY_ADDR:
3647 		retval = sctp_setsockopt_peer_primary_addr(sk, optval, optlen);
3648 		break;
3649 	case SCTP_NODELAY:
3650 		retval = sctp_setsockopt_nodelay(sk, optval, optlen);
3651 		break;
3652 	case SCTP_RTOINFO:
3653 		retval = sctp_setsockopt_rtoinfo(sk, optval, optlen);
3654 		break;
3655 	case SCTP_ASSOCINFO:
3656 		retval = sctp_setsockopt_associnfo(sk, optval, optlen);
3657 		break;
3658 	case SCTP_I_WANT_MAPPED_V4_ADDR:
3659 		retval = sctp_setsockopt_mappedv4(sk, optval, optlen);
3660 		break;
3661 	case SCTP_MAXSEG:
3662 		retval = sctp_setsockopt_maxseg(sk, optval, optlen);
3663 		break;
3664 	case SCTP_ADAPTATION_LAYER:
3665 		retval = sctp_setsockopt_adaptation_layer(sk, optval, optlen);
3666 		break;
3667 	case SCTP_CONTEXT:
3668 		retval = sctp_setsockopt_context(sk, optval, optlen);
3669 		break;
3670 	case SCTP_FRAGMENT_INTERLEAVE:
3671 		retval = sctp_setsockopt_fragment_interleave(sk, optval, optlen);
3672 		break;
3673 	case SCTP_MAX_BURST:
3674 		retval = sctp_setsockopt_maxburst(sk, optval, optlen);
3675 		break;
3676 	case SCTP_AUTH_CHUNK:
3677 		retval = sctp_setsockopt_auth_chunk(sk, optval, optlen);
3678 		break;
3679 	case SCTP_HMAC_IDENT:
3680 		retval = sctp_setsockopt_hmac_ident(sk, optval, optlen);
3681 		break;
3682 	case SCTP_AUTH_KEY:
3683 		retval = sctp_setsockopt_auth_key(sk, optval, optlen);
3684 		break;
3685 	case SCTP_AUTH_ACTIVE_KEY:
3686 		retval = sctp_setsockopt_active_key(sk, optval, optlen);
3687 		break;
3688 	case SCTP_AUTH_DELETE_KEY:
3689 		retval = sctp_setsockopt_del_key(sk, optval, optlen);
3690 		break;
3691 	case SCTP_AUTO_ASCONF:
3692 		retval = sctp_setsockopt_auto_asconf(sk, optval, optlen);
3693 		break;
3694 	case SCTP_PEER_ADDR_THLDS:
3695 		retval = sctp_setsockopt_paddr_thresholds(sk, optval, optlen);
3696 		break;
3697 	default:
3698 		retval = -ENOPROTOOPT;
3699 		break;
3700 	}
3701 
3702 	sctp_release_sock(sk);
3703 
3704 out_nounlock:
3705 	return retval;
3706 }
3707 
3708 /* API 3.1.6 connect() - UDP Style Syntax
3709  *
3710  * An application may use the connect() call in the UDP model to initiate an
3711  * association without sending data.
3712  *
3713  * The syntax is:
3714  *
3715  * ret = connect(int sd, const struct sockaddr *nam, socklen_t len);
3716  *
3717  * sd: the socket descriptor to have a new association added to.
3718  *
3719  * nam: the address structure (either struct sockaddr_in or struct
3720  *    sockaddr_in6 defined in RFC2553 [7]).
3721  *
3722  * len: the size of the address.
3723  */
3724 SCTP_STATIC int sctp_connect(struct sock *sk, struct sockaddr *addr,
3725 			     int addr_len)
3726 {
3727 	int err = 0;
3728 	struct sctp_af *af;
3729 
3730 	sctp_lock_sock(sk);
3731 
3732 	SCTP_DEBUG_PRINTK("%s - sk: %p, sockaddr: %p, addr_len: %d\n",
3733 			  __func__, sk, addr, addr_len);
3734 
3735 	/* Validate addr_len before calling common connect/connectx routine. */
3736 	af = sctp_get_af_specific(addr->sa_family);
3737 	if (!af || addr_len < af->sockaddr_len) {
3738 		err = -EINVAL;
3739 	} else {
3740 		/* Pass correct addr len to common routine (so it knows there
3741 		 * is only one address being passed.
3742 		 */
3743 		err = __sctp_connect(sk, addr, af->sockaddr_len, NULL);
3744 	}
3745 
3746 	sctp_release_sock(sk);
3747 	return err;
3748 }
3749 
3750 /* FIXME: Write comments. */
3751 SCTP_STATIC int sctp_disconnect(struct sock *sk, int flags)
3752 {
3753 	return -EOPNOTSUPP; /* STUB */
3754 }
3755 
3756 /* 4.1.4 accept() - TCP Style Syntax
3757  *
3758  * Applications use accept() call to remove an established SCTP
3759  * association from the accept queue of the endpoint.  A new socket
3760  * descriptor will be returned from accept() to represent the newly
3761  * formed association.
3762  */
3763 SCTP_STATIC struct sock *sctp_accept(struct sock *sk, int flags, int *err)
3764 {
3765 	struct sctp_sock *sp;
3766 	struct sctp_endpoint *ep;
3767 	struct sock *newsk = NULL;
3768 	struct sctp_association *asoc;
3769 	long timeo;
3770 	int error = 0;
3771 
3772 	sctp_lock_sock(sk);
3773 
3774 	sp = sctp_sk(sk);
3775 	ep = sp->ep;
3776 
3777 	if (!sctp_style(sk, TCP)) {
3778 		error = -EOPNOTSUPP;
3779 		goto out;
3780 	}
3781 
3782 	if (!sctp_sstate(sk, LISTENING)) {
3783 		error = -EINVAL;
3784 		goto out;
3785 	}
3786 
3787 	timeo = sock_rcvtimeo(sk, flags & O_NONBLOCK);
3788 
3789 	error = sctp_wait_for_accept(sk, timeo);
3790 	if (error)
3791 		goto out;
3792 
3793 	/* We treat the list of associations on the endpoint as the accept
3794 	 * queue and pick the first association on the list.
3795 	 */
3796 	asoc = list_entry(ep->asocs.next, struct sctp_association, asocs);
3797 
3798 	newsk = sp->pf->create_accept_sk(sk, asoc);
3799 	if (!newsk) {
3800 		error = -ENOMEM;
3801 		goto out;
3802 	}
3803 
3804 	/* Populate the fields of the newsk from the oldsk and migrate the
3805 	 * asoc to the newsk.
3806 	 */
3807 	sctp_sock_migrate(sk, newsk, asoc, SCTP_SOCKET_TCP);
3808 
3809 out:
3810 	sctp_release_sock(sk);
3811 	*err = error;
3812 	return newsk;
3813 }
3814 
3815 /* The SCTP ioctl handler. */
3816 SCTP_STATIC int sctp_ioctl(struct sock *sk, int cmd, unsigned long arg)
3817 {
3818 	int rc = -ENOTCONN;
3819 
3820 	sctp_lock_sock(sk);
3821 
3822 	/*
3823 	 * SEQPACKET-style sockets in LISTENING state are valid, for
3824 	 * SCTP, so only discard TCP-style sockets in LISTENING state.
3825 	 */
3826 	if (sctp_style(sk, TCP) && sctp_sstate(sk, LISTENING))
3827 		goto out;
3828 
3829 	switch (cmd) {
3830 	case SIOCINQ: {
3831 		struct sk_buff *skb;
3832 		unsigned int amount = 0;
3833 
3834 		skb = skb_peek(&sk->sk_receive_queue);
3835 		if (skb != NULL) {
3836 			/*
3837 			 * We will only return the amount of this packet since
3838 			 * that is all that will be read.
3839 			 */
3840 			amount = skb->len;
3841 		}
3842 		rc = put_user(amount, (int __user *)arg);
3843 		break;
3844 	}
3845 	default:
3846 		rc = -ENOIOCTLCMD;
3847 		break;
3848 	}
3849 out:
3850 	sctp_release_sock(sk);
3851 	return rc;
3852 }
3853 
3854 /* This is the function which gets called during socket creation to
3855  * initialized the SCTP-specific portion of the sock.
3856  * The sock structure should already be zero-filled memory.
3857  */
3858 SCTP_STATIC int sctp_init_sock(struct sock *sk)
3859 {
3860 	struct net *net = sock_net(sk);
3861 	struct sctp_endpoint *ep;
3862 	struct sctp_sock *sp;
3863 
3864 	SCTP_DEBUG_PRINTK("sctp_init_sock(sk: %p)\n", sk);
3865 
3866 	sp = sctp_sk(sk);
3867 
3868 	/* Initialize the SCTP per socket area.  */
3869 	switch (sk->sk_type) {
3870 	case SOCK_SEQPACKET:
3871 		sp->type = SCTP_SOCKET_UDP;
3872 		break;
3873 	case SOCK_STREAM:
3874 		sp->type = SCTP_SOCKET_TCP;
3875 		break;
3876 	default:
3877 		return -ESOCKTNOSUPPORT;
3878 	}
3879 
3880 	/* Initialize default send parameters. These parameters can be
3881 	 * modified with the SCTP_DEFAULT_SEND_PARAM socket option.
3882 	 */
3883 	sp->default_stream = 0;
3884 	sp->default_ppid = 0;
3885 	sp->default_flags = 0;
3886 	sp->default_context = 0;
3887 	sp->default_timetolive = 0;
3888 
3889 	sp->default_rcv_context = 0;
3890 	sp->max_burst = net->sctp.max_burst;
3891 
3892 	/* Initialize default setup parameters. These parameters
3893 	 * can be modified with the SCTP_INITMSG socket option or
3894 	 * overridden by the SCTP_INIT CMSG.
3895 	 */
3896 	sp->initmsg.sinit_num_ostreams   = sctp_max_outstreams;
3897 	sp->initmsg.sinit_max_instreams  = sctp_max_instreams;
3898 	sp->initmsg.sinit_max_attempts   = net->sctp.max_retrans_init;
3899 	sp->initmsg.sinit_max_init_timeo = net->sctp.rto_max;
3900 
3901 	/* Initialize default RTO related parameters.  These parameters can
3902 	 * be modified for with the SCTP_RTOINFO socket option.
3903 	 */
3904 	sp->rtoinfo.srto_initial = net->sctp.rto_initial;
3905 	sp->rtoinfo.srto_max     = net->sctp.rto_max;
3906 	sp->rtoinfo.srto_min     = net->sctp.rto_min;
3907 
3908 	/* Initialize default association related parameters. These parameters
3909 	 * can be modified with the SCTP_ASSOCINFO socket option.
3910 	 */
3911 	sp->assocparams.sasoc_asocmaxrxt = net->sctp.max_retrans_association;
3912 	sp->assocparams.sasoc_number_peer_destinations = 0;
3913 	sp->assocparams.sasoc_peer_rwnd = 0;
3914 	sp->assocparams.sasoc_local_rwnd = 0;
3915 	sp->assocparams.sasoc_cookie_life = net->sctp.valid_cookie_life;
3916 
3917 	/* Initialize default event subscriptions. By default, all the
3918 	 * options are off.
3919 	 */
3920 	memset(&sp->subscribe, 0, sizeof(struct sctp_event_subscribe));
3921 
3922 	/* Default Peer Address Parameters.  These defaults can
3923 	 * be modified via SCTP_PEER_ADDR_PARAMS
3924 	 */
3925 	sp->hbinterval  = net->sctp.hb_interval;
3926 	sp->pathmaxrxt  = net->sctp.max_retrans_path;
3927 	sp->pathmtu     = 0; // allow default discovery
3928 	sp->sackdelay   = net->sctp.sack_timeout;
3929 	sp->sackfreq	= 2;
3930 	sp->param_flags = SPP_HB_ENABLE |
3931 			  SPP_PMTUD_ENABLE |
3932 			  SPP_SACKDELAY_ENABLE;
3933 
3934 	/* If enabled no SCTP message fragmentation will be performed.
3935 	 * Configure through SCTP_DISABLE_FRAGMENTS socket option.
3936 	 */
3937 	sp->disable_fragments = 0;
3938 
3939 	/* Enable Nagle algorithm by default.  */
3940 	sp->nodelay           = 0;
3941 
3942 	/* Enable by default. */
3943 	sp->v4mapped          = 1;
3944 
3945 	/* Auto-close idle associations after the configured
3946 	 * number of seconds.  A value of 0 disables this
3947 	 * feature.  Configure through the SCTP_AUTOCLOSE socket option,
3948 	 * for UDP-style sockets only.
3949 	 */
3950 	sp->autoclose         = 0;
3951 
3952 	/* User specified fragmentation limit. */
3953 	sp->user_frag         = 0;
3954 
3955 	sp->adaptation_ind = 0;
3956 
3957 	sp->pf = sctp_get_pf_specific(sk->sk_family);
3958 
3959 	/* Control variables for partial data delivery. */
3960 	atomic_set(&sp->pd_mode, 0);
3961 	skb_queue_head_init(&sp->pd_lobby);
3962 	sp->frag_interleave = 0;
3963 
3964 	/* Create a per socket endpoint structure.  Even if we
3965 	 * change the data structure relationships, this may still
3966 	 * be useful for storing pre-connect address information.
3967 	 */
3968 	ep = sctp_endpoint_new(sk, GFP_KERNEL);
3969 	if (!ep)
3970 		return -ENOMEM;
3971 
3972 	sp->ep = ep;
3973 	sp->hmac = NULL;
3974 
3975 	SCTP_DBG_OBJCNT_INC(sock);
3976 
3977 	local_bh_disable();
3978 	percpu_counter_inc(&sctp_sockets_allocated);
3979 	sock_prot_inuse_add(net, sk->sk_prot, 1);
3980 	if (net->sctp.default_auto_asconf) {
3981 		list_add_tail(&sp->auto_asconf_list,
3982 		    &net->sctp.auto_asconf_splist);
3983 		sp->do_auto_asconf = 1;
3984 	} else
3985 		sp->do_auto_asconf = 0;
3986 	local_bh_enable();
3987 
3988 	return 0;
3989 }
3990 
3991 /* Cleanup any SCTP per socket resources.  */
3992 SCTP_STATIC void sctp_destroy_sock(struct sock *sk)
3993 {
3994 	struct sctp_sock *sp;
3995 
3996 	SCTP_DEBUG_PRINTK("sctp_destroy_sock(sk: %p)\n", sk);
3997 
3998 	/* Release our hold on the endpoint. */
3999 	sp = sctp_sk(sk);
4000 	if (sp->do_auto_asconf) {
4001 		sp->do_auto_asconf = 0;
4002 		list_del(&sp->auto_asconf_list);
4003 	}
4004 	sctp_endpoint_free(sp->ep);
4005 	local_bh_disable();
4006 	percpu_counter_dec(&sctp_sockets_allocated);
4007 	sock_prot_inuse_add(sock_net(sk), sk->sk_prot, -1);
4008 	local_bh_enable();
4009 }
4010 
4011 /* API 4.1.7 shutdown() - TCP Style Syntax
4012  *     int shutdown(int socket, int how);
4013  *
4014  *     sd      - the socket descriptor of the association to be closed.
4015  *     how     - Specifies the type of shutdown.  The  values  are
4016  *               as follows:
4017  *               SHUT_RD
4018  *                     Disables further receive operations. No SCTP
4019  *                     protocol action is taken.
4020  *               SHUT_WR
4021  *                     Disables further send operations, and initiates
4022  *                     the SCTP shutdown sequence.
4023  *               SHUT_RDWR
4024  *                     Disables further send  and  receive  operations
4025  *                     and initiates the SCTP shutdown sequence.
4026  */
4027 SCTP_STATIC void sctp_shutdown(struct sock *sk, int how)
4028 {
4029 	struct net *net = sock_net(sk);
4030 	struct sctp_endpoint *ep;
4031 	struct sctp_association *asoc;
4032 
4033 	if (!sctp_style(sk, TCP))
4034 		return;
4035 
4036 	if (how & SEND_SHUTDOWN) {
4037 		ep = sctp_sk(sk)->ep;
4038 		if (!list_empty(&ep->asocs)) {
4039 			asoc = list_entry(ep->asocs.next,
4040 					  struct sctp_association, asocs);
4041 			sctp_primitive_SHUTDOWN(net, asoc, NULL);
4042 		}
4043 	}
4044 }
4045 
4046 /* 7.2.1 Association Status (SCTP_STATUS)
4047 
4048  * Applications can retrieve current status information about an
4049  * association, including association state, peer receiver window size,
4050  * number of unacked data chunks, and number of data chunks pending
4051  * receipt.  This information is read-only.
4052  */
4053 static int sctp_getsockopt_sctp_status(struct sock *sk, int len,
4054 				       char __user *optval,
4055 				       int __user *optlen)
4056 {
4057 	struct sctp_status status;
4058 	struct sctp_association *asoc = NULL;
4059 	struct sctp_transport *transport;
4060 	sctp_assoc_t associd;
4061 	int retval = 0;
4062 
4063 	if (len < sizeof(status)) {
4064 		retval = -EINVAL;
4065 		goto out;
4066 	}
4067 
4068 	len = sizeof(status);
4069 	if (copy_from_user(&status, optval, len)) {
4070 		retval = -EFAULT;
4071 		goto out;
4072 	}
4073 
4074 	associd = status.sstat_assoc_id;
4075 	asoc = sctp_id2assoc(sk, associd);
4076 	if (!asoc) {
4077 		retval = -EINVAL;
4078 		goto out;
4079 	}
4080 
4081 	transport = asoc->peer.primary_path;
4082 
4083 	status.sstat_assoc_id = sctp_assoc2id(asoc);
4084 	status.sstat_state = asoc->state;
4085 	status.sstat_rwnd =  asoc->peer.rwnd;
4086 	status.sstat_unackdata = asoc->unack_data;
4087 
4088 	status.sstat_penddata = sctp_tsnmap_pending(&asoc->peer.tsn_map);
4089 	status.sstat_instrms = asoc->c.sinit_max_instreams;
4090 	status.sstat_outstrms = asoc->c.sinit_num_ostreams;
4091 	status.sstat_fragmentation_point = asoc->frag_point;
4092 	status.sstat_primary.spinfo_assoc_id = sctp_assoc2id(transport->asoc);
4093 	memcpy(&status.sstat_primary.spinfo_address, &transport->ipaddr,
4094 			transport->af_specific->sockaddr_len);
4095 	/* Map ipv4 address into v4-mapped-on-v6 address.  */
4096 	sctp_get_pf_specific(sk->sk_family)->addr_v4map(sctp_sk(sk),
4097 		(union sctp_addr *)&status.sstat_primary.spinfo_address);
4098 	status.sstat_primary.spinfo_state = transport->state;
4099 	status.sstat_primary.spinfo_cwnd = transport->cwnd;
4100 	status.sstat_primary.spinfo_srtt = transport->srtt;
4101 	status.sstat_primary.spinfo_rto = jiffies_to_msecs(transport->rto);
4102 	status.sstat_primary.spinfo_mtu = transport->pathmtu;
4103 
4104 	if (status.sstat_primary.spinfo_state == SCTP_UNKNOWN)
4105 		status.sstat_primary.spinfo_state = SCTP_ACTIVE;
4106 
4107 	if (put_user(len, optlen)) {
4108 		retval = -EFAULT;
4109 		goto out;
4110 	}
4111 
4112 	SCTP_DEBUG_PRINTK("sctp_getsockopt_sctp_status(%d): %d %d %d\n",
4113 			  len, status.sstat_state, status.sstat_rwnd,
4114 			  status.sstat_assoc_id);
4115 
4116 	if (copy_to_user(optval, &status, len)) {
4117 		retval = -EFAULT;
4118 		goto out;
4119 	}
4120 
4121 out:
4122 	return retval;
4123 }
4124 
4125 
4126 /* 7.2.2 Peer Address Information (SCTP_GET_PEER_ADDR_INFO)
4127  *
4128  * Applications can retrieve information about a specific peer address
4129  * of an association, including its reachability state, congestion
4130  * window, and retransmission timer values.  This information is
4131  * read-only.
4132  */
4133 static int sctp_getsockopt_peer_addr_info(struct sock *sk, int len,
4134 					  char __user *optval,
4135 					  int __user *optlen)
4136 {
4137 	struct sctp_paddrinfo pinfo;
4138 	struct sctp_transport *transport;
4139 	int retval = 0;
4140 
4141 	if (len < sizeof(pinfo)) {
4142 		retval = -EINVAL;
4143 		goto out;
4144 	}
4145 
4146 	len = sizeof(pinfo);
4147 	if (copy_from_user(&pinfo, optval, len)) {
4148 		retval = -EFAULT;
4149 		goto out;
4150 	}
4151 
4152 	transport = sctp_addr_id2transport(sk, &pinfo.spinfo_address,
4153 					   pinfo.spinfo_assoc_id);
4154 	if (!transport)
4155 		return -EINVAL;
4156 
4157 	pinfo.spinfo_assoc_id = sctp_assoc2id(transport->asoc);
4158 	pinfo.spinfo_state = transport->state;
4159 	pinfo.spinfo_cwnd = transport->cwnd;
4160 	pinfo.spinfo_srtt = transport->srtt;
4161 	pinfo.spinfo_rto = jiffies_to_msecs(transport->rto);
4162 	pinfo.spinfo_mtu = transport->pathmtu;
4163 
4164 	if (pinfo.spinfo_state == SCTP_UNKNOWN)
4165 		pinfo.spinfo_state = SCTP_ACTIVE;
4166 
4167 	if (put_user(len, optlen)) {
4168 		retval = -EFAULT;
4169 		goto out;
4170 	}
4171 
4172 	if (copy_to_user(optval, &pinfo, len)) {
4173 		retval = -EFAULT;
4174 		goto out;
4175 	}
4176 
4177 out:
4178 	return retval;
4179 }
4180 
4181 /* 7.1.12 Enable/Disable message fragmentation (SCTP_DISABLE_FRAGMENTS)
4182  *
4183  * This option is a on/off flag.  If enabled no SCTP message
4184  * fragmentation will be performed.  Instead if a message being sent
4185  * exceeds the current PMTU size, the message will NOT be sent and
4186  * instead a error will be indicated to the user.
4187  */
4188 static int sctp_getsockopt_disable_fragments(struct sock *sk, int len,
4189 					char __user *optval, int __user *optlen)
4190 {
4191 	int val;
4192 
4193 	if (len < sizeof(int))
4194 		return -EINVAL;
4195 
4196 	len = sizeof(int);
4197 	val = (sctp_sk(sk)->disable_fragments == 1);
4198 	if (put_user(len, optlen))
4199 		return -EFAULT;
4200 	if (copy_to_user(optval, &val, len))
4201 		return -EFAULT;
4202 	return 0;
4203 }
4204 
4205 /* 7.1.15 Set notification and ancillary events (SCTP_EVENTS)
4206  *
4207  * This socket option is used to specify various notifications and
4208  * ancillary data the user wishes to receive.
4209  */
4210 static int sctp_getsockopt_events(struct sock *sk, int len, char __user *optval,
4211 				  int __user *optlen)
4212 {
4213 	if (len <= 0)
4214 		return -EINVAL;
4215 	if (len > sizeof(struct sctp_event_subscribe))
4216 		len = sizeof(struct sctp_event_subscribe);
4217 	if (put_user(len, optlen))
4218 		return -EFAULT;
4219 	if (copy_to_user(optval, &sctp_sk(sk)->subscribe, len))
4220 		return -EFAULT;
4221 	return 0;
4222 }
4223 
4224 /* 7.1.8 Automatic Close of associations (SCTP_AUTOCLOSE)
4225  *
4226  * This socket option is applicable to the UDP-style socket only.  When
4227  * set it will cause associations that are idle for more than the
4228  * specified number of seconds to automatically close.  An association
4229  * being idle is defined an association that has NOT sent or received
4230  * user data.  The special value of '0' indicates that no automatic
4231  * close of any associations should be performed.  The option expects an
4232  * integer defining the number of seconds of idle time before an
4233  * association is closed.
4234  */
4235 static int sctp_getsockopt_autoclose(struct sock *sk, int len, char __user *optval, int __user *optlen)
4236 {
4237 	/* Applicable to UDP-style socket only */
4238 	if (sctp_style(sk, TCP))
4239 		return -EOPNOTSUPP;
4240 	if (len < sizeof(int))
4241 		return -EINVAL;
4242 	len = sizeof(int);
4243 	if (put_user(len, optlen))
4244 		return -EFAULT;
4245 	if (copy_to_user(optval, &sctp_sk(sk)->autoclose, sizeof(int)))
4246 		return -EFAULT;
4247 	return 0;
4248 }
4249 
4250 /* Helper routine to branch off an association to a new socket.  */
4251 int sctp_do_peeloff(struct sock *sk, sctp_assoc_t id, struct socket **sockp)
4252 {
4253 	struct sctp_association *asoc = sctp_id2assoc(sk, id);
4254 	struct socket *sock;
4255 	struct sctp_af *af;
4256 	int err = 0;
4257 
4258 	if (!asoc)
4259 		return -EINVAL;
4260 
4261 	/* An association cannot be branched off from an already peeled-off
4262 	 * socket, nor is this supported for tcp style sockets.
4263 	 */
4264 	if (!sctp_style(sk, UDP))
4265 		return -EINVAL;
4266 
4267 	/* Create a new socket.  */
4268 	err = sock_create(sk->sk_family, SOCK_SEQPACKET, IPPROTO_SCTP, &sock);
4269 	if (err < 0)
4270 		return err;
4271 
4272 	sctp_copy_sock(sock->sk, sk, asoc);
4273 
4274 	/* Make peeled-off sockets more like 1-1 accepted sockets.
4275 	 * Set the daddr and initialize id to something more random
4276 	 */
4277 	af = sctp_get_af_specific(asoc->peer.primary_addr.sa.sa_family);
4278 	af->to_sk_daddr(&asoc->peer.primary_addr, sk);
4279 
4280 	/* Populate the fields of the newsk from the oldsk and migrate the
4281 	 * asoc to the newsk.
4282 	 */
4283 	sctp_sock_migrate(sk, sock->sk, asoc, SCTP_SOCKET_UDP_HIGH_BANDWIDTH);
4284 
4285 	*sockp = sock;
4286 
4287 	return err;
4288 }
4289 EXPORT_SYMBOL(sctp_do_peeloff);
4290 
4291 static int sctp_getsockopt_peeloff(struct sock *sk, int len, char __user *optval, int __user *optlen)
4292 {
4293 	sctp_peeloff_arg_t peeloff;
4294 	struct socket *newsock;
4295 	int retval = 0;
4296 
4297 	if (len < sizeof(sctp_peeloff_arg_t))
4298 		return -EINVAL;
4299 	len = sizeof(sctp_peeloff_arg_t);
4300 	if (copy_from_user(&peeloff, optval, len))
4301 		return -EFAULT;
4302 
4303 	retval = sctp_do_peeloff(sk, peeloff.associd, &newsock);
4304 	if (retval < 0)
4305 		goto out;
4306 
4307 	/* Map the socket to an unused fd that can be returned to the user.  */
4308 	retval = sock_map_fd(newsock, 0);
4309 	if (retval < 0) {
4310 		sock_release(newsock);
4311 		goto out;
4312 	}
4313 
4314 	SCTP_DEBUG_PRINTK("%s: sk: %p newsk: %p sd: %d\n",
4315 			  __func__, sk, newsock->sk, retval);
4316 
4317 	/* Return the fd mapped to the new socket.  */
4318 	peeloff.sd = retval;
4319 	if (put_user(len, optlen))
4320 		return -EFAULT;
4321 	if (copy_to_user(optval, &peeloff, len))
4322 		retval = -EFAULT;
4323 
4324 out:
4325 	return retval;
4326 }
4327 
4328 /* 7.1.13 Peer Address Parameters (SCTP_PEER_ADDR_PARAMS)
4329  *
4330  * Applications can enable or disable heartbeats for any peer address of
4331  * an association, modify an address's heartbeat interval, force a
4332  * heartbeat to be sent immediately, and adjust the address's maximum
4333  * number of retransmissions sent before an address is considered
4334  * unreachable.  The following structure is used to access and modify an
4335  * address's parameters:
4336  *
4337  *  struct sctp_paddrparams {
4338  *     sctp_assoc_t            spp_assoc_id;
4339  *     struct sockaddr_storage spp_address;
4340  *     uint32_t                spp_hbinterval;
4341  *     uint16_t                spp_pathmaxrxt;
4342  *     uint32_t                spp_pathmtu;
4343  *     uint32_t                spp_sackdelay;
4344  *     uint32_t                spp_flags;
4345  * };
4346  *
4347  *   spp_assoc_id    - (one-to-many style socket) This is filled in the
4348  *                     application, and identifies the association for
4349  *                     this query.
4350  *   spp_address     - This specifies which address is of interest.
4351  *   spp_hbinterval  - This contains the value of the heartbeat interval,
4352  *                     in milliseconds.  If a  value of zero
4353  *                     is present in this field then no changes are to
4354  *                     be made to this parameter.
4355  *   spp_pathmaxrxt  - This contains the maximum number of
4356  *                     retransmissions before this address shall be
4357  *                     considered unreachable. If a  value of zero
4358  *                     is present in this field then no changes are to
4359  *                     be made to this parameter.
4360  *   spp_pathmtu     - When Path MTU discovery is disabled the value
4361  *                     specified here will be the "fixed" path mtu.
4362  *                     Note that if the spp_address field is empty
4363  *                     then all associations on this address will
4364  *                     have this fixed path mtu set upon them.
4365  *
4366  *   spp_sackdelay   - When delayed sack is enabled, this value specifies
4367  *                     the number of milliseconds that sacks will be delayed
4368  *                     for. This value will apply to all addresses of an
4369  *                     association if the spp_address field is empty. Note
4370  *                     also, that if delayed sack is enabled and this
4371  *                     value is set to 0, no change is made to the last
4372  *                     recorded delayed sack timer value.
4373  *
4374  *   spp_flags       - These flags are used to control various features
4375  *                     on an association. The flag field may contain
4376  *                     zero or more of the following options.
4377  *
4378  *                     SPP_HB_ENABLE  - Enable heartbeats on the
4379  *                     specified address. Note that if the address
4380  *                     field is empty all addresses for the association
4381  *                     have heartbeats enabled upon them.
4382  *
4383  *                     SPP_HB_DISABLE - Disable heartbeats on the
4384  *                     speicifed address. Note that if the address
4385  *                     field is empty all addresses for the association
4386  *                     will have their heartbeats disabled. Note also
4387  *                     that SPP_HB_ENABLE and SPP_HB_DISABLE are
4388  *                     mutually exclusive, only one of these two should
4389  *                     be specified. Enabling both fields will have
4390  *                     undetermined results.
4391  *
4392  *                     SPP_HB_DEMAND - Request a user initiated heartbeat
4393  *                     to be made immediately.
4394  *
4395  *                     SPP_PMTUD_ENABLE - This field will enable PMTU
4396  *                     discovery upon the specified address. Note that
4397  *                     if the address feild is empty then all addresses
4398  *                     on the association are effected.
4399  *
4400  *                     SPP_PMTUD_DISABLE - This field will disable PMTU
4401  *                     discovery upon the specified address. Note that
4402  *                     if the address feild is empty then all addresses
4403  *                     on the association are effected. Not also that
4404  *                     SPP_PMTUD_ENABLE and SPP_PMTUD_DISABLE are mutually
4405  *                     exclusive. Enabling both will have undetermined
4406  *                     results.
4407  *
4408  *                     SPP_SACKDELAY_ENABLE - Setting this flag turns
4409  *                     on delayed sack. The time specified in spp_sackdelay
4410  *                     is used to specify the sack delay for this address. Note
4411  *                     that if spp_address is empty then all addresses will
4412  *                     enable delayed sack and take on the sack delay
4413  *                     value specified in spp_sackdelay.
4414  *                     SPP_SACKDELAY_DISABLE - Setting this flag turns
4415  *                     off delayed sack. If the spp_address field is blank then
4416  *                     delayed sack is disabled for the entire association. Note
4417  *                     also that this field is mutually exclusive to
4418  *                     SPP_SACKDELAY_ENABLE, setting both will have undefined
4419  *                     results.
4420  */
4421 static int sctp_getsockopt_peer_addr_params(struct sock *sk, int len,
4422 					    char __user *optval, int __user *optlen)
4423 {
4424 	struct sctp_paddrparams  params;
4425 	struct sctp_transport   *trans = NULL;
4426 	struct sctp_association *asoc = NULL;
4427 	struct sctp_sock        *sp = sctp_sk(sk);
4428 
4429 	if (len < sizeof(struct sctp_paddrparams))
4430 		return -EINVAL;
4431 	len = sizeof(struct sctp_paddrparams);
4432 	if (copy_from_user(&params, optval, len))
4433 		return -EFAULT;
4434 
4435 	/* If an address other than INADDR_ANY is specified, and
4436 	 * no transport is found, then the request is invalid.
4437 	 */
4438 	if (!sctp_is_any(sk, ( union sctp_addr *)&params.spp_address)) {
4439 		trans = sctp_addr_id2transport(sk, &params.spp_address,
4440 					       params.spp_assoc_id);
4441 		if (!trans) {
4442 			SCTP_DEBUG_PRINTK("Failed no transport\n");
4443 			return -EINVAL;
4444 		}
4445 	}
4446 
4447 	/* Get association, if assoc_id != 0 and the socket is a one
4448 	 * to many style socket, and an association was not found, then
4449 	 * the id was invalid.
4450 	 */
4451 	asoc = sctp_id2assoc(sk, params.spp_assoc_id);
4452 	if (!asoc && params.spp_assoc_id && sctp_style(sk, UDP)) {
4453 		SCTP_DEBUG_PRINTK("Failed no association\n");
4454 		return -EINVAL;
4455 	}
4456 
4457 	if (trans) {
4458 		/* Fetch transport values. */
4459 		params.spp_hbinterval = jiffies_to_msecs(trans->hbinterval);
4460 		params.spp_pathmtu    = trans->pathmtu;
4461 		params.spp_pathmaxrxt = trans->pathmaxrxt;
4462 		params.spp_sackdelay  = jiffies_to_msecs(trans->sackdelay);
4463 
4464 		/*draft-11 doesn't say what to return in spp_flags*/
4465 		params.spp_flags      = trans->param_flags;
4466 	} else if (asoc) {
4467 		/* Fetch association values. */
4468 		params.spp_hbinterval = jiffies_to_msecs(asoc->hbinterval);
4469 		params.spp_pathmtu    = asoc->pathmtu;
4470 		params.spp_pathmaxrxt = asoc->pathmaxrxt;
4471 		params.spp_sackdelay  = jiffies_to_msecs(asoc->sackdelay);
4472 
4473 		/*draft-11 doesn't say what to return in spp_flags*/
4474 		params.spp_flags      = asoc->param_flags;
4475 	} else {
4476 		/* Fetch socket values. */
4477 		params.spp_hbinterval = sp->hbinterval;
4478 		params.spp_pathmtu    = sp->pathmtu;
4479 		params.spp_sackdelay  = sp->sackdelay;
4480 		params.spp_pathmaxrxt = sp->pathmaxrxt;
4481 
4482 		/*draft-11 doesn't say what to return in spp_flags*/
4483 		params.spp_flags      = sp->param_flags;
4484 	}
4485 
4486 	if (copy_to_user(optval, &params, len))
4487 		return -EFAULT;
4488 
4489 	if (put_user(len, optlen))
4490 		return -EFAULT;
4491 
4492 	return 0;
4493 }
4494 
4495 /*
4496  * 7.1.23.  Get or set delayed ack timer (SCTP_DELAYED_SACK)
4497  *
4498  * This option will effect the way delayed acks are performed.  This
4499  * option allows you to get or set the delayed ack time, in
4500  * milliseconds.  It also allows changing the delayed ack frequency.
4501  * Changing the frequency to 1 disables the delayed sack algorithm.  If
4502  * the assoc_id is 0, then this sets or gets the endpoints default
4503  * values.  If the assoc_id field is non-zero, then the set or get
4504  * effects the specified association for the one to many model (the
4505  * assoc_id field is ignored by the one to one model).  Note that if
4506  * sack_delay or sack_freq are 0 when setting this option, then the
4507  * current values will remain unchanged.
4508  *
4509  * struct sctp_sack_info {
4510  *     sctp_assoc_t            sack_assoc_id;
4511  *     uint32_t                sack_delay;
4512  *     uint32_t                sack_freq;
4513  * };
4514  *
4515  * sack_assoc_id -  This parameter, indicates which association the user
4516  *    is performing an action upon.  Note that if this field's value is
4517  *    zero then the endpoints default value is changed (effecting future
4518  *    associations only).
4519  *
4520  * sack_delay -  This parameter contains the number of milliseconds that
4521  *    the user is requesting the delayed ACK timer be set to.  Note that
4522  *    this value is defined in the standard to be between 200 and 500
4523  *    milliseconds.
4524  *
4525  * sack_freq -  This parameter contains the number of packets that must
4526  *    be received before a sack is sent without waiting for the delay
4527  *    timer to expire.  The default value for this is 2, setting this
4528  *    value to 1 will disable the delayed sack algorithm.
4529  */
4530 static int sctp_getsockopt_delayed_ack(struct sock *sk, int len,
4531 					    char __user *optval,
4532 					    int __user *optlen)
4533 {
4534 	struct sctp_sack_info    params;
4535 	struct sctp_association *asoc = NULL;
4536 	struct sctp_sock        *sp = sctp_sk(sk);
4537 
4538 	if (len >= sizeof(struct sctp_sack_info)) {
4539 		len = sizeof(struct sctp_sack_info);
4540 
4541 		if (copy_from_user(&params, optval, len))
4542 			return -EFAULT;
4543 	} else if (len == sizeof(struct sctp_assoc_value)) {
4544 		pr_warn("Use of struct sctp_assoc_value in delayed_ack socket option deprecated\n");
4545 		pr_warn("Use struct sctp_sack_info instead\n");
4546 		if (copy_from_user(&params, optval, len))
4547 			return -EFAULT;
4548 	} else
4549 		return - EINVAL;
4550 
4551 	/* Get association, if sack_assoc_id != 0 and the socket is a one
4552 	 * to many style socket, and an association was not found, then
4553 	 * the id was invalid.
4554 	 */
4555 	asoc = sctp_id2assoc(sk, params.sack_assoc_id);
4556 	if (!asoc && params.sack_assoc_id && sctp_style(sk, UDP))
4557 		return -EINVAL;
4558 
4559 	if (asoc) {
4560 		/* Fetch association values. */
4561 		if (asoc->param_flags & SPP_SACKDELAY_ENABLE) {
4562 			params.sack_delay = jiffies_to_msecs(
4563 				asoc->sackdelay);
4564 			params.sack_freq = asoc->sackfreq;
4565 
4566 		} else {
4567 			params.sack_delay = 0;
4568 			params.sack_freq = 1;
4569 		}
4570 	} else {
4571 		/* Fetch socket values. */
4572 		if (sp->param_flags & SPP_SACKDELAY_ENABLE) {
4573 			params.sack_delay  = sp->sackdelay;
4574 			params.sack_freq = sp->sackfreq;
4575 		} else {
4576 			params.sack_delay  = 0;
4577 			params.sack_freq = 1;
4578 		}
4579 	}
4580 
4581 	if (copy_to_user(optval, &params, len))
4582 		return -EFAULT;
4583 
4584 	if (put_user(len, optlen))
4585 		return -EFAULT;
4586 
4587 	return 0;
4588 }
4589 
4590 /* 7.1.3 Initialization Parameters (SCTP_INITMSG)
4591  *
4592  * Applications can specify protocol parameters for the default association
4593  * initialization.  The option name argument to setsockopt() and getsockopt()
4594  * is SCTP_INITMSG.
4595  *
4596  * Setting initialization parameters is effective only on an unconnected
4597  * socket (for UDP-style sockets only future associations are effected
4598  * by the change).  With TCP-style sockets, this option is inherited by
4599  * sockets derived from a listener socket.
4600  */
4601 static int sctp_getsockopt_initmsg(struct sock *sk, int len, char __user *optval, int __user *optlen)
4602 {
4603 	if (len < sizeof(struct sctp_initmsg))
4604 		return -EINVAL;
4605 	len = sizeof(struct sctp_initmsg);
4606 	if (put_user(len, optlen))
4607 		return -EFAULT;
4608 	if (copy_to_user(optval, &sctp_sk(sk)->initmsg, len))
4609 		return -EFAULT;
4610 	return 0;
4611 }
4612 
4613 
4614 static int sctp_getsockopt_peer_addrs(struct sock *sk, int len,
4615 				      char __user *optval, int __user *optlen)
4616 {
4617 	struct sctp_association *asoc;
4618 	int cnt = 0;
4619 	struct sctp_getaddrs getaddrs;
4620 	struct sctp_transport *from;
4621 	void __user *to;
4622 	union sctp_addr temp;
4623 	struct sctp_sock *sp = sctp_sk(sk);
4624 	int addrlen;
4625 	size_t space_left;
4626 	int bytes_copied;
4627 
4628 	if (len < sizeof(struct sctp_getaddrs))
4629 		return -EINVAL;
4630 
4631 	if (copy_from_user(&getaddrs, optval, sizeof(struct sctp_getaddrs)))
4632 		return -EFAULT;
4633 
4634 	/* For UDP-style sockets, id specifies the association to query.  */
4635 	asoc = sctp_id2assoc(sk, getaddrs.assoc_id);
4636 	if (!asoc)
4637 		return -EINVAL;
4638 
4639 	to = optval + offsetof(struct sctp_getaddrs,addrs);
4640 	space_left = len - offsetof(struct sctp_getaddrs,addrs);
4641 
4642 	list_for_each_entry(from, &asoc->peer.transport_addr_list,
4643 				transports) {
4644 		memcpy(&temp, &from->ipaddr, sizeof(temp));
4645 		sctp_get_pf_specific(sk->sk_family)->addr_v4map(sp, &temp);
4646 		addrlen = sctp_get_af_specific(temp.sa.sa_family)->sockaddr_len;
4647 		if (space_left < addrlen)
4648 			return -ENOMEM;
4649 		if (copy_to_user(to, &temp, addrlen))
4650 			return -EFAULT;
4651 		to += addrlen;
4652 		cnt++;
4653 		space_left -= addrlen;
4654 	}
4655 
4656 	if (put_user(cnt, &((struct sctp_getaddrs __user *)optval)->addr_num))
4657 		return -EFAULT;
4658 	bytes_copied = ((char __user *)to) - optval;
4659 	if (put_user(bytes_copied, optlen))
4660 		return -EFAULT;
4661 
4662 	return 0;
4663 }
4664 
4665 static int sctp_copy_laddrs(struct sock *sk, __u16 port, void *to,
4666 			    size_t space_left, int *bytes_copied)
4667 {
4668 	struct sctp_sockaddr_entry *addr;
4669 	union sctp_addr temp;
4670 	int cnt = 0;
4671 	int addrlen;
4672 	struct net *net = sock_net(sk);
4673 
4674 	rcu_read_lock();
4675 	list_for_each_entry_rcu(addr, &net->sctp.local_addr_list, list) {
4676 		if (!addr->valid)
4677 			continue;
4678 
4679 		if ((PF_INET == sk->sk_family) &&
4680 		    (AF_INET6 == addr->a.sa.sa_family))
4681 			continue;
4682 		if ((PF_INET6 == sk->sk_family) &&
4683 		    inet_v6_ipv6only(sk) &&
4684 		    (AF_INET == addr->a.sa.sa_family))
4685 			continue;
4686 		memcpy(&temp, &addr->a, sizeof(temp));
4687 		if (!temp.v4.sin_port)
4688 			temp.v4.sin_port = htons(port);
4689 
4690 		sctp_get_pf_specific(sk->sk_family)->addr_v4map(sctp_sk(sk),
4691 								&temp);
4692 		addrlen = sctp_get_af_specific(temp.sa.sa_family)->sockaddr_len;
4693 		if (space_left < addrlen) {
4694 			cnt =  -ENOMEM;
4695 			break;
4696 		}
4697 		memcpy(to, &temp, addrlen);
4698 
4699 		to += addrlen;
4700 		cnt ++;
4701 		space_left -= addrlen;
4702 		*bytes_copied += addrlen;
4703 	}
4704 	rcu_read_unlock();
4705 
4706 	return cnt;
4707 }
4708 
4709 
4710 static int sctp_getsockopt_local_addrs(struct sock *sk, int len,
4711 				       char __user *optval, int __user *optlen)
4712 {
4713 	struct sctp_bind_addr *bp;
4714 	struct sctp_association *asoc;
4715 	int cnt = 0;
4716 	struct sctp_getaddrs getaddrs;
4717 	struct sctp_sockaddr_entry *addr;
4718 	void __user *to;
4719 	union sctp_addr temp;
4720 	struct sctp_sock *sp = sctp_sk(sk);
4721 	int addrlen;
4722 	int err = 0;
4723 	size_t space_left;
4724 	int bytes_copied = 0;
4725 	void *addrs;
4726 	void *buf;
4727 
4728 	if (len < sizeof(struct sctp_getaddrs))
4729 		return -EINVAL;
4730 
4731 	if (copy_from_user(&getaddrs, optval, sizeof(struct sctp_getaddrs)))
4732 		return -EFAULT;
4733 
4734 	/*
4735 	 *  For UDP-style sockets, id specifies the association to query.
4736 	 *  If the id field is set to the value '0' then the locally bound
4737 	 *  addresses are returned without regard to any particular
4738 	 *  association.
4739 	 */
4740 	if (0 == getaddrs.assoc_id) {
4741 		bp = &sctp_sk(sk)->ep->base.bind_addr;
4742 	} else {
4743 		asoc = sctp_id2assoc(sk, getaddrs.assoc_id);
4744 		if (!asoc)
4745 			return -EINVAL;
4746 		bp = &asoc->base.bind_addr;
4747 	}
4748 
4749 	to = optval + offsetof(struct sctp_getaddrs,addrs);
4750 	space_left = len - offsetof(struct sctp_getaddrs,addrs);
4751 
4752 	addrs = kmalloc(space_left, GFP_KERNEL);
4753 	if (!addrs)
4754 		return -ENOMEM;
4755 
4756 	/* If the endpoint is bound to 0.0.0.0 or ::0, get the valid
4757 	 * addresses from the global local address list.
4758 	 */
4759 	if (sctp_list_single_entry(&bp->address_list)) {
4760 		addr = list_entry(bp->address_list.next,
4761 				  struct sctp_sockaddr_entry, list);
4762 		if (sctp_is_any(sk, &addr->a)) {
4763 			cnt = sctp_copy_laddrs(sk, bp->port, addrs,
4764 						space_left, &bytes_copied);
4765 			if (cnt < 0) {
4766 				err = cnt;
4767 				goto out;
4768 			}
4769 			goto copy_getaddrs;
4770 		}
4771 	}
4772 
4773 	buf = addrs;
4774 	/* Protection on the bound address list is not needed since
4775 	 * in the socket option context we hold a socket lock and
4776 	 * thus the bound address list can't change.
4777 	 */
4778 	list_for_each_entry(addr, &bp->address_list, list) {
4779 		memcpy(&temp, &addr->a, sizeof(temp));
4780 		sctp_get_pf_specific(sk->sk_family)->addr_v4map(sp, &temp);
4781 		addrlen = sctp_get_af_specific(temp.sa.sa_family)->sockaddr_len;
4782 		if (space_left < addrlen) {
4783 			err =  -ENOMEM; /*fixme: right error?*/
4784 			goto out;
4785 		}
4786 		memcpy(buf, &temp, addrlen);
4787 		buf += addrlen;
4788 		bytes_copied += addrlen;
4789 		cnt ++;
4790 		space_left -= addrlen;
4791 	}
4792 
4793 copy_getaddrs:
4794 	if (copy_to_user(to, addrs, bytes_copied)) {
4795 		err = -EFAULT;
4796 		goto out;
4797 	}
4798 	if (put_user(cnt, &((struct sctp_getaddrs __user *)optval)->addr_num)) {
4799 		err = -EFAULT;
4800 		goto out;
4801 	}
4802 	if (put_user(bytes_copied, optlen))
4803 		err = -EFAULT;
4804 out:
4805 	kfree(addrs);
4806 	return err;
4807 }
4808 
4809 /* 7.1.10 Set Primary Address (SCTP_PRIMARY_ADDR)
4810  *
4811  * Requests that the local SCTP stack use the enclosed peer address as
4812  * the association primary.  The enclosed address must be one of the
4813  * association peer's addresses.
4814  */
4815 static int sctp_getsockopt_primary_addr(struct sock *sk, int len,
4816 					char __user *optval, int __user *optlen)
4817 {
4818 	struct sctp_prim prim;
4819 	struct sctp_association *asoc;
4820 	struct sctp_sock *sp = sctp_sk(sk);
4821 
4822 	if (len < sizeof(struct sctp_prim))
4823 		return -EINVAL;
4824 
4825 	len = sizeof(struct sctp_prim);
4826 
4827 	if (copy_from_user(&prim, optval, len))
4828 		return -EFAULT;
4829 
4830 	asoc = sctp_id2assoc(sk, prim.ssp_assoc_id);
4831 	if (!asoc)
4832 		return -EINVAL;
4833 
4834 	if (!asoc->peer.primary_path)
4835 		return -ENOTCONN;
4836 
4837 	memcpy(&prim.ssp_addr, &asoc->peer.primary_path->ipaddr,
4838 		asoc->peer.primary_path->af_specific->sockaddr_len);
4839 
4840 	sctp_get_pf_specific(sk->sk_family)->addr_v4map(sp,
4841 			(union sctp_addr *)&prim.ssp_addr);
4842 
4843 	if (put_user(len, optlen))
4844 		return -EFAULT;
4845 	if (copy_to_user(optval, &prim, len))
4846 		return -EFAULT;
4847 
4848 	return 0;
4849 }
4850 
4851 /*
4852  * 7.1.11  Set Adaptation Layer Indicator (SCTP_ADAPTATION_LAYER)
4853  *
4854  * Requests that the local endpoint set the specified Adaptation Layer
4855  * Indication parameter for all future INIT and INIT-ACK exchanges.
4856  */
4857 static int sctp_getsockopt_adaptation_layer(struct sock *sk, int len,
4858 				  char __user *optval, int __user *optlen)
4859 {
4860 	struct sctp_setadaptation adaptation;
4861 
4862 	if (len < sizeof(struct sctp_setadaptation))
4863 		return -EINVAL;
4864 
4865 	len = sizeof(struct sctp_setadaptation);
4866 
4867 	adaptation.ssb_adaptation_ind = sctp_sk(sk)->adaptation_ind;
4868 
4869 	if (put_user(len, optlen))
4870 		return -EFAULT;
4871 	if (copy_to_user(optval, &adaptation, len))
4872 		return -EFAULT;
4873 
4874 	return 0;
4875 }
4876 
4877 /*
4878  *
4879  * 7.1.14 Set default send parameters (SCTP_DEFAULT_SEND_PARAM)
4880  *
4881  *   Applications that wish to use the sendto() system call may wish to
4882  *   specify a default set of parameters that would normally be supplied
4883  *   through the inclusion of ancillary data.  This socket option allows
4884  *   such an application to set the default sctp_sndrcvinfo structure.
4885 
4886 
4887  *   The application that wishes to use this socket option simply passes
4888  *   in to this call the sctp_sndrcvinfo structure defined in Section
4889  *   5.2.2) The input parameters accepted by this call include
4890  *   sinfo_stream, sinfo_flags, sinfo_ppid, sinfo_context,
4891  *   sinfo_timetolive.  The user must provide the sinfo_assoc_id field in
4892  *   to this call if the caller is using the UDP model.
4893  *
4894  *   For getsockopt, it get the default sctp_sndrcvinfo structure.
4895  */
4896 static int sctp_getsockopt_default_send_param(struct sock *sk,
4897 					int len, char __user *optval,
4898 					int __user *optlen)
4899 {
4900 	struct sctp_sndrcvinfo info;
4901 	struct sctp_association *asoc;
4902 	struct sctp_sock *sp = sctp_sk(sk);
4903 
4904 	if (len < sizeof(struct sctp_sndrcvinfo))
4905 		return -EINVAL;
4906 
4907 	len = sizeof(struct sctp_sndrcvinfo);
4908 
4909 	if (copy_from_user(&info, optval, len))
4910 		return -EFAULT;
4911 
4912 	asoc = sctp_id2assoc(sk, info.sinfo_assoc_id);
4913 	if (!asoc && info.sinfo_assoc_id && sctp_style(sk, UDP))
4914 		return -EINVAL;
4915 
4916 	if (asoc) {
4917 		info.sinfo_stream = asoc->default_stream;
4918 		info.sinfo_flags = asoc->default_flags;
4919 		info.sinfo_ppid = asoc->default_ppid;
4920 		info.sinfo_context = asoc->default_context;
4921 		info.sinfo_timetolive = asoc->default_timetolive;
4922 	} else {
4923 		info.sinfo_stream = sp->default_stream;
4924 		info.sinfo_flags = sp->default_flags;
4925 		info.sinfo_ppid = sp->default_ppid;
4926 		info.sinfo_context = sp->default_context;
4927 		info.sinfo_timetolive = sp->default_timetolive;
4928 	}
4929 
4930 	if (put_user(len, optlen))
4931 		return -EFAULT;
4932 	if (copy_to_user(optval, &info, len))
4933 		return -EFAULT;
4934 
4935 	return 0;
4936 }
4937 
4938 /*
4939  *
4940  * 7.1.5 SCTP_NODELAY
4941  *
4942  * Turn on/off any Nagle-like algorithm.  This means that packets are
4943  * generally sent as soon as possible and no unnecessary delays are
4944  * introduced, at the cost of more packets in the network.  Expects an
4945  * integer boolean flag.
4946  */
4947 
4948 static int sctp_getsockopt_nodelay(struct sock *sk, int len,
4949 				   char __user *optval, int __user *optlen)
4950 {
4951 	int val;
4952 
4953 	if (len < sizeof(int))
4954 		return -EINVAL;
4955 
4956 	len = sizeof(int);
4957 	val = (sctp_sk(sk)->nodelay == 1);
4958 	if (put_user(len, optlen))
4959 		return -EFAULT;
4960 	if (copy_to_user(optval, &val, len))
4961 		return -EFAULT;
4962 	return 0;
4963 }
4964 
4965 /*
4966  *
4967  * 7.1.1 SCTP_RTOINFO
4968  *
4969  * The protocol parameters used to initialize and bound retransmission
4970  * timeout (RTO) are tunable. sctp_rtoinfo structure is used to access
4971  * and modify these parameters.
4972  * All parameters are time values, in milliseconds.  A value of 0, when
4973  * modifying the parameters, indicates that the current value should not
4974  * be changed.
4975  *
4976  */
4977 static int sctp_getsockopt_rtoinfo(struct sock *sk, int len,
4978 				char __user *optval,
4979 				int __user *optlen) {
4980 	struct sctp_rtoinfo rtoinfo;
4981 	struct sctp_association *asoc;
4982 
4983 	if (len < sizeof (struct sctp_rtoinfo))
4984 		return -EINVAL;
4985 
4986 	len = sizeof(struct sctp_rtoinfo);
4987 
4988 	if (copy_from_user(&rtoinfo, optval, len))
4989 		return -EFAULT;
4990 
4991 	asoc = sctp_id2assoc(sk, rtoinfo.srto_assoc_id);
4992 
4993 	if (!asoc && rtoinfo.srto_assoc_id && sctp_style(sk, UDP))
4994 		return -EINVAL;
4995 
4996 	/* Values corresponding to the specific association. */
4997 	if (asoc) {
4998 		rtoinfo.srto_initial = jiffies_to_msecs(asoc->rto_initial);
4999 		rtoinfo.srto_max = jiffies_to_msecs(asoc->rto_max);
5000 		rtoinfo.srto_min = jiffies_to_msecs(asoc->rto_min);
5001 	} else {
5002 		/* Values corresponding to the endpoint. */
5003 		struct sctp_sock *sp = sctp_sk(sk);
5004 
5005 		rtoinfo.srto_initial = sp->rtoinfo.srto_initial;
5006 		rtoinfo.srto_max = sp->rtoinfo.srto_max;
5007 		rtoinfo.srto_min = sp->rtoinfo.srto_min;
5008 	}
5009 
5010 	if (put_user(len, optlen))
5011 		return -EFAULT;
5012 
5013 	if (copy_to_user(optval, &rtoinfo, len))
5014 		return -EFAULT;
5015 
5016 	return 0;
5017 }
5018 
5019 /*
5020  *
5021  * 7.1.2 SCTP_ASSOCINFO
5022  *
5023  * This option is used to tune the maximum retransmission attempts
5024  * of the association.
5025  * Returns an error if the new association retransmission value is
5026  * greater than the sum of the retransmission value  of the peer.
5027  * See [SCTP] for more information.
5028  *
5029  */
5030 static int sctp_getsockopt_associnfo(struct sock *sk, int len,
5031 				     char __user *optval,
5032 				     int __user *optlen)
5033 {
5034 
5035 	struct sctp_assocparams assocparams;
5036 	struct sctp_association *asoc;
5037 	struct list_head *pos;
5038 	int cnt = 0;
5039 
5040 	if (len < sizeof (struct sctp_assocparams))
5041 		return -EINVAL;
5042 
5043 	len = sizeof(struct sctp_assocparams);
5044 
5045 	if (copy_from_user(&assocparams, optval, len))
5046 		return -EFAULT;
5047 
5048 	asoc = sctp_id2assoc(sk, assocparams.sasoc_assoc_id);
5049 
5050 	if (!asoc && assocparams.sasoc_assoc_id && sctp_style(sk, UDP))
5051 		return -EINVAL;
5052 
5053 	/* Values correspoinding to the specific association */
5054 	if (asoc) {
5055 		assocparams.sasoc_asocmaxrxt = asoc->max_retrans;
5056 		assocparams.sasoc_peer_rwnd = asoc->peer.rwnd;
5057 		assocparams.sasoc_local_rwnd = asoc->a_rwnd;
5058 		assocparams.sasoc_cookie_life = (asoc->cookie_life.tv_sec
5059 						* 1000) +
5060 						(asoc->cookie_life.tv_usec
5061 						/ 1000);
5062 
5063 		list_for_each(pos, &asoc->peer.transport_addr_list) {
5064 			cnt ++;
5065 		}
5066 
5067 		assocparams.sasoc_number_peer_destinations = cnt;
5068 	} else {
5069 		/* Values corresponding to the endpoint */
5070 		struct sctp_sock *sp = sctp_sk(sk);
5071 
5072 		assocparams.sasoc_asocmaxrxt = sp->assocparams.sasoc_asocmaxrxt;
5073 		assocparams.sasoc_peer_rwnd = sp->assocparams.sasoc_peer_rwnd;
5074 		assocparams.sasoc_local_rwnd = sp->assocparams.sasoc_local_rwnd;
5075 		assocparams.sasoc_cookie_life =
5076 					sp->assocparams.sasoc_cookie_life;
5077 		assocparams.sasoc_number_peer_destinations =
5078 					sp->assocparams.
5079 					sasoc_number_peer_destinations;
5080 	}
5081 
5082 	if (put_user(len, optlen))
5083 		return -EFAULT;
5084 
5085 	if (copy_to_user(optval, &assocparams, len))
5086 		return -EFAULT;
5087 
5088 	return 0;
5089 }
5090 
5091 /*
5092  * 7.1.16 Set/clear IPv4 mapped addresses (SCTP_I_WANT_MAPPED_V4_ADDR)
5093  *
5094  * This socket option is a boolean flag which turns on or off mapped V4
5095  * addresses.  If this option is turned on and the socket is type
5096  * PF_INET6, then IPv4 addresses will be mapped to V6 representation.
5097  * If this option is turned off, then no mapping will be done of V4
5098  * addresses and a user will receive both PF_INET6 and PF_INET type
5099  * addresses on the socket.
5100  */
5101 static int sctp_getsockopt_mappedv4(struct sock *sk, int len,
5102 				    char __user *optval, int __user *optlen)
5103 {
5104 	int val;
5105 	struct sctp_sock *sp = sctp_sk(sk);
5106 
5107 	if (len < sizeof(int))
5108 		return -EINVAL;
5109 
5110 	len = sizeof(int);
5111 	val = sp->v4mapped;
5112 	if (put_user(len, optlen))
5113 		return -EFAULT;
5114 	if (copy_to_user(optval, &val, len))
5115 		return -EFAULT;
5116 
5117 	return 0;
5118 }
5119 
5120 /*
5121  * 7.1.29.  Set or Get the default context (SCTP_CONTEXT)
5122  * (chapter and verse is quoted at sctp_setsockopt_context())
5123  */
5124 static int sctp_getsockopt_context(struct sock *sk, int len,
5125 				   char __user *optval, int __user *optlen)
5126 {
5127 	struct sctp_assoc_value params;
5128 	struct sctp_sock *sp;
5129 	struct sctp_association *asoc;
5130 
5131 	if (len < sizeof(struct sctp_assoc_value))
5132 		return -EINVAL;
5133 
5134 	len = sizeof(struct sctp_assoc_value);
5135 
5136 	if (copy_from_user(&params, optval, len))
5137 		return -EFAULT;
5138 
5139 	sp = sctp_sk(sk);
5140 
5141 	if (params.assoc_id != 0) {
5142 		asoc = sctp_id2assoc(sk, params.assoc_id);
5143 		if (!asoc)
5144 			return -EINVAL;
5145 		params.assoc_value = asoc->default_rcv_context;
5146 	} else {
5147 		params.assoc_value = sp->default_rcv_context;
5148 	}
5149 
5150 	if (put_user(len, optlen))
5151 		return -EFAULT;
5152 	if (copy_to_user(optval, &params, len))
5153 		return -EFAULT;
5154 
5155 	return 0;
5156 }
5157 
5158 /*
5159  * 8.1.16.  Get or Set the Maximum Fragmentation Size (SCTP_MAXSEG)
5160  * This option will get or set the maximum size to put in any outgoing
5161  * SCTP DATA chunk.  If a message is larger than this size it will be
5162  * fragmented by SCTP into the specified size.  Note that the underlying
5163  * SCTP implementation may fragment into smaller sized chunks when the
5164  * PMTU of the underlying association is smaller than the value set by
5165  * the user.  The default value for this option is '0' which indicates
5166  * the user is NOT limiting fragmentation and only the PMTU will effect
5167  * SCTP's choice of DATA chunk size.  Note also that values set larger
5168  * than the maximum size of an IP datagram will effectively let SCTP
5169  * control fragmentation (i.e. the same as setting this option to 0).
5170  *
5171  * The following structure is used to access and modify this parameter:
5172  *
5173  * struct sctp_assoc_value {
5174  *   sctp_assoc_t assoc_id;
5175  *   uint32_t assoc_value;
5176  * };
5177  *
5178  * assoc_id:  This parameter is ignored for one-to-one style sockets.
5179  *    For one-to-many style sockets this parameter indicates which
5180  *    association the user is performing an action upon.  Note that if
5181  *    this field's value is zero then the endpoints default value is
5182  *    changed (effecting future associations only).
5183  * assoc_value:  This parameter specifies the maximum size in bytes.
5184  */
5185 static int sctp_getsockopt_maxseg(struct sock *sk, int len,
5186 				  char __user *optval, int __user *optlen)
5187 {
5188 	struct sctp_assoc_value params;
5189 	struct sctp_association *asoc;
5190 
5191 	if (len == sizeof(int)) {
5192 		pr_warn("Use of int in maxseg socket option deprecated\n");
5193 		pr_warn("Use struct sctp_assoc_value instead\n");
5194 		params.assoc_id = 0;
5195 	} else if (len >= sizeof(struct sctp_assoc_value)) {
5196 		len = sizeof(struct sctp_assoc_value);
5197 		if (copy_from_user(&params, optval, sizeof(params)))
5198 			return -EFAULT;
5199 	} else
5200 		return -EINVAL;
5201 
5202 	asoc = sctp_id2assoc(sk, params.assoc_id);
5203 	if (!asoc && params.assoc_id && sctp_style(sk, UDP))
5204 		return -EINVAL;
5205 
5206 	if (asoc)
5207 		params.assoc_value = asoc->frag_point;
5208 	else
5209 		params.assoc_value = sctp_sk(sk)->user_frag;
5210 
5211 	if (put_user(len, optlen))
5212 		return -EFAULT;
5213 	if (len == sizeof(int)) {
5214 		if (copy_to_user(optval, &params.assoc_value, len))
5215 			return -EFAULT;
5216 	} else {
5217 		if (copy_to_user(optval, &params, len))
5218 			return -EFAULT;
5219 	}
5220 
5221 	return 0;
5222 }
5223 
5224 /*
5225  * 7.1.24.  Get or set fragmented interleave (SCTP_FRAGMENT_INTERLEAVE)
5226  * (chapter and verse is quoted at sctp_setsockopt_fragment_interleave())
5227  */
5228 static int sctp_getsockopt_fragment_interleave(struct sock *sk, int len,
5229 					       char __user *optval, int __user *optlen)
5230 {
5231 	int val;
5232 
5233 	if (len < sizeof(int))
5234 		return -EINVAL;
5235 
5236 	len = sizeof(int);
5237 
5238 	val = sctp_sk(sk)->frag_interleave;
5239 	if (put_user(len, optlen))
5240 		return -EFAULT;
5241 	if (copy_to_user(optval, &val, len))
5242 		return -EFAULT;
5243 
5244 	return 0;
5245 }
5246 
5247 /*
5248  * 7.1.25.  Set or Get the sctp partial delivery point
5249  * (chapter and verse is quoted at sctp_setsockopt_partial_delivery_point())
5250  */
5251 static int sctp_getsockopt_partial_delivery_point(struct sock *sk, int len,
5252 						  char __user *optval,
5253 						  int __user *optlen)
5254 {
5255 	u32 val;
5256 
5257 	if (len < sizeof(u32))
5258 		return -EINVAL;
5259 
5260 	len = sizeof(u32);
5261 
5262 	val = sctp_sk(sk)->pd_point;
5263 	if (put_user(len, optlen))
5264 		return -EFAULT;
5265 	if (copy_to_user(optval, &val, len))
5266 		return -EFAULT;
5267 
5268 	return 0;
5269 }
5270 
5271 /*
5272  * 7.1.28.  Set or Get the maximum burst (SCTP_MAX_BURST)
5273  * (chapter and verse is quoted at sctp_setsockopt_maxburst())
5274  */
5275 static int sctp_getsockopt_maxburst(struct sock *sk, int len,
5276 				    char __user *optval,
5277 				    int __user *optlen)
5278 {
5279 	struct sctp_assoc_value params;
5280 	struct sctp_sock *sp;
5281 	struct sctp_association *asoc;
5282 
5283 	if (len == sizeof(int)) {
5284 		pr_warn("Use of int in max_burst socket option deprecated\n");
5285 		pr_warn("Use struct sctp_assoc_value instead\n");
5286 		params.assoc_id = 0;
5287 	} else if (len >= sizeof(struct sctp_assoc_value)) {
5288 		len = sizeof(struct sctp_assoc_value);
5289 		if (copy_from_user(&params, optval, len))
5290 			return -EFAULT;
5291 	} else
5292 		return -EINVAL;
5293 
5294 	sp = sctp_sk(sk);
5295 
5296 	if (params.assoc_id != 0) {
5297 		asoc = sctp_id2assoc(sk, params.assoc_id);
5298 		if (!asoc)
5299 			return -EINVAL;
5300 		params.assoc_value = asoc->max_burst;
5301 	} else
5302 		params.assoc_value = sp->max_burst;
5303 
5304 	if (len == sizeof(int)) {
5305 		if (copy_to_user(optval, &params.assoc_value, len))
5306 			return -EFAULT;
5307 	} else {
5308 		if (copy_to_user(optval, &params, len))
5309 			return -EFAULT;
5310 	}
5311 
5312 	return 0;
5313 
5314 }
5315 
5316 static int sctp_getsockopt_hmac_ident(struct sock *sk, int len,
5317 				    char __user *optval, int __user *optlen)
5318 {
5319 	struct net *net = sock_net(sk);
5320 	struct sctp_hmacalgo  __user *p = (void __user *)optval;
5321 	struct sctp_hmac_algo_param *hmacs;
5322 	__u16 data_len = 0;
5323 	u32 num_idents;
5324 
5325 	if (!net->sctp.auth_enable)
5326 		return -EACCES;
5327 
5328 	hmacs = sctp_sk(sk)->ep->auth_hmacs_list;
5329 	data_len = ntohs(hmacs->param_hdr.length) - sizeof(sctp_paramhdr_t);
5330 
5331 	if (len < sizeof(struct sctp_hmacalgo) + data_len)
5332 		return -EINVAL;
5333 
5334 	len = sizeof(struct sctp_hmacalgo) + data_len;
5335 	num_idents = data_len / sizeof(u16);
5336 
5337 	if (put_user(len, optlen))
5338 		return -EFAULT;
5339 	if (put_user(num_idents, &p->shmac_num_idents))
5340 		return -EFAULT;
5341 	if (copy_to_user(p->shmac_idents, hmacs->hmac_ids, data_len))
5342 		return -EFAULT;
5343 	return 0;
5344 }
5345 
5346 static int sctp_getsockopt_active_key(struct sock *sk, int len,
5347 				    char __user *optval, int __user *optlen)
5348 {
5349 	struct net *net = sock_net(sk);
5350 	struct sctp_authkeyid val;
5351 	struct sctp_association *asoc;
5352 
5353 	if (!net->sctp.auth_enable)
5354 		return -EACCES;
5355 
5356 	if (len < sizeof(struct sctp_authkeyid))
5357 		return -EINVAL;
5358 	if (copy_from_user(&val, optval, sizeof(struct sctp_authkeyid)))
5359 		return -EFAULT;
5360 
5361 	asoc = sctp_id2assoc(sk, val.scact_assoc_id);
5362 	if (!asoc && val.scact_assoc_id && sctp_style(sk, UDP))
5363 		return -EINVAL;
5364 
5365 	if (asoc)
5366 		val.scact_keynumber = asoc->active_key_id;
5367 	else
5368 		val.scact_keynumber = sctp_sk(sk)->ep->active_key_id;
5369 
5370 	len = sizeof(struct sctp_authkeyid);
5371 	if (put_user(len, optlen))
5372 		return -EFAULT;
5373 	if (copy_to_user(optval, &val, len))
5374 		return -EFAULT;
5375 
5376 	return 0;
5377 }
5378 
5379 static int sctp_getsockopt_peer_auth_chunks(struct sock *sk, int len,
5380 				    char __user *optval, int __user *optlen)
5381 {
5382 	struct net *net = sock_net(sk);
5383 	struct sctp_authchunks __user *p = (void __user *)optval;
5384 	struct sctp_authchunks val;
5385 	struct sctp_association *asoc;
5386 	struct sctp_chunks_param *ch;
5387 	u32    num_chunks = 0;
5388 	char __user *to;
5389 
5390 	if (!net->sctp.auth_enable)
5391 		return -EACCES;
5392 
5393 	if (len < sizeof(struct sctp_authchunks))
5394 		return -EINVAL;
5395 
5396 	if (copy_from_user(&val, optval, sizeof(struct sctp_authchunks)))
5397 		return -EFAULT;
5398 
5399 	to = p->gauth_chunks;
5400 	asoc = sctp_id2assoc(sk, val.gauth_assoc_id);
5401 	if (!asoc)
5402 		return -EINVAL;
5403 
5404 	ch = asoc->peer.peer_chunks;
5405 	if (!ch)
5406 		goto num;
5407 
5408 	/* See if the user provided enough room for all the data */
5409 	num_chunks = ntohs(ch->param_hdr.length) - sizeof(sctp_paramhdr_t);
5410 	if (len < num_chunks)
5411 		return -EINVAL;
5412 
5413 	if (copy_to_user(to, ch->chunks, num_chunks))
5414 		return -EFAULT;
5415 num:
5416 	len = sizeof(struct sctp_authchunks) + num_chunks;
5417 	if (put_user(len, optlen)) return -EFAULT;
5418 	if (put_user(num_chunks, &p->gauth_number_of_chunks))
5419 		return -EFAULT;
5420 	return 0;
5421 }
5422 
5423 static int sctp_getsockopt_local_auth_chunks(struct sock *sk, int len,
5424 				    char __user *optval, int __user *optlen)
5425 {
5426 	struct net *net = sock_net(sk);
5427 	struct sctp_authchunks __user *p = (void __user *)optval;
5428 	struct sctp_authchunks val;
5429 	struct sctp_association *asoc;
5430 	struct sctp_chunks_param *ch;
5431 	u32    num_chunks = 0;
5432 	char __user *to;
5433 
5434 	if (!net->sctp.auth_enable)
5435 		return -EACCES;
5436 
5437 	if (len < sizeof(struct sctp_authchunks))
5438 		return -EINVAL;
5439 
5440 	if (copy_from_user(&val, optval, sizeof(struct sctp_authchunks)))
5441 		return -EFAULT;
5442 
5443 	to = p->gauth_chunks;
5444 	asoc = sctp_id2assoc(sk, val.gauth_assoc_id);
5445 	if (!asoc && val.gauth_assoc_id && sctp_style(sk, UDP))
5446 		return -EINVAL;
5447 
5448 	if (asoc)
5449 		ch = (struct sctp_chunks_param*)asoc->c.auth_chunks;
5450 	else
5451 		ch = sctp_sk(sk)->ep->auth_chunk_list;
5452 
5453 	if (!ch)
5454 		goto num;
5455 
5456 	num_chunks = ntohs(ch->param_hdr.length) - sizeof(sctp_paramhdr_t);
5457 	if (len < sizeof(struct sctp_authchunks) + num_chunks)
5458 		return -EINVAL;
5459 
5460 	if (copy_to_user(to, ch->chunks, num_chunks))
5461 		return -EFAULT;
5462 num:
5463 	len = sizeof(struct sctp_authchunks) + num_chunks;
5464 	if (put_user(len, optlen))
5465 		return -EFAULT;
5466 	if (put_user(num_chunks, &p->gauth_number_of_chunks))
5467 		return -EFAULT;
5468 
5469 	return 0;
5470 }
5471 
5472 /*
5473  * 8.2.5.  Get the Current Number of Associations (SCTP_GET_ASSOC_NUMBER)
5474  * This option gets the current number of associations that are attached
5475  * to a one-to-many style socket.  The option value is an uint32_t.
5476  */
5477 static int sctp_getsockopt_assoc_number(struct sock *sk, int len,
5478 				    char __user *optval, int __user *optlen)
5479 {
5480 	struct sctp_sock *sp = sctp_sk(sk);
5481 	struct sctp_association *asoc;
5482 	u32 val = 0;
5483 
5484 	if (sctp_style(sk, TCP))
5485 		return -EOPNOTSUPP;
5486 
5487 	if (len < sizeof(u32))
5488 		return -EINVAL;
5489 
5490 	len = sizeof(u32);
5491 
5492 	list_for_each_entry(asoc, &(sp->ep->asocs), asocs) {
5493 		val++;
5494 	}
5495 
5496 	if (put_user(len, optlen))
5497 		return -EFAULT;
5498 	if (copy_to_user(optval, &val, len))
5499 		return -EFAULT;
5500 
5501 	return 0;
5502 }
5503 
5504 /*
5505  * 8.1.23 SCTP_AUTO_ASCONF
5506  * See the corresponding setsockopt entry as description
5507  */
5508 static int sctp_getsockopt_auto_asconf(struct sock *sk, int len,
5509 				   char __user *optval, int __user *optlen)
5510 {
5511 	int val = 0;
5512 
5513 	if (len < sizeof(int))
5514 		return -EINVAL;
5515 
5516 	len = sizeof(int);
5517 	if (sctp_sk(sk)->do_auto_asconf && sctp_is_ep_boundall(sk))
5518 		val = 1;
5519 	if (put_user(len, optlen))
5520 		return -EFAULT;
5521 	if (copy_to_user(optval, &val, len))
5522 		return -EFAULT;
5523 	return 0;
5524 }
5525 
5526 /*
5527  * 8.2.6. Get the Current Identifiers of Associations
5528  *        (SCTP_GET_ASSOC_ID_LIST)
5529  *
5530  * This option gets the current list of SCTP association identifiers of
5531  * the SCTP associations handled by a one-to-many style socket.
5532  */
5533 static int sctp_getsockopt_assoc_ids(struct sock *sk, int len,
5534 				    char __user *optval, int __user *optlen)
5535 {
5536 	struct sctp_sock *sp = sctp_sk(sk);
5537 	struct sctp_association *asoc;
5538 	struct sctp_assoc_ids *ids;
5539 	u32 num = 0;
5540 
5541 	if (sctp_style(sk, TCP))
5542 		return -EOPNOTSUPP;
5543 
5544 	if (len < sizeof(struct sctp_assoc_ids))
5545 		return -EINVAL;
5546 
5547 	list_for_each_entry(asoc, &(sp->ep->asocs), asocs) {
5548 		num++;
5549 	}
5550 
5551 	if (len < sizeof(struct sctp_assoc_ids) + sizeof(sctp_assoc_t) * num)
5552 		return -EINVAL;
5553 
5554 	len = sizeof(struct sctp_assoc_ids) + sizeof(sctp_assoc_t) * num;
5555 
5556 	ids = kmalloc(len, GFP_KERNEL);
5557 	if (unlikely(!ids))
5558 		return -ENOMEM;
5559 
5560 	ids->gaids_number_of_ids = num;
5561 	num = 0;
5562 	list_for_each_entry(asoc, &(sp->ep->asocs), asocs) {
5563 		ids->gaids_assoc_id[num++] = asoc->assoc_id;
5564 	}
5565 
5566 	if (put_user(len, optlen) || copy_to_user(optval, ids, len)) {
5567 		kfree(ids);
5568 		return -EFAULT;
5569 	}
5570 
5571 	kfree(ids);
5572 	return 0;
5573 }
5574 
5575 /*
5576  * SCTP_PEER_ADDR_THLDS
5577  *
5578  * This option allows us to fetch the partially failed threshold for one or all
5579  * transports in an association.  See Section 6.1 of:
5580  * http://www.ietf.org/id/draft-nishida-tsvwg-sctp-failover-05.txt
5581  */
5582 static int sctp_getsockopt_paddr_thresholds(struct sock *sk,
5583 					    char __user *optval,
5584 					    int len,
5585 					    int __user *optlen)
5586 {
5587 	struct sctp_paddrthlds val;
5588 	struct sctp_transport *trans;
5589 	struct sctp_association *asoc;
5590 
5591 	if (len < sizeof(struct sctp_paddrthlds))
5592 		return -EINVAL;
5593 	len = sizeof(struct sctp_paddrthlds);
5594 	if (copy_from_user(&val, (struct sctp_paddrthlds __user *)optval, len))
5595 		return -EFAULT;
5596 
5597 	if (sctp_is_any(sk, (const union sctp_addr *)&val.spt_address)) {
5598 		asoc = sctp_id2assoc(sk, val.spt_assoc_id);
5599 		if (!asoc)
5600 			return -ENOENT;
5601 
5602 		val.spt_pathpfthld = asoc->pf_retrans;
5603 		val.spt_pathmaxrxt = asoc->pathmaxrxt;
5604 	} else {
5605 		trans = sctp_addr_id2transport(sk, &val.spt_address,
5606 					       val.spt_assoc_id);
5607 		if (!trans)
5608 			return -ENOENT;
5609 
5610 		val.spt_pathmaxrxt = trans->pathmaxrxt;
5611 		val.spt_pathpfthld = trans->pf_retrans;
5612 	}
5613 
5614 	if (put_user(len, optlen) || copy_to_user(optval, &val, len))
5615 		return -EFAULT;
5616 
5617 	return 0;
5618 }
5619 
5620 SCTP_STATIC int sctp_getsockopt(struct sock *sk, int level, int optname,
5621 				char __user *optval, int __user *optlen)
5622 {
5623 	int retval = 0;
5624 	int len;
5625 
5626 	SCTP_DEBUG_PRINTK("sctp_getsockopt(sk: %p... optname: %d)\n",
5627 			  sk, optname);
5628 
5629 	/* I can hardly begin to describe how wrong this is.  This is
5630 	 * so broken as to be worse than useless.  The API draft
5631 	 * REALLY is NOT helpful here...  I am not convinced that the
5632 	 * semantics of getsockopt() with a level OTHER THAN SOL_SCTP
5633 	 * are at all well-founded.
5634 	 */
5635 	if (level != SOL_SCTP) {
5636 		struct sctp_af *af = sctp_sk(sk)->pf->af;
5637 
5638 		retval = af->getsockopt(sk, level, optname, optval, optlen);
5639 		return retval;
5640 	}
5641 
5642 	if (get_user(len, optlen))
5643 		return -EFAULT;
5644 
5645 	sctp_lock_sock(sk);
5646 
5647 	switch (optname) {
5648 	case SCTP_STATUS:
5649 		retval = sctp_getsockopt_sctp_status(sk, len, optval, optlen);
5650 		break;
5651 	case SCTP_DISABLE_FRAGMENTS:
5652 		retval = sctp_getsockopt_disable_fragments(sk, len, optval,
5653 							   optlen);
5654 		break;
5655 	case SCTP_EVENTS:
5656 		retval = sctp_getsockopt_events(sk, len, optval, optlen);
5657 		break;
5658 	case SCTP_AUTOCLOSE:
5659 		retval = sctp_getsockopt_autoclose(sk, len, optval, optlen);
5660 		break;
5661 	case SCTP_SOCKOPT_PEELOFF:
5662 		retval = sctp_getsockopt_peeloff(sk, len, optval, optlen);
5663 		break;
5664 	case SCTP_PEER_ADDR_PARAMS:
5665 		retval = sctp_getsockopt_peer_addr_params(sk, len, optval,
5666 							  optlen);
5667 		break;
5668 	case SCTP_DELAYED_SACK:
5669 		retval = sctp_getsockopt_delayed_ack(sk, len, optval,
5670 							  optlen);
5671 		break;
5672 	case SCTP_INITMSG:
5673 		retval = sctp_getsockopt_initmsg(sk, len, optval, optlen);
5674 		break;
5675 	case SCTP_GET_PEER_ADDRS:
5676 		retval = sctp_getsockopt_peer_addrs(sk, len, optval,
5677 						    optlen);
5678 		break;
5679 	case SCTP_GET_LOCAL_ADDRS:
5680 		retval = sctp_getsockopt_local_addrs(sk, len, optval,
5681 						     optlen);
5682 		break;
5683 	case SCTP_SOCKOPT_CONNECTX3:
5684 		retval = sctp_getsockopt_connectx3(sk, len, optval, optlen);
5685 		break;
5686 	case SCTP_DEFAULT_SEND_PARAM:
5687 		retval = sctp_getsockopt_default_send_param(sk, len,
5688 							    optval, optlen);
5689 		break;
5690 	case SCTP_PRIMARY_ADDR:
5691 		retval = sctp_getsockopt_primary_addr(sk, len, optval, optlen);
5692 		break;
5693 	case SCTP_NODELAY:
5694 		retval = sctp_getsockopt_nodelay(sk, len, optval, optlen);
5695 		break;
5696 	case SCTP_RTOINFO:
5697 		retval = sctp_getsockopt_rtoinfo(sk, len, optval, optlen);
5698 		break;
5699 	case SCTP_ASSOCINFO:
5700 		retval = sctp_getsockopt_associnfo(sk, len, optval, optlen);
5701 		break;
5702 	case SCTP_I_WANT_MAPPED_V4_ADDR:
5703 		retval = sctp_getsockopt_mappedv4(sk, len, optval, optlen);
5704 		break;
5705 	case SCTP_MAXSEG:
5706 		retval = sctp_getsockopt_maxseg(sk, len, optval, optlen);
5707 		break;
5708 	case SCTP_GET_PEER_ADDR_INFO:
5709 		retval = sctp_getsockopt_peer_addr_info(sk, len, optval,
5710 							optlen);
5711 		break;
5712 	case SCTP_ADAPTATION_LAYER:
5713 		retval = sctp_getsockopt_adaptation_layer(sk, len, optval,
5714 							optlen);
5715 		break;
5716 	case SCTP_CONTEXT:
5717 		retval = sctp_getsockopt_context(sk, len, optval, optlen);
5718 		break;
5719 	case SCTP_FRAGMENT_INTERLEAVE:
5720 		retval = sctp_getsockopt_fragment_interleave(sk, len, optval,
5721 							     optlen);
5722 		break;
5723 	case SCTP_PARTIAL_DELIVERY_POINT:
5724 		retval = sctp_getsockopt_partial_delivery_point(sk, len, optval,
5725 								optlen);
5726 		break;
5727 	case SCTP_MAX_BURST:
5728 		retval = sctp_getsockopt_maxburst(sk, len, optval, optlen);
5729 		break;
5730 	case SCTP_AUTH_KEY:
5731 	case SCTP_AUTH_CHUNK:
5732 	case SCTP_AUTH_DELETE_KEY:
5733 		retval = -EOPNOTSUPP;
5734 		break;
5735 	case SCTP_HMAC_IDENT:
5736 		retval = sctp_getsockopt_hmac_ident(sk, len, optval, optlen);
5737 		break;
5738 	case SCTP_AUTH_ACTIVE_KEY:
5739 		retval = sctp_getsockopt_active_key(sk, len, optval, optlen);
5740 		break;
5741 	case SCTP_PEER_AUTH_CHUNKS:
5742 		retval = sctp_getsockopt_peer_auth_chunks(sk, len, optval,
5743 							optlen);
5744 		break;
5745 	case SCTP_LOCAL_AUTH_CHUNKS:
5746 		retval = sctp_getsockopt_local_auth_chunks(sk, len, optval,
5747 							optlen);
5748 		break;
5749 	case SCTP_GET_ASSOC_NUMBER:
5750 		retval = sctp_getsockopt_assoc_number(sk, len, optval, optlen);
5751 		break;
5752 	case SCTP_GET_ASSOC_ID_LIST:
5753 		retval = sctp_getsockopt_assoc_ids(sk, len, optval, optlen);
5754 		break;
5755 	case SCTP_AUTO_ASCONF:
5756 		retval = sctp_getsockopt_auto_asconf(sk, len, optval, optlen);
5757 		break;
5758 	case SCTP_PEER_ADDR_THLDS:
5759 		retval = sctp_getsockopt_paddr_thresholds(sk, optval, len, optlen);
5760 		break;
5761 	default:
5762 		retval = -ENOPROTOOPT;
5763 		break;
5764 	}
5765 
5766 	sctp_release_sock(sk);
5767 	return retval;
5768 }
5769 
5770 static void sctp_hash(struct sock *sk)
5771 {
5772 	/* STUB */
5773 }
5774 
5775 static void sctp_unhash(struct sock *sk)
5776 {
5777 	/* STUB */
5778 }
5779 
5780 /* Check if port is acceptable.  Possibly find first available port.
5781  *
5782  * The port hash table (contained in the 'global' SCTP protocol storage
5783  * returned by struct sctp_protocol *sctp_get_protocol()). The hash
5784  * table is an array of 4096 lists (sctp_bind_hashbucket). Each
5785  * list (the list number is the port number hashed out, so as you
5786  * would expect from a hash function, all the ports in a given list have
5787  * such a number that hashes out to the same list number; you were
5788  * expecting that, right?); so each list has a set of ports, with a
5789  * link to the socket (struct sock) that uses it, the port number and
5790  * a fastreuse flag (FIXME: NPI ipg).
5791  */
5792 static struct sctp_bind_bucket *sctp_bucket_create(
5793 	struct sctp_bind_hashbucket *head, struct net *, unsigned short snum);
5794 
5795 static long sctp_get_port_local(struct sock *sk, union sctp_addr *addr)
5796 {
5797 	struct sctp_bind_hashbucket *head; /* hash list */
5798 	struct sctp_bind_bucket *pp; /* hash list port iterator */
5799 	struct hlist_node *node;
5800 	unsigned short snum;
5801 	int ret;
5802 
5803 	snum = ntohs(addr->v4.sin_port);
5804 
5805 	SCTP_DEBUG_PRINTK("sctp_get_port() begins, snum=%d\n", snum);
5806 	sctp_local_bh_disable();
5807 
5808 	if (snum == 0) {
5809 		/* Search for an available port. */
5810 		int low, high, remaining, index;
5811 		unsigned int rover;
5812 
5813 		inet_get_local_port_range(&low, &high);
5814 		remaining = (high - low) + 1;
5815 		rover = net_random() % remaining + low;
5816 
5817 		do {
5818 			rover++;
5819 			if ((rover < low) || (rover > high))
5820 				rover = low;
5821 			if (inet_is_reserved_local_port(rover))
5822 				continue;
5823 			index = sctp_phashfn(sock_net(sk), rover);
5824 			head = &sctp_port_hashtable[index];
5825 			sctp_spin_lock(&head->lock);
5826 			sctp_for_each_hentry(pp, node, &head->chain)
5827 				if ((pp->port == rover) &&
5828 				    net_eq(sock_net(sk), pp->net))
5829 					goto next;
5830 			break;
5831 		next:
5832 			sctp_spin_unlock(&head->lock);
5833 		} while (--remaining > 0);
5834 
5835 		/* Exhausted local port range during search? */
5836 		ret = 1;
5837 		if (remaining <= 0)
5838 			goto fail;
5839 
5840 		/* OK, here is the one we will use.  HEAD (the port
5841 		 * hash table list entry) is non-NULL and we hold it's
5842 		 * mutex.
5843 		 */
5844 		snum = rover;
5845 	} else {
5846 		/* We are given an specific port number; we verify
5847 		 * that it is not being used. If it is used, we will
5848 		 * exahust the search in the hash list corresponding
5849 		 * to the port number (snum) - we detect that with the
5850 		 * port iterator, pp being NULL.
5851 		 */
5852 		head = &sctp_port_hashtable[sctp_phashfn(sock_net(sk), snum)];
5853 		sctp_spin_lock(&head->lock);
5854 		sctp_for_each_hentry(pp, node, &head->chain) {
5855 			if ((pp->port == snum) && net_eq(pp->net, sock_net(sk)))
5856 				goto pp_found;
5857 		}
5858 	}
5859 	pp = NULL;
5860 	goto pp_not_found;
5861 pp_found:
5862 	if (!hlist_empty(&pp->owner)) {
5863 		/* We had a port hash table hit - there is an
5864 		 * available port (pp != NULL) and it is being
5865 		 * used by other socket (pp->owner not empty); that other
5866 		 * socket is going to be sk2.
5867 		 */
5868 		int reuse = sk->sk_reuse;
5869 		struct sock *sk2;
5870 
5871 		SCTP_DEBUG_PRINTK("sctp_get_port() found a possible match\n");
5872 		if (pp->fastreuse && sk->sk_reuse &&
5873 			sk->sk_state != SCTP_SS_LISTENING)
5874 			goto success;
5875 
5876 		/* Run through the list of sockets bound to the port
5877 		 * (pp->port) [via the pointers bind_next and
5878 		 * bind_pprev in the struct sock *sk2 (pp->sk)]. On each one,
5879 		 * we get the endpoint they describe and run through
5880 		 * the endpoint's list of IP (v4 or v6) addresses,
5881 		 * comparing each of the addresses with the address of
5882 		 * the socket sk. If we find a match, then that means
5883 		 * that this port/socket (sk) combination are already
5884 		 * in an endpoint.
5885 		 */
5886 		sk_for_each_bound(sk2, node, &pp->owner) {
5887 			struct sctp_endpoint *ep2;
5888 			ep2 = sctp_sk(sk2)->ep;
5889 
5890 			if (sk == sk2 ||
5891 			    (reuse && sk2->sk_reuse &&
5892 			     sk2->sk_state != SCTP_SS_LISTENING))
5893 				continue;
5894 
5895 			if (sctp_bind_addr_conflict(&ep2->base.bind_addr, addr,
5896 						 sctp_sk(sk2), sctp_sk(sk))) {
5897 				ret = (long)sk2;
5898 				goto fail_unlock;
5899 			}
5900 		}
5901 		SCTP_DEBUG_PRINTK("sctp_get_port(): Found a match\n");
5902 	}
5903 pp_not_found:
5904 	/* If there was a hash table miss, create a new port.  */
5905 	ret = 1;
5906 	if (!pp && !(pp = sctp_bucket_create(head, sock_net(sk), snum)))
5907 		goto fail_unlock;
5908 
5909 	/* In either case (hit or miss), make sure fastreuse is 1 only
5910 	 * if sk->sk_reuse is too (that is, if the caller requested
5911 	 * SO_REUSEADDR on this socket -sk-).
5912 	 */
5913 	if (hlist_empty(&pp->owner)) {
5914 		if (sk->sk_reuse && sk->sk_state != SCTP_SS_LISTENING)
5915 			pp->fastreuse = 1;
5916 		else
5917 			pp->fastreuse = 0;
5918 	} else if (pp->fastreuse &&
5919 		(!sk->sk_reuse || sk->sk_state == SCTP_SS_LISTENING))
5920 		pp->fastreuse = 0;
5921 
5922 	/* We are set, so fill up all the data in the hash table
5923 	 * entry, tie the socket list information with the rest of the
5924 	 * sockets FIXME: Blurry, NPI (ipg).
5925 	 */
5926 success:
5927 	if (!sctp_sk(sk)->bind_hash) {
5928 		inet_sk(sk)->inet_num = snum;
5929 		sk_add_bind_node(sk, &pp->owner);
5930 		sctp_sk(sk)->bind_hash = pp;
5931 	}
5932 	ret = 0;
5933 
5934 fail_unlock:
5935 	sctp_spin_unlock(&head->lock);
5936 
5937 fail:
5938 	sctp_local_bh_enable();
5939 	return ret;
5940 }
5941 
5942 /* Assign a 'snum' port to the socket.  If snum == 0, an ephemeral
5943  * port is requested.
5944  */
5945 static int sctp_get_port(struct sock *sk, unsigned short snum)
5946 {
5947 	long ret;
5948 	union sctp_addr addr;
5949 	struct sctp_af *af = sctp_sk(sk)->pf->af;
5950 
5951 	/* Set up a dummy address struct from the sk. */
5952 	af->from_sk(&addr, sk);
5953 	addr.v4.sin_port = htons(snum);
5954 
5955 	/* Note: sk->sk_num gets filled in if ephemeral port request. */
5956 	ret = sctp_get_port_local(sk, &addr);
5957 
5958 	return ret ? 1 : 0;
5959 }
5960 
5961 /*
5962  *  Move a socket to LISTENING state.
5963  */
5964 SCTP_STATIC int sctp_listen_start(struct sock *sk, int backlog)
5965 {
5966 	struct sctp_sock *sp = sctp_sk(sk);
5967 	struct sctp_endpoint *ep = sp->ep;
5968 	struct crypto_hash *tfm = NULL;
5969 
5970 	/* Allocate HMAC for generating cookie. */
5971 	if (!sctp_sk(sk)->hmac && sctp_hmac_alg) {
5972 		tfm = crypto_alloc_hash(sctp_hmac_alg, 0, CRYPTO_ALG_ASYNC);
5973 		if (IS_ERR(tfm)) {
5974 			net_info_ratelimited("failed to load transform for %s: %ld\n",
5975 					     sctp_hmac_alg, PTR_ERR(tfm));
5976 			return -ENOSYS;
5977 		}
5978 		sctp_sk(sk)->hmac = tfm;
5979 	}
5980 
5981 	/*
5982 	 * If a bind() or sctp_bindx() is not called prior to a listen()
5983 	 * call that allows new associations to be accepted, the system
5984 	 * picks an ephemeral port and will choose an address set equivalent
5985 	 * to binding with a wildcard address.
5986 	 *
5987 	 * This is not currently spelled out in the SCTP sockets
5988 	 * extensions draft, but follows the practice as seen in TCP
5989 	 * sockets.
5990 	 *
5991 	 */
5992 	sk->sk_state = SCTP_SS_LISTENING;
5993 	if (!ep->base.bind_addr.port) {
5994 		if (sctp_autobind(sk))
5995 			return -EAGAIN;
5996 	} else {
5997 		if (sctp_get_port(sk, inet_sk(sk)->inet_num)) {
5998 			sk->sk_state = SCTP_SS_CLOSED;
5999 			return -EADDRINUSE;
6000 		}
6001 	}
6002 
6003 	sk->sk_max_ack_backlog = backlog;
6004 	sctp_hash_endpoint(ep);
6005 	return 0;
6006 }
6007 
6008 /*
6009  * 4.1.3 / 5.1.3 listen()
6010  *
6011  *   By default, new associations are not accepted for UDP style sockets.
6012  *   An application uses listen() to mark a socket as being able to
6013  *   accept new associations.
6014  *
6015  *   On TCP style sockets, applications use listen() to ready the SCTP
6016  *   endpoint for accepting inbound associations.
6017  *
6018  *   On both types of endpoints a backlog of '0' disables listening.
6019  *
6020  *  Move a socket to LISTENING state.
6021  */
6022 int sctp_inet_listen(struct socket *sock, int backlog)
6023 {
6024 	struct sock *sk = sock->sk;
6025 	struct sctp_endpoint *ep = sctp_sk(sk)->ep;
6026 	int err = -EINVAL;
6027 
6028 	if (unlikely(backlog < 0))
6029 		return err;
6030 
6031 	sctp_lock_sock(sk);
6032 
6033 	/* Peeled-off sockets are not allowed to listen().  */
6034 	if (sctp_style(sk, UDP_HIGH_BANDWIDTH))
6035 		goto out;
6036 
6037 	if (sock->state != SS_UNCONNECTED)
6038 		goto out;
6039 
6040 	/* If backlog is zero, disable listening. */
6041 	if (!backlog) {
6042 		if (sctp_sstate(sk, CLOSED))
6043 			goto out;
6044 
6045 		err = 0;
6046 		sctp_unhash_endpoint(ep);
6047 		sk->sk_state = SCTP_SS_CLOSED;
6048 		if (sk->sk_reuse)
6049 			sctp_sk(sk)->bind_hash->fastreuse = 1;
6050 		goto out;
6051 	}
6052 
6053 	/* If we are already listening, just update the backlog */
6054 	if (sctp_sstate(sk, LISTENING))
6055 		sk->sk_max_ack_backlog = backlog;
6056 	else {
6057 		err = sctp_listen_start(sk, backlog);
6058 		if (err)
6059 			goto out;
6060 	}
6061 
6062 	err = 0;
6063 out:
6064 	sctp_release_sock(sk);
6065 	return err;
6066 }
6067 
6068 /*
6069  * This function is done by modeling the current datagram_poll() and the
6070  * tcp_poll().  Note that, based on these implementations, we don't
6071  * lock the socket in this function, even though it seems that,
6072  * ideally, locking or some other mechanisms can be used to ensure
6073  * the integrity of the counters (sndbuf and wmem_alloc) used
6074  * in this place.  We assume that we don't need locks either until proven
6075  * otherwise.
6076  *
6077  * Another thing to note is that we include the Async I/O support
6078  * here, again, by modeling the current TCP/UDP code.  We don't have
6079  * a good way to test with it yet.
6080  */
6081 unsigned int sctp_poll(struct file *file, struct socket *sock, poll_table *wait)
6082 {
6083 	struct sock *sk = sock->sk;
6084 	struct sctp_sock *sp = sctp_sk(sk);
6085 	unsigned int mask;
6086 
6087 	poll_wait(file, sk_sleep(sk), wait);
6088 
6089 	/* A TCP-style listening socket becomes readable when the accept queue
6090 	 * is not empty.
6091 	 */
6092 	if (sctp_style(sk, TCP) && sctp_sstate(sk, LISTENING))
6093 		return (!list_empty(&sp->ep->asocs)) ?
6094 			(POLLIN | POLLRDNORM) : 0;
6095 
6096 	mask = 0;
6097 
6098 	/* Is there any exceptional events?  */
6099 	if (sk->sk_err || !skb_queue_empty(&sk->sk_error_queue))
6100 		mask |= POLLERR;
6101 	if (sk->sk_shutdown & RCV_SHUTDOWN)
6102 		mask |= POLLRDHUP | POLLIN | POLLRDNORM;
6103 	if (sk->sk_shutdown == SHUTDOWN_MASK)
6104 		mask |= POLLHUP;
6105 
6106 	/* Is it readable?  Reconsider this code with TCP-style support.  */
6107 	if (!skb_queue_empty(&sk->sk_receive_queue))
6108 		mask |= POLLIN | POLLRDNORM;
6109 
6110 	/* The association is either gone or not ready.  */
6111 	if (!sctp_style(sk, UDP) && sctp_sstate(sk, CLOSED))
6112 		return mask;
6113 
6114 	/* Is it writable?  */
6115 	if (sctp_writeable(sk)) {
6116 		mask |= POLLOUT | POLLWRNORM;
6117 	} else {
6118 		set_bit(SOCK_ASYNC_NOSPACE, &sk->sk_socket->flags);
6119 		/*
6120 		 * Since the socket is not locked, the buffer
6121 		 * might be made available after the writeable check and
6122 		 * before the bit is set.  This could cause a lost I/O
6123 		 * signal.  tcp_poll() has a race breaker for this race
6124 		 * condition.  Based on their implementation, we put
6125 		 * in the following code to cover it as well.
6126 		 */
6127 		if (sctp_writeable(sk))
6128 			mask |= POLLOUT | POLLWRNORM;
6129 	}
6130 	return mask;
6131 }
6132 
6133 /********************************************************************
6134  * 2nd Level Abstractions
6135  ********************************************************************/
6136 
6137 static struct sctp_bind_bucket *sctp_bucket_create(
6138 	struct sctp_bind_hashbucket *head, struct net *net, unsigned short snum)
6139 {
6140 	struct sctp_bind_bucket *pp;
6141 
6142 	pp = kmem_cache_alloc(sctp_bucket_cachep, GFP_ATOMIC);
6143 	if (pp) {
6144 		SCTP_DBG_OBJCNT_INC(bind_bucket);
6145 		pp->port = snum;
6146 		pp->fastreuse = 0;
6147 		INIT_HLIST_HEAD(&pp->owner);
6148 		pp->net = net;
6149 		hlist_add_head(&pp->node, &head->chain);
6150 	}
6151 	return pp;
6152 }
6153 
6154 /* Caller must hold hashbucket lock for this tb with local BH disabled */
6155 static void sctp_bucket_destroy(struct sctp_bind_bucket *pp)
6156 {
6157 	if (pp && hlist_empty(&pp->owner)) {
6158 		__hlist_del(&pp->node);
6159 		kmem_cache_free(sctp_bucket_cachep, pp);
6160 		SCTP_DBG_OBJCNT_DEC(bind_bucket);
6161 	}
6162 }
6163 
6164 /* Release this socket's reference to a local port.  */
6165 static inline void __sctp_put_port(struct sock *sk)
6166 {
6167 	struct sctp_bind_hashbucket *head =
6168 		&sctp_port_hashtable[sctp_phashfn(sock_net(sk),
6169 						  inet_sk(sk)->inet_num)];
6170 	struct sctp_bind_bucket *pp;
6171 
6172 	sctp_spin_lock(&head->lock);
6173 	pp = sctp_sk(sk)->bind_hash;
6174 	__sk_del_bind_node(sk);
6175 	sctp_sk(sk)->bind_hash = NULL;
6176 	inet_sk(sk)->inet_num = 0;
6177 	sctp_bucket_destroy(pp);
6178 	sctp_spin_unlock(&head->lock);
6179 }
6180 
6181 void sctp_put_port(struct sock *sk)
6182 {
6183 	sctp_local_bh_disable();
6184 	__sctp_put_port(sk);
6185 	sctp_local_bh_enable();
6186 }
6187 
6188 /*
6189  * The system picks an ephemeral port and choose an address set equivalent
6190  * to binding with a wildcard address.
6191  * One of those addresses will be the primary address for the association.
6192  * This automatically enables the multihoming capability of SCTP.
6193  */
6194 static int sctp_autobind(struct sock *sk)
6195 {
6196 	union sctp_addr autoaddr;
6197 	struct sctp_af *af;
6198 	__be16 port;
6199 
6200 	/* Initialize a local sockaddr structure to INADDR_ANY. */
6201 	af = sctp_sk(sk)->pf->af;
6202 
6203 	port = htons(inet_sk(sk)->inet_num);
6204 	af->inaddr_any(&autoaddr, port);
6205 
6206 	return sctp_do_bind(sk, &autoaddr, af->sockaddr_len);
6207 }
6208 
6209 /* Parse out IPPROTO_SCTP CMSG headers.  Perform only minimal validation.
6210  *
6211  * From RFC 2292
6212  * 4.2 The cmsghdr Structure *
6213  *
6214  * When ancillary data is sent or received, any number of ancillary data
6215  * objects can be specified by the msg_control and msg_controllen members of
6216  * the msghdr structure, because each object is preceded by
6217  * a cmsghdr structure defining the object's length (the cmsg_len member).
6218  * Historically Berkeley-derived implementations have passed only one object
6219  * at a time, but this API allows multiple objects to be
6220  * passed in a single call to sendmsg() or recvmsg(). The following example
6221  * shows two ancillary data objects in a control buffer.
6222  *
6223  *   |<--------------------------- msg_controllen -------------------------->|
6224  *   |                                                                       |
6225  *
6226  *   |<----- ancillary data object ----->|<----- ancillary data object ----->|
6227  *
6228  *   |<---------- CMSG_SPACE() --------->|<---------- CMSG_SPACE() --------->|
6229  *   |                                   |                                   |
6230  *
6231  *   |<---------- cmsg_len ---------->|  |<--------- cmsg_len ----------->|  |
6232  *
6233  *   |<--------- CMSG_LEN() --------->|  |<-------- CMSG_LEN() ---------->|  |
6234  *   |                                |  |                                |  |
6235  *
6236  *   +-----+-----+-----+--+-----------+--+-----+-----+-----+--+-----------+--+
6237  *   |cmsg_|cmsg_|cmsg_|XX|           |XX|cmsg_|cmsg_|cmsg_|XX|           |XX|
6238  *
6239  *   |len  |level|type |XX|cmsg_data[]|XX|len  |level|type |XX|cmsg_data[]|XX|
6240  *
6241  *   +-----+-----+-----+--+-----------+--+-----+-----+-----+--+-----------+--+
6242  *    ^
6243  *    |
6244  *
6245  * msg_control
6246  * points here
6247  */
6248 SCTP_STATIC int sctp_msghdr_parse(const struct msghdr *msg,
6249 				  sctp_cmsgs_t *cmsgs)
6250 {
6251 	struct cmsghdr *cmsg;
6252 	struct msghdr *my_msg = (struct msghdr *)msg;
6253 
6254 	for (cmsg = CMSG_FIRSTHDR(msg);
6255 	     cmsg != NULL;
6256 	     cmsg = CMSG_NXTHDR(my_msg, cmsg)) {
6257 		if (!CMSG_OK(my_msg, cmsg))
6258 			return -EINVAL;
6259 
6260 		/* Should we parse this header or ignore?  */
6261 		if (cmsg->cmsg_level != IPPROTO_SCTP)
6262 			continue;
6263 
6264 		/* Strictly check lengths following example in SCM code.  */
6265 		switch (cmsg->cmsg_type) {
6266 		case SCTP_INIT:
6267 			/* SCTP Socket API Extension
6268 			 * 5.2.1 SCTP Initiation Structure (SCTP_INIT)
6269 			 *
6270 			 * This cmsghdr structure provides information for
6271 			 * initializing new SCTP associations with sendmsg().
6272 			 * The SCTP_INITMSG socket option uses this same data
6273 			 * structure.  This structure is not used for
6274 			 * recvmsg().
6275 			 *
6276 			 * cmsg_level    cmsg_type      cmsg_data[]
6277 			 * ------------  ------------   ----------------------
6278 			 * IPPROTO_SCTP  SCTP_INIT      struct sctp_initmsg
6279 			 */
6280 			if (cmsg->cmsg_len !=
6281 			    CMSG_LEN(sizeof(struct sctp_initmsg)))
6282 				return -EINVAL;
6283 			cmsgs->init = (struct sctp_initmsg *)CMSG_DATA(cmsg);
6284 			break;
6285 
6286 		case SCTP_SNDRCV:
6287 			/* SCTP Socket API Extension
6288 			 * 5.2.2 SCTP Header Information Structure(SCTP_SNDRCV)
6289 			 *
6290 			 * This cmsghdr structure specifies SCTP options for
6291 			 * sendmsg() and describes SCTP header information
6292 			 * about a received message through recvmsg().
6293 			 *
6294 			 * cmsg_level    cmsg_type      cmsg_data[]
6295 			 * ------------  ------------   ----------------------
6296 			 * IPPROTO_SCTP  SCTP_SNDRCV    struct sctp_sndrcvinfo
6297 			 */
6298 			if (cmsg->cmsg_len !=
6299 			    CMSG_LEN(sizeof(struct sctp_sndrcvinfo)))
6300 				return -EINVAL;
6301 
6302 			cmsgs->info =
6303 				(struct sctp_sndrcvinfo *)CMSG_DATA(cmsg);
6304 
6305 			/* Minimally, validate the sinfo_flags. */
6306 			if (cmsgs->info->sinfo_flags &
6307 			    ~(SCTP_UNORDERED | SCTP_ADDR_OVER |
6308 			      SCTP_ABORT | SCTP_EOF))
6309 				return -EINVAL;
6310 			break;
6311 
6312 		default:
6313 			return -EINVAL;
6314 		}
6315 	}
6316 	return 0;
6317 }
6318 
6319 /*
6320  * Wait for a packet..
6321  * Note: This function is the same function as in core/datagram.c
6322  * with a few modifications to make lksctp work.
6323  */
6324 static int sctp_wait_for_packet(struct sock * sk, int *err, long *timeo_p)
6325 {
6326 	int error;
6327 	DEFINE_WAIT(wait);
6328 
6329 	prepare_to_wait_exclusive(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
6330 
6331 	/* Socket errors? */
6332 	error = sock_error(sk);
6333 	if (error)
6334 		goto out;
6335 
6336 	if (!skb_queue_empty(&sk->sk_receive_queue))
6337 		goto ready;
6338 
6339 	/* Socket shut down?  */
6340 	if (sk->sk_shutdown & RCV_SHUTDOWN)
6341 		goto out;
6342 
6343 	/* Sequenced packets can come disconnected.  If so we report the
6344 	 * problem.
6345 	 */
6346 	error = -ENOTCONN;
6347 
6348 	/* Is there a good reason to think that we may receive some data?  */
6349 	if (list_empty(&sctp_sk(sk)->ep->asocs) && !sctp_sstate(sk, LISTENING))
6350 		goto out;
6351 
6352 	/* Handle signals.  */
6353 	if (signal_pending(current))
6354 		goto interrupted;
6355 
6356 	/* Let another process have a go.  Since we are going to sleep
6357 	 * anyway.  Note: This may cause odd behaviors if the message
6358 	 * does not fit in the user's buffer, but this seems to be the
6359 	 * only way to honor MSG_DONTWAIT realistically.
6360 	 */
6361 	sctp_release_sock(sk);
6362 	*timeo_p = schedule_timeout(*timeo_p);
6363 	sctp_lock_sock(sk);
6364 
6365 ready:
6366 	finish_wait(sk_sleep(sk), &wait);
6367 	return 0;
6368 
6369 interrupted:
6370 	error = sock_intr_errno(*timeo_p);
6371 
6372 out:
6373 	finish_wait(sk_sleep(sk), &wait);
6374 	*err = error;
6375 	return error;
6376 }
6377 
6378 /* Receive a datagram.
6379  * Note: This is pretty much the same routine as in core/datagram.c
6380  * with a few changes to make lksctp work.
6381  */
6382 static struct sk_buff *sctp_skb_recv_datagram(struct sock *sk, int flags,
6383 					      int noblock, int *err)
6384 {
6385 	int error;
6386 	struct sk_buff *skb;
6387 	long timeo;
6388 
6389 	timeo = sock_rcvtimeo(sk, noblock);
6390 
6391 	SCTP_DEBUG_PRINTK("Timeout: timeo: %ld, MAX: %ld.\n",
6392 			  timeo, MAX_SCHEDULE_TIMEOUT);
6393 
6394 	do {
6395 		/* Again only user level code calls this function,
6396 		 * so nothing interrupt level
6397 		 * will suddenly eat the receive_queue.
6398 		 *
6399 		 *  Look at current nfs client by the way...
6400 		 *  However, this function was correct in any case. 8)
6401 		 */
6402 		if (flags & MSG_PEEK) {
6403 			spin_lock_bh(&sk->sk_receive_queue.lock);
6404 			skb = skb_peek(&sk->sk_receive_queue);
6405 			if (skb)
6406 				atomic_inc(&skb->users);
6407 			spin_unlock_bh(&sk->sk_receive_queue.lock);
6408 		} else {
6409 			skb = skb_dequeue(&sk->sk_receive_queue);
6410 		}
6411 
6412 		if (skb)
6413 			return skb;
6414 
6415 		/* Caller is allowed not to check sk->sk_err before calling. */
6416 		error = sock_error(sk);
6417 		if (error)
6418 			goto no_packet;
6419 
6420 		if (sk->sk_shutdown & RCV_SHUTDOWN)
6421 			break;
6422 
6423 		/* User doesn't want to wait.  */
6424 		error = -EAGAIN;
6425 		if (!timeo)
6426 			goto no_packet;
6427 	} while (sctp_wait_for_packet(sk, err, &timeo) == 0);
6428 
6429 	return NULL;
6430 
6431 no_packet:
6432 	*err = error;
6433 	return NULL;
6434 }
6435 
6436 /* If sndbuf has changed, wake up per association sndbuf waiters.  */
6437 static void __sctp_write_space(struct sctp_association *asoc)
6438 {
6439 	struct sock *sk = asoc->base.sk;
6440 	struct socket *sock = sk->sk_socket;
6441 
6442 	if ((sctp_wspace(asoc) > 0) && sock) {
6443 		if (waitqueue_active(&asoc->wait))
6444 			wake_up_interruptible(&asoc->wait);
6445 
6446 		if (sctp_writeable(sk)) {
6447 			wait_queue_head_t *wq = sk_sleep(sk);
6448 
6449 			if (wq && waitqueue_active(wq))
6450 				wake_up_interruptible(wq);
6451 
6452 			/* Note that we try to include the Async I/O support
6453 			 * here by modeling from the current TCP/UDP code.
6454 			 * We have not tested with it yet.
6455 			 */
6456 			if (!(sk->sk_shutdown & SEND_SHUTDOWN))
6457 				sock_wake_async(sock,
6458 						SOCK_WAKE_SPACE, POLL_OUT);
6459 		}
6460 	}
6461 }
6462 
6463 /* Do accounting for the sndbuf space.
6464  * Decrement the used sndbuf space of the corresponding association by the
6465  * data size which was just transmitted(freed).
6466  */
6467 static void sctp_wfree(struct sk_buff *skb)
6468 {
6469 	struct sctp_association *asoc;
6470 	struct sctp_chunk *chunk;
6471 	struct sock *sk;
6472 
6473 	/* Get the saved chunk pointer.  */
6474 	chunk = *((struct sctp_chunk **)(skb->cb));
6475 	asoc = chunk->asoc;
6476 	sk = asoc->base.sk;
6477 	asoc->sndbuf_used -= SCTP_DATA_SNDSIZE(chunk) +
6478 				sizeof(struct sk_buff) +
6479 				sizeof(struct sctp_chunk);
6480 
6481 	atomic_sub(sizeof(struct sctp_chunk), &sk->sk_wmem_alloc);
6482 
6483 	/*
6484 	 * This undoes what is done via sctp_set_owner_w and sk_mem_charge
6485 	 */
6486 	sk->sk_wmem_queued   -= skb->truesize;
6487 	sk_mem_uncharge(sk, skb->truesize);
6488 
6489 	sock_wfree(skb);
6490 	__sctp_write_space(asoc);
6491 
6492 	sctp_association_put(asoc);
6493 }
6494 
6495 /* Do accounting for the receive space on the socket.
6496  * Accounting for the association is done in ulpevent.c
6497  * We set this as a destructor for the cloned data skbs so that
6498  * accounting is done at the correct time.
6499  */
6500 void sctp_sock_rfree(struct sk_buff *skb)
6501 {
6502 	struct sock *sk = skb->sk;
6503 	struct sctp_ulpevent *event = sctp_skb2event(skb);
6504 
6505 	atomic_sub(event->rmem_len, &sk->sk_rmem_alloc);
6506 
6507 	/*
6508 	 * Mimic the behavior of sock_rfree
6509 	 */
6510 	sk_mem_uncharge(sk, event->rmem_len);
6511 }
6512 
6513 
6514 /* Helper function to wait for space in the sndbuf.  */
6515 static int sctp_wait_for_sndbuf(struct sctp_association *asoc, long *timeo_p,
6516 				size_t msg_len)
6517 {
6518 	struct sock *sk = asoc->base.sk;
6519 	int err = 0;
6520 	long current_timeo = *timeo_p;
6521 	DEFINE_WAIT(wait);
6522 
6523 	SCTP_DEBUG_PRINTK("wait_for_sndbuf: asoc=%p, timeo=%ld, msg_len=%zu\n",
6524 			  asoc, (long)(*timeo_p), msg_len);
6525 
6526 	/* Increment the association's refcnt.  */
6527 	sctp_association_hold(asoc);
6528 
6529 	/* Wait on the association specific sndbuf space. */
6530 	for (;;) {
6531 		prepare_to_wait_exclusive(&asoc->wait, &wait,
6532 					  TASK_INTERRUPTIBLE);
6533 		if (!*timeo_p)
6534 			goto do_nonblock;
6535 		if (sk->sk_err || asoc->state >= SCTP_STATE_SHUTDOWN_PENDING ||
6536 		    asoc->base.dead)
6537 			goto do_error;
6538 		if (signal_pending(current))
6539 			goto do_interrupted;
6540 		if (msg_len <= sctp_wspace(asoc))
6541 			break;
6542 
6543 		/* Let another process have a go.  Since we are going
6544 		 * to sleep anyway.
6545 		 */
6546 		sctp_release_sock(sk);
6547 		current_timeo = schedule_timeout(current_timeo);
6548 		BUG_ON(sk != asoc->base.sk);
6549 		sctp_lock_sock(sk);
6550 
6551 		*timeo_p = current_timeo;
6552 	}
6553 
6554 out:
6555 	finish_wait(&asoc->wait, &wait);
6556 
6557 	/* Release the association's refcnt.  */
6558 	sctp_association_put(asoc);
6559 
6560 	return err;
6561 
6562 do_error:
6563 	err = -EPIPE;
6564 	goto out;
6565 
6566 do_interrupted:
6567 	err = sock_intr_errno(*timeo_p);
6568 	goto out;
6569 
6570 do_nonblock:
6571 	err = -EAGAIN;
6572 	goto out;
6573 }
6574 
6575 void sctp_data_ready(struct sock *sk, int len)
6576 {
6577 	struct socket_wq *wq;
6578 
6579 	rcu_read_lock();
6580 	wq = rcu_dereference(sk->sk_wq);
6581 	if (wq_has_sleeper(wq))
6582 		wake_up_interruptible_sync_poll(&wq->wait, POLLIN |
6583 						POLLRDNORM | POLLRDBAND);
6584 	sk_wake_async(sk, SOCK_WAKE_WAITD, POLL_IN);
6585 	rcu_read_unlock();
6586 }
6587 
6588 /* If socket sndbuf has changed, wake up all per association waiters.  */
6589 void sctp_write_space(struct sock *sk)
6590 {
6591 	struct sctp_association *asoc;
6592 
6593 	/* Wake up the tasks in each wait queue.  */
6594 	list_for_each_entry(asoc, &((sctp_sk(sk))->ep->asocs), asocs) {
6595 		__sctp_write_space(asoc);
6596 	}
6597 }
6598 
6599 /* Is there any sndbuf space available on the socket?
6600  *
6601  * Note that sk_wmem_alloc is the sum of the send buffers on all of the
6602  * associations on the same socket.  For a UDP-style socket with
6603  * multiple associations, it is possible for it to be "unwriteable"
6604  * prematurely.  I assume that this is acceptable because
6605  * a premature "unwriteable" is better than an accidental "writeable" which
6606  * would cause an unwanted block under certain circumstances.  For the 1-1
6607  * UDP-style sockets or TCP-style sockets, this code should work.
6608  *  - Daisy
6609  */
6610 static int sctp_writeable(struct sock *sk)
6611 {
6612 	int amt = 0;
6613 
6614 	amt = sk->sk_sndbuf - sk_wmem_alloc_get(sk);
6615 	if (amt < 0)
6616 		amt = 0;
6617 	return amt;
6618 }
6619 
6620 /* Wait for an association to go into ESTABLISHED state. If timeout is 0,
6621  * returns immediately with EINPROGRESS.
6622  */
6623 static int sctp_wait_for_connect(struct sctp_association *asoc, long *timeo_p)
6624 {
6625 	struct sock *sk = asoc->base.sk;
6626 	int err = 0;
6627 	long current_timeo = *timeo_p;
6628 	DEFINE_WAIT(wait);
6629 
6630 	SCTP_DEBUG_PRINTK("%s: asoc=%p, timeo=%ld\n", __func__, asoc,
6631 			  (long)(*timeo_p));
6632 
6633 	/* Increment the association's refcnt.  */
6634 	sctp_association_hold(asoc);
6635 
6636 	for (;;) {
6637 		prepare_to_wait_exclusive(&asoc->wait, &wait,
6638 					  TASK_INTERRUPTIBLE);
6639 		if (!*timeo_p)
6640 			goto do_nonblock;
6641 		if (sk->sk_shutdown & RCV_SHUTDOWN)
6642 			break;
6643 		if (sk->sk_err || asoc->state >= SCTP_STATE_SHUTDOWN_PENDING ||
6644 		    asoc->base.dead)
6645 			goto do_error;
6646 		if (signal_pending(current))
6647 			goto do_interrupted;
6648 
6649 		if (sctp_state(asoc, ESTABLISHED))
6650 			break;
6651 
6652 		/* Let another process have a go.  Since we are going
6653 		 * to sleep anyway.
6654 		 */
6655 		sctp_release_sock(sk);
6656 		current_timeo = schedule_timeout(current_timeo);
6657 		sctp_lock_sock(sk);
6658 
6659 		*timeo_p = current_timeo;
6660 	}
6661 
6662 out:
6663 	finish_wait(&asoc->wait, &wait);
6664 
6665 	/* Release the association's refcnt.  */
6666 	sctp_association_put(asoc);
6667 
6668 	return err;
6669 
6670 do_error:
6671 	if (asoc->init_err_counter + 1 > asoc->max_init_attempts)
6672 		err = -ETIMEDOUT;
6673 	else
6674 		err = -ECONNREFUSED;
6675 	goto out;
6676 
6677 do_interrupted:
6678 	err = sock_intr_errno(*timeo_p);
6679 	goto out;
6680 
6681 do_nonblock:
6682 	err = -EINPROGRESS;
6683 	goto out;
6684 }
6685 
6686 static int sctp_wait_for_accept(struct sock *sk, long timeo)
6687 {
6688 	struct sctp_endpoint *ep;
6689 	int err = 0;
6690 	DEFINE_WAIT(wait);
6691 
6692 	ep = sctp_sk(sk)->ep;
6693 
6694 
6695 	for (;;) {
6696 		prepare_to_wait_exclusive(sk_sleep(sk), &wait,
6697 					  TASK_INTERRUPTIBLE);
6698 
6699 		if (list_empty(&ep->asocs)) {
6700 			sctp_release_sock(sk);
6701 			timeo = schedule_timeout(timeo);
6702 			sctp_lock_sock(sk);
6703 		}
6704 
6705 		err = -EINVAL;
6706 		if (!sctp_sstate(sk, LISTENING))
6707 			break;
6708 
6709 		err = 0;
6710 		if (!list_empty(&ep->asocs))
6711 			break;
6712 
6713 		err = sock_intr_errno(timeo);
6714 		if (signal_pending(current))
6715 			break;
6716 
6717 		err = -EAGAIN;
6718 		if (!timeo)
6719 			break;
6720 	}
6721 
6722 	finish_wait(sk_sleep(sk), &wait);
6723 
6724 	return err;
6725 }
6726 
6727 static void sctp_wait_for_close(struct sock *sk, long timeout)
6728 {
6729 	DEFINE_WAIT(wait);
6730 
6731 	do {
6732 		prepare_to_wait(sk_sleep(sk), &wait, TASK_INTERRUPTIBLE);
6733 		if (list_empty(&sctp_sk(sk)->ep->asocs))
6734 			break;
6735 		sctp_release_sock(sk);
6736 		timeout = schedule_timeout(timeout);
6737 		sctp_lock_sock(sk);
6738 	} while (!signal_pending(current) && timeout);
6739 
6740 	finish_wait(sk_sleep(sk), &wait);
6741 }
6742 
6743 static void sctp_skb_set_owner_r_frag(struct sk_buff *skb, struct sock *sk)
6744 {
6745 	struct sk_buff *frag;
6746 
6747 	if (!skb->data_len)
6748 		goto done;
6749 
6750 	/* Don't forget the fragments. */
6751 	skb_walk_frags(skb, frag)
6752 		sctp_skb_set_owner_r_frag(frag, sk);
6753 
6754 done:
6755 	sctp_skb_set_owner_r(skb, sk);
6756 }
6757 
6758 void sctp_copy_sock(struct sock *newsk, struct sock *sk,
6759 		    struct sctp_association *asoc)
6760 {
6761 	struct inet_sock *inet = inet_sk(sk);
6762 	struct inet_sock *newinet;
6763 
6764 	newsk->sk_type = sk->sk_type;
6765 	newsk->sk_bound_dev_if = sk->sk_bound_dev_if;
6766 	newsk->sk_flags = sk->sk_flags;
6767 	newsk->sk_no_check = sk->sk_no_check;
6768 	newsk->sk_reuse = sk->sk_reuse;
6769 
6770 	newsk->sk_shutdown = sk->sk_shutdown;
6771 	newsk->sk_destruct = inet_sock_destruct;
6772 	newsk->sk_family = sk->sk_family;
6773 	newsk->sk_protocol = IPPROTO_SCTP;
6774 	newsk->sk_backlog_rcv = sk->sk_prot->backlog_rcv;
6775 	newsk->sk_sndbuf = sk->sk_sndbuf;
6776 	newsk->sk_rcvbuf = sk->sk_rcvbuf;
6777 	newsk->sk_lingertime = sk->sk_lingertime;
6778 	newsk->sk_rcvtimeo = sk->sk_rcvtimeo;
6779 	newsk->sk_sndtimeo = sk->sk_sndtimeo;
6780 
6781 	newinet = inet_sk(newsk);
6782 
6783 	/* Initialize sk's sport, dport, rcv_saddr and daddr for
6784 	 * getsockname() and getpeername()
6785 	 */
6786 	newinet->inet_sport = inet->inet_sport;
6787 	newinet->inet_saddr = inet->inet_saddr;
6788 	newinet->inet_rcv_saddr = inet->inet_rcv_saddr;
6789 	newinet->inet_dport = htons(asoc->peer.port);
6790 	newinet->pmtudisc = inet->pmtudisc;
6791 	newinet->inet_id = asoc->next_tsn ^ jiffies;
6792 
6793 	newinet->uc_ttl = inet->uc_ttl;
6794 	newinet->mc_loop = 1;
6795 	newinet->mc_ttl = 1;
6796 	newinet->mc_index = 0;
6797 	newinet->mc_list = NULL;
6798 }
6799 
6800 /* Populate the fields of the newsk from the oldsk and migrate the assoc
6801  * and its messages to the newsk.
6802  */
6803 static void sctp_sock_migrate(struct sock *oldsk, struct sock *newsk,
6804 			      struct sctp_association *assoc,
6805 			      sctp_socket_type_t type)
6806 {
6807 	struct sctp_sock *oldsp = sctp_sk(oldsk);
6808 	struct sctp_sock *newsp = sctp_sk(newsk);
6809 	struct sctp_bind_bucket *pp; /* hash list port iterator */
6810 	struct sctp_endpoint *newep = newsp->ep;
6811 	struct sk_buff *skb, *tmp;
6812 	struct sctp_ulpevent *event;
6813 	struct sctp_bind_hashbucket *head;
6814 	struct list_head tmplist;
6815 
6816 	/* Migrate socket buffer sizes and all the socket level options to the
6817 	 * new socket.
6818 	 */
6819 	newsk->sk_sndbuf = oldsk->sk_sndbuf;
6820 	newsk->sk_rcvbuf = oldsk->sk_rcvbuf;
6821 	/* Brute force copy old sctp opt. */
6822 	if (oldsp->do_auto_asconf) {
6823 		memcpy(&tmplist, &newsp->auto_asconf_list, sizeof(tmplist));
6824 		inet_sk_copy_descendant(newsk, oldsk);
6825 		memcpy(&newsp->auto_asconf_list, &tmplist, sizeof(tmplist));
6826 	} else
6827 		inet_sk_copy_descendant(newsk, oldsk);
6828 
6829 	/* Restore the ep value that was overwritten with the above structure
6830 	 * copy.
6831 	 */
6832 	newsp->ep = newep;
6833 	newsp->hmac = NULL;
6834 
6835 	/* Hook this new socket in to the bind_hash list. */
6836 	head = &sctp_port_hashtable[sctp_phashfn(sock_net(oldsk),
6837 						 inet_sk(oldsk)->inet_num)];
6838 	sctp_local_bh_disable();
6839 	sctp_spin_lock(&head->lock);
6840 	pp = sctp_sk(oldsk)->bind_hash;
6841 	sk_add_bind_node(newsk, &pp->owner);
6842 	sctp_sk(newsk)->bind_hash = pp;
6843 	inet_sk(newsk)->inet_num = inet_sk(oldsk)->inet_num;
6844 	sctp_spin_unlock(&head->lock);
6845 	sctp_local_bh_enable();
6846 
6847 	/* Copy the bind_addr list from the original endpoint to the new
6848 	 * endpoint so that we can handle restarts properly
6849 	 */
6850 	sctp_bind_addr_dup(&newsp->ep->base.bind_addr,
6851 				&oldsp->ep->base.bind_addr, GFP_KERNEL);
6852 
6853 	/* Move any messages in the old socket's receive queue that are for the
6854 	 * peeled off association to the new socket's receive queue.
6855 	 */
6856 	sctp_skb_for_each(skb, &oldsk->sk_receive_queue, tmp) {
6857 		event = sctp_skb2event(skb);
6858 		if (event->asoc == assoc) {
6859 			__skb_unlink(skb, &oldsk->sk_receive_queue);
6860 			__skb_queue_tail(&newsk->sk_receive_queue, skb);
6861 			sctp_skb_set_owner_r_frag(skb, newsk);
6862 		}
6863 	}
6864 
6865 	/* Clean up any messages pending delivery due to partial
6866 	 * delivery.   Three cases:
6867 	 * 1) No partial deliver;  no work.
6868 	 * 2) Peeling off partial delivery; keep pd_lobby in new pd_lobby.
6869 	 * 3) Peeling off non-partial delivery; move pd_lobby to receive_queue.
6870 	 */
6871 	skb_queue_head_init(&newsp->pd_lobby);
6872 	atomic_set(&sctp_sk(newsk)->pd_mode, assoc->ulpq.pd_mode);
6873 
6874 	if (atomic_read(&sctp_sk(oldsk)->pd_mode)) {
6875 		struct sk_buff_head *queue;
6876 
6877 		/* Decide which queue to move pd_lobby skbs to. */
6878 		if (assoc->ulpq.pd_mode) {
6879 			queue = &newsp->pd_lobby;
6880 		} else
6881 			queue = &newsk->sk_receive_queue;
6882 
6883 		/* Walk through the pd_lobby, looking for skbs that
6884 		 * need moved to the new socket.
6885 		 */
6886 		sctp_skb_for_each(skb, &oldsp->pd_lobby, tmp) {
6887 			event = sctp_skb2event(skb);
6888 			if (event->asoc == assoc) {
6889 				__skb_unlink(skb, &oldsp->pd_lobby);
6890 				__skb_queue_tail(queue, skb);
6891 				sctp_skb_set_owner_r_frag(skb, newsk);
6892 			}
6893 		}
6894 
6895 		/* Clear up any skbs waiting for the partial
6896 		 * delivery to finish.
6897 		 */
6898 		if (assoc->ulpq.pd_mode)
6899 			sctp_clear_pd(oldsk, NULL);
6900 
6901 	}
6902 
6903 	sctp_skb_for_each(skb, &assoc->ulpq.reasm, tmp)
6904 		sctp_skb_set_owner_r_frag(skb, newsk);
6905 
6906 	sctp_skb_for_each(skb, &assoc->ulpq.lobby, tmp)
6907 		sctp_skb_set_owner_r_frag(skb, newsk);
6908 
6909 	/* Set the type of socket to indicate that it is peeled off from the
6910 	 * original UDP-style socket or created with the accept() call on a
6911 	 * TCP-style socket..
6912 	 */
6913 	newsp->type = type;
6914 
6915 	/* Mark the new socket "in-use" by the user so that any packets
6916 	 * that may arrive on the association after we've moved it are
6917 	 * queued to the backlog.  This prevents a potential race between
6918 	 * backlog processing on the old socket and new-packet processing
6919 	 * on the new socket.
6920 	 *
6921 	 * The caller has just allocated newsk so we can guarantee that other
6922 	 * paths won't try to lock it and then oldsk.
6923 	 */
6924 	lock_sock_nested(newsk, SINGLE_DEPTH_NESTING);
6925 	sctp_assoc_migrate(assoc, newsk);
6926 
6927 	/* If the association on the newsk is already closed before accept()
6928 	 * is called, set RCV_SHUTDOWN flag.
6929 	 */
6930 	if (sctp_state(assoc, CLOSED) && sctp_style(newsk, TCP))
6931 		newsk->sk_shutdown |= RCV_SHUTDOWN;
6932 
6933 	newsk->sk_state = SCTP_SS_ESTABLISHED;
6934 	sctp_release_sock(newsk);
6935 }
6936 
6937 
6938 /* This proto struct describes the ULP interface for SCTP.  */
6939 struct proto sctp_prot = {
6940 	.name        =	"SCTP",
6941 	.owner       =	THIS_MODULE,
6942 	.close       =	sctp_close,
6943 	.connect     =	sctp_connect,
6944 	.disconnect  =	sctp_disconnect,
6945 	.accept      =	sctp_accept,
6946 	.ioctl       =	sctp_ioctl,
6947 	.init        =	sctp_init_sock,
6948 	.destroy     =	sctp_destroy_sock,
6949 	.shutdown    =	sctp_shutdown,
6950 	.setsockopt  =	sctp_setsockopt,
6951 	.getsockopt  =	sctp_getsockopt,
6952 	.sendmsg     =	sctp_sendmsg,
6953 	.recvmsg     =	sctp_recvmsg,
6954 	.bind        =	sctp_bind,
6955 	.backlog_rcv =	sctp_backlog_rcv,
6956 	.hash        =	sctp_hash,
6957 	.unhash      =	sctp_unhash,
6958 	.get_port    =	sctp_get_port,
6959 	.obj_size    =  sizeof(struct sctp_sock),
6960 	.sysctl_mem  =  sysctl_sctp_mem,
6961 	.sysctl_rmem =  sysctl_sctp_rmem,
6962 	.sysctl_wmem =  sysctl_sctp_wmem,
6963 	.memory_pressure = &sctp_memory_pressure,
6964 	.enter_memory_pressure = sctp_enter_memory_pressure,
6965 	.memory_allocated = &sctp_memory_allocated,
6966 	.sockets_allocated = &sctp_sockets_allocated,
6967 };
6968 
6969 #if IS_ENABLED(CONFIG_IPV6)
6970 
6971 struct proto sctpv6_prot = {
6972 	.name		= "SCTPv6",
6973 	.owner		= THIS_MODULE,
6974 	.close		= sctp_close,
6975 	.connect	= sctp_connect,
6976 	.disconnect	= sctp_disconnect,
6977 	.accept		= sctp_accept,
6978 	.ioctl		= sctp_ioctl,
6979 	.init		= sctp_init_sock,
6980 	.destroy	= sctp_destroy_sock,
6981 	.shutdown	= sctp_shutdown,
6982 	.setsockopt	= sctp_setsockopt,
6983 	.getsockopt	= sctp_getsockopt,
6984 	.sendmsg	= sctp_sendmsg,
6985 	.recvmsg	= sctp_recvmsg,
6986 	.bind		= sctp_bind,
6987 	.backlog_rcv	= sctp_backlog_rcv,
6988 	.hash		= sctp_hash,
6989 	.unhash		= sctp_unhash,
6990 	.get_port	= sctp_get_port,
6991 	.obj_size	= sizeof(struct sctp6_sock),
6992 	.sysctl_mem	= sysctl_sctp_mem,
6993 	.sysctl_rmem	= sysctl_sctp_rmem,
6994 	.sysctl_wmem	= sysctl_sctp_wmem,
6995 	.memory_pressure = &sctp_memory_pressure,
6996 	.enter_memory_pressure = sctp_enter_memory_pressure,
6997 	.memory_allocated = &sctp_memory_allocated,
6998 	.sockets_allocated = &sctp_sockets_allocated,
6999 };
7000 #endif /* IS_ENABLED(CONFIG_IPV6) */
7001