xref: /linux/net/sctp/output.c (revision db6d8d5fdf9537641c76ba7f32e02b4bcc600972)
1 /* SCTP kernel implementation
2  * (C) Copyright IBM Corp. 2001, 2004
3  * Copyright (c) 1999-2000 Cisco, Inc.
4  * Copyright (c) 1999-2001 Motorola, Inc.
5  *
6  * This file is part of the SCTP kernel implementation
7  *
8  * These functions handle output processing.
9  *
10  * This SCTP implementation is free software;
11  * you can redistribute it and/or modify it under the terms of
12  * the GNU General Public License as published by
13  * the Free Software Foundation; either version 2, or (at your option)
14  * any later version.
15  *
16  * This SCTP implementation is distributed in the hope that it
17  * will be useful, but WITHOUT ANY WARRANTY; without even the implied
18  *                 ************************
19  * warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
20  * See the GNU General Public License for more details.
21  *
22  * You should have received a copy of the GNU General Public License
23  * along with GNU CC; see the file COPYING.  If not, see
24  * <http://www.gnu.org/licenses/>.
25  *
26  * Please send any bug reports or fixes you make to the
27  * email address(es):
28  *    lksctp developers <linux-sctp@vger.kernel.org>
29  *
30  * Written or modified by:
31  *    La Monte H.P. Yarroll <piggy@acm.org>
32  *    Karl Knutson          <karl@athena.chicago.il.us>
33  *    Jon Grimm             <jgrimm@austin.ibm.com>
34  *    Sridhar Samudrala     <sri@us.ibm.com>
35  */
36 
37 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
38 
39 #include <linux/types.h>
40 #include <linux/kernel.h>
41 #include <linux/wait.h>
42 #include <linux/time.h>
43 #include <linux/ip.h>
44 #include <linux/ipv6.h>
45 #include <linux/init.h>
46 #include <linux/slab.h>
47 #include <net/inet_ecn.h>
48 #include <net/ip.h>
49 #include <net/icmp.h>
50 #include <net/net_namespace.h>
51 
52 #include <linux/socket.h> /* for sa_family_t */
53 #include <net/sock.h>
54 
55 #include <net/sctp/sctp.h>
56 #include <net/sctp/sm.h>
57 #include <net/sctp/checksum.h>
58 
59 /* Forward declarations for private helpers. */
60 static sctp_xmit_t __sctp_packet_append_chunk(struct sctp_packet *packet,
61 					      struct sctp_chunk *chunk);
62 static sctp_xmit_t sctp_packet_can_append_data(struct sctp_packet *packet,
63 					   struct sctp_chunk *chunk);
64 static void sctp_packet_append_data(struct sctp_packet *packet,
65 					   struct sctp_chunk *chunk);
66 static sctp_xmit_t sctp_packet_will_fit(struct sctp_packet *packet,
67 					struct sctp_chunk *chunk,
68 					u16 chunk_len);
69 
70 static void sctp_packet_reset(struct sctp_packet *packet)
71 {
72 	packet->size = packet->overhead;
73 	packet->has_cookie_echo = 0;
74 	packet->has_sack = 0;
75 	packet->has_data = 0;
76 	packet->has_auth = 0;
77 	packet->ipfragok = 0;
78 	packet->auth = NULL;
79 }
80 
81 /* Config a packet.
82  * This appears to be a followup set of initializations.
83  */
84 struct sctp_packet *sctp_packet_config(struct sctp_packet *packet,
85 				       __u32 vtag, int ecn_capable)
86 {
87 	struct sctp_transport *tp = packet->transport;
88 	struct sctp_association *asoc = tp->asoc;
89 
90 	pr_debug("%s: packet:%p vtag:0x%x\n", __func__, packet, vtag);
91 
92 	packet->vtag = vtag;
93 
94 	if (asoc && tp->dst) {
95 		struct sock *sk = asoc->base.sk;
96 
97 		rcu_read_lock();
98 		if (__sk_dst_get(sk) != tp->dst) {
99 			dst_hold(tp->dst);
100 			sk_setup_caps(sk, tp->dst);
101 		}
102 
103 		if (sk_can_gso(sk)) {
104 			struct net_device *dev = tp->dst->dev;
105 
106 			packet->max_size = dev->gso_max_size;
107 		} else {
108 			packet->max_size = asoc->pathmtu;
109 		}
110 		rcu_read_unlock();
111 
112 	} else {
113 		packet->max_size = tp->pathmtu;
114 	}
115 
116 	if (ecn_capable && sctp_packet_empty(packet)) {
117 		struct sctp_chunk *chunk;
118 
119 		/* If there a is a prepend chunk stick it on the list before
120 		 * any other chunks get appended.
121 		 */
122 		chunk = sctp_get_ecne_prepend(asoc);
123 		if (chunk)
124 			sctp_packet_append_chunk(packet, chunk);
125 	}
126 
127 	return packet;
128 }
129 
130 /* Initialize the packet structure. */
131 struct sctp_packet *sctp_packet_init(struct sctp_packet *packet,
132 				     struct sctp_transport *transport,
133 				     __u16 sport, __u16 dport)
134 {
135 	struct sctp_association *asoc = transport->asoc;
136 	size_t overhead;
137 
138 	pr_debug("%s: packet:%p transport:%p\n", __func__, packet, transport);
139 
140 	packet->transport = transport;
141 	packet->source_port = sport;
142 	packet->destination_port = dport;
143 	INIT_LIST_HEAD(&packet->chunk_list);
144 	if (asoc) {
145 		struct sctp_sock *sp = sctp_sk(asoc->base.sk);
146 		overhead = sp->pf->af->net_header_len;
147 	} else {
148 		overhead = sizeof(struct ipv6hdr);
149 	}
150 	overhead += sizeof(struct sctphdr);
151 	packet->overhead = overhead;
152 	sctp_packet_reset(packet);
153 	packet->vtag = 0;
154 
155 	return packet;
156 }
157 
158 /* Free a packet.  */
159 void sctp_packet_free(struct sctp_packet *packet)
160 {
161 	struct sctp_chunk *chunk, *tmp;
162 
163 	pr_debug("%s: packet:%p\n", __func__, packet);
164 
165 	list_for_each_entry_safe(chunk, tmp, &packet->chunk_list, list) {
166 		list_del_init(&chunk->list);
167 		sctp_chunk_free(chunk);
168 	}
169 }
170 
171 /* This routine tries to append the chunk to the offered packet. If adding
172  * the chunk causes the packet to exceed the path MTU and COOKIE_ECHO chunk
173  * is not present in the packet, it transmits the input packet.
174  * Data can be bundled with a packet containing a COOKIE_ECHO chunk as long
175  * as it can fit in the packet, but any more data that does not fit in this
176  * packet can be sent only after receiving the COOKIE_ACK.
177  */
178 sctp_xmit_t sctp_packet_transmit_chunk(struct sctp_packet *packet,
179 				       struct sctp_chunk *chunk,
180 				       int one_packet, gfp_t gfp)
181 {
182 	sctp_xmit_t retval;
183 
184 	pr_debug("%s: packet:%p size:%Zu chunk:%p size:%d\n", __func__,
185 		 packet, packet->size, chunk, chunk->skb ? chunk->skb->len : -1);
186 
187 	switch ((retval = (sctp_packet_append_chunk(packet, chunk)))) {
188 	case SCTP_XMIT_PMTU_FULL:
189 		if (!packet->has_cookie_echo) {
190 			int error = 0;
191 
192 			error = sctp_packet_transmit(packet, gfp);
193 			if (error < 0)
194 				chunk->skb->sk->sk_err = -error;
195 
196 			/* If we have an empty packet, then we can NOT ever
197 			 * return PMTU_FULL.
198 			 */
199 			if (!one_packet)
200 				retval = sctp_packet_append_chunk(packet,
201 								  chunk);
202 		}
203 		break;
204 
205 	case SCTP_XMIT_RWND_FULL:
206 	case SCTP_XMIT_OK:
207 	case SCTP_XMIT_DELAY:
208 		break;
209 	}
210 
211 	return retval;
212 }
213 
214 /* Try to bundle an auth chunk into the packet. */
215 static sctp_xmit_t sctp_packet_bundle_auth(struct sctp_packet *pkt,
216 					   struct sctp_chunk *chunk)
217 {
218 	struct sctp_association *asoc = pkt->transport->asoc;
219 	struct sctp_chunk *auth;
220 	sctp_xmit_t retval = SCTP_XMIT_OK;
221 
222 	/* if we don't have an association, we can't do authentication */
223 	if (!asoc)
224 		return retval;
225 
226 	/* See if this is an auth chunk we are bundling or if
227 	 * auth is already bundled.
228 	 */
229 	if (chunk->chunk_hdr->type == SCTP_CID_AUTH || pkt->has_auth)
230 		return retval;
231 
232 	/* if the peer did not request this chunk to be authenticated,
233 	 * don't do it
234 	 */
235 	if (!chunk->auth)
236 		return retval;
237 
238 	auth = sctp_make_auth(asoc);
239 	if (!auth)
240 		return retval;
241 
242 	retval = __sctp_packet_append_chunk(pkt, auth);
243 
244 	if (retval != SCTP_XMIT_OK)
245 		sctp_chunk_free(auth);
246 
247 	return retval;
248 }
249 
250 /* Try to bundle a SACK with the packet. */
251 static sctp_xmit_t sctp_packet_bundle_sack(struct sctp_packet *pkt,
252 					   struct sctp_chunk *chunk)
253 {
254 	sctp_xmit_t retval = SCTP_XMIT_OK;
255 
256 	/* If sending DATA and haven't aleady bundled a SACK, try to
257 	 * bundle one in to the packet.
258 	 */
259 	if (sctp_chunk_is_data(chunk) && !pkt->has_sack &&
260 	    !pkt->has_cookie_echo) {
261 		struct sctp_association *asoc;
262 		struct timer_list *timer;
263 		asoc = pkt->transport->asoc;
264 		timer = &asoc->timers[SCTP_EVENT_TIMEOUT_SACK];
265 
266 		/* If the SACK timer is running, we have a pending SACK */
267 		if (timer_pending(timer)) {
268 			struct sctp_chunk *sack;
269 
270 			if (pkt->transport->sack_generation !=
271 			    pkt->transport->asoc->peer.sack_generation)
272 				return retval;
273 
274 			asoc->a_rwnd = asoc->rwnd;
275 			sack = sctp_make_sack(asoc);
276 			if (sack) {
277 				retval = __sctp_packet_append_chunk(pkt, sack);
278 				if (retval != SCTP_XMIT_OK) {
279 					sctp_chunk_free(sack);
280 					goto out;
281 				}
282 				asoc->peer.sack_needed = 0;
283 				if (del_timer(timer))
284 					sctp_association_put(asoc);
285 			}
286 		}
287 	}
288 out:
289 	return retval;
290 }
291 
292 
293 /* Append a chunk to the offered packet reporting back any inability to do
294  * so.
295  */
296 static sctp_xmit_t __sctp_packet_append_chunk(struct sctp_packet *packet,
297 					      struct sctp_chunk *chunk)
298 {
299 	sctp_xmit_t retval = SCTP_XMIT_OK;
300 	__u16 chunk_len = SCTP_PAD4(ntohs(chunk->chunk_hdr->length));
301 
302 	/* Check to see if this chunk will fit into the packet */
303 	retval = sctp_packet_will_fit(packet, chunk, chunk_len);
304 	if (retval != SCTP_XMIT_OK)
305 		goto finish;
306 
307 	/* We believe that this chunk is OK to add to the packet */
308 	switch (chunk->chunk_hdr->type) {
309 	case SCTP_CID_DATA:
310 		/* Account for the data being in the packet */
311 		sctp_packet_append_data(packet, chunk);
312 		/* Disallow SACK bundling after DATA. */
313 		packet->has_sack = 1;
314 		/* Disallow AUTH bundling after DATA */
315 		packet->has_auth = 1;
316 		/* Let it be knows that packet has DATA in it */
317 		packet->has_data = 1;
318 		/* timestamp the chunk for rtx purposes */
319 		chunk->sent_at = jiffies;
320 		/* Mainly used for prsctp RTX policy */
321 		chunk->sent_count++;
322 		break;
323 	case SCTP_CID_COOKIE_ECHO:
324 		packet->has_cookie_echo = 1;
325 		break;
326 
327 	case SCTP_CID_SACK:
328 		packet->has_sack = 1;
329 		if (chunk->asoc)
330 			chunk->asoc->stats.osacks++;
331 		break;
332 
333 	case SCTP_CID_AUTH:
334 		packet->has_auth = 1;
335 		packet->auth = chunk;
336 		break;
337 	}
338 
339 	/* It is OK to send this chunk.  */
340 	list_add_tail(&chunk->list, &packet->chunk_list);
341 	packet->size += chunk_len;
342 	chunk->transport = packet->transport;
343 finish:
344 	return retval;
345 }
346 
347 /* Append a chunk to the offered packet reporting back any inability to do
348  * so.
349  */
350 sctp_xmit_t sctp_packet_append_chunk(struct sctp_packet *packet,
351 				     struct sctp_chunk *chunk)
352 {
353 	sctp_xmit_t retval = SCTP_XMIT_OK;
354 
355 	pr_debug("%s: packet:%p chunk:%p\n", __func__, packet, chunk);
356 
357 	/* Data chunks are special.  Before seeing what else we can
358 	 * bundle into this packet, check to see if we are allowed to
359 	 * send this DATA.
360 	 */
361 	if (sctp_chunk_is_data(chunk)) {
362 		retval = sctp_packet_can_append_data(packet, chunk);
363 		if (retval != SCTP_XMIT_OK)
364 			goto finish;
365 	}
366 
367 	/* Try to bundle AUTH chunk */
368 	retval = sctp_packet_bundle_auth(packet, chunk);
369 	if (retval != SCTP_XMIT_OK)
370 		goto finish;
371 
372 	/* Try to bundle SACK chunk */
373 	retval = sctp_packet_bundle_sack(packet, chunk);
374 	if (retval != SCTP_XMIT_OK)
375 		goto finish;
376 
377 	retval = __sctp_packet_append_chunk(packet, chunk);
378 
379 finish:
380 	return retval;
381 }
382 
383 static void sctp_packet_release_owner(struct sk_buff *skb)
384 {
385 	sk_free(skb->sk);
386 }
387 
388 static void sctp_packet_set_owner_w(struct sk_buff *skb, struct sock *sk)
389 {
390 	skb_orphan(skb);
391 	skb->sk = sk;
392 	skb->destructor = sctp_packet_release_owner;
393 
394 	/*
395 	 * The data chunks have already been accounted for in sctp_sendmsg(),
396 	 * therefore only reserve a single byte to keep socket around until
397 	 * the packet has been transmitted.
398 	 */
399 	atomic_inc(&sk->sk_wmem_alloc);
400 }
401 
402 /* All packets are sent to the network through this function from
403  * sctp_outq_tail().
404  *
405  * The return value is a normal kernel error return value.
406  */
407 int sctp_packet_transmit(struct sctp_packet *packet, gfp_t gfp)
408 {
409 	struct sctp_transport *tp = packet->transport;
410 	struct sctp_association *asoc = tp->asoc;
411 	struct sctphdr *sh;
412 	struct sk_buff *nskb = NULL, *head = NULL;
413 	struct sctp_chunk *chunk, *tmp;
414 	struct sock *sk;
415 	int err = 0;
416 	int padding;		/* How much padding do we need?  */
417 	int pkt_size;
418 	__u8 has_data = 0;
419 	int gso = 0;
420 	int pktcount = 0;
421 	struct dst_entry *dst;
422 	unsigned char *auth = NULL;	/* pointer to auth in skb data */
423 
424 	pr_debug("%s: packet:%p\n", __func__, packet);
425 
426 	/* Do NOT generate a chunkless packet. */
427 	if (list_empty(&packet->chunk_list))
428 		return err;
429 
430 	/* Set up convenience variables... */
431 	chunk = list_entry(packet->chunk_list.next, struct sctp_chunk, list);
432 	sk = chunk->skb->sk;
433 
434 	/* Allocate the head skb, or main one if not in GSO */
435 	if (packet->size > tp->pathmtu && !packet->ipfragok) {
436 		if (sk_can_gso(sk)) {
437 			gso = 1;
438 			pkt_size = packet->overhead;
439 		} else {
440 			/* If this happens, we trash this packet and try
441 			 * to build a new one, hopefully correct this
442 			 * time. Application may notice this error.
443 			 */
444 			pr_err_once("Trying to GSO but underlying device doesn't support it.");
445 			goto err;
446 		}
447 	} else {
448 		pkt_size = packet->size;
449 	}
450 	head = alloc_skb(pkt_size + MAX_HEADER, gfp);
451 	if (!head)
452 		goto err;
453 	if (gso) {
454 		NAPI_GRO_CB(head)->last = head;
455 		skb_shinfo(head)->gso_type = sk->sk_gso_type;
456 	}
457 
458 	/* Make sure the outbound skb has enough header room reserved. */
459 	skb_reserve(head, packet->overhead + MAX_HEADER);
460 
461 	/* Set the owning socket so that we know where to get the
462 	 * destination IP address.
463 	 */
464 	sctp_packet_set_owner_w(head, sk);
465 
466 	if (!sctp_transport_dst_check(tp)) {
467 		sctp_transport_route(tp, NULL, sctp_sk(sk));
468 		if (asoc && (asoc->param_flags & SPP_PMTUD_ENABLE)) {
469 			sctp_assoc_sync_pmtu(sk, asoc);
470 		}
471 	}
472 	dst = dst_clone(tp->dst);
473 	if (!dst) {
474 		if (asoc)
475 			IP_INC_STATS(sock_net(asoc->base.sk),
476 				     IPSTATS_MIB_OUTNOROUTES);
477 		goto nodst;
478 	}
479 	skb_dst_set(head, dst);
480 
481 	/* Build the SCTP header.  */
482 	sh = (struct sctphdr *)skb_push(head, sizeof(struct sctphdr));
483 	skb_reset_transport_header(head);
484 	sh->source = htons(packet->source_port);
485 	sh->dest   = htons(packet->destination_port);
486 
487 	/* From 6.8 Adler-32 Checksum Calculation:
488 	 * After the packet is constructed (containing the SCTP common
489 	 * header and one or more control or DATA chunks), the
490 	 * transmitter shall:
491 	 *
492 	 * 1) Fill in the proper Verification Tag in the SCTP common
493 	 *    header and initialize the checksum field to 0's.
494 	 */
495 	sh->vtag     = htonl(packet->vtag);
496 	sh->checksum = 0;
497 
498 	pr_debug("***sctp_transmit_packet***\n");
499 
500 	do {
501 		/* Set up convenience variables... */
502 		chunk = list_entry(packet->chunk_list.next, struct sctp_chunk, list);
503 		pktcount++;
504 
505 		/* Calculate packet size, so it fits in PMTU. Leave
506 		 * other chunks for the next packets.
507 		 */
508 		if (gso) {
509 			pkt_size = packet->overhead;
510 			list_for_each_entry(chunk, &packet->chunk_list, list) {
511 				int padded = SCTP_PAD4(chunk->skb->len);
512 
513 				if (pkt_size + padded > tp->pathmtu)
514 					break;
515 				pkt_size += padded;
516 			}
517 
518 			/* Allocate a new skb. */
519 			nskb = alloc_skb(pkt_size + MAX_HEADER, gfp);
520 			if (!nskb)
521 				goto nomem;
522 
523 			/* Make sure the outbound skb has enough header
524 			 * room reserved.
525 			 */
526 			skb_reserve(nskb, packet->overhead + MAX_HEADER);
527 		} else {
528 			nskb = head;
529 		}
530 
531 		/**
532 		 * 3.2  Chunk Field Descriptions
533 		 *
534 		 * The total length of a chunk (including Type, Length and
535 		 * Value fields) MUST be a multiple of 4 bytes.  If the length
536 		 * of the chunk is not a multiple of 4 bytes, the sender MUST
537 		 * pad the chunk with all zero bytes and this padding is not
538 		 * included in the chunk length field.  The sender should
539 		 * never pad with more than 3 bytes.
540 		 *
541 		 * [This whole comment explains SCTP_PAD4() below.]
542 		 */
543 
544 		pkt_size -= packet->overhead;
545 		list_for_each_entry_safe(chunk, tmp, &packet->chunk_list, list) {
546 			list_del_init(&chunk->list);
547 			if (sctp_chunk_is_data(chunk)) {
548 				/* 6.3.1 C4) When data is in flight and when allowed
549 				 * by rule C5, a new RTT measurement MUST be made each
550 				 * round trip.  Furthermore, new RTT measurements
551 				 * SHOULD be made no more than once per round-trip
552 				 * for a given destination transport address.
553 				 */
554 
555 				if (!chunk->resent && !tp->rto_pending) {
556 					chunk->rtt_in_progress = 1;
557 					tp->rto_pending = 1;
558 				}
559 
560 				has_data = 1;
561 			}
562 
563 			padding = SCTP_PAD4(chunk->skb->len) - chunk->skb->len;
564 			if (padding)
565 				memset(skb_put(chunk->skb, padding), 0, padding);
566 
567 			/* if this is the auth chunk that we are adding,
568 			 * store pointer where it will be added and put
569 			 * the auth into the packet.
570 			 */
571 			if (chunk == packet->auth)
572 				auth = skb_tail_pointer(nskb);
573 
574 			memcpy(skb_put(nskb, chunk->skb->len),
575 			       chunk->skb->data, chunk->skb->len);
576 
577 			pr_debug("*** Chunk:%p[%s] %s 0x%x, length:%d, chunk->skb->len:%d, rtt_in_progress:%d\n",
578 				 chunk,
579 				 sctp_cname(SCTP_ST_CHUNK(chunk->chunk_hdr->type)),
580 				 chunk->has_tsn ? "TSN" : "No TSN",
581 				 chunk->has_tsn ? ntohl(chunk->subh.data_hdr->tsn) : 0,
582 				 ntohs(chunk->chunk_hdr->length), chunk->skb->len,
583 				 chunk->rtt_in_progress);
584 
585 			/* If this is a control chunk, this is our last
586 			 * reference. Free data chunks after they've been
587 			 * acknowledged or have failed.
588 			 * Re-queue auth chunks if needed.
589 			 */
590 			pkt_size -= SCTP_PAD4(chunk->skb->len);
591 
592 			if (!sctp_chunk_is_data(chunk) && chunk != packet->auth)
593 				sctp_chunk_free(chunk);
594 
595 			if (!pkt_size)
596 				break;
597 		}
598 
599 		/* SCTP-AUTH, Section 6.2
600 		 *    The sender MUST calculate the MAC as described in RFC2104 [2]
601 		 *    using the hash function H as described by the MAC Identifier and
602 		 *    the shared association key K based on the endpoint pair shared key
603 		 *    described by the shared key identifier.  The 'data' used for the
604 		 *    computation of the AUTH-chunk is given by the AUTH chunk with its
605 		 *    HMAC field set to zero (as shown in Figure 6) followed by all
606 		 *    chunks that are placed after the AUTH chunk in the SCTP packet.
607 		 */
608 		if (auth)
609 			sctp_auth_calculate_hmac(asoc, nskb,
610 						 (struct sctp_auth_chunk *)auth,
611 						 gfp);
612 
613 		if (packet->auth) {
614 			if (!list_empty(&packet->chunk_list)) {
615 				/* We will generate more packets, so re-queue
616 				 * auth chunk.
617 				 */
618 				list_add(&packet->auth->list,
619 					 &packet->chunk_list);
620 			} else {
621 				sctp_chunk_free(packet->auth);
622 				packet->auth = NULL;
623 			}
624 		}
625 
626 		if (!gso)
627 			break;
628 
629 		if (skb_gro_receive(&head, nskb)) {
630 			kfree_skb(nskb);
631 			goto nomem;
632 		}
633 		nskb = NULL;
634 		if (WARN_ON_ONCE(skb_shinfo(head)->gso_segs >=
635 				 sk->sk_gso_max_segs))
636 			goto nomem;
637 	} while (!list_empty(&packet->chunk_list));
638 
639 	/* 2) Calculate the Adler-32 checksum of the whole packet,
640 	 *    including the SCTP common header and all the
641 	 *    chunks.
642 	 *
643 	 * Note: Adler-32 is no longer applicable, as has been replaced
644 	 * by CRC32-C as described in <draft-ietf-tsvwg-sctpcsum-02.txt>.
645 	 *
646 	 * If it's a GSO packet, it's postponed to sctp_skb_segment.
647 	 */
648 	if (!sctp_checksum_disable || gso) {
649 		if (!gso && (!(dst->dev->features & NETIF_F_SCTP_CRC) ||
650 			     dst_xfrm(dst) || packet->ipfragok)) {
651 			sh->checksum = sctp_compute_cksum(head, 0);
652 		} else {
653 			/* no need to seed pseudo checksum for SCTP */
654 			head->ip_summed = CHECKSUM_PARTIAL;
655 			head->csum_start = skb_transport_header(head) - head->head;
656 			head->csum_offset = offsetof(struct sctphdr, checksum);
657 		}
658 	}
659 
660 	/* IP layer ECN support
661 	 * From RFC 2481
662 	 *  "The ECN-Capable Transport (ECT) bit would be set by the
663 	 *   data sender to indicate that the end-points of the
664 	 *   transport protocol are ECN-capable."
665 	 *
666 	 * Now setting the ECT bit all the time, as it should not cause
667 	 * any problems protocol-wise even if our peer ignores it.
668 	 *
669 	 * Note: The works for IPv6 layer checks this bit too later
670 	 * in transmission.  See IP6_ECN_flow_xmit().
671 	 */
672 	tp->af_specific->ecn_capable(sk);
673 
674 	/* Set up the IP options.  */
675 	/* BUG: not implemented
676 	 * For v4 this all lives somewhere in sk->sk_opt...
677 	 */
678 
679 	/* Dump that on IP!  */
680 	if (asoc) {
681 		asoc->stats.opackets += pktcount;
682 		if (asoc->peer.last_sent_to != tp)
683 			/* Considering the multiple CPU scenario, this is a
684 			 * "correcter" place for last_sent_to.  --xguo
685 			 */
686 			asoc->peer.last_sent_to = tp;
687 	}
688 
689 	if (has_data) {
690 		struct timer_list *timer;
691 		unsigned long timeout;
692 
693 		/* Restart the AUTOCLOSE timer when sending data. */
694 		if (sctp_state(asoc, ESTABLISHED) &&
695 		    asoc->timeouts[SCTP_EVENT_TIMEOUT_AUTOCLOSE]) {
696 			timer = &asoc->timers[SCTP_EVENT_TIMEOUT_AUTOCLOSE];
697 			timeout = asoc->timeouts[SCTP_EVENT_TIMEOUT_AUTOCLOSE];
698 
699 			if (!mod_timer(timer, jiffies + timeout))
700 				sctp_association_hold(asoc);
701 		}
702 	}
703 
704 	pr_debug("***sctp_transmit_packet*** skb->len:%d\n", head->len);
705 
706 	if (gso) {
707 		/* Cleanup our debris for IP stacks */
708 		memset(head->cb, 0, max(sizeof(struct inet_skb_parm),
709 					sizeof(struct inet6_skb_parm)));
710 
711 		skb_shinfo(head)->gso_segs = pktcount;
712 		skb_shinfo(head)->gso_size = GSO_BY_FRAGS;
713 
714 		/* We have to refresh this in case we are xmiting to
715 		 * more than one transport at a time
716 		 */
717 		rcu_read_lock();
718 		if (__sk_dst_get(sk) != tp->dst) {
719 			dst_hold(tp->dst);
720 			sk_setup_caps(sk, tp->dst);
721 		}
722 		rcu_read_unlock();
723 	}
724 	head->ignore_df = packet->ipfragok;
725 	tp->af_specific->sctp_xmit(head, tp);
726 	goto out;
727 
728 nomem:
729 	if (packet->auth && list_empty(&packet->auth->list))
730 		sctp_chunk_free(packet->auth);
731 
732 nodst:
733 	/* FIXME: Returning the 'err' will effect all the associations
734 	 * associated with a socket, although only one of the paths of the
735 	 * association is unreachable.
736 	 * The real failure of a transport or association can be passed on
737 	 * to the user via notifications. So setting this error may not be
738 	 * required.
739 	 */
740 	 /* err = -EHOSTUNREACH; */
741 	kfree_skb(head);
742 
743 err:
744 	list_for_each_entry_safe(chunk, tmp, &packet->chunk_list, list) {
745 		list_del_init(&chunk->list);
746 		if (!sctp_chunk_is_data(chunk))
747 			sctp_chunk_free(chunk);
748 	}
749 
750 out:
751 	sctp_packet_reset(packet);
752 	return err;
753 }
754 
755 /********************************************************************
756  * 2nd Level Abstractions
757  ********************************************************************/
758 
759 /* This private function check to see if a chunk can be added */
760 static sctp_xmit_t sctp_packet_can_append_data(struct sctp_packet *packet,
761 					   struct sctp_chunk *chunk)
762 {
763 	size_t datasize, rwnd, inflight, flight_size;
764 	struct sctp_transport *transport = packet->transport;
765 	struct sctp_association *asoc = transport->asoc;
766 	struct sctp_outq *q = &asoc->outqueue;
767 
768 	/* RFC 2960 6.1  Transmission of DATA Chunks
769 	 *
770 	 * A) At any given time, the data sender MUST NOT transmit new data to
771 	 * any destination transport address if its peer's rwnd indicates
772 	 * that the peer has no buffer space (i.e. rwnd is 0, see Section
773 	 * 6.2.1).  However, regardless of the value of rwnd (including if it
774 	 * is 0), the data sender can always have one DATA chunk in flight to
775 	 * the receiver if allowed by cwnd (see rule B below).  This rule
776 	 * allows the sender to probe for a change in rwnd that the sender
777 	 * missed due to the SACK having been lost in transit from the data
778 	 * receiver to the data sender.
779 	 */
780 
781 	rwnd = asoc->peer.rwnd;
782 	inflight = q->outstanding_bytes;
783 	flight_size = transport->flight_size;
784 
785 	datasize = sctp_data_size(chunk);
786 
787 	if (datasize > rwnd && inflight > 0)
788 		/* We have (at least) one data chunk in flight,
789 		 * so we can't fall back to rule 6.1 B).
790 		 */
791 		return SCTP_XMIT_RWND_FULL;
792 
793 	/* RFC 2960 6.1  Transmission of DATA Chunks
794 	 *
795 	 * B) At any given time, the sender MUST NOT transmit new data
796 	 * to a given transport address if it has cwnd or more bytes
797 	 * of data outstanding to that transport address.
798 	 */
799 	/* RFC 7.2.4 & the Implementers Guide 2.8.
800 	 *
801 	 * 3) ...
802 	 *    When a Fast Retransmit is being performed the sender SHOULD
803 	 *    ignore the value of cwnd and SHOULD NOT delay retransmission.
804 	 */
805 	if (chunk->fast_retransmit != SCTP_NEED_FRTX &&
806 	    flight_size >= transport->cwnd)
807 		return SCTP_XMIT_RWND_FULL;
808 
809 	/* Nagle's algorithm to solve small-packet problem:
810 	 * Inhibit the sending of new chunks when new outgoing data arrives
811 	 * if any previously transmitted data on the connection remains
812 	 * unacknowledged.
813 	 */
814 
815 	if (sctp_sk(asoc->base.sk)->nodelay)
816 		/* Nagle disabled */
817 		return SCTP_XMIT_OK;
818 
819 	if (!sctp_packet_empty(packet))
820 		/* Append to packet */
821 		return SCTP_XMIT_OK;
822 
823 	if (inflight == 0)
824 		/* Nothing unacked */
825 		return SCTP_XMIT_OK;
826 
827 	if (!sctp_state(asoc, ESTABLISHED))
828 		return SCTP_XMIT_OK;
829 
830 	/* Check whether this chunk and all the rest of pending data will fit
831 	 * or delay in hopes of bundling a full sized packet.
832 	 */
833 	if (chunk->skb->len + q->out_qlen >
834 		transport->pathmtu - packet->overhead - sizeof(sctp_data_chunk_t) - 4)
835 		/* Enough data queued to fill a packet */
836 		return SCTP_XMIT_OK;
837 
838 	/* Don't delay large message writes that may have been fragmented */
839 	if (!chunk->msg->can_delay)
840 		return SCTP_XMIT_OK;
841 
842 	/* Defer until all data acked or packet full */
843 	return SCTP_XMIT_DELAY;
844 }
845 
846 /* This private function does management things when adding DATA chunk */
847 static void sctp_packet_append_data(struct sctp_packet *packet,
848 				struct sctp_chunk *chunk)
849 {
850 	struct sctp_transport *transport = packet->transport;
851 	size_t datasize = sctp_data_size(chunk);
852 	struct sctp_association *asoc = transport->asoc;
853 	u32 rwnd = asoc->peer.rwnd;
854 
855 	/* Keep track of how many bytes are in flight over this transport. */
856 	transport->flight_size += datasize;
857 
858 	/* Keep track of how many bytes are in flight to the receiver. */
859 	asoc->outqueue.outstanding_bytes += datasize;
860 
861 	/* Update our view of the receiver's rwnd. */
862 	if (datasize < rwnd)
863 		rwnd -= datasize;
864 	else
865 		rwnd = 0;
866 
867 	asoc->peer.rwnd = rwnd;
868 	/* Has been accepted for transmission. */
869 	if (!asoc->peer.prsctp_capable)
870 		chunk->msg->can_abandon = 0;
871 	sctp_chunk_assign_tsn(chunk);
872 	sctp_chunk_assign_ssn(chunk);
873 }
874 
875 static sctp_xmit_t sctp_packet_will_fit(struct sctp_packet *packet,
876 					struct sctp_chunk *chunk,
877 					u16 chunk_len)
878 {
879 	size_t psize, pmtu, maxsize;
880 	sctp_xmit_t retval = SCTP_XMIT_OK;
881 
882 	psize = packet->size;
883 	if (packet->transport->asoc)
884 		pmtu = packet->transport->asoc->pathmtu;
885 	else
886 		pmtu = packet->transport->pathmtu;
887 
888 	/* Decide if we need to fragment or resubmit later. */
889 	if (psize + chunk_len > pmtu) {
890 		/* It's OK to fragment at IP level if any one of the following
891 		 * is true:
892 		 *	1. The packet is empty (meaning this chunk is greater
893 		 *	   the MTU)
894 		 *	2. The packet doesn't have any data in it yet and data
895 		 *	   requires authentication.
896 		 */
897 		if (sctp_packet_empty(packet) ||
898 		    (!packet->has_data && chunk->auth)) {
899 			/* We no longer do re-fragmentation.
900 			 * Just fragment at the IP layer, if we
901 			 * actually hit this condition
902 			 */
903 			packet->ipfragok = 1;
904 			goto out;
905 		}
906 
907 		/* Similarly, if this chunk was built before a PMTU
908 		 * reduction, we have to fragment it at IP level now. So
909 		 * if the packet already contains something, we need to
910 		 * flush.
911 		 */
912 		maxsize = pmtu - packet->overhead;
913 		if (packet->auth)
914 			maxsize -= SCTP_PAD4(packet->auth->skb->len);
915 		if (chunk_len > maxsize)
916 			retval = SCTP_XMIT_PMTU_FULL;
917 
918 		/* It is also okay to fragment if the chunk we are
919 		 * adding is a control chunk, but only if current packet
920 		 * is not a GSO one otherwise it causes fragmentation of
921 		 * a large frame. So in this case we allow the
922 		 * fragmentation by forcing it to be in a new packet.
923 		 */
924 		if (!sctp_chunk_is_data(chunk) && packet->has_data)
925 			retval = SCTP_XMIT_PMTU_FULL;
926 
927 		if (psize + chunk_len > packet->max_size)
928 			/* Hit GSO/PMTU limit, gotta flush */
929 			retval = SCTP_XMIT_PMTU_FULL;
930 
931 		if (!packet->transport->burst_limited &&
932 		    psize + chunk_len > (packet->transport->cwnd >> 1))
933 			/* Do not allow a single GSO packet to use more
934 			 * than half of cwnd.
935 			 */
936 			retval = SCTP_XMIT_PMTU_FULL;
937 
938 		if (packet->transport->burst_limited &&
939 		    psize + chunk_len > (packet->transport->burst_limited >> 1))
940 			/* Do not allow a single GSO packet to use more
941 			 * than half of original cwnd.
942 			 */
943 			retval = SCTP_XMIT_PMTU_FULL;
944 		/* Otherwise it will fit in the GSO packet */
945 	}
946 
947 out:
948 	return retval;
949 }
950