1 /* Copyright (c) 2018, Mellanox Technologies All rights reserved. 2 * 3 * This software is available to you under a choice of one of two 4 * licenses. You may choose to be licensed under the terms of the GNU 5 * General Public License (GPL) Version 2, available from the file 6 * COPYING in the main directory of this source tree, or the 7 * OpenIB.org BSD license below: 8 * 9 * Redistribution and use in source and binary forms, with or 10 * without modification, are permitted provided that the following 11 * conditions are met: 12 * 13 * - Redistributions of source code must retain the above 14 * copyright notice, this list of conditions and the following 15 * disclaimer. 16 * 17 * - Redistributions in binary form must reproduce the above 18 * copyright notice, this list of conditions and the following 19 * disclaimer in the documentation and/or other materials 20 * provided with the distribution. 21 * 22 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 23 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 24 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 25 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS 26 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN 27 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN 28 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 29 * SOFTWARE. 30 */ 31 32 #include <crypto/aead.h> 33 #include <linux/highmem.h> 34 #include <linux/module.h> 35 #include <linux/netdevice.h> 36 #include <net/dst.h> 37 #include <net/inet_connection_sock.h> 38 #include <net/tcp.h> 39 #include <net/tls.h> 40 41 /* device_offload_lock is used to synchronize tls_dev_add 42 * against NETDEV_DOWN notifications. 43 */ 44 static DECLARE_RWSEM(device_offload_lock); 45 46 static void tls_device_gc_task(struct work_struct *work); 47 48 static DECLARE_WORK(tls_device_gc_work, tls_device_gc_task); 49 static LIST_HEAD(tls_device_gc_list); 50 static LIST_HEAD(tls_device_list); 51 static DEFINE_SPINLOCK(tls_device_lock); 52 53 static void tls_device_free_ctx(struct tls_context *ctx) 54 { 55 if (ctx->tx_conf == TLS_HW) { 56 kfree(tls_offload_ctx_tx(ctx)); 57 kfree(ctx->tx.rec_seq); 58 kfree(ctx->tx.iv); 59 } 60 61 if (ctx->rx_conf == TLS_HW) 62 kfree(tls_offload_ctx_rx(ctx)); 63 64 kfree(ctx); 65 } 66 67 static void tls_device_gc_task(struct work_struct *work) 68 { 69 struct tls_context *ctx, *tmp; 70 unsigned long flags; 71 LIST_HEAD(gc_list); 72 73 spin_lock_irqsave(&tls_device_lock, flags); 74 list_splice_init(&tls_device_gc_list, &gc_list); 75 spin_unlock_irqrestore(&tls_device_lock, flags); 76 77 list_for_each_entry_safe(ctx, tmp, &gc_list, list) { 78 struct net_device *netdev = ctx->netdev; 79 80 if (netdev && ctx->tx_conf == TLS_HW) { 81 netdev->tlsdev_ops->tls_dev_del(netdev, ctx, 82 TLS_OFFLOAD_CTX_DIR_TX); 83 dev_put(netdev); 84 ctx->netdev = NULL; 85 } 86 87 list_del(&ctx->list); 88 tls_device_free_ctx(ctx); 89 } 90 } 91 92 static void tls_device_attach(struct tls_context *ctx, struct sock *sk, 93 struct net_device *netdev) 94 { 95 if (sk->sk_destruct != tls_device_sk_destruct) { 96 refcount_set(&ctx->refcount, 1); 97 dev_hold(netdev); 98 ctx->netdev = netdev; 99 spin_lock_irq(&tls_device_lock); 100 list_add_tail(&ctx->list, &tls_device_list); 101 spin_unlock_irq(&tls_device_lock); 102 103 ctx->sk_destruct = sk->sk_destruct; 104 sk->sk_destruct = tls_device_sk_destruct; 105 } 106 } 107 108 static void tls_device_queue_ctx_destruction(struct tls_context *ctx) 109 { 110 unsigned long flags; 111 112 spin_lock_irqsave(&tls_device_lock, flags); 113 list_move_tail(&ctx->list, &tls_device_gc_list); 114 115 /* schedule_work inside the spinlock 116 * to make sure tls_device_down waits for that work. 117 */ 118 schedule_work(&tls_device_gc_work); 119 120 spin_unlock_irqrestore(&tls_device_lock, flags); 121 } 122 123 /* We assume that the socket is already connected */ 124 static struct net_device *get_netdev_for_sock(struct sock *sk) 125 { 126 struct dst_entry *dst = sk_dst_get(sk); 127 struct net_device *netdev = NULL; 128 129 if (likely(dst)) { 130 netdev = dst->dev; 131 dev_hold(netdev); 132 } 133 134 dst_release(dst); 135 136 return netdev; 137 } 138 139 static void destroy_record(struct tls_record_info *record) 140 { 141 int nr_frags = record->num_frags; 142 skb_frag_t *frag; 143 144 while (nr_frags-- > 0) { 145 frag = &record->frags[nr_frags]; 146 __skb_frag_unref(frag); 147 } 148 kfree(record); 149 } 150 151 static void delete_all_records(struct tls_offload_context_tx *offload_ctx) 152 { 153 struct tls_record_info *info, *temp; 154 155 list_for_each_entry_safe(info, temp, &offload_ctx->records_list, list) { 156 list_del(&info->list); 157 destroy_record(info); 158 } 159 160 offload_ctx->retransmit_hint = NULL; 161 } 162 163 static void tls_icsk_clean_acked(struct sock *sk, u32 acked_seq) 164 { 165 struct tls_context *tls_ctx = tls_get_ctx(sk); 166 struct tls_record_info *info, *temp; 167 struct tls_offload_context_tx *ctx; 168 u64 deleted_records = 0; 169 unsigned long flags; 170 171 if (!tls_ctx) 172 return; 173 174 ctx = tls_offload_ctx_tx(tls_ctx); 175 176 spin_lock_irqsave(&ctx->lock, flags); 177 info = ctx->retransmit_hint; 178 if (info && !before(acked_seq, info->end_seq)) { 179 ctx->retransmit_hint = NULL; 180 list_del(&info->list); 181 destroy_record(info); 182 deleted_records++; 183 } 184 185 list_for_each_entry_safe(info, temp, &ctx->records_list, list) { 186 if (before(acked_seq, info->end_seq)) 187 break; 188 list_del(&info->list); 189 190 destroy_record(info); 191 deleted_records++; 192 } 193 194 ctx->unacked_record_sn += deleted_records; 195 spin_unlock_irqrestore(&ctx->lock, flags); 196 } 197 198 /* At this point, there should be no references on this 199 * socket and no in-flight SKBs associated with this 200 * socket, so it is safe to free all the resources. 201 */ 202 void tls_device_sk_destruct(struct sock *sk) 203 { 204 struct tls_context *tls_ctx = tls_get_ctx(sk); 205 struct tls_offload_context_tx *ctx = tls_offload_ctx_tx(tls_ctx); 206 207 tls_ctx->sk_destruct(sk); 208 209 if (tls_ctx->tx_conf == TLS_HW) { 210 if (ctx->open_record) 211 destroy_record(ctx->open_record); 212 delete_all_records(ctx); 213 crypto_free_aead(ctx->aead_send); 214 clean_acked_data_disable(inet_csk(sk)); 215 } 216 217 if (refcount_dec_and_test(&tls_ctx->refcount)) 218 tls_device_queue_ctx_destruction(tls_ctx); 219 } 220 EXPORT_SYMBOL(tls_device_sk_destruct); 221 222 void tls_device_free_resources_tx(struct sock *sk) 223 { 224 struct tls_context *tls_ctx = tls_get_ctx(sk); 225 226 tls_free_partial_record(sk, tls_ctx); 227 } 228 229 static void tls_append_frag(struct tls_record_info *record, 230 struct page_frag *pfrag, 231 int size) 232 { 233 skb_frag_t *frag; 234 235 frag = &record->frags[record->num_frags - 1]; 236 if (frag->page.p == pfrag->page && 237 frag->page_offset + frag->size == pfrag->offset) { 238 frag->size += size; 239 } else { 240 ++frag; 241 frag->page.p = pfrag->page; 242 frag->page_offset = pfrag->offset; 243 frag->size = size; 244 ++record->num_frags; 245 get_page(pfrag->page); 246 } 247 248 pfrag->offset += size; 249 record->len += size; 250 } 251 252 static int tls_push_record(struct sock *sk, 253 struct tls_context *ctx, 254 struct tls_offload_context_tx *offload_ctx, 255 struct tls_record_info *record, 256 struct page_frag *pfrag, 257 int flags, 258 unsigned char record_type) 259 { 260 struct tls_prot_info *prot = &ctx->prot_info; 261 struct tcp_sock *tp = tcp_sk(sk); 262 struct page_frag dummy_tag_frag; 263 skb_frag_t *frag; 264 int i; 265 266 /* fill prepend */ 267 frag = &record->frags[0]; 268 tls_fill_prepend(ctx, 269 skb_frag_address(frag), 270 record->len - prot->prepend_size, 271 record_type, 272 ctx->crypto_send.info.version); 273 274 /* HW doesn't care about the data in the tag, because it fills it. */ 275 dummy_tag_frag.page = skb_frag_page(frag); 276 dummy_tag_frag.offset = 0; 277 278 tls_append_frag(record, &dummy_tag_frag, prot->tag_size); 279 record->end_seq = tp->write_seq + record->len; 280 spin_lock_irq(&offload_ctx->lock); 281 list_add_tail(&record->list, &offload_ctx->records_list); 282 spin_unlock_irq(&offload_ctx->lock); 283 offload_ctx->open_record = NULL; 284 tls_advance_record_sn(sk, &ctx->tx, ctx->crypto_send.info.version); 285 286 for (i = 0; i < record->num_frags; i++) { 287 frag = &record->frags[i]; 288 sg_unmark_end(&offload_ctx->sg_tx_data[i]); 289 sg_set_page(&offload_ctx->sg_tx_data[i], skb_frag_page(frag), 290 frag->size, frag->page_offset); 291 sk_mem_charge(sk, frag->size); 292 get_page(skb_frag_page(frag)); 293 } 294 sg_mark_end(&offload_ctx->sg_tx_data[record->num_frags - 1]); 295 296 /* all ready, send */ 297 return tls_push_sg(sk, ctx, offload_ctx->sg_tx_data, 0, flags); 298 } 299 300 static int tls_create_new_record(struct tls_offload_context_tx *offload_ctx, 301 struct page_frag *pfrag, 302 size_t prepend_size) 303 { 304 struct tls_record_info *record; 305 skb_frag_t *frag; 306 307 record = kmalloc(sizeof(*record), GFP_KERNEL); 308 if (!record) 309 return -ENOMEM; 310 311 frag = &record->frags[0]; 312 __skb_frag_set_page(frag, pfrag->page); 313 frag->page_offset = pfrag->offset; 314 skb_frag_size_set(frag, prepend_size); 315 316 get_page(pfrag->page); 317 pfrag->offset += prepend_size; 318 319 record->num_frags = 1; 320 record->len = prepend_size; 321 offload_ctx->open_record = record; 322 return 0; 323 } 324 325 static int tls_do_allocation(struct sock *sk, 326 struct tls_offload_context_tx *offload_ctx, 327 struct page_frag *pfrag, 328 size_t prepend_size) 329 { 330 int ret; 331 332 if (!offload_ctx->open_record) { 333 if (unlikely(!skb_page_frag_refill(prepend_size, pfrag, 334 sk->sk_allocation))) { 335 sk->sk_prot->enter_memory_pressure(sk); 336 sk_stream_moderate_sndbuf(sk); 337 return -ENOMEM; 338 } 339 340 ret = tls_create_new_record(offload_ctx, pfrag, prepend_size); 341 if (ret) 342 return ret; 343 344 if (pfrag->size > pfrag->offset) 345 return 0; 346 } 347 348 if (!sk_page_frag_refill(sk, pfrag)) 349 return -ENOMEM; 350 351 return 0; 352 } 353 354 static int tls_push_data(struct sock *sk, 355 struct iov_iter *msg_iter, 356 size_t size, int flags, 357 unsigned char record_type) 358 { 359 struct tls_context *tls_ctx = tls_get_ctx(sk); 360 struct tls_prot_info *prot = &tls_ctx->prot_info; 361 struct tls_offload_context_tx *ctx = tls_offload_ctx_tx(tls_ctx); 362 int tls_push_record_flags = flags | MSG_SENDPAGE_NOTLAST; 363 int more = flags & (MSG_SENDPAGE_NOTLAST | MSG_MORE); 364 struct tls_record_info *record = ctx->open_record; 365 struct page_frag *pfrag; 366 size_t orig_size = size; 367 u32 max_open_record_len; 368 int copy, rc = 0; 369 bool done = false; 370 long timeo; 371 372 if (flags & 373 ~(MSG_MORE | MSG_DONTWAIT | MSG_NOSIGNAL | MSG_SENDPAGE_NOTLAST)) 374 return -ENOTSUPP; 375 376 if (sk->sk_err) 377 return -sk->sk_err; 378 379 timeo = sock_sndtimeo(sk, flags & MSG_DONTWAIT); 380 if (tls_is_partially_sent_record(tls_ctx)) { 381 rc = tls_push_partial_record(sk, tls_ctx, flags); 382 if (rc < 0) 383 return rc; 384 } 385 386 pfrag = sk_page_frag(sk); 387 388 /* TLS_HEADER_SIZE is not counted as part of the TLS record, and 389 * we need to leave room for an authentication tag. 390 */ 391 max_open_record_len = TLS_MAX_PAYLOAD_SIZE + 392 prot->prepend_size; 393 do { 394 rc = tls_do_allocation(sk, ctx, pfrag, 395 prot->prepend_size); 396 if (rc) { 397 rc = sk_stream_wait_memory(sk, &timeo); 398 if (!rc) 399 continue; 400 401 record = ctx->open_record; 402 if (!record) 403 break; 404 handle_error: 405 if (record_type != TLS_RECORD_TYPE_DATA) { 406 /* avoid sending partial 407 * record with type != 408 * application_data 409 */ 410 size = orig_size; 411 destroy_record(record); 412 ctx->open_record = NULL; 413 } else if (record->len > prot->prepend_size) { 414 goto last_record; 415 } 416 417 break; 418 } 419 420 record = ctx->open_record; 421 copy = min_t(size_t, size, (pfrag->size - pfrag->offset)); 422 copy = min_t(size_t, copy, (max_open_record_len - record->len)); 423 424 if (copy_from_iter_nocache(page_address(pfrag->page) + 425 pfrag->offset, 426 copy, msg_iter) != copy) { 427 rc = -EFAULT; 428 goto handle_error; 429 } 430 tls_append_frag(record, pfrag, copy); 431 432 size -= copy; 433 if (!size) { 434 last_record: 435 tls_push_record_flags = flags; 436 if (more) { 437 tls_ctx->pending_open_record_frags = 438 !!record->num_frags; 439 break; 440 } 441 442 done = true; 443 } 444 445 if (done || record->len >= max_open_record_len || 446 (record->num_frags >= MAX_SKB_FRAGS - 1)) { 447 rc = tls_push_record(sk, 448 tls_ctx, 449 ctx, 450 record, 451 pfrag, 452 tls_push_record_flags, 453 record_type); 454 if (rc < 0) 455 break; 456 } 457 } while (!done); 458 459 if (orig_size - size > 0) 460 rc = orig_size - size; 461 462 return rc; 463 } 464 465 int tls_device_sendmsg(struct sock *sk, struct msghdr *msg, size_t size) 466 { 467 unsigned char record_type = TLS_RECORD_TYPE_DATA; 468 int rc; 469 470 lock_sock(sk); 471 472 if (unlikely(msg->msg_controllen)) { 473 rc = tls_proccess_cmsg(sk, msg, &record_type); 474 if (rc) 475 goto out; 476 } 477 478 rc = tls_push_data(sk, &msg->msg_iter, size, 479 msg->msg_flags, record_type); 480 481 out: 482 release_sock(sk); 483 return rc; 484 } 485 486 int tls_device_sendpage(struct sock *sk, struct page *page, 487 int offset, size_t size, int flags) 488 { 489 struct iov_iter msg_iter; 490 char *kaddr = kmap(page); 491 struct kvec iov; 492 int rc; 493 494 if (flags & MSG_SENDPAGE_NOTLAST) 495 flags |= MSG_MORE; 496 497 lock_sock(sk); 498 499 if (flags & MSG_OOB) { 500 rc = -ENOTSUPP; 501 goto out; 502 } 503 504 iov.iov_base = kaddr + offset; 505 iov.iov_len = size; 506 iov_iter_kvec(&msg_iter, WRITE, &iov, 1, size); 507 rc = tls_push_data(sk, &msg_iter, size, 508 flags, TLS_RECORD_TYPE_DATA); 509 kunmap(page); 510 511 out: 512 release_sock(sk); 513 return rc; 514 } 515 516 struct tls_record_info *tls_get_record(struct tls_offload_context_tx *context, 517 u32 seq, u64 *p_record_sn) 518 { 519 u64 record_sn = context->hint_record_sn; 520 struct tls_record_info *info; 521 522 info = context->retransmit_hint; 523 if (!info || 524 before(seq, info->end_seq - info->len)) { 525 /* if retransmit_hint is irrelevant start 526 * from the beggining of the list 527 */ 528 info = list_first_entry(&context->records_list, 529 struct tls_record_info, list); 530 record_sn = context->unacked_record_sn; 531 } 532 533 list_for_each_entry_from(info, &context->records_list, list) { 534 if (before(seq, info->end_seq)) { 535 if (!context->retransmit_hint || 536 after(info->end_seq, 537 context->retransmit_hint->end_seq)) { 538 context->hint_record_sn = record_sn; 539 context->retransmit_hint = info; 540 } 541 *p_record_sn = record_sn; 542 return info; 543 } 544 record_sn++; 545 } 546 547 return NULL; 548 } 549 EXPORT_SYMBOL(tls_get_record); 550 551 static int tls_device_push_pending_record(struct sock *sk, int flags) 552 { 553 struct iov_iter msg_iter; 554 555 iov_iter_kvec(&msg_iter, WRITE, NULL, 0, 0); 556 return tls_push_data(sk, &msg_iter, 0, flags, TLS_RECORD_TYPE_DATA); 557 } 558 559 void tls_device_write_space(struct sock *sk, struct tls_context *ctx) 560 { 561 int rc = 0; 562 563 if (!sk->sk_write_pending && tls_is_partially_sent_record(ctx)) { 564 gfp_t sk_allocation = sk->sk_allocation; 565 566 sk->sk_allocation = GFP_ATOMIC; 567 rc = tls_push_partial_record(sk, ctx, 568 MSG_DONTWAIT | MSG_NOSIGNAL); 569 sk->sk_allocation = sk_allocation; 570 } 571 } 572 573 void handle_device_resync(struct sock *sk, u32 seq, u64 rcd_sn) 574 { 575 struct tls_context *tls_ctx = tls_get_ctx(sk); 576 struct net_device *netdev = tls_ctx->netdev; 577 struct tls_offload_context_rx *rx_ctx; 578 u32 is_req_pending; 579 s64 resync_req; 580 u32 req_seq; 581 582 if (tls_ctx->rx_conf != TLS_HW) 583 return; 584 585 rx_ctx = tls_offload_ctx_rx(tls_ctx); 586 resync_req = atomic64_read(&rx_ctx->resync_req); 587 req_seq = ntohl(resync_req >> 32) - ((u32)TLS_HEADER_SIZE - 1); 588 is_req_pending = resync_req; 589 590 if (unlikely(is_req_pending) && req_seq == seq && 591 atomic64_try_cmpxchg(&rx_ctx->resync_req, &resync_req, 0)) 592 netdev->tlsdev_ops->tls_dev_resync_rx(netdev, sk, 593 seq + TLS_HEADER_SIZE - 1, 594 rcd_sn); 595 } 596 597 static int tls_device_reencrypt(struct sock *sk, struct sk_buff *skb) 598 { 599 struct strp_msg *rxm = strp_msg(skb); 600 int err = 0, offset = rxm->offset, copy, nsg, data_len, pos; 601 struct sk_buff *skb_iter, *unused; 602 struct scatterlist sg[1]; 603 char *orig_buf, *buf; 604 605 orig_buf = kmalloc(rxm->full_len + TLS_HEADER_SIZE + 606 TLS_CIPHER_AES_GCM_128_IV_SIZE, sk->sk_allocation); 607 if (!orig_buf) 608 return -ENOMEM; 609 buf = orig_buf; 610 611 nsg = skb_cow_data(skb, 0, &unused); 612 if (unlikely(nsg < 0)) { 613 err = nsg; 614 goto free_buf; 615 } 616 617 sg_init_table(sg, 1); 618 sg_set_buf(&sg[0], buf, 619 rxm->full_len + TLS_HEADER_SIZE + 620 TLS_CIPHER_AES_GCM_128_IV_SIZE); 621 skb_copy_bits(skb, offset, buf, 622 TLS_HEADER_SIZE + TLS_CIPHER_AES_GCM_128_IV_SIZE); 623 624 /* We are interested only in the decrypted data not the auth */ 625 err = decrypt_skb(sk, skb, sg); 626 if (err != -EBADMSG) 627 goto free_buf; 628 else 629 err = 0; 630 631 data_len = rxm->full_len - TLS_CIPHER_AES_GCM_128_TAG_SIZE; 632 633 if (skb_pagelen(skb) > offset) { 634 copy = min_t(int, skb_pagelen(skb) - offset, data_len); 635 636 if (skb->decrypted) 637 skb_store_bits(skb, offset, buf, copy); 638 639 offset += copy; 640 buf += copy; 641 } 642 643 pos = skb_pagelen(skb); 644 skb_walk_frags(skb, skb_iter) { 645 int frag_pos; 646 647 /* Practically all frags must belong to msg if reencrypt 648 * is needed with current strparser and coalescing logic, 649 * but strparser may "get optimized", so let's be safe. 650 */ 651 if (pos + skb_iter->len <= offset) 652 goto done_with_frag; 653 if (pos >= data_len + rxm->offset) 654 break; 655 656 frag_pos = offset - pos; 657 copy = min_t(int, skb_iter->len - frag_pos, 658 data_len + rxm->offset - offset); 659 660 if (skb_iter->decrypted) 661 skb_store_bits(skb_iter, frag_pos, buf, copy); 662 663 offset += copy; 664 buf += copy; 665 done_with_frag: 666 pos += skb_iter->len; 667 } 668 669 free_buf: 670 kfree(orig_buf); 671 return err; 672 } 673 674 int tls_device_decrypted(struct sock *sk, struct sk_buff *skb) 675 { 676 struct tls_context *tls_ctx = tls_get_ctx(sk); 677 struct tls_offload_context_rx *ctx = tls_offload_ctx_rx(tls_ctx); 678 int is_decrypted = skb->decrypted; 679 int is_encrypted = !is_decrypted; 680 struct sk_buff *skb_iter; 681 682 /* Skip if it is already decrypted */ 683 if (ctx->sw.decrypted) 684 return 0; 685 686 /* Check if all the data is decrypted already */ 687 skb_walk_frags(skb, skb_iter) { 688 is_decrypted &= skb_iter->decrypted; 689 is_encrypted &= !skb_iter->decrypted; 690 } 691 692 ctx->sw.decrypted |= is_decrypted; 693 694 /* Return immedeatly if the record is either entirely plaintext or 695 * entirely ciphertext. Otherwise handle reencrypt partially decrypted 696 * record. 697 */ 698 return (is_encrypted || is_decrypted) ? 0 : 699 tls_device_reencrypt(sk, skb); 700 } 701 702 int tls_set_device_offload(struct sock *sk, struct tls_context *ctx) 703 { 704 u16 nonce_size, tag_size, iv_size, rec_seq_size; 705 struct tls_context *tls_ctx = tls_get_ctx(sk); 706 struct tls_prot_info *prot = &tls_ctx->prot_info; 707 struct tls_record_info *start_marker_record; 708 struct tls_offload_context_tx *offload_ctx; 709 struct tls_crypto_info *crypto_info; 710 struct net_device *netdev; 711 char *iv, *rec_seq; 712 struct sk_buff *skb; 713 int rc = -EINVAL; 714 __be64 rcd_sn; 715 716 if (!ctx) 717 goto out; 718 719 if (ctx->priv_ctx_tx) { 720 rc = -EEXIST; 721 goto out; 722 } 723 724 start_marker_record = kmalloc(sizeof(*start_marker_record), GFP_KERNEL); 725 if (!start_marker_record) { 726 rc = -ENOMEM; 727 goto out; 728 } 729 730 offload_ctx = kzalloc(TLS_OFFLOAD_CONTEXT_SIZE_TX, GFP_KERNEL); 731 if (!offload_ctx) { 732 rc = -ENOMEM; 733 goto free_marker_record; 734 } 735 736 crypto_info = &ctx->crypto_send.info; 737 switch (crypto_info->cipher_type) { 738 case TLS_CIPHER_AES_GCM_128: 739 nonce_size = TLS_CIPHER_AES_GCM_128_IV_SIZE; 740 tag_size = TLS_CIPHER_AES_GCM_128_TAG_SIZE; 741 iv_size = TLS_CIPHER_AES_GCM_128_IV_SIZE; 742 iv = ((struct tls12_crypto_info_aes_gcm_128 *)crypto_info)->iv; 743 rec_seq_size = TLS_CIPHER_AES_GCM_128_REC_SEQ_SIZE; 744 rec_seq = 745 ((struct tls12_crypto_info_aes_gcm_128 *)crypto_info)->rec_seq; 746 break; 747 default: 748 rc = -EINVAL; 749 goto free_offload_ctx; 750 } 751 752 prot->prepend_size = TLS_HEADER_SIZE + nonce_size; 753 prot->tag_size = tag_size; 754 prot->overhead_size = prot->prepend_size + prot->tag_size; 755 prot->iv_size = iv_size; 756 ctx->tx.iv = kmalloc(iv_size + TLS_CIPHER_AES_GCM_128_SALT_SIZE, 757 GFP_KERNEL); 758 if (!ctx->tx.iv) { 759 rc = -ENOMEM; 760 goto free_offload_ctx; 761 } 762 763 memcpy(ctx->tx.iv + TLS_CIPHER_AES_GCM_128_SALT_SIZE, iv, iv_size); 764 765 prot->rec_seq_size = rec_seq_size; 766 ctx->tx.rec_seq = kmemdup(rec_seq, rec_seq_size, GFP_KERNEL); 767 if (!ctx->tx.rec_seq) { 768 rc = -ENOMEM; 769 goto free_iv; 770 } 771 772 rc = tls_sw_fallback_init(sk, offload_ctx, crypto_info); 773 if (rc) 774 goto free_rec_seq; 775 776 /* start at rec_seq - 1 to account for the start marker record */ 777 memcpy(&rcd_sn, ctx->tx.rec_seq, sizeof(rcd_sn)); 778 offload_ctx->unacked_record_sn = be64_to_cpu(rcd_sn) - 1; 779 780 start_marker_record->end_seq = tcp_sk(sk)->write_seq; 781 start_marker_record->len = 0; 782 start_marker_record->num_frags = 0; 783 784 INIT_LIST_HEAD(&offload_ctx->records_list); 785 list_add_tail(&start_marker_record->list, &offload_ctx->records_list); 786 spin_lock_init(&offload_ctx->lock); 787 sg_init_table(offload_ctx->sg_tx_data, 788 ARRAY_SIZE(offload_ctx->sg_tx_data)); 789 790 clean_acked_data_enable(inet_csk(sk), &tls_icsk_clean_acked); 791 ctx->push_pending_record = tls_device_push_pending_record; 792 793 /* TLS offload is greatly simplified if we don't send 794 * SKBs where only part of the payload needs to be encrypted. 795 * So mark the last skb in the write queue as end of record. 796 */ 797 skb = tcp_write_queue_tail(sk); 798 if (skb) 799 TCP_SKB_CB(skb)->eor = 1; 800 801 /* We support starting offload on multiple sockets 802 * concurrently, so we only need a read lock here. 803 * This lock must precede get_netdev_for_sock to prevent races between 804 * NETDEV_DOWN and setsockopt. 805 */ 806 down_read(&device_offload_lock); 807 netdev = get_netdev_for_sock(sk); 808 if (!netdev) { 809 pr_err_ratelimited("%s: netdev not found\n", __func__); 810 rc = -EINVAL; 811 goto release_lock; 812 } 813 814 if (!(netdev->features & NETIF_F_HW_TLS_TX)) { 815 rc = -ENOTSUPP; 816 goto release_netdev; 817 } 818 819 /* Avoid offloading if the device is down 820 * We don't want to offload new flows after 821 * the NETDEV_DOWN event 822 */ 823 if (!(netdev->flags & IFF_UP)) { 824 rc = -EINVAL; 825 goto release_netdev; 826 } 827 828 ctx->priv_ctx_tx = offload_ctx; 829 rc = netdev->tlsdev_ops->tls_dev_add(netdev, sk, TLS_OFFLOAD_CTX_DIR_TX, 830 &ctx->crypto_send.info, 831 tcp_sk(sk)->write_seq); 832 if (rc) 833 goto release_netdev; 834 835 tls_device_attach(ctx, sk, netdev); 836 837 /* following this assignment tls_is_sk_tx_device_offloaded 838 * will return true and the context might be accessed 839 * by the netdev's xmit function. 840 */ 841 smp_store_release(&sk->sk_validate_xmit_skb, tls_validate_xmit_skb); 842 dev_put(netdev); 843 up_read(&device_offload_lock); 844 goto out; 845 846 release_netdev: 847 dev_put(netdev); 848 release_lock: 849 up_read(&device_offload_lock); 850 clean_acked_data_disable(inet_csk(sk)); 851 crypto_free_aead(offload_ctx->aead_send); 852 free_rec_seq: 853 kfree(ctx->tx.rec_seq); 854 free_iv: 855 kfree(ctx->tx.iv); 856 free_offload_ctx: 857 kfree(offload_ctx); 858 ctx->priv_ctx_tx = NULL; 859 free_marker_record: 860 kfree(start_marker_record); 861 out: 862 return rc; 863 } 864 865 int tls_set_device_offload_rx(struct sock *sk, struct tls_context *ctx) 866 { 867 struct tls_offload_context_rx *context; 868 struct net_device *netdev; 869 int rc = 0; 870 871 /* We support starting offload on multiple sockets 872 * concurrently, so we only need a read lock here. 873 * This lock must precede get_netdev_for_sock to prevent races between 874 * NETDEV_DOWN and setsockopt. 875 */ 876 down_read(&device_offload_lock); 877 netdev = get_netdev_for_sock(sk); 878 if (!netdev) { 879 pr_err_ratelimited("%s: netdev not found\n", __func__); 880 rc = -EINVAL; 881 goto release_lock; 882 } 883 884 if (!(netdev->features & NETIF_F_HW_TLS_RX)) { 885 pr_err_ratelimited("%s: netdev %s with no TLS offload\n", 886 __func__, netdev->name); 887 rc = -ENOTSUPP; 888 goto release_netdev; 889 } 890 891 /* Avoid offloading if the device is down 892 * We don't want to offload new flows after 893 * the NETDEV_DOWN event 894 */ 895 if (!(netdev->flags & IFF_UP)) { 896 rc = -EINVAL; 897 goto release_netdev; 898 } 899 900 context = kzalloc(TLS_OFFLOAD_CONTEXT_SIZE_RX, GFP_KERNEL); 901 if (!context) { 902 rc = -ENOMEM; 903 goto release_netdev; 904 } 905 906 ctx->priv_ctx_rx = context; 907 rc = tls_set_sw_offload(sk, ctx, 0); 908 if (rc) 909 goto release_ctx; 910 911 rc = netdev->tlsdev_ops->tls_dev_add(netdev, sk, TLS_OFFLOAD_CTX_DIR_RX, 912 &ctx->crypto_recv.info, 913 tcp_sk(sk)->copied_seq); 914 if (rc) { 915 pr_err_ratelimited("%s: The netdev has refused to offload this socket\n", 916 __func__); 917 goto free_sw_resources; 918 } 919 920 tls_device_attach(ctx, sk, netdev); 921 goto release_netdev; 922 923 free_sw_resources: 924 up_read(&device_offload_lock); 925 tls_sw_free_resources_rx(sk); 926 down_read(&device_offload_lock); 927 release_ctx: 928 ctx->priv_ctx_rx = NULL; 929 release_netdev: 930 dev_put(netdev); 931 release_lock: 932 up_read(&device_offload_lock); 933 return rc; 934 } 935 936 void tls_device_offload_cleanup_rx(struct sock *sk) 937 { 938 struct tls_context *tls_ctx = tls_get_ctx(sk); 939 struct net_device *netdev; 940 941 down_read(&device_offload_lock); 942 netdev = tls_ctx->netdev; 943 if (!netdev) 944 goto out; 945 946 if (!(netdev->features & NETIF_F_HW_TLS_RX)) { 947 pr_err_ratelimited("%s: device is missing NETIF_F_HW_TLS_RX cap\n", 948 __func__); 949 goto out; 950 } 951 952 netdev->tlsdev_ops->tls_dev_del(netdev, tls_ctx, 953 TLS_OFFLOAD_CTX_DIR_RX); 954 955 if (tls_ctx->tx_conf != TLS_HW) { 956 dev_put(netdev); 957 tls_ctx->netdev = NULL; 958 } 959 out: 960 up_read(&device_offload_lock); 961 tls_sw_release_resources_rx(sk); 962 } 963 964 static int tls_device_down(struct net_device *netdev) 965 { 966 struct tls_context *ctx, *tmp; 967 unsigned long flags; 968 LIST_HEAD(list); 969 970 /* Request a write lock to block new offload attempts */ 971 down_write(&device_offload_lock); 972 973 spin_lock_irqsave(&tls_device_lock, flags); 974 list_for_each_entry_safe(ctx, tmp, &tls_device_list, list) { 975 if (ctx->netdev != netdev || 976 !refcount_inc_not_zero(&ctx->refcount)) 977 continue; 978 979 list_move(&ctx->list, &list); 980 } 981 spin_unlock_irqrestore(&tls_device_lock, flags); 982 983 list_for_each_entry_safe(ctx, tmp, &list, list) { 984 if (ctx->tx_conf == TLS_HW) 985 netdev->tlsdev_ops->tls_dev_del(netdev, ctx, 986 TLS_OFFLOAD_CTX_DIR_TX); 987 if (ctx->rx_conf == TLS_HW) 988 netdev->tlsdev_ops->tls_dev_del(netdev, ctx, 989 TLS_OFFLOAD_CTX_DIR_RX); 990 ctx->netdev = NULL; 991 dev_put(netdev); 992 list_del_init(&ctx->list); 993 994 if (refcount_dec_and_test(&ctx->refcount)) 995 tls_device_free_ctx(ctx); 996 } 997 998 up_write(&device_offload_lock); 999 1000 flush_work(&tls_device_gc_work); 1001 1002 return NOTIFY_DONE; 1003 } 1004 1005 static int tls_dev_event(struct notifier_block *this, unsigned long event, 1006 void *ptr) 1007 { 1008 struct net_device *dev = netdev_notifier_info_to_dev(ptr); 1009 1010 if (!(dev->features & (NETIF_F_HW_TLS_RX | NETIF_F_HW_TLS_TX))) 1011 return NOTIFY_DONE; 1012 1013 switch (event) { 1014 case NETDEV_REGISTER: 1015 case NETDEV_FEAT_CHANGE: 1016 if ((dev->features & NETIF_F_HW_TLS_RX) && 1017 !dev->tlsdev_ops->tls_dev_resync_rx) 1018 return NOTIFY_BAD; 1019 1020 if (dev->tlsdev_ops && 1021 dev->tlsdev_ops->tls_dev_add && 1022 dev->tlsdev_ops->tls_dev_del) 1023 return NOTIFY_DONE; 1024 else 1025 return NOTIFY_BAD; 1026 case NETDEV_DOWN: 1027 return tls_device_down(dev); 1028 } 1029 return NOTIFY_DONE; 1030 } 1031 1032 static struct notifier_block tls_dev_notifier = { 1033 .notifier_call = tls_dev_event, 1034 }; 1035 1036 void __init tls_device_init(void) 1037 { 1038 register_netdevice_notifier(&tls_dev_notifier); 1039 } 1040 1041 void __exit tls_device_cleanup(void) 1042 { 1043 unregister_netdevice_notifier(&tls_dev_notifier); 1044 flush_work(&tls_device_gc_work); 1045 } 1046