1 // SPDX-License-Identifier: GPL-2.0-only 2 /* Copyright (C) 2023 Intel Corporation */ 3 4 #include "idpf.h" 5 #include "idpf_virtchnl.h" 6 7 /** 8 * idpf_buf_lifo_push - push a buffer pointer onto stack 9 * @stack: pointer to stack struct 10 * @buf: pointer to buf to push 11 * 12 * Returns 0 on success, negative on failure 13 **/ 14 static int idpf_buf_lifo_push(struct idpf_buf_lifo *stack, 15 struct idpf_tx_stash *buf) 16 { 17 if (unlikely(stack->top == stack->size)) 18 return -ENOSPC; 19 20 stack->bufs[stack->top++] = buf; 21 22 return 0; 23 } 24 25 /** 26 * idpf_buf_lifo_pop - pop a buffer pointer from stack 27 * @stack: pointer to stack struct 28 **/ 29 static struct idpf_tx_stash *idpf_buf_lifo_pop(struct idpf_buf_lifo *stack) 30 { 31 if (unlikely(!stack->top)) 32 return NULL; 33 34 return stack->bufs[--stack->top]; 35 } 36 37 /** 38 * idpf_tx_timeout - Respond to a Tx Hang 39 * @netdev: network interface device structure 40 * @txqueue: TX queue 41 */ 42 void idpf_tx_timeout(struct net_device *netdev, unsigned int txqueue) 43 { 44 struct idpf_adapter *adapter = idpf_netdev_to_adapter(netdev); 45 46 adapter->tx_timeout_count++; 47 48 netdev_err(netdev, "Detected Tx timeout: Count %d, Queue %d\n", 49 adapter->tx_timeout_count, txqueue); 50 if (!idpf_is_reset_in_prog(adapter)) { 51 set_bit(IDPF_HR_FUNC_RESET, adapter->flags); 52 queue_delayed_work(adapter->vc_event_wq, 53 &adapter->vc_event_task, 54 msecs_to_jiffies(10)); 55 } 56 } 57 58 /** 59 * idpf_tx_buf_rel - Release a Tx buffer 60 * @tx_q: the queue that owns the buffer 61 * @tx_buf: the buffer to free 62 */ 63 static void idpf_tx_buf_rel(struct idpf_queue *tx_q, struct idpf_tx_buf *tx_buf) 64 { 65 if (tx_buf->skb) { 66 if (dma_unmap_len(tx_buf, len)) 67 dma_unmap_single(tx_q->dev, 68 dma_unmap_addr(tx_buf, dma), 69 dma_unmap_len(tx_buf, len), 70 DMA_TO_DEVICE); 71 dev_kfree_skb_any(tx_buf->skb); 72 } else if (dma_unmap_len(tx_buf, len)) { 73 dma_unmap_page(tx_q->dev, 74 dma_unmap_addr(tx_buf, dma), 75 dma_unmap_len(tx_buf, len), 76 DMA_TO_DEVICE); 77 } 78 79 tx_buf->next_to_watch = NULL; 80 tx_buf->skb = NULL; 81 tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; 82 dma_unmap_len_set(tx_buf, len, 0); 83 } 84 85 /** 86 * idpf_tx_buf_rel_all - Free any empty Tx buffers 87 * @txq: queue to be cleaned 88 */ 89 static void idpf_tx_buf_rel_all(struct idpf_queue *txq) 90 { 91 u16 i; 92 93 /* Buffers already cleared, nothing to do */ 94 if (!txq->tx_buf) 95 return; 96 97 /* Free all the Tx buffer sk_buffs */ 98 for (i = 0; i < txq->desc_count; i++) 99 idpf_tx_buf_rel(txq, &txq->tx_buf[i]); 100 101 kfree(txq->tx_buf); 102 txq->tx_buf = NULL; 103 104 if (!txq->buf_stack.bufs) 105 return; 106 107 for (i = 0; i < txq->buf_stack.size; i++) 108 kfree(txq->buf_stack.bufs[i]); 109 110 kfree(txq->buf_stack.bufs); 111 txq->buf_stack.bufs = NULL; 112 } 113 114 /** 115 * idpf_tx_desc_rel - Free Tx resources per queue 116 * @txq: Tx descriptor ring for a specific queue 117 * @bufq: buffer q or completion q 118 * 119 * Free all transmit software resources 120 */ 121 static void idpf_tx_desc_rel(struct idpf_queue *txq, bool bufq) 122 { 123 if (bufq) 124 idpf_tx_buf_rel_all(txq); 125 126 if (!txq->desc_ring) 127 return; 128 129 dmam_free_coherent(txq->dev, txq->size, txq->desc_ring, txq->dma); 130 txq->desc_ring = NULL; 131 txq->next_to_alloc = 0; 132 txq->next_to_use = 0; 133 txq->next_to_clean = 0; 134 } 135 136 /** 137 * idpf_tx_desc_rel_all - Free Tx Resources for All Queues 138 * @vport: virtual port structure 139 * 140 * Free all transmit software resources 141 */ 142 static void idpf_tx_desc_rel_all(struct idpf_vport *vport) 143 { 144 int i, j; 145 146 if (!vport->txq_grps) 147 return; 148 149 for (i = 0; i < vport->num_txq_grp; i++) { 150 struct idpf_txq_group *txq_grp = &vport->txq_grps[i]; 151 152 for (j = 0; j < txq_grp->num_txq; j++) 153 idpf_tx_desc_rel(txq_grp->txqs[j], true); 154 155 if (idpf_is_queue_model_split(vport->txq_model)) 156 idpf_tx_desc_rel(txq_grp->complq, false); 157 } 158 } 159 160 /** 161 * idpf_tx_buf_alloc_all - Allocate memory for all buffer resources 162 * @tx_q: queue for which the buffers are allocated 163 * 164 * Returns 0 on success, negative on failure 165 */ 166 static int idpf_tx_buf_alloc_all(struct idpf_queue *tx_q) 167 { 168 int buf_size; 169 int i; 170 171 /* Allocate book keeping buffers only. Buffers to be supplied to HW 172 * are allocated by kernel network stack and received as part of skb 173 */ 174 buf_size = sizeof(struct idpf_tx_buf) * tx_q->desc_count; 175 tx_q->tx_buf = kzalloc(buf_size, GFP_KERNEL); 176 if (!tx_q->tx_buf) 177 return -ENOMEM; 178 179 /* Initialize tx_bufs with invalid completion tags */ 180 for (i = 0; i < tx_q->desc_count; i++) 181 tx_q->tx_buf[i].compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; 182 183 /* Initialize tx buf stack for out-of-order completions if 184 * flow scheduling offload is enabled 185 */ 186 tx_q->buf_stack.bufs = 187 kcalloc(tx_q->desc_count, sizeof(struct idpf_tx_stash *), 188 GFP_KERNEL); 189 if (!tx_q->buf_stack.bufs) 190 return -ENOMEM; 191 192 tx_q->buf_stack.size = tx_q->desc_count; 193 tx_q->buf_stack.top = tx_q->desc_count; 194 195 for (i = 0; i < tx_q->desc_count; i++) { 196 tx_q->buf_stack.bufs[i] = kzalloc(sizeof(*tx_q->buf_stack.bufs[i]), 197 GFP_KERNEL); 198 if (!tx_q->buf_stack.bufs[i]) 199 return -ENOMEM; 200 } 201 202 return 0; 203 } 204 205 /** 206 * idpf_tx_desc_alloc - Allocate the Tx descriptors 207 * @tx_q: the tx ring to set up 208 * @bufq: buffer or completion queue 209 * 210 * Returns 0 on success, negative on failure 211 */ 212 static int idpf_tx_desc_alloc(struct idpf_queue *tx_q, bool bufq) 213 { 214 struct device *dev = tx_q->dev; 215 u32 desc_sz; 216 int err; 217 218 if (bufq) { 219 err = idpf_tx_buf_alloc_all(tx_q); 220 if (err) 221 goto err_alloc; 222 223 desc_sz = sizeof(struct idpf_base_tx_desc); 224 } else { 225 desc_sz = sizeof(struct idpf_splitq_tx_compl_desc); 226 } 227 228 tx_q->size = tx_q->desc_count * desc_sz; 229 230 /* Allocate descriptors also round up to nearest 4K */ 231 tx_q->size = ALIGN(tx_q->size, 4096); 232 tx_q->desc_ring = dmam_alloc_coherent(dev, tx_q->size, &tx_q->dma, 233 GFP_KERNEL); 234 if (!tx_q->desc_ring) { 235 dev_err(dev, "Unable to allocate memory for the Tx descriptor ring, size=%d\n", 236 tx_q->size); 237 err = -ENOMEM; 238 goto err_alloc; 239 } 240 241 tx_q->next_to_alloc = 0; 242 tx_q->next_to_use = 0; 243 tx_q->next_to_clean = 0; 244 set_bit(__IDPF_Q_GEN_CHK, tx_q->flags); 245 246 return 0; 247 248 err_alloc: 249 idpf_tx_desc_rel(tx_q, bufq); 250 251 return err; 252 } 253 254 /** 255 * idpf_tx_desc_alloc_all - allocate all queues Tx resources 256 * @vport: virtual port private structure 257 * 258 * Returns 0 on success, negative on failure 259 */ 260 static int idpf_tx_desc_alloc_all(struct idpf_vport *vport) 261 { 262 struct device *dev = &vport->adapter->pdev->dev; 263 int err = 0; 264 int i, j; 265 266 /* Setup buffer queues. In single queue model buffer queues and 267 * completion queues will be same 268 */ 269 for (i = 0; i < vport->num_txq_grp; i++) { 270 for (j = 0; j < vport->txq_grps[i].num_txq; j++) { 271 struct idpf_queue *txq = vport->txq_grps[i].txqs[j]; 272 u8 gen_bits = 0; 273 u16 bufidx_mask; 274 275 err = idpf_tx_desc_alloc(txq, true); 276 if (err) { 277 dev_err(dev, "Allocation for Tx Queue %u failed\n", 278 i); 279 goto err_out; 280 } 281 282 if (!idpf_is_queue_model_split(vport->txq_model)) 283 continue; 284 285 txq->compl_tag_cur_gen = 0; 286 287 /* Determine the number of bits in the bufid 288 * mask and add one to get the start of the 289 * generation bits 290 */ 291 bufidx_mask = txq->desc_count - 1; 292 while (bufidx_mask >> 1) { 293 txq->compl_tag_gen_s++; 294 bufidx_mask = bufidx_mask >> 1; 295 } 296 txq->compl_tag_gen_s++; 297 298 gen_bits = IDPF_TX_SPLITQ_COMPL_TAG_WIDTH - 299 txq->compl_tag_gen_s; 300 txq->compl_tag_gen_max = GETMAXVAL(gen_bits); 301 302 /* Set bufid mask based on location of first 303 * gen bit; it cannot simply be the descriptor 304 * ring size-1 since we can have size values 305 * where not all of those bits are set. 306 */ 307 txq->compl_tag_bufid_m = 308 GETMAXVAL(txq->compl_tag_gen_s); 309 } 310 311 if (!idpf_is_queue_model_split(vport->txq_model)) 312 continue; 313 314 /* Setup completion queues */ 315 err = idpf_tx_desc_alloc(vport->txq_grps[i].complq, false); 316 if (err) { 317 dev_err(dev, "Allocation for Tx Completion Queue %u failed\n", 318 i); 319 goto err_out; 320 } 321 } 322 323 err_out: 324 if (err) 325 idpf_tx_desc_rel_all(vport); 326 327 return err; 328 } 329 330 /** 331 * idpf_rx_page_rel - Release an rx buffer page 332 * @rxq: the queue that owns the buffer 333 * @rx_buf: the buffer to free 334 */ 335 static void idpf_rx_page_rel(struct idpf_queue *rxq, struct idpf_rx_buf *rx_buf) 336 { 337 if (unlikely(!rx_buf->page)) 338 return; 339 340 page_pool_put_full_page(rxq->pp, rx_buf->page, false); 341 342 rx_buf->page = NULL; 343 rx_buf->page_offset = 0; 344 } 345 346 /** 347 * idpf_rx_hdr_buf_rel_all - Release header buffer memory 348 * @rxq: queue to use 349 */ 350 static void idpf_rx_hdr_buf_rel_all(struct idpf_queue *rxq) 351 { 352 struct idpf_adapter *adapter = rxq->vport->adapter; 353 354 dma_free_coherent(&adapter->pdev->dev, 355 rxq->desc_count * IDPF_HDR_BUF_SIZE, 356 rxq->rx_buf.hdr_buf_va, 357 rxq->rx_buf.hdr_buf_pa); 358 rxq->rx_buf.hdr_buf_va = NULL; 359 } 360 361 /** 362 * idpf_rx_buf_rel_all - Free all Rx buffer resources for a queue 363 * @rxq: queue to be cleaned 364 */ 365 static void idpf_rx_buf_rel_all(struct idpf_queue *rxq) 366 { 367 u16 i; 368 369 /* queue already cleared, nothing to do */ 370 if (!rxq->rx_buf.buf) 371 return; 372 373 /* Free all the bufs allocated and given to hw on Rx queue */ 374 for (i = 0; i < rxq->desc_count; i++) 375 idpf_rx_page_rel(rxq, &rxq->rx_buf.buf[i]); 376 377 if (rxq->rx_hsplit_en) 378 idpf_rx_hdr_buf_rel_all(rxq); 379 380 page_pool_destroy(rxq->pp); 381 rxq->pp = NULL; 382 383 kfree(rxq->rx_buf.buf); 384 rxq->rx_buf.buf = NULL; 385 } 386 387 /** 388 * idpf_rx_desc_rel - Free a specific Rx q resources 389 * @rxq: queue to clean the resources from 390 * @bufq: buffer q or completion q 391 * @q_model: single or split q model 392 * 393 * Free a specific rx queue resources 394 */ 395 static void idpf_rx_desc_rel(struct idpf_queue *rxq, bool bufq, s32 q_model) 396 { 397 if (!rxq) 398 return; 399 400 if (rxq->skb) { 401 dev_kfree_skb_any(rxq->skb); 402 rxq->skb = NULL; 403 } 404 405 if (bufq || !idpf_is_queue_model_split(q_model)) 406 idpf_rx_buf_rel_all(rxq); 407 408 rxq->next_to_alloc = 0; 409 rxq->next_to_clean = 0; 410 rxq->next_to_use = 0; 411 if (!rxq->desc_ring) 412 return; 413 414 dmam_free_coherent(rxq->dev, rxq->size, rxq->desc_ring, rxq->dma); 415 rxq->desc_ring = NULL; 416 } 417 418 /** 419 * idpf_rx_desc_rel_all - Free Rx Resources for All Queues 420 * @vport: virtual port structure 421 * 422 * Free all rx queues resources 423 */ 424 static void idpf_rx_desc_rel_all(struct idpf_vport *vport) 425 { 426 struct idpf_rxq_group *rx_qgrp; 427 u16 num_rxq; 428 int i, j; 429 430 if (!vport->rxq_grps) 431 return; 432 433 for (i = 0; i < vport->num_rxq_grp; i++) { 434 rx_qgrp = &vport->rxq_grps[i]; 435 436 if (!idpf_is_queue_model_split(vport->rxq_model)) { 437 for (j = 0; j < rx_qgrp->singleq.num_rxq; j++) 438 idpf_rx_desc_rel(rx_qgrp->singleq.rxqs[j], 439 false, vport->rxq_model); 440 continue; 441 } 442 443 num_rxq = rx_qgrp->splitq.num_rxq_sets; 444 for (j = 0; j < num_rxq; j++) 445 idpf_rx_desc_rel(&rx_qgrp->splitq.rxq_sets[j]->rxq, 446 false, vport->rxq_model); 447 448 if (!rx_qgrp->splitq.bufq_sets) 449 continue; 450 451 for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { 452 struct idpf_bufq_set *bufq_set = 453 &rx_qgrp->splitq.bufq_sets[j]; 454 455 idpf_rx_desc_rel(&bufq_set->bufq, true, 456 vport->rxq_model); 457 } 458 } 459 } 460 461 /** 462 * idpf_rx_buf_hw_update - Store the new tail and head values 463 * @rxq: queue to bump 464 * @val: new head index 465 */ 466 void idpf_rx_buf_hw_update(struct idpf_queue *rxq, u32 val) 467 { 468 rxq->next_to_use = val; 469 470 if (unlikely(!rxq->tail)) 471 return; 472 473 /* writel has an implicit memory barrier */ 474 writel(val, rxq->tail); 475 } 476 477 /** 478 * idpf_rx_hdr_buf_alloc_all - Allocate memory for header buffers 479 * @rxq: ring to use 480 * 481 * Returns 0 on success, negative on failure. 482 */ 483 static int idpf_rx_hdr_buf_alloc_all(struct idpf_queue *rxq) 484 { 485 struct idpf_adapter *adapter = rxq->vport->adapter; 486 487 rxq->rx_buf.hdr_buf_va = 488 dma_alloc_coherent(&adapter->pdev->dev, 489 IDPF_HDR_BUF_SIZE * rxq->desc_count, 490 &rxq->rx_buf.hdr_buf_pa, 491 GFP_KERNEL); 492 if (!rxq->rx_buf.hdr_buf_va) 493 return -ENOMEM; 494 495 return 0; 496 } 497 498 /** 499 * idpf_rx_post_buf_refill - Post buffer id to refill queue 500 * @refillq: refill queue to post to 501 * @buf_id: buffer id to post 502 */ 503 static void idpf_rx_post_buf_refill(struct idpf_sw_queue *refillq, u16 buf_id) 504 { 505 u16 nta = refillq->next_to_alloc; 506 507 /* store the buffer ID and the SW maintained GEN bit to the refillq */ 508 refillq->ring[nta] = 509 FIELD_PREP(IDPF_RX_BI_BUFID_M, buf_id) | 510 FIELD_PREP(IDPF_RX_BI_GEN_M, 511 test_bit(__IDPF_Q_GEN_CHK, refillq->flags)); 512 513 if (unlikely(++nta == refillq->desc_count)) { 514 nta = 0; 515 change_bit(__IDPF_Q_GEN_CHK, refillq->flags); 516 } 517 refillq->next_to_alloc = nta; 518 } 519 520 /** 521 * idpf_rx_post_buf_desc - Post buffer to bufq descriptor ring 522 * @bufq: buffer queue to post to 523 * @buf_id: buffer id to post 524 * 525 * Returns false if buffer could not be allocated, true otherwise. 526 */ 527 static bool idpf_rx_post_buf_desc(struct idpf_queue *bufq, u16 buf_id) 528 { 529 struct virtchnl2_splitq_rx_buf_desc *splitq_rx_desc = NULL; 530 u16 nta = bufq->next_to_alloc; 531 struct idpf_rx_buf *buf; 532 dma_addr_t addr; 533 534 splitq_rx_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, nta); 535 buf = &bufq->rx_buf.buf[buf_id]; 536 537 if (bufq->rx_hsplit_en) { 538 splitq_rx_desc->hdr_addr = 539 cpu_to_le64(bufq->rx_buf.hdr_buf_pa + 540 (u32)buf_id * IDPF_HDR_BUF_SIZE); 541 } 542 543 addr = idpf_alloc_page(bufq->pp, buf, bufq->rx_buf_size); 544 if (unlikely(addr == DMA_MAPPING_ERROR)) 545 return false; 546 547 splitq_rx_desc->pkt_addr = cpu_to_le64(addr); 548 splitq_rx_desc->qword0.buf_id = cpu_to_le16(buf_id); 549 550 nta++; 551 if (unlikely(nta == bufq->desc_count)) 552 nta = 0; 553 bufq->next_to_alloc = nta; 554 555 return true; 556 } 557 558 /** 559 * idpf_rx_post_init_bufs - Post initial buffers to bufq 560 * @bufq: buffer queue to post working set to 561 * @working_set: number of buffers to put in working set 562 * 563 * Returns true if @working_set bufs were posted successfully, false otherwise. 564 */ 565 static bool idpf_rx_post_init_bufs(struct idpf_queue *bufq, u16 working_set) 566 { 567 int i; 568 569 for (i = 0; i < working_set; i++) { 570 if (!idpf_rx_post_buf_desc(bufq, i)) 571 return false; 572 } 573 574 idpf_rx_buf_hw_update(bufq, 575 bufq->next_to_alloc & ~(bufq->rx_buf_stride - 1)); 576 577 return true; 578 } 579 580 /** 581 * idpf_rx_create_page_pool - Create a page pool 582 * @rxbufq: RX queue to create page pool for 583 * 584 * Returns &page_pool on success, casted -errno on failure 585 */ 586 static struct page_pool *idpf_rx_create_page_pool(struct idpf_queue *rxbufq) 587 { 588 struct page_pool_params pp = { 589 .flags = PP_FLAG_DMA_MAP | PP_FLAG_DMA_SYNC_DEV, 590 .order = 0, 591 .pool_size = rxbufq->desc_count, 592 .nid = NUMA_NO_NODE, 593 .dev = rxbufq->vport->netdev->dev.parent, 594 .max_len = PAGE_SIZE, 595 .dma_dir = DMA_FROM_DEVICE, 596 .offset = 0, 597 }; 598 599 return page_pool_create(&pp); 600 } 601 602 /** 603 * idpf_rx_buf_alloc_all - Allocate memory for all buffer resources 604 * @rxbufq: queue for which the buffers are allocated; equivalent to 605 * rxq when operating in singleq mode 606 * 607 * Returns 0 on success, negative on failure 608 */ 609 static int idpf_rx_buf_alloc_all(struct idpf_queue *rxbufq) 610 { 611 int err = 0; 612 613 /* Allocate book keeping buffers */ 614 rxbufq->rx_buf.buf = kcalloc(rxbufq->desc_count, 615 sizeof(struct idpf_rx_buf), GFP_KERNEL); 616 if (!rxbufq->rx_buf.buf) { 617 err = -ENOMEM; 618 goto rx_buf_alloc_all_out; 619 } 620 621 if (rxbufq->rx_hsplit_en) { 622 err = idpf_rx_hdr_buf_alloc_all(rxbufq); 623 if (err) 624 goto rx_buf_alloc_all_out; 625 } 626 627 /* Allocate buffers to be given to HW. */ 628 if (idpf_is_queue_model_split(rxbufq->vport->rxq_model)) { 629 int working_set = IDPF_RX_BUFQ_WORKING_SET(rxbufq); 630 631 if (!idpf_rx_post_init_bufs(rxbufq, working_set)) 632 err = -ENOMEM; 633 } else { 634 if (idpf_rx_singleq_buf_hw_alloc_all(rxbufq, 635 rxbufq->desc_count - 1)) 636 err = -ENOMEM; 637 } 638 639 rx_buf_alloc_all_out: 640 if (err) 641 idpf_rx_buf_rel_all(rxbufq); 642 643 return err; 644 } 645 646 /** 647 * idpf_rx_bufs_init - Initialize page pool, allocate rx bufs, and post to HW 648 * @rxbufq: RX queue to create page pool for 649 * 650 * Returns 0 on success, negative on failure 651 */ 652 static int idpf_rx_bufs_init(struct idpf_queue *rxbufq) 653 { 654 struct page_pool *pool; 655 656 pool = idpf_rx_create_page_pool(rxbufq); 657 if (IS_ERR(pool)) 658 return PTR_ERR(pool); 659 660 rxbufq->pp = pool; 661 662 return idpf_rx_buf_alloc_all(rxbufq); 663 } 664 665 /** 666 * idpf_rx_bufs_init_all - Initialize all RX bufs 667 * @vport: virtual port struct 668 * 669 * Returns 0 on success, negative on failure 670 */ 671 int idpf_rx_bufs_init_all(struct idpf_vport *vport) 672 { 673 struct idpf_rxq_group *rx_qgrp; 674 struct idpf_queue *q; 675 int i, j, err; 676 677 for (i = 0; i < vport->num_rxq_grp; i++) { 678 rx_qgrp = &vport->rxq_grps[i]; 679 680 /* Allocate bufs for the rxq itself in singleq */ 681 if (!idpf_is_queue_model_split(vport->rxq_model)) { 682 int num_rxq = rx_qgrp->singleq.num_rxq; 683 684 for (j = 0; j < num_rxq; j++) { 685 q = rx_qgrp->singleq.rxqs[j]; 686 err = idpf_rx_bufs_init(q); 687 if (err) 688 return err; 689 } 690 691 continue; 692 } 693 694 /* Otherwise, allocate bufs for the buffer queues */ 695 for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { 696 q = &rx_qgrp->splitq.bufq_sets[j].bufq; 697 err = idpf_rx_bufs_init(q); 698 if (err) 699 return err; 700 } 701 } 702 703 return 0; 704 } 705 706 /** 707 * idpf_rx_desc_alloc - Allocate queue Rx resources 708 * @rxq: Rx queue for which the resources are setup 709 * @bufq: buffer or completion queue 710 * @q_model: single or split queue model 711 * 712 * Returns 0 on success, negative on failure 713 */ 714 static int idpf_rx_desc_alloc(struct idpf_queue *rxq, bool bufq, s32 q_model) 715 { 716 struct device *dev = rxq->dev; 717 718 if (bufq) 719 rxq->size = rxq->desc_count * 720 sizeof(struct virtchnl2_splitq_rx_buf_desc); 721 else 722 rxq->size = rxq->desc_count * 723 sizeof(union virtchnl2_rx_desc); 724 725 /* Allocate descriptors and also round up to nearest 4K */ 726 rxq->size = ALIGN(rxq->size, 4096); 727 rxq->desc_ring = dmam_alloc_coherent(dev, rxq->size, 728 &rxq->dma, GFP_KERNEL); 729 if (!rxq->desc_ring) { 730 dev_err(dev, "Unable to allocate memory for the Rx descriptor ring, size=%d\n", 731 rxq->size); 732 return -ENOMEM; 733 } 734 735 rxq->next_to_alloc = 0; 736 rxq->next_to_clean = 0; 737 rxq->next_to_use = 0; 738 set_bit(__IDPF_Q_GEN_CHK, rxq->flags); 739 740 return 0; 741 } 742 743 /** 744 * idpf_rx_desc_alloc_all - allocate all RX queues resources 745 * @vport: virtual port structure 746 * 747 * Returns 0 on success, negative on failure 748 */ 749 static int idpf_rx_desc_alloc_all(struct idpf_vport *vport) 750 { 751 struct device *dev = &vport->adapter->pdev->dev; 752 struct idpf_rxq_group *rx_qgrp; 753 struct idpf_queue *q; 754 int i, j, err; 755 u16 num_rxq; 756 757 for (i = 0; i < vport->num_rxq_grp; i++) { 758 rx_qgrp = &vport->rxq_grps[i]; 759 if (idpf_is_queue_model_split(vport->rxq_model)) 760 num_rxq = rx_qgrp->splitq.num_rxq_sets; 761 else 762 num_rxq = rx_qgrp->singleq.num_rxq; 763 764 for (j = 0; j < num_rxq; j++) { 765 if (idpf_is_queue_model_split(vport->rxq_model)) 766 q = &rx_qgrp->splitq.rxq_sets[j]->rxq; 767 else 768 q = rx_qgrp->singleq.rxqs[j]; 769 err = idpf_rx_desc_alloc(q, false, vport->rxq_model); 770 if (err) { 771 dev_err(dev, "Memory allocation for Rx Queue %u failed\n", 772 i); 773 goto err_out; 774 } 775 } 776 777 if (!idpf_is_queue_model_split(vport->rxq_model)) 778 continue; 779 780 for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { 781 q = &rx_qgrp->splitq.bufq_sets[j].bufq; 782 err = idpf_rx_desc_alloc(q, true, vport->rxq_model); 783 if (err) { 784 dev_err(dev, "Memory allocation for Rx Buffer Queue %u failed\n", 785 i); 786 goto err_out; 787 } 788 } 789 } 790 791 return 0; 792 793 err_out: 794 idpf_rx_desc_rel_all(vport); 795 796 return err; 797 } 798 799 /** 800 * idpf_txq_group_rel - Release all resources for txq groups 801 * @vport: vport to release txq groups on 802 */ 803 static void idpf_txq_group_rel(struct idpf_vport *vport) 804 { 805 int i, j; 806 807 if (!vport->txq_grps) 808 return; 809 810 for (i = 0; i < vport->num_txq_grp; i++) { 811 struct idpf_txq_group *txq_grp = &vport->txq_grps[i]; 812 813 for (j = 0; j < txq_grp->num_txq; j++) { 814 kfree(txq_grp->txqs[j]); 815 txq_grp->txqs[j] = NULL; 816 } 817 kfree(txq_grp->complq); 818 txq_grp->complq = NULL; 819 } 820 kfree(vport->txq_grps); 821 vport->txq_grps = NULL; 822 } 823 824 /** 825 * idpf_rxq_sw_queue_rel - Release software queue resources 826 * @rx_qgrp: rx queue group with software queues 827 */ 828 static void idpf_rxq_sw_queue_rel(struct idpf_rxq_group *rx_qgrp) 829 { 830 int i, j; 831 832 for (i = 0; i < rx_qgrp->vport->num_bufqs_per_qgrp; i++) { 833 struct idpf_bufq_set *bufq_set = &rx_qgrp->splitq.bufq_sets[i]; 834 835 for (j = 0; j < bufq_set->num_refillqs; j++) { 836 kfree(bufq_set->refillqs[j].ring); 837 bufq_set->refillqs[j].ring = NULL; 838 } 839 kfree(bufq_set->refillqs); 840 bufq_set->refillqs = NULL; 841 } 842 } 843 844 /** 845 * idpf_rxq_group_rel - Release all resources for rxq groups 846 * @vport: vport to release rxq groups on 847 */ 848 static void idpf_rxq_group_rel(struct idpf_vport *vport) 849 { 850 int i; 851 852 if (!vport->rxq_grps) 853 return; 854 855 for (i = 0; i < vport->num_rxq_grp; i++) { 856 struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; 857 u16 num_rxq; 858 int j; 859 860 if (idpf_is_queue_model_split(vport->rxq_model)) { 861 num_rxq = rx_qgrp->splitq.num_rxq_sets; 862 for (j = 0; j < num_rxq; j++) { 863 kfree(rx_qgrp->splitq.rxq_sets[j]); 864 rx_qgrp->splitq.rxq_sets[j] = NULL; 865 } 866 867 idpf_rxq_sw_queue_rel(rx_qgrp); 868 kfree(rx_qgrp->splitq.bufq_sets); 869 rx_qgrp->splitq.bufq_sets = NULL; 870 } else { 871 num_rxq = rx_qgrp->singleq.num_rxq; 872 for (j = 0; j < num_rxq; j++) { 873 kfree(rx_qgrp->singleq.rxqs[j]); 874 rx_qgrp->singleq.rxqs[j] = NULL; 875 } 876 } 877 } 878 kfree(vport->rxq_grps); 879 vport->rxq_grps = NULL; 880 } 881 882 /** 883 * idpf_vport_queue_grp_rel_all - Release all queue groups 884 * @vport: vport to release queue groups for 885 */ 886 static void idpf_vport_queue_grp_rel_all(struct idpf_vport *vport) 887 { 888 idpf_txq_group_rel(vport); 889 idpf_rxq_group_rel(vport); 890 } 891 892 /** 893 * idpf_vport_queues_rel - Free memory for all queues 894 * @vport: virtual port 895 * 896 * Free the memory allocated for queues associated to a vport 897 */ 898 void idpf_vport_queues_rel(struct idpf_vport *vport) 899 { 900 idpf_tx_desc_rel_all(vport); 901 idpf_rx_desc_rel_all(vport); 902 idpf_vport_queue_grp_rel_all(vport); 903 904 kfree(vport->txqs); 905 vport->txqs = NULL; 906 } 907 908 /** 909 * idpf_vport_init_fast_path_txqs - Initialize fast path txq array 910 * @vport: vport to init txqs on 911 * 912 * We get a queue index from skb->queue_mapping and we need a fast way to 913 * dereference the queue from queue groups. This allows us to quickly pull a 914 * txq based on a queue index. 915 * 916 * Returns 0 on success, negative on failure 917 */ 918 static int idpf_vport_init_fast_path_txqs(struct idpf_vport *vport) 919 { 920 int i, j, k = 0; 921 922 vport->txqs = kcalloc(vport->num_txq, sizeof(struct idpf_queue *), 923 GFP_KERNEL); 924 925 if (!vport->txqs) 926 return -ENOMEM; 927 928 for (i = 0; i < vport->num_txq_grp; i++) { 929 struct idpf_txq_group *tx_grp = &vport->txq_grps[i]; 930 931 for (j = 0; j < tx_grp->num_txq; j++, k++) { 932 vport->txqs[k] = tx_grp->txqs[j]; 933 vport->txqs[k]->idx = k; 934 } 935 } 936 937 return 0; 938 } 939 940 /** 941 * idpf_vport_init_num_qs - Initialize number of queues 942 * @vport: vport to initialize queues 943 * @vport_msg: data to be filled into vport 944 */ 945 void idpf_vport_init_num_qs(struct idpf_vport *vport, 946 struct virtchnl2_create_vport *vport_msg) 947 { 948 struct idpf_vport_user_config_data *config_data; 949 u16 idx = vport->idx; 950 951 config_data = &vport->adapter->vport_config[idx]->user_config; 952 vport->num_txq = le16_to_cpu(vport_msg->num_tx_q); 953 vport->num_rxq = le16_to_cpu(vport_msg->num_rx_q); 954 /* number of txqs and rxqs in config data will be zeros only in the 955 * driver load path and we dont update them there after 956 */ 957 if (!config_data->num_req_tx_qs && !config_data->num_req_rx_qs) { 958 config_data->num_req_tx_qs = le16_to_cpu(vport_msg->num_tx_q); 959 config_data->num_req_rx_qs = le16_to_cpu(vport_msg->num_rx_q); 960 } 961 962 if (idpf_is_queue_model_split(vport->txq_model)) 963 vport->num_complq = le16_to_cpu(vport_msg->num_tx_complq); 964 if (idpf_is_queue_model_split(vport->rxq_model)) 965 vport->num_bufq = le16_to_cpu(vport_msg->num_rx_bufq); 966 967 /* Adjust number of buffer queues per Rx queue group. */ 968 if (!idpf_is_queue_model_split(vport->rxq_model)) { 969 vport->num_bufqs_per_qgrp = 0; 970 vport->bufq_size[0] = IDPF_RX_BUF_2048; 971 972 return; 973 } 974 975 vport->num_bufqs_per_qgrp = IDPF_MAX_BUFQS_PER_RXQ_GRP; 976 /* Bufq[0] default buffer size is 4K 977 * Bufq[1] default buffer size is 2K 978 */ 979 vport->bufq_size[0] = IDPF_RX_BUF_4096; 980 vport->bufq_size[1] = IDPF_RX_BUF_2048; 981 } 982 983 /** 984 * idpf_vport_calc_num_q_desc - Calculate number of queue groups 985 * @vport: vport to calculate q groups for 986 */ 987 void idpf_vport_calc_num_q_desc(struct idpf_vport *vport) 988 { 989 struct idpf_vport_user_config_data *config_data; 990 int num_bufqs = vport->num_bufqs_per_qgrp; 991 u32 num_req_txq_desc, num_req_rxq_desc; 992 u16 idx = vport->idx; 993 int i; 994 995 config_data = &vport->adapter->vport_config[idx]->user_config; 996 num_req_txq_desc = config_data->num_req_txq_desc; 997 num_req_rxq_desc = config_data->num_req_rxq_desc; 998 999 vport->complq_desc_count = 0; 1000 if (num_req_txq_desc) { 1001 vport->txq_desc_count = num_req_txq_desc; 1002 if (idpf_is_queue_model_split(vport->txq_model)) { 1003 vport->complq_desc_count = num_req_txq_desc; 1004 if (vport->complq_desc_count < IDPF_MIN_TXQ_COMPLQ_DESC) 1005 vport->complq_desc_count = 1006 IDPF_MIN_TXQ_COMPLQ_DESC; 1007 } 1008 } else { 1009 vport->txq_desc_count = IDPF_DFLT_TX_Q_DESC_COUNT; 1010 if (idpf_is_queue_model_split(vport->txq_model)) 1011 vport->complq_desc_count = 1012 IDPF_DFLT_TX_COMPLQ_DESC_COUNT; 1013 } 1014 1015 if (num_req_rxq_desc) 1016 vport->rxq_desc_count = num_req_rxq_desc; 1017 else 1018 vport->rxq_desc_count = IDPF_DFLT_RX_Q_DESC_COUNT; 1019 1020 for (i = 0; i < num_bufqs; i++) { 1021 if (!vport->bufq_desc_count[i]) 1022 vport->bufq_desc_count[i] = 1023 IDPF_RX_BUFQ_DESC_COUNT(vport->rxq_desc_count, 1024 num_bufqs); 1025 } 1026 } 1027 1028 /** 1029 * idpf_vport_calc_total_qs - Calculate total number of queues 1030 * @adapter: private data struct 1031 * @vport_idx: vport idx to retrieve vport pointer 1032 * @vport_msg: message to fill with data 1033 * @max_q: vport max queue info 1034 * 1035 * Return 0 on success, error value on failure. 1036 */ 1037 int idpf_vport_calc_total_qs(struct idpf_adapter *adapter, u16 vport_idx, 1038 struct virtchnl2_create_vport *vport_msg, 1039 struct idpf_vport_max_q *max_q) 1040 { 1041 int dflt_splitq_txq_grps = 0, dflt_singleq_txqs = 0; 1042 int dflt_splitq_rxq_grps = 0, dflt_singleq_rxqs = 0; 1043 u16 num_req_tx_qs = 0, num_req_rx_qs = 0; 1044 struct idpf_vport_config *vport_config; 1045 u16 num_txq_grps, num_rxq_grps; 1046 u32 num_qs; 1047 1048 vport_config = adapter->vport_config[vport_idx]; 1049 if (vport_config) { 1050 num_req_tx_qs = vport_config->user_config.num_req_tx_qs; 1051 num_req_rx_qs = vport_config->user_config.num_req_rx_qs; 1052 } else { 1053 int num_cpus; 1054 1055 /* Restrict num of queues to cpus online as a default 1056 * configuration to give best performance. User can always 1057 * override to a max number of queues via ethtool. 1058 */ 1059 num_cpus = num_online_cpus(); 1060 1061 dflt_splitq_txq_grps = min_t(int, max_q->max_txq, num_cpus); 1062 dflt_singleq_txqs = min_t(int, max_q->max_txq, num_cpus); 1063 dflt_splitq_rxq_grps = min_t(int, max_q->max_rxq, num_cpus); 1064 dflt_singleq_rxqs = min_t(int, max_q->max_rxq, num_cpus); 1065 } 1066 1067 if (idpf_is_queue_model_split(le16_to_cpu(vport_msg->txq_model))) { 1068 num_txq_grps = num_req_tx_qs ? num_req_tx_qs : dflt_splitq_txq_grps; 1069 vport_msg->num_tx_complq = cpu_to_le16(num_txq_grps * 1070 IDPF_COMPLQ_PER_GROUP); 1071 vport_msg->num_tx_q = cpu_to_le16(num_txq_grps * 1072 IDPF_DFLT_SPLITQ_TXQ_PER_GROUP); 1073 } else { 1074 num_txq_grps = IDPF_DFLT_SINGLEQ_TX_Q_GROUPS; 1075 num_qs = num_txq_grps * (num_req_tx_qs ? num_req_tx_qs : 1076 dflt_singleq_txqs); 1077 vport_msg->num_tx_q = cpu_to_le16(num_qs); 1078 vport_msg->num_tx_complq = 0; 1079 } 1080 if (idpf_is_queue_model_split(le16_to_cpu(vport_msg->rxq_model))) { 1081 num_rxq_grps = num_req_rx_qs ? num_req_rx_qs : dflt_splitq_rxq_grps; 1082 vport_msg->num_rx_bufq = cpu_to_le16(num_rxq_grps * 1083 IDPF_MAX_BUFQS_PER_RXQ_GRP); 1084 vport_msg->num_rx_q = cpu_to_le16(num_rxq_grps * 1085 IDPF_DFLT_SPLITQ_RXQ_PER_GROUP); 1086 } else { 1087 num_rxq_grps = IDPF_DFLT_SINGLEQ_RX_Q_GROUPS; 1088 num_qs = num_rxq_grps * (num_req_rx_qs ? num_req_rx_qs : 1089 dflt_singleq_rxqs); 1090 vport_msg->num_rx_q = cpu_to_le16(num_qs); 1091 vport_msg->num_rx_bufq = 0; 1092 } 1093 1094 return 0; 1095 } 1096 1097 /** 1098 * idpf_vport_calc_num_q_groups - Calculate number of queue groups 1099 * @vport: vport to calculate q groups for 1100 */ 1101 void idpf_vport_calc_num_q_groups(struct idpf_vport *vport) 1102 { 1103 if (idpf_is_queue_model_split(vport->txq_model)) 1104 vport->num_txq_grp = vport->num_txq; 1105 else 1106 vport->num_txq_grp = IDPF_DFLT_SINGLEQ_TX_Q_GROUPS; 1107 1108 if (idpf_is_queue_model_split(vport->rxq_model)) 1109 vport->num_rxq_grp = vport->num_rxq; 1110 else 1111 vport->num_rxq_grp = IDPF_DFLT_SINGLEQ_RX_Q_GROUPS; 1112 } 1113 1114 /** 1115 * idpf_vport_calc_numq_per_grp - Calculate number of queues per group 1116 * @vport: vport to calculate queues for 1117 * @num_txq: return parameter for number of TX queues 1118 * @num_rxq: return parameter for number of RX queues 1119 */ 1120 static void idpf_vport_calc_numq_per_grp(struct idpf_vport *vport, 1121 u16 *num_txq, u16 *num_rxq) 1122 { 1123 if (idpf_is_queue_model_split(vport->txq_model)) 1124 *num_txq = IDPF_DFLT_SPLITQ_TXQ_PER_GROUP; 1125 else 1126 *num_txq = vport->num_txq; 1127 1128 if (idpf_is_queue_model_split(vport->rxq_model)) 1129 *num_rxq = IDPF_DFLT_SPLITQ_RXQ_PER_GROUP; 1130 else 1131 *num_rxq = vport->num_rxq; 1132 } 1133 1134 /** 1135 * idpf_rxq_set_descids - set the descids supported by this queue 1136 * @vport: virtual port data structure 1137 * @q: rx queue for which descids are set 1138 * 1139 */ 1140 static void idpf_rxq_set_descids(struct idpf_vport *vport, struct idpf_queue *q) 1141 { 1142 if (vport->rxq_model == VIRTCHNL2_QUEUE_MODEL_SPLIT) { 1143 q->rxdids = VIRTCHNL2_RXDID_2_FLEX_SPLITQ_M; 1144 } else { 1145 if (vport->base_rxd) 1146 q->rxdids = VIRTCHNL2_RXDID_1_32B_BASE_M; 1147 else 1148 q->rxdids = VIRTCHNL2_RXDID_2_FLEX_SQ_NIC_M; 1149 } 1150 } 1151 1152 /** 1153 * idpf_txq_group_alloc - Allocate all txq group resources 1154 * @vport: vport to allocate txq groups for 1155 * @num_txq: number of txqs to allocate for each group 1156 * 1157 * Returns 0 on success, negative on failure 1158 */ 1159 static int idpf_txq_group_alloc(struct idpf_vport *vport, u16 num_txq) 1160 { 1161 bool flow_sch_en; 1162 int err, i; 1163 1164 vport->txq_grps = kcalloc(vport->num_txq_grp, 1165 sizeof(*vport->txq_grps), GFP_KERNEL); 1166 if (!vport->txq_grps) 1167 return -ENOMEM; 1168 1169 flow_sch_en = !idpf_is_cap_ena(vport->adapter, IDPF_OTHER_CAPS, 1170 VIRTCHNL2_CAP_SPLITQ_QSCHED); 1171 1172 for (i = 0; i < vport->num_txq_grp; i++) { 1173 struct idpf_txq_group *tx_qgrp = &vport->txq_grps[i]; 1174 struct idpf_adapter *adapter = vport->adapter; 1175 int j; 1176 1177 tx_qgrp->vport = vport; 1178 tx_qgrp->num_txq = num_txq; 1179 1180 for (j = 0; j < tx_qgrp->num_txq; j++) { 1181 tx_qgrp->txqs[j] = kzalloc(sizeof(*tx_qgrp->txqs[j]), 1182 GFP_KERNEL); 1183 if (!tx_qgrp->txqs[j]) { 1184 err = -ENOMEM; 1185 goto err_alloc; 1186 } 1187 } 1188 1189 for (j = 0; j < tx_qgrp->num_txq; j++) { 1190 struct idpf_queue *q = tx_qgrp->txqs[j]; 1191 1192 q->dev = &adapter->pdev->dev; 1193 q->desc_count = vport->txq_desc_count; 1194 q->tx_max_bufs = idpf_get_max_tx_bufs(adapter); 1195 q->tx_min_pkt_len = idpf_get_min_tx_pkt_len(adapter); 1196 q->vport = vport; 1197 q->txq_grp = tx_qgrp; 1198 hash_init(q->sched_buf_hash); 1199 1200 if (flow_sch_en) 1201 set_bit(__IDPF_Q_FLOW_SCH_EN, q->flags); 1202 } 1203 1204 if (!idpf_is_queue_model_split(vport->txq_model)) 1205 continue; 1206 1207 tx_qgrp->complq = kcalloc(IDPF_COMPLQ_PER_GROUP, 1208 sizeof(*tx_qgrp->complq), 1209 GFP_KERNEL); 1210 if (!tx_qgrp->complq) { 1211 err = -ENOMEM; 1212 goto err_alloc; 1213 } 1214 1215 tx_qgrp->complq->dev = &adapter->pdev->dev; 1216 tx_qgrp->complq->desc_count = vport->complq_desc_count; 1217 tx_qgrp->complq->vport = vport; 1218 tx_qgrp->complq->txq_grp = tx_qgrp; 1219 1220 if (flow_sch_en) 1221 __set_bit(__IDPF_Q_FLOW_SCH_EN, tx_qgrp->complq->flags); 1222 } 1223 1224 return 0; 1225 1226 err_alloc: 1227 idpf_txq_group_rel(vport); 1228 1229 return err; 1230 } 1231 1232 /** 1233 * idpf_rxq_group_alloc - Allocate all rxq group resources 1234 * @vport: vport to allocate rxq groups for 1235 * @num_rxq: number of rxqs to allocate for each group 1236 * 1237 * Returns 0 on success, negative on failure 1238 */ 1239 static int idpf_rxq_group_alloc(struct idpf_vport *vport, u16 num_rxq) 1240 { 1241 struct idpf_adapter *adapter = vport->adapter; 1242 struct idpf_queue *q; 1243 int i, k, err = 0; 1244 bool hs; 1245 1246 vport->rxq_grps = kcalloc(vport->num_rxq_grp, 1247 sizeof(struct idpf_rxq_group), GFP_KERNEL); 1248 if (!vport->rxq_grps) 1249 return -ENOMEM; 1250 1251 hs = idpf_vport_get_hsplit(vport) == ETHTOOL_TCP_DATA_SPLIT_ENABLED; 1252 1253 for (i = 0; i < vport->num_rxq_grp; i++) { 1254 struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; 1255 int j; 1256 1257 rx_qgrp->vport = vport; 1258 if (!idpf_is_queue_model_split(vport->rxq_model)) { 1259 rx_qgrp->singleq.num_rxq = num_rxq; 1260 for (j = 0; j < num_rxq; j++) { 1261 rx_qgrp->singleq.rxqs[j] = 1262 kzalloc(sizeof(*rx_qgrp->singleq.rxqs[j]), 1263 GFP_KERNEL); 1264 if (!rx_qgrp->singleq.rxqs[j]) { 1265 err = -ENOMEM; 1266 goto err_alloc; 1267 } 1268 } 1269 goto skip_splitq_rx_init; 1270 } 1271 rx_qgrp->splitq.num_rxq_sets = num_rxq; 1272 1273 for (j = 0; j < num_rxq; j++) { 1274 rx_qgrp->splitq.rxq_sets[j] = 1275 kzalloc(sizeof(struct idpf_rxq_set), 1276 GFP_KERNEL); 1277 if (!rx_qgrp->splitq.rxq_sets[j]) { 1278 err = -ENOMEM; 1279 goto err_alloc; 1280 } 1281 } 1282 1283 rx_qgrp->splitq.bufq_sets = kcalloc(vport->num_bufqs_per_qgrp, 1284 sizeof(struct idpf_bufq_set), 1285 GFP_KERNEL); 1286 if (!rx_qgrp->splitq.bufq_sets) { 1287 err = -ENOMEM; 1288 goto err_alloc; 1289 } 1290 1291 for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { 1292 struct idpf_bufq_set *bufq_set = 1293 &rx_qgrp->splitq.bufq_sets[j]; 1294 int swq_size = sizeof(struct idpf_sw_queue); 1295 1296 q = &rx_qgrp->splitq.bufq_sets[j].bufq; 1297 q->dev = &adapter->pdev->dev; 1298 q->desc_count = vport->bufq_desc_count[j]; 1299 q->vport = vport; 1300 q->rxq_grp = rx_qgrp; 1301 q->idx = j; 1302 q->rx_buf_size = vport->bufq_size[j]; 1303 q->rx_buffer_low_watermark = IDPF_LOW_WATERMARK; 1304 q->rx_buf_stride = IDPF_RX_BUF_STRIDE; 1305 1306 if (hs) { 1307 q->rx_hsplit_en = true; 1308 q->rx_hbuf_size = IDPF_HDR_BUF_SIZE; 1309 } 1310 1311 bufq_set->num_refillqs = num_rxq; 1312 bufq_set->refillqs = kcalloc(num_rxq, swq_size, 1313 GFP_KERNEL); 1314 if (!bufq_set->refillqs) { 1315 err = -ENOMEM; 1316 goto err_alloc; 1317 } 1318 for (k = 0; k < bufq_set->num_refillqs; k++) { 1319 struct idpf_sw_queue *refillq = 1320 &bufq_set->refillqs[k]; 1321 1322 refillq->dev = &vport->adapter->pdev->dev; 1323 refillq->desc_count = 1324 vport->bufq_desc_count[j]; 1325 set_bit(__IDPF_Q_GEN_CHK, refillq->flags); 1326 set_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags); 1327 refillq->ring = kcalloc(refillq->desc_count, 1328 sizeof(u16), 1329 GFP_KERNEL); 1330 if (!refillq->ring) { 1331 err = -ENOMEM; 1332 goto err_alloc; 1333 } 1334 } 1335 } 1336 1337 skip_splitq_rx_init: 1338 for (j = 0; j < num_rxq; j++) { 1339 if (!idpf_is_queue_model_split(vport->rxq_model)) { 1340 q = rx_qgrp->singleq.rxqs[j]; 1341 goto setup_rxq; 1342 } 1343 q = &rx_qgrp->splitq.rxq_sets[j]->rxq; 1344 rx_qgrp->splitq.rxq_sets[j]->refillq0 = 1345 &rx_qgrp->splitq.bufq_sets[0].refillqs[j]; 1346 if (vport->num_bufqs_per_qgrp > IDPF_SINGLE_BUFQ_PER_RXQ_GRP) 1347 rx_qgrp->splitq.rxq_sets[j]->refillq1 = 1348 &rx_qgrp->splitq.bufq_sets[1].refillqs[j]; 1349 1350 if (hs) { 1351 q->rx_hsplit_en = true; 1352 q->rx_hbuf_size = IDPF_HDR_BUF_SIZE; 1353 } 1354 1355 setup_rxq: 1356 q->dev = &adapter->pdev->dev; 1357 q->desc_count = vport->rxq_desc_count; 1358 q->vport = vport; 1359 q->rxq_grp = rx_qgrp; 1360 q->idx = (i * num_rxq) + j; 1361 /* In splitq mode, RXQ buffer size should be 1362 * set to that of the first buffer queue 1363 * associated with this RXQ 1364 */ 1365 q->rx_buf_size = vport->bufq_size[0]; 1366 q->rx_buffer_low_watermark = IDPF_LOW_WATERMARK; 1367 q->rx_max_pkt_size = vport->netdev->mtu + 1368 IDPF_PACKET_HDR_PAD; 1369 idpf_rxq_set_descids(vport, q); 1370 } 1371 } 1372 1373 err_alloc: 1374 if (err) 1375 idpf_rxq_group_rel(vport); 1376 1377 return err; 1378 } 1379 1380 /** 1381 * idpf_vport_queue_grp_alloc_all - Allocate all queue groups/resources 1382 * @vport: vport with qgrps to allocate 1383 * 1384 * Returns 0 on success, negative on failure 1385 */ 1386 static int idpf_vport_queue_grp_alloc_all(struct idpf_vport *vport) 1387 { 1388 u16 num_txq, num_rxq; 1389 int err; 1390 1391 idpf_vport_calc_numq_per_grp(vport, &num_txq, &num_rxq); 1392 1393 err = idpf_txq_group_alloc(vport, num_txq); 1394 if (err) 1395 goto err_out; 1396 1397 err = idpf_rxq_group_alloc(vport, num_rxq); 1398 if (err) 1399 goto err_out; 1400 1401 return 0; 1402 1403 err_out: 1404 idpf_vport_queue_grp_rel_all(vport); 1405 1406 return err; 1407 } 1408 1409 /** 1410 * idpf_vport_queues_alloc - Allocate memory for all queues 1411 * @vport: virtual port 1412 * 1413 * Allocate memory for queues associated with a vport. Returns 0 on success, 1414 * negative on failure. 1415 */ 1416 int idpf_vport_queues_alloc(struct idpf_vport *vport) 1417 { 1418 int err; 1419 1420 err = idpf_vport_queue_grp_alloc_all(vport); 1421 if (err) 1422 goto err_out; 1423 1424 err = idpf_tx_desc_alloc_all(vport); 1425 if (err) 1426 goto err_out; 1427 1428 err = idpf_rx_desc_alloc_all(vport); 1429 if (err) 1430 goto err_out; 1431 1432 err = idpf_vport_init_fast_path_txqs(vport); 1433 if (err) 1434 goto err_out; 1435 1436 return 0; 1437 1438 err_out: 1439 idpf_vport_queues_rel(vport); 1440 1441 return err; 1442 } 1443 1444 /** 1445 * idpf_tx_handle_sw_marker - Handle queue marker packet 1446 * @tx_q: tx queue to handle software marker 1447 */ 1448 static void idpf_tx_handle_sw_marker(struct idpf_queue *tx_q) 1449 { 1450 struct idpf_vport *vport = tx_q->vport; 1451 int i; 1452 1453 clear_bit(__IDPF_Q_SW_MARKER, tx_q->flags); 1454 /* Hardware must write marker packets to all queues associated with 1455 * completion queues. So check if all queues received marker packets 1456 */ 1457 for (i = 0; i < vport->num_txq; i++) 1458 /* If we're still waiting on any other TXQ marker completions, 1459 * just return now since we cannot wake up the marker_wq yet. 1460 */ 1461 if (test_bit(__IDPF_Q_SW_MARKER, vport->txqs[i]->flags)) 1462 return; 1463 1464 /* Drain complete */ 1465 set_bit(IDPF_VPORT_SW_MARKER, vport->flags); 1466 wake_up(&vport->sw_marker_wq); 1467 } 1468 1469 /** 1470 * idpf_tx_splitq_clean_hdr - Clean TX buffer resources for header portion of 1471 * packet 1472 * @tx_q: tx queue to clean buffer from 1473 * @tx_buf: buffer to be cleaned 1474 * @cleaned: pointer to stats struct to track cleaned packets/bytes 1475 * @napi_budget: Used to determine if we are in netpoll 1476 */ 1477 static void idpf_tx_splitq_clean_hdr(struct idpf_queue *tx_q, 1478 struct idpf_tx_buf *tx_buf, 1479 struct idpf_cleaned_stats *cleaned, 1480 int napi_budget) 1481 { 1482 napi_consume_skb(tx_buf->skb, napi_budget); 1483 1484 if (dma_unmap_len(tx_buf, len)) { 1485 dma_unmap_single(tx_q->dev, 1486 dma_unmap_addr(tx_buf, dma), 1487 dma_unmap_len(tx_buf, len), 1488 DMA_TO_DEVICE); 1489 1490 dma_unmap_len_set(tx_buf, len, 0); 1491 } 1492 1493 /* clear tx_buf data */ 1494 tx_buf->skb = NULL; 1495 1496 cleaned->bytes += tx_buf->bytecount; 1497 cleaned->packets += tx_buf->gso_segs; 1498 } 1499 1500 /** 1501 * idpf_tx_clean_stashed_bufs - clean bufs that were stored for 1502 * out of order completions 1503 * @txq: queue to clean 1504 * @compl_tag: completion tag of packet to clean (from completion descriptor) 1505 * @cleaned: pointer to stats struct to track cleaned packets/bytes 1506 * @budget: Used to determine if we are in netpoll 1507 */ 1508 static void idpf_tx_clean_stashed_bufs(struct idpf_queue *txq, u16 compl_tag, 1509 struct idpf_cleaned_stats *cleaned, 1510 int budget) 1511 { 1512 struct idpf_tx_stash *stash; 1513 struct hlist_node *tmp_buf; 1514 1515 /* Buffer completion */ 1516 hash_for_each_possible_safe(txq->sched_buf_hash, stash, tmp_buf, 1517 hlist, compl_tag) { 1518 if (unlikely(stash->buf.compl_tag != (int)compl_tag)) 1519 continue; 1520 1521 if (stash->buf.skb) { 1522 idpf_tx_splitq_clean_hdr(txq, &stash->buf, cleaned, 1523 budget); 1524 } else if (dma_unmap_len(&stash->buf, len)) { 1525 dma_unmap_page(txq->dev, 1526 dma_unmap_addr(&stash->buf, dma), 1527 dma_unmap_len(&stash->buf, len), 1528 DMA_TO_DEVICE); 1529 dma_unmap_len_set(&stash->buf, len, 0); 1530 } 1531 1532 /* Push shadow buf back onto stack */ 1533 idpf_buf_lifo_push(&txq->buf_stack, stash); 1534 1535 hash_del(&stash->hlist); 1536 } 1537 } 1538 1539 /** 1540 * idpf_stash_flow_sch_buffers - store buffer parameters info to be freed at a 1541 * later time (only relevant for flow scheduling mode) 1542 * @txq: Tx queue to clean 1543 * @tx_buf: buffer to store 1544 */ 1545 static int idpf_stash_flow_sch_buffers(struct idpf_queue *txq, 1546 struct idpf_tx_buf *tx_buf) 1547 { 1548 struct idpf_tx_stash *stash; 1549 1550 if (unlikely(!dma_unmap_addr(tx_buf, dma) && 1551 !dma_unmap_len(tx_buf, len))) 1552 return 0; 1553 1554 stash = idpf_buf_lifo_pop(&txq->buf_stack); 1555 if (unlikely(!stash)) { 1556 net_err_ratelimited("%s: No out-of-order TX buffers left!\n", 1557 txq->vport->netdev->name); 1558 1559 return -ENOMEM; 1560 } 1561 1562 /* Store buffer params in shadow buffer */ 1563 stash->buf.skb = tx_buf->skb; 1564 stash->buf.bytecount = tx_buf->bytecount; 1565 stash->buf.gso_segs = tx_buf->gso_segs; 1566 dma_unmap_addr_set(&stash->buf, dma, dma_unmap_addr(tx_buf, dma)); 1567 dma_unmap_len_set(&stash->buf, len, dma_unmap_len(tx_buf, len)); 1568 stash->buf.compl_tag = tx_buf->compl_tag; 1569 1570 /* Add buffer to buf_hash table to be freed later */ 1571 hash_add(txq->sched_buf_hash, &stash->hlist, stash->buf.compl_tag); 1572 1573 memset(tx_buf, 0, sizeof(struct idpf_tx_buf)); 1574 1575 /* Reinitialize buf_id portion of tag */ 1576 tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; 1577 1578 return 0; 1579 } 1580 1581 #define idpf_tx_splitq_clean_bump_ntc(txq, ntc, desc, buf) \ 1582 do { \ 1583 (ntc)++; \ 1584 if (unlikely(!(ntc))) { \ 1585 ntc -= (txq)->desc_count; \ 1586 buf = (txq)->tx_buf; \ 1587 desc = IDPF_FLEX_TX_DESC(txq, 0); \ 1588 } else { \ 1589 (buf)++; \ 1590 (desc)++; \ 1591 } \ 1592 } while (0) 1593 1594 /** 1595 * idpf_tx_splitq_clean - Reclaim resources from buffer queue 1596 * @tx_q: Tx queue to clean 1597 * @end: queue index until which it should be cleaned 1598 * @napi_budget: Used to determine if we are in netpoll 1599 * @cleaned: pointer to stats struct to track cleaned packets/bytes 1600 * @descs_only: true if queue is using flow-based scheduling and should 1601 * not clean buffers at this time 1602 * 1603 * Cleans the queue descriptor ring. If the queue is using queue-based 1604 * scheduling, the buffers will be cleaned as well. If the queue is using 1605 * flow-based scheduling, only the descriptors are cleaned at this time. 1606 * Separate packet completion events will be reported on the completion queue, 1607 * and the buffers will be cleaned separately. The stats are not updated from 1608 * this function when using flow-based scheduling. 1609 */ 1610 static void idpf_tx_splitq_clean(struct idpf_queue *tx_q, u16 end, 1611 int napi_budget, 1612 struct idpf_cleaned_stats *cleaned, 1613 bool descs_only) 1614 { 1615 union idpf_tx_flex_desc *next_pending_desc = NULL; 1616 union idpf_tx_flex_desc *tx_desc; 1617 s16 ntc = tx_q->next_to_clean; 1618 struct idpf_tx_buf *tx_buf; 1619 1620 tx_desc = IDPF_FLEX_TX_DESC(tx_q, ntc); 1621 next_pending_desc = IDPF_FLEX_TX_DESC(tx_q, end); 1622 tx_buf = &tx_q->tx_buf[ntc]; 1623 ntc -= tx_q->desc_count; 1624 1625 while (tx_desc != next_pending_desc) { 1626 union idpf_tx_flex_desc *eop_desc; 1627 1628 /* If this entry in the ring was used as a context descriptor, 1629 * it's corresponding entry in the buffer ring will have an 1630 * invalid completion tag since no buffer was used. We can 1631 * skip this descriptor since there is no buffer to clean. 1632 */ 1633 if (unlikely(tx_buf->compl_tag == IDPF_SPLITQ_TX_INVAL_COMPL_TAG)) 1634 goto fetch_next_txq_desc; 1635 1636 eop_desc = (union idpf_tx_flex_desc *)tx_buf->next_to_watch; 1637 1638 /* clear next_to_watch to prevent false hangs */ 1639 tx_buf->next_to_watch = NULL; 1640 1641 if (descs_only) { 1642 if (idpf_stash_flow_sch_buffers(tx_q, tx_buf)) 1643 goto tx_splitq_clean_out; 1644 1645 while (tx_desc != eop_desc) { 1646 idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, 1647 tx_desc, tx_buf); 1648 1649 if (dma_unmap_len(tx_buf, len)) { 1650 if (idpf_stash_flow_sch_buffers(tx_q, 1651 tx_buf)) 1652 goto tx_splitq_clean_out; 1653 } 1654 } 1655 } else { 1656 idpf_tx_splitq_clean_hdr(tx_q, tx_buf, cleaned, 1657 napi_budget); 1658 1659 /* unmap remaining buffers */ 1660 while (tx_desc != eop_desc) { 1661 idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, 1662 tx_desc, tx_buf); 1663 1664 /* unmap any remaining paged data */ 1665 if (dma_unmap_len(tx_buf, len)) { 1666 dma_unmap_page(tx_q->dev, 1667 dma_unmap_addr(tx_buf, dma), 1668 dma_unmap_len(tx_buf, len), 1669 DMA_TO_DEVICE); 1670 dma_unmap_len_set(tx_buf, len, 0); 1671 } 1672 } 1673 } 1674 1675 fetch_next_txq_desc: 1676 idpf_tx_splitq_clean_bump_ntc(tx_q, ntc, tx_desc, tx_buf); 1677 } 1678 1679 tx_splitq_clean_out: 1680 ntc += tx_q->desc_count; 1681 tx_q->next_to_clean = ntc; 1682 } 1683 1684 #define idpf_tx_clean_buf_ring_bump_ntc(txq, ntc, buf) \ 1685 do { \ 1686 (buf)++; \ 1687 (ntc)++; \ 1688 if (unlikely((ntc) == (txq)->desc_count)) { \ 1689 buf = (txq)->tx_buf; \ 1690 ntc = 0; \ 1691 } \ 1692 } while (0) 1693 1694 /** 1695 * idpf_tx_clean_buf_ring - clean flow scheduling TX queue buffers 1696 * @txq: queue to clean 1697 * @compl_tag: completion tag of packet to clean (from completion descriptor) 1698 * @cleaned: pointer to stats struct to track cleaned packets/bytes 1699 * @budget: Used to determine if we are in netpoll 1700 * 1701 * Cleans all buffers associated with the input completion tag either from the 1702 * TX buffer ring or from the hash table if the buffers were previously 1703 * stashed. Returns the byte/segment count for the cleaned packet associated 1704 * this completion tag. 1705 */ 1706 static bool idpf_tx_clean_buf_ring(struct idpf_queue *txq, u16 compl_tag, 1707 struct idpf_cleaned_stats *cleaned, 1708 int budget) 1709 { 1710 u16 idx = compl_tag & txq->compl_tag_bufid_m; 1711 struct idpf_tx_buf *tx_buf = NULL; 1712 u16 ntc = txq->next_to_clean; 1713 u16 num_descs_cleaned = 0; 1714 u16 orig_idx = idx; 1715 1716 tx_buf = &txq->tx_buf[idx]; 1717 1718 while (tx_buf->compl_tag == (int)compl_tag) { 1719 if (tx_buf->skb) { 1720 idpf_tx_splitq_clean_hdr(txq, tx_buf, cleaned, budget); 1721 } else if (dma_unmap_len(tx_buf, len)) { 1722 dma_unmap_page(txq->dev, 1723 dma_unmap_addr(tx_buf, dma), 1724 dma_unmap_len(tx_buf, len), 1725 DMA_TO_DEVICE); 1726 dma_unmap_len_set(tx_buf, len, 0); 1727 } 1728 1729 memset(tx_buf, 0, sizeof(struct idpf_tx_buf)); 1730 tx_buf->compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; 1731 1732 num_descs_cleaned++; 1733 idpf_tx_clean_buf_ring_bump_ntc(txq, idx, tx_buf); 1734 } 1735 1736 /* If we didn't clean anything on the ring for this completion, there's 1737 * nothing more to do. 1738 */ 1739 if (unlikely(!num_descs_cleaned)) 1740 return false; 1741 1742 /* Otherwise, if we did clean a packet on the ring directly, it's safe 1743 * to assume that the descriptors starting from the original 1744 * next_to_clean up until the previously cleaned packet can be reused. 1745 * Therefore, we will go back in the ring and stash any buffers still 1746 * in the ring into the hash table to be cleaned later. 1747 */ 1748 tx_buf = &txq->tx_buf[ntc]; 1749 while (tx_buf != &txq->tx_buf[orig_idx]) { 1750 idpf_stash_flow_sch_buffers(txq, tx_buf); 1751 idpf_tx_clean_buf_ring_bump_ntc(txq, ntc, tx_buf); 1752 } 1753 1754 /* Finally, update next_to_clean to reflect the work that was just done 1755 * on the ring, if any. If the packet was only cleaned from the hash 1756 * table, the ring will not be impacted, therefore we should not touch 1757 * next_to_clean. The updated idx is used here 1758 */ 1759 txq->next_to_clean = idx; 1760 1761 return true; 1762 } 1763 1764 /** 1765 * idpf_tx_handle_rs_completion - clean a single packet and all of its buffers 1766 * whether on the buffer ring or in the hash table 1767 * @txq: Tx ring to clean 1768 * @desc: pointer to completion queue descriptor to extract completion 1769 * information from 1770 * @cleaned: pointer to stats struct to track cleaned packets/bytes 1771 * @budget: Used to determine if we are in netpoll 1772 * 1773 * Returns bytes/packets cleaned 1774 */ 1775 static void idpf_tx_handle_rs_completion(struct idpf_queue *txq, 1776 struct idpf_splitq_tx_compl_desc *desc, 1777 struct idpf_cleaned_stats *cleaned, 1778 int budget) 1779 { 1780 u16 compl_tag; 1781 1782 if (!test_bit(__IDPF_Q_FLOW_SCH_EN, txq->flags)) { 1783 u16 head = le16_to_cpu(desc->q_head_compl_tag.q_head); 1784 1785 return idpf_tx_splitq_clean(txq, head, budget, cleaned, false); 1786 } 1787 1788 compl_tag = le16_to_cpu(desc->q_head_compl_tag.compl_tag); 1789 1790 /* If we didn't clean anything on the ring, this packet must be 1791 * in the hash table. Go clean it there. 1792 */ 1793 if (!idpf_tx_clean_buf_ring(txq, compl_tag, cleaned, budget)) 1794 idpf_tx_clean_stashed_bufs(txq, compl_tag, cleaned, budget); 1795 } 1796 1797 /** 1798 * idpf_tx_clean_complq - Reclaim resources on completion queue 1799 * @complq: Tx ring to clean 1800 * @budget: Used to determine if we are in netpoll 1801 * @cleaned: returns number of packets cleaned 1802 * 1803 * Returns true if there's any budget left (e.g. the clean is finished) 1804 */ 1805 static bool idpf_tx_clean_complq(struct idpf_queue *complq, int budget, 1806 int *cleaned) 1807 { 1808 struct idpf_splitq_tx_compl_desc *tx_desc; 1809 struct idpf_vport *vport = complq->vport; 1810 s16 ntc = complq->next_to_clean; 1811 struct idpf_netdev_priv *np; 1812 unsigned int complq_budget; 1813 bool complq_ok = true; 1814 int i; 1815 1816 complq_budget = vport->compln_clean_budget; 1817 tx_desc = IDPF_SPLITQ_TX_COMPLQ_DESC(complq, ntc); 1818 ntc -= complq->desc_count; 1819 1820 do { 1821 struct idpf_cleaned_stats cleaned_stats = { }; 1822 struct idpf_queue *tx_q; 1823 int rel_tx_qid; 1824 u16 hw_head; 1825 u8 ctype; /* completion type */ 1826 u16 gen; 1827 1828 /* if the descriptor isn't done, no work yet to do */ 1829 gen = le16_get_bits(tx_desc->qid_comptype_gen, 1830 IDPF_TXD_COMPLQ_GEN_M); 1831 if (test_bit(__IDPF_Q_GEN_CHK, complq->flags) != gen) 1832 break; 1833 1834 /* Find necessary info of TX queue to clean buffers */ 1835 rel_tx_qid = le16_get_bits(tx_desc->qid_comptype_gen, 1836 IDPF_TXD_COMPLQ_QID_M); 1837 if (rel_tx_qid >= complq->txq_grp->num_txq || 1838 !complq->txq_grp->txqs[rel_tx_qid]) { 1839 dev_err(&complq->vport->adapter->pdev->dev, 1840 "TxQ not found\n"); 1841 goto fetch_next_desc; 1842 } 1843 tx_q = complq->txq_grp->txqs[rel_tx_qid]; 1844 1845 /* Determine completion type */ 1846 ctype = le16_get_bits(tx_desc->qid_comptype_gen, 1847 IDPF_TXD_COMPLQ_COMPL_TYPE_M); 1848 switch (ctype) { 1849 case IDPF_TXD_COMPLT_RE: 1850 hw_head = le16_to_cpu(tx_desc->q_head_compl_tag.q_head); 1851 1852 idpf_tx_splitq_clean(tx_q, hw_head, budget, 1853 &cleaned_stats, true); 1854 break; 1855 case IDPF_TXD_COMPLT_RS: 1856 idpf_tx_handle_rs_completion(tx_q, tx_desc, 1857 &cleaned_stats, budget); 1858 break; 1859 case IDPF_TXD_COMPLT_SW_MARKER: 1860 idpf_tx_handle_sw_marker(tx_q); 1861 break; 1862 default: 1863 dev_err(&tx_q->vport->adapter->pdev->dev, 1864 "Unknown TX completion type: %d\n", 1865 ctype); 1866 goto fetch_next_desc; 1867 } 1868 1869 u64_stats_update_begin(&tx_q->stats_sync); 1870 u64_stats_add(&tx_q->q_stats.tx.packets, cleaned_stats.packets); 1871 u64_stats_add(&tx_q->q_stats.tx.bytes, cleaned_stats.bytes); 1872 tx_q->cleaned_pkts += cleaned_stats.packets; 1873 tx_q->cleaned_bytes += cleaned_stats.bytes; 1874 complq->num_completions++; 1875 u64_stats_update_end(&tx_q->stats_sync); 1876 1877 fetch_next_desc: 1878 tx_desc++; 1879 ntc++; 1880 if (unlikely(!ntc)) { 1881 ntc -= complq->desc_count; 1882 tx_desc = IDPF_SPLITQ_TX_COMPLQ_DESC(complq, 0); 1883 change_bit(__IDPF_Q_GEN_CHK, complq->flags); 1884 } 1885 1886 prefetch(tx_desc); 1887 1888 /* update budget accounting */ 1889 complq_budget--; 1890 } while (likely(complq_budget)); 1891 1892 /* Store the state of the complq to be used later in deciding if a 1893 * TXQ can be started again 1894 */ 1895 if (unlikely(IDPF_TX_COMPLQ_PENDING(complq->txq_grp) > 1896 IDPF_TX_COMPLQ_OVERFLOW_THRESH(complq))) 1897 complq_ok = false; 1898 1899 np = netdev_priv(complq->vport->netdev); 1900 for (i = 0; i < complq->txq_grp->num_txq; ++i) { 1901 struct idpf_queue *tx_q = complq->txq_grp->txqs[i]; 1902 struct netdev_queue *nq; 1903 bool dont_wake; 1904 1905 /* We didn't clean anything on this queue, move along */ 1906 if (!tx_q->cleaned_bytes) 1907 continue; 1908 1909 *cleaned += tx_q->cleaned_pkts; 1910 1911 /* Update BQL */ 1912 nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); 1913 1914 dont_wake = !complq_ok || IDPF_TX_BUF_RSV_LOW(tx_q) || 1915 np->state != __IDPF_VPORT_UP || 1916 !netif_carrier_ok(tx_q->vport->netdev); 1917 /* Check if the TXQ needs to and can be restarted */ 1918 __netif_txq_completed_wake(nq, tx_q->cleaned_pkts, tx_q->cleaned_bytes, 1919 IDPF_DESC_UNUSED(tx_q), IDPF_TX_WAKE_THRESH, 1920 dont_wake); 1921 1922 /* Reset cleaned stats for the next time this queue is 1923 * cleaned 1924 */ 1925 tx_q->cleaned_bytes = 0; 1926 tx_q->cleaned_pkts = 0; 1927 } 1928 1929 ntc += complq->desc_count; 1930 complq->next_to_clean = ntc; 1931 1932 return !!complq_budget; 1933 } 1934 1935 /** 1936 * idpf_tx_splitq_build_ctb - populate command tag and size for queue 1937 * based scheduling descriptors 1938 * @desc: descriptor to populate 1939 * @params: pointer to tx params struct 1940 * @td_cmd: command to be filled in desc 1941 * @size: size of buffer 1942 */ 1943 void idpf_tx_splitq_build_ctb(union idpf_tx_flex_desc *desc, 1944 struct idpf_tx_splitq_params *params, 1945 u16 td_cmd, u16 size) 1946 { 1947 desc->q.qw1.cmd_dtype = 1948 le16_encode_bits(params->dtype, IDPF_FLEX_TXD_QW1_DTYPE_M); 1949 desc->q.qw1.cmd_dtype |= 1950 le16_encode_bits(td_cmd, IDPF_FLEX_TXD_QW1_CMD_M); 1951 desc->q.qw1.buf_size = cpu_to_le16(size); 1952 desc->q.qw1.l2tags.l2tag1 = cpu_to_le16(params->td_tag); 1953 } 1954 1955 /** 1956 * idpf_tx_splitq_build_flow_desc - populate command tag and size for flow 1957 * scheduling descriptors 1958 * @desc: descriptor to populate 1959 * @params: pointer to tx params struct 1960 * @td_cmd: command to be filled in desc 1961 * @size: size of buffer 1962 */ 1963 void idpf_tx_splitq_build_flow_desc(union idpf_tx_flex_desc *desc, 1964 struct idpf_tx_splitq_params *params, 1965 u16 td_cmd, u16 size) 1966 { 1967 desc->flow.qw1.cmd_dtype = (u16)params->dtype | td_cmd; 1968 desc->flow.qw1.rxr_bufsize = cpu_to_le16((u16)size); 1969 desc->flow.qw1.compl_tag = cpu_to_le16(params->compl_tag); 1970 } 1971 1972 /** 1973 * idpf_tx_maybe_stop_common - 1st level check for common Tx stop conditions 1974 * @tx_q: the queue to be checked 1975 * @size: number of descriptors we want to assure is available 1976 * 1977 * Returns 0 if stop is not needed 1978 */ 1979 int idpf_tx_maybe_stop_common(struct idpf_queue *tx_q, unsigned int size) 1980 { 1981 struct netdev_queue *nq; 1982 1983 if (likely(IDPF_DESC_UNUSED(tx_q) >= size)) 1984 return 0; 1985 1986 u64_stats_update_begin(&tx_q->stats_sync); 1987 u64_stats_inc(&tx_q->q_stats.tx.q_busy); 1988 u64_stats_update_end(&tx_q->stats_sync); 1989 1990 nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); 1991 1992 return netif_txq_maybe_stop(nq, IDPF_DESC_UNUSED(tx_q), size, size); 1993 } 1994 1995 /** 1996 * idpf_tx_maybe_stop_splitq - 1st level check for Tx splitq stop conditions 1997 * @tx_q: the queue to be checked 1998 * @descs_needed: number of descriptors required for this packet 1999 * 2000 * Returns 0 if stop is not needed 2001 */ 2002 static int idpf_tx_maybe_stop_splitq(struct idpf_queue *tx_q, 2003 unsigned int descs_needed) 2004 { 2005 if (idpf_tx_maybe_stop_common(tx_q, descs_needed)) 2006 goto splitq_stop; 2007 2008 /* If there are too many outstanding completions expected on the 2009 * completion queue, stop the TX queue to give the device some time to 2010 * catch up 2011 */ 2012 if (unlikely(IDPF_TX_COMPLQ_PENDING(tx_q->txq_grp) > 2013 IDPF_TX_COMPLQ_OVERFLOW_THRESH(tx_q->txq_grp->complq))) 2014 goto splitq_stop; 2015 2016 /* Also check for available book keeping buffers; if we are low, stop 2017 * the queue to wait for more completions 2018 */ 2019 if (unlikely(IDPF_TX_BUF_RSV_LOW(tx_q))) 2020 goto splitq_stop; 2021 2022 return 0; 2023 2024 splitq_stop: 2025 u64_stats_update_begin(&tx_q->stats_sync); 2026 u64_stats_inc(&tx_q->q_stats.tx.q_busy); 2027 u64_stats_update_end(&tx_q->stats_sync); 2028 netif_stop_subqueue(tx_q->vport->netdev, tx_q->idx); 2029 2030 return -EBUSY; 2031 } 2032 2033 /** 2034 * idpf_tx_buf_hw_update - Store the new tail value 2035 * @tx_q: queue to bump 2036 * @val: new tail index 2037 * @xmit_more: more skb's pending 2038 * 2039 * The naming here is special in that 'hw' signals that this function is about 2040 * to do a register write to update our queue status. We know this can only 2041 * mean tail here as HW should be owning head for TX. 2042 */ 2043 void idpf_tx_buf_hw_update(struct idpf_queue *tx_q, u32 val, 2044 bool xmit_more) 2045 { 2046 struct netdev_queue *nq; 2047 2048 nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); 2049 tx_q->next_to_use = val; 2050 2051 idpf_tx_maybe_stop_common(tx_q, IDPF_TX_DESC_NEEDED); 2052 2053 /* Force memory writes to complete before letting h/w 2054 * know there are new descriptors to fetch. (Only 2055 * applicable for weak-ordered memory model archs, 2056 * such as IA-64). 2057 */ 2058 wmb(); 2059 2060 /* notify HW of packet */ 2061 if (netif_xmit_stopped(nq) || !xmit_more) 2062 writel(val, tx_q->tail); 2063 } 2064 2065 /** 2066 * idpf_tx_desc_count_required - calculate number of Tx descriptors needed 2067 * @txq: queue to send buffer on 2068 * @skb: send buffer 2069 * 2070 * Returns number of data descriptors needed for this skb. 2071 */ 2072 unsigned int idpf_tx_desc_count_required(struct idpf_queue *txq, 2073 struct sk_buff *skb) 2074 { 2075 const struct skb_shared_info *shinfo; 2076 unsigned int count = 0, i; 2077 2078 count += !!skb_headlen(skb); 2079 2080 if (!skb_is_nonlinear(skb)) 2081 return count; 2082 2083 shinfo = skb_shinfo(skb); 2084 for (i = 0; i < shinfo->nr_frags; i++) { 2085 unsigned int size; 2086 2087 size = skb_frag_size(&shinfo->frags[i]); 2088 2089 /* We only need to use the idpf_size_to_txd_count check if the 2090 * fragment is going to span multiple descriptors, 2091 * i.e. size >= 16K. 2092 */ 2093 if (size >= SZ_16K) 2094 count += idpf_size_to_txd_count(size); 2095 else 2096 count++; 2097 } 2098 2099 if (idpf_chk_linearize(skb, txq->tx_max_bufs, count)) { 2100 if (__skb_linearize(skb)) 2101 return 0; 2102 2103 count = idpf_size_to_txd_count(skb->len); 2104 u64_stats_update_begin(&txq->stats_sync); 2105 u64_stats_inc(&txq->q_stats.tx.linearize); 2106 u64_stats_update_end(&txq->stats_sync); 2107 } 2108 2109 return count; 2110 } 2111 2112 /** 2113 * idpf_tx_dma_map_error - handle TX DMA map errors 2114 * @txq: queue to send buffer on 2115 * @skb: send buffer 2116 * @first: original first buffer info buffer for packet 2117 * @idx: starting point on ring to unwind 2118 */ 2119 void idpf_tx_dma_map_error(struct idpf_queue *txq, struct sk_buff *skb, 2120 struct idpf_tx_buf *first, u16 idx) 2121 { 2122 u64_stats_update_begin(&txq->stats_sync); 2123 u64_stats_inc(&txq->q_stats.tx.dma_map_errs); 2124 u64_stats_update_end(&txq->stats_sync); 2125 2126 /* clear dma mappings for failed tx_buf map */ 2127 for (;;) { 2128 struct idpf_tx_buf *tx_buf; 2129 2130 tx_buf = &txq->tx_buf[idx]; 2131 idpf_tx_buf_rel(txq, tx_buf); 2132 if (tx_buf == first) 2133 break; 2134 if (idx == 0) 2135 idx = txq->desc_count; 2136 idx--; 2137 } 2138 2139 if (skb_is_gso(skb)) { 2140 union idpf_tx_flex_desc *tx_desc; 2141 2142 /* If we failed a DMA mapping for a TSO packet, we will have 2143 * used one additional descriptor for a context 2144 * descriptor. Reset that here. 2145 */ 2146 tx_desc = IDPF_FLEX_TX_DESC(txq, idx); 2147 memset(tx_desc, 0, sizeof(struct idpf_flex_tx_ctx_desc)); 2148 if (idx == 0) 2149 idx = txq->desc_count; 2150 idx--; 2151 } 2152 2153 /* Update tail in case netdev_xmit_more was previously true */ 2154 idpf_tx_buf_hw_update(txq, idx, false); 2155 } 2156 2157 /** 2158 * idpf_tx_splitq_bump_ntu - adjust NTU and generation 2159 * @txq: the tx ring to wrap 2160 * @ntu: ring index to bump 2161 */ 2162 static unsigned int idpf_tx_splitq_bump_ntu(struct idpf_queue *txq, u16 ntu) 2163 { 2164 ntu++; 2165 2166 if (ntu == txq->desc_count) { 2167 ntu = 0; 2168 txq->compl_tag_cur_gen = IDPF_TX_ADJ_COMPL_TAG_GEN(txq); 2169 } 2170 2171 return ntu; 2172 } 2173 2174 /** 2175 * idpf_tx_splitq_map - Build the Tx flex descriptor 2176 * @tx_q: queue to send buffer on 2177 * @params: pointer to splitq params struct 2178 * @first: first buffer info buffer to use 2179 * 2180 * This function loops over the skb data pointed to by *first 2181 * and gets a physical address for each memory location and programs 2182 * it and the length into the transmit flex descriptor. 2183 */ 2184 static void idpf_tx_splitq_map(struct idpf_queue *tx_q, 2185 struct idpf_tx_splitq_params *params, 2186 struct idpf_tx_buf *first) 2187 { 2188 union idpf_tx_flex_desc *tx_desc; 2189 unsigned int data_len, size; 2190 struct idpf_tx_buf *tx_buf; 2191 u16 i = tx_q->next_to_use; 2192 struct netdev_queue *nq; 2193 struct sk_buff *skb; 2194 skb_frag_t *frag; 2195 u16 td_cmd = 0; 2196 dma_addr_t dma; 2197 2198 skb = first->skb; 2199 2200 td_cmd = params->offload.td_cmd; 2201 2202 data_len = skb->data_len; 2203 size = skb_headlen(skb); 2204 2205 tx_desc = IDPF_FLEX_TX_DESC(tx_q, i); 2206 2207 dma = dma_map_single(tx_q->dev, skb->data, size, DMA_TO_DEVICE); 2208 2209 tx_buf = first; 2210 2211 params->compl_tag = 2212 (tx_q->compl_tag_cur_gen << tx_q->compl_tag_gen_s) | i; 2213 2214 for (frag = &skb_shinfo(skb)->frags[0];; frag++) { 2215 unsigned int max_data = IDPF_TX_MAX_DESC_DATA_ALIGNED; 2216 2217 if (dma_mapping_error(tx_q->dev, dma)) 2218 return idpf_tx_dma_map_error(tx_q, skb, first, i); 2219 2220 tx_buf->compl_tag = params->compl_tag; 2221 2222 /* record length, and DMA address */ 2223 dma_unmap_len_set(tx_buf, len, size); 2224 dma_unmap_addr_set(tx_buf, dma, dma); 2225 2226 /* buf_addr is in same location for both desc types */ 2227 tx_desc->q.buf_addr = cpu_to_le64(dma); 2228 2229 /* The stack can send us fragments that are too large for a 2230 * single descriptor i.e. frag size > 16K-1. We will need to 2231 * split the fragment across multiple descriptors in this case. 2232 * To adhere to HW alignment restrictions, the fragment needs 2233 * to be split such that the first chunk ends on a 4K boundary 2234 * and all subsequent chunks start on a 4K boundary. We still 2235 * want to send as much data as possible though, so our 2236 * intermediate descriptor chunk size will be 12K. 2237 * 2238 * For example, consider a 32K fragment mapped to DMA addr 2600. 2239 * ------------------------------------------------------------ 2240 * | frag_size = 32K | 2241 * ------------------------------------------------------------ 2242 * |2600 |16384 |28672 2243 * 2244 * 3 descriptors will be used for this fragment. The HW expects 2245 * the descriptors to contain the following: 2246 * ------------------------------------------------------------ 2247 * | size = 13784 | size = 12K | size = 6696 | 2248 * | dma = 2600 | dma = 16384 | dma = 28672 | 2249 * ------------------------------------------------------------ 2250 * 2251 * We need to first adjust the max_data for the first chunk so 2252 * that it ends on a 4K boundary. By negating the value of the 2253 * DMA address and taking only the low order bits, we're 2254 * effectively calculating 2255 * 4K - (DMA addr lower order bits) = 2256 * bytes to next boundary. 2257 * 2258 * Add that to our base aligned max_data (12K) and we have 2259 * our first chunk size. In the example above, 2260 * 13784 = 12K + (4096-2600) 2261 * 2262 * After guaranteeing the first chunk ends on a 4K boundary, we 2263 * will give the intermediate descriptors 12K chunks and 2264 * whatever is left to the final descriptor. This ensures that 2265 * all descriptors used for the remaining chunks of the 2266 * fragment start on a 4K boundary and we use as few 2267 * descriptors as possible. 2268 */ 2269 max_data += -dma & (IDPF_TX_MAX_READ_REQ_SIZE - 1); 2270 while (unlikely(size > IDPF_TX_MAX_DESC_DATA)) { 2271 idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, 2272 max_data); 2273 2274 tx_desc++; 2275 i++; 2276 2277 if (i == tx_q->desc_count) { 2278 tx_desc = IDPF_FLEX_TX_DESC(tx_q, 0); 2279 i = 0; 2280 tx_q->compl_tag_cur_gen = 2281 IDPF_TX_ADJ_COMPL_TAG_GEN(tx_q); 2282 } 2283 2284 /* Since this packet has a buffer that is going to span 2285 * multiple descriptors, it's going to leave holes in 2286 * to the TX buffer ring. To ensure these holes do not 2287 * cause issues in the cleaning routines, we will clear 2288 * them of any stale data and assign them the same 2289 * completion tag as the current packet. Then when the 2290 * packet is being cleaned, the cleaning routines will 2291 * simply pass over these holes and finish cleaning the 2292 * rest of the packet. 2293 */ 2294 memset(&tx_q->tx_buf[i], 0, sizeof(struct idpf_tx_buf)); 2295 tx_q->tx_buf[i].compl_tag = params->compl_tag; 2296 2297 /* Adjust the DMA offset and the remaining size of the 2298 * fragment. On the first iteration of this loop, 2299 * max_data will be >= 12K and <= 16K-1. On any 2300 * subsequent iteration of this loop, max_data will 2301 * always be 12K. 2302 */ 2303 dma += max_data; 2304 size -= max_data; 2305 2306 /* Reset max_data since remaining chunks will be 12K 2307 * at most 2308 */ 2309 max_data = IDPF_TX_MAX_DESC_DATA_ALIGNED; 2310 2311 /* buf_addr is in same location for both desc types */ 2312 tx_desc->q.buf_addr = cpu_to_le64(dma); 2313 } 2314 2315 if (!data_len) 2316 break; 2317 2318 idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, size); 2319 tx_desc++; 2320 i++; 2321 2322 if (i == tx_q->desc_count) { 2323 tx_desc = IDPF_FLEX_TX_DESC(tx_q, 0); 2324 i = 0; 2325 tx_q->compl_tag_cur_gen = IDPF_TX_ADJ_COMPL_TAG_GEN(tx_q); 2326 } 2327 2328 size = skb_frag_size(frag); 2329 data_len -= size; 2330 2331 dma = skb_frag_dma_map(tx_q->dev, frag, 0, size, 2332 DMA_TO_DEVICE); 2333 2334 tx_buf = &tx_q->tx_buf[i]; 2335 } 2336 2337 /* record SW timestamp if HW timestamp is not available */ 2338 skb_tx_timestamp(skb); 2339 2340 /* write last descriptor with RS and EOP bits */ 2341 td_cmd |= params->eop_cmd; 2342 idpf_tx_splitq_build_desc(tx_desc, params, td_cmd, size); 2343 i = idpf_tx_splitq_bump_ntu(tx_q, i); 2344 2345 /* set next_to_watch value indicating a packet is present */ 2346 first->next_to_watch = tx_desc; 2347 2348 tx_q->txq_grp->num_completions_pending++; 2349 2350 /* record bytecount for BQL */ 2351 nq = netdev_get_tx_queue(tx_q->vport->netdev, tx_q->idx); 2352 netdev_tx_sent_queue(nq, first->bytecount); 2353 2354 idpf_tx_buf_hw_update(tx_q, i, netdev_xmit_more()); 2355 } 2356 2357 /** 2358 * idpf_tso - computes mss and TSO length to prepare for TSO 2359 * @skb: pointer to skb 2360 * @off: pointer to struct that holds offload parameters 2361 * 2362 * Returns error (negative) if TSO was requested but cannot be applied to the 2363 * given skb, 0 if TSO does not apply to the given skb, or 1 otherwise. 2364 */ 2365 int idpf_tso(struct sk_buff *skb, struct idpf_tx_offload_params *off) 2366 { 2367 const struct skb_shared_info *shinfo; 2368 union { 2369 struct iphdr *v4; 2370 struct ipv6hdr *v6; 2371 unsigned char *hdr; 2372 } ip; 2373 union { 2374 struct tcphdr *tcp; 2375 struct udphdr *udp; 2376 unsigned char *hdr; 2377 } l4; 2378 u32 paylen, l4_start; 2379 int err; 2380 2381 if (!skb_is_gso(skb)) 2382 return 0; 2383 2384 err = skb_cow_head(skb, 0); 2385 if (err < 0) 2386 return err; 2387 2388 shinfo = skb_shinfo(skb); 2389 2390 ip.hdr = skb_network_header(skb); 2391 l4.hdr = skb_transport_header(skb); 2392 2393 /* initialize outer IP header fields */ 2394 if (ip.v4->version == 4) { 2395 ip.v4->tot_len = 0; 2396 ip.v4->check = 0; 2397 } else if (ip.v6->version == 6) { 2398 ip.v6->payload_len = 0; 2399 } 2400 2401 l4_start = skb_transport_offset(skb); 2402 2403 /* remove payload length from checksum */ 2404 paylen = skb->len - l4_start; 2405 2406 switch (shinfo->gso_type & ~SKB_GSO_DODGY) { 2407 case SKB_GSO_TCPV4: 2408 case SKB_GSO_TCPV6: 2409 csum_replace_by_diff(&l4.tcp->check, 2410 (__force __wsum)htonl(paylen)); 2411 off->tso_hdr_len = __tcp_hdrlen(l4.tcp) + l4_start; 2412 break; 2413 case SKB_GSO_UDP_L4: 2414 csum_replace_by_diff(&l4.udp->check, 2415 (__force __wsum)htonl(paylen)); 2416 /* compute length of segmentation header */ 2417 off->tso_hdr_len = sizeof(struct udphdr) + l4_start; 2418 l4.udp->len = htons(shinfo->gso_size + sizeof(struct udphdr)); 2419 break; 2420 default: 2421 return -EINVAL; 2422 } 2423 2424 off->tso_len = skb->len - off->tso_hdr_len; 2425 off->mss = shinfo->gso_size; 2426 off->tso_segs = shinfo->gso_segs; 2427 2428 off->tx_flags |= IDPF_TX_FLAGS_TSO; 2429 2430 return 1; 2431 } 2432 2433 /** 2434 * __idpf_chk_linearize - Check skb is not using too many buffers 2435 * @skb: send buffer 2436 * @max_bufs: maximum number of buffers 2437 * 2438 * For TSO we need to count the TSO header and segment payload separately. As 2439 * such we need to check cases where we have max_bufs-1 fragments or more as we 2440 * can potentially require max_bufs+1 DMA transactions, 1 for the TSO header, 1 2441 * for the segment payload in the first descriptor, and another max_buf-1 for 2442 * the fragments. 2443 */ 2444 static bool __idpf_chk_linearize(struct sk_buff *skb, unsigned int max_bufs) 2445 { 2446 const struct skb_shared_info *shinfo = skb_shinfo(skb); 2447 const skb_frag_t *frag, *stale; 2448 int nr_frags, sum; 2449 2450 /* no need to check if number of frags is less than max_bufs - 1 */ 2451 nr_frags = shinfo->nr_frags; 2452 if (nr_frags < (max_bufs - 1)) 2453 return false; 2454 2455 /* We need to walk through the list and validate that each group 2456 * of max_bufs-2 fragments totals at least gso_size. 2457 */ 2458 nr_frags -= max_bufs - 2; 2459 frag = &shinfo->frags[0]; 2460 2461 /* Initialize size to the negative value of gso_size minus 1. We use 2462 * this as the worst case scenario in which the frag ahead of us only 2463 * provides one byte which is why we are limited to max_bufs-2 2464 * descriptors for a single transmit as the header and previous 2465 * fragment are already consuming 2 descriptors. 2466 */ 2467 sum = 1 - shinfo->gso_size; 2468 2469 /* Add size of frags 0 through 4 to create our initial sum */ 2470 sum += skb_frag_size(frag++); 2471 sum += skb_frag_size(frag++); 2472 sum += skb_frag_size(frag++); 2473 sum += skb_frag_size(frag++); 2474 sum += skb_frag_size(frag++); 2475 2476 /* Walk through fragments adding latest fragment, testing it, and 2477 * then removing stale fragments from the sum. 2478 */ 2479 for (stale = &shinfo->frags[0];; stale++) { 2480 int stale_size = skb_frag_size(stale); 2481 2482 sum += skb_frag_size(frag++); 2483 2484 /* The stale fragment may present us with a smaller 2485 * descriptor than the actual fragment size. To account 2486 * for that we need to remove all the data on the front and 2487 * figure out what the remainder would be in the last 2488 * descriptor associated with the fragment. 2489 */ 2490 if (stale_size > IDPF_TX_MAX_DESC_DATA) { 2491 int align_pad = -(skb_frag_off(stale)) & 2492 (IDPF_TX_MAX_READ_REQ_SIZE - 1); 2493 2494 sum -= align_pad; 2495 stale_size -= align_pad; 2496 2497 do { 2498 sum -= IDPF_TX_MAX_DESC_DATA_ALIGNED; 2499 stale_size -= IDPF_TX_MAX_DESC_DATA_ALIGNED; 2500 } while (stale_size > IDPF_TX_MAX_DESC_DATA); 2501 } 2502 2503 /* if sum is negative we failed to make sufficient progress */ 2504 if (sum < 0) 2505 return true; 2506 2507 if (!nr_frags--) 2508 break; 2509 2510 sum -= stale_size; 2511 } 2512 2513 return false; 2514 } 2515 2516 /** 2517 * idpf_chk_linearize - Check if skb exceeds max descriptors per packet 2518 * @skb: send buffer 2519 * @max_bufs: maximum scatter gather buffers for single packet 2520 * @count: number of buffers this packet needs 2521 * 2522 * Make sure we don't exceed maximum scatter gather buffers for a single 2523 * packet. We have to do some special checking around the boundary (max_bufs-1) 2524 * if TSO is on since we need count the TSO header and payload separately. 2525 * E.g.: a packet with 7 fragments can require 9 DMA transactions; 1 for TSO 2526 * header, 1 for segment payload, and then 7 for the fragments. 2527 */ 2528 bool idpf_chk_linearize(struct sk_buff *skb, unsigned int max_bufs, 2529 unsigned int count) 2530 { 2531 if (likely(count < max_bufs)) 2532 return false; 2533 if (skb_is_gso(skb)) 2534 return __idpf_chk_linearize(skb, max_bufs); 2535 2536 return count > max_bufs; 2537 } 2538 2539 /** 2540 * idpf_tx_splitq_get_ctx_desc - grab next desc and update buffer ring 2541 * @txq: queue to put context descriptor on 2542 * 2543 * Since the TX buffer rings mimics the descriptor ring, update the tx buffer 2544 * ring entry to reflect that this index is a context descriptor 2545 */ 2546 static struct idpf_flex_tx_ctx_desc * 2547 idpf_tx_splitq_get_ctx_desc(struct idpf_queue *txq) 2548 { 2549 struct idpf_flex_tx_ctx_desc *desc; 2550 int i = txq->next_to_use; 2551 2552 memset(&txq->tx_buf[i], 0, sizeof(struct idpf_tx_buf)); 2553 txq->tx_buf[i].compl_tag = IDPF_SPLITQ_TX_INVAL_COMPL_TAG; 2554 2555 /* grab the next descriptor */ 2556 desc = IDPF_FLEX_TX_CTX_DESC(txq, i); 2557 txq->next_to_use = idpf_tx_splitq_bump_ntu(txq, i); 2558 2559 return desc; 2560 } 2561 2562 /** 2563 * idpf_tx_drop_skb - free the SKB and bump tail if necessary 2564 * @tx_q: queue to send buffer on 2565 * @skb: pointer to skb 2566 */ 2567 netdev_tx_t idpf_tx_drop_skb(struct idpf_queue *tx_q, struct sk_buff *skb) 2568 { 2569 u64_stats_update_begin(&tx_q->stats_sync); 2570 u64_stats_inc(&tx_q->q_stats.tx.skb_drops); 2571 u64_stats_update_end(&tx_q->stats_sync); 2572 2573 idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); 2574 2575 dev_kfree_skb(skb); 2576 2577 return NETDEV_TX_OK; 2578 } 2579 2580 /** 2581 * idpf_tx_splitq_frame - Sends buffer on Tx ring using flex descriptors 2582 * @skb: send buffer 2583 * @tx_q: queue to send buffer on 2584 * 2585 * Returns NETDEV_TX_OK if sent, else an error code 2586 */ 2587 static netdev_tx_t idpf_tx_splitq_frame(struct sk_buff *skb, 2588 struct idpf_queue *tx_q) 2589 { 2590 struct idpf_tx_splitq_params tx_params = { }; 2591 struct idpf_tx_buf *first; 2592 unsigned int count; 2593 int tso; 2594 2595 count = idpf_tx_desc_count_required(tx_q, skb); 2596 if (unlikely(!count)) 2597 return idpf_tx_drop_skb(tx_q, skb); 2598 2599 tso = idpf_tso(skb, &tx_params.offload); 2600 if (unlikely(tso < 0)) 2601 return idpf_tx_drop_skb(tx_q, skb); 2602 2603 /* Check for splitq specific TX resources */ 2604 count += (IDPF_TX_DESCS_PER_CACHE_LINE + tso); 2605 if (idpf_tx_maybe_stop_splitq(tx_q, count)) { 2606 idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); 2607 2608 return NETDEV_TX_BUSY; 2609 } 2610 2611 if (tso) { 2612 /* If tso is needed, set up context desc */ 2613 struct idpf_flex_tx_ctx_desc *ctx_desc = 2614 idpf_tx_splitq_get_ctx_desc(tx_q); 2615 2616 ctx_desc->tso.qw1.cmd_dtype = 2617 cpu_to_le16(IDPF_TX_DESC_DTYPE_FLEX_TSO_CTX | 2618 IDPF_TX_FLEX_CTX_DESC_CMD_TSO); 2619 ctx_desc->tso.qw0.flex_tlen = 2620 cpu_to_le32(tx_params.offload.tso_len & 2621 IDPF_TXD_FLEX_CTX_TLEN_M); 2622 ctx_desc->tso.qw0.mss_rt = 2623 cpu_to_le16(tx_params.offload.mss & 2624 IDPF_TXD_FLEX_CTX_MSS_RT_M); 2625 ctx_desc->tso.qw0.hdr_len = tx_params.offload.tso_hdr_len; 2626 2627 u64_stats_update_begin(&tx_q->stats_sync); 2628 u64_stats_inc(&tx_q->q_stats.tx.lso_pkts); 2629 u64_stats_update_end(&tx_q->stats_sync); 2630 } 2631 2632 /* record the location of the first descriptor for this packet */ 2633 first = &tx_q->tx_buf[tx_q->next_to_use]; 2634 first->skb = skb; 2635 2636 if (tso) { 2637 first->gso_segs = tx_params.offload.tso_segs; 2638 first->bytecount = skb->len + 2639 ((first->gso_segs - 1) * tx_params.offload.tso_hdr_len); 2640 } else { 2641 first->gso_segs = 1; 2642 first->bytecount = max_t(unsigned int, skb->len, ETH_ZLEN); 2643 } 2644 2645 if (test_bit(__IDPF_Q_FLOW_SCH_EN, tx_q->flags)) { 2646 tx_params.dtype = IDPF_TX_DESC_DTYPE_FLEX_FLOW_SCHE; 2647 tx_params.eop_cmd = IDPF_TXD_FLEX_FLOW_CMD_EOP; 2648 /* Set the RE bit to catch any packets that may have not been 2649 * stashed during RS completion cleaning. MIN_GAP is set to 2650 * MIN_RING size to ensure it will be set at least once each 2651 * time around the ring. 2652 */ 2653 if (!(tx_q->next_to_use % IDPF_TX_SPLITQ_RE_MIN_GAP)) { 2654 tx_params.eop_cmd |= IDPF_TXD_FLEX_FLOW_CMD_RE; 2655 tx_q->txq_grp->num_completions_pending++; 2656 } 2657 2658 if (skb->ip_summed == CHECKSUM_PARTIAL) 2659 tx_params.offload.td_cmd |= IDPF_TXD_FLEX_FLOW_CMD_CS_EN; 2660 2661 } else { 2662 tx_params.dtype = IDPF_TX_DESC_DTYPE_FLEX_L2TAG1_L2TAG2; 2663 tx_params.eop_cmd = IDPF_TXD_LAST_DESC_CMD; 2664 2665 if (skb->ip_summed == CHECKSUM_PARTIAL) 2666 tx_params.offload.td_cmd |= IDPF_TX_FLEX_DESC_CMD_CS_EN; 2667 } 2668 2669 idpf_tx_splitq_map(tx_q, &tx_params, first); 2670 2671 return NETDEV_TX_OK; 2672 } 2673 2674 /** 2675 * idpf_tx_splitq_start - Selects the right Tx queue to send buffer 2676 * @skb: send buffer 2677 * @netdev: network interface device structure 2678 * 2679 * Returns NETDEV_TX_OK if sent, else an error code 2680 */ 2681 netdev_tx_t idpf_tx_splitq_start(struct sk_buff *skb, 2682 struct net_device *netdev) 2683 { 2684 struct idpf_vport *vport = idpf_netdev_to_vport(netdev); 2685 struct idpf_queue *tx_q; 2686 2687 if (unlikely(skb_get_queue_mapping(skb) >= vport->num_txq)) { 2688 dev_kfree_skb_any(skb); 2689 2690 return NETDEV_TX_OK; 2691 } 2692 2693 tx_q = vport->txqs[skb_get_queue_mapping(skb)]; 2694 2695 /* hardware can't handle really short frames, hardware padding works 2696 * beyond this point 2697 */ 2698 if (skb_put_padto(skb, tx_q->tx_min_pkt_len)) { 2699 idpf_tx_buf_hw_update(tx_q, tx_q->next_to_use, false); 2700 2701 return NETDEV_TX_OK; 2702 } 2703 2704 return idpf_tx_splitq_frame(skb, tx_q); 2705 } 2706 2707 /** 2708 * idpf_ptype_to_htype - get a hash type 2709 * @decoded: Decoded Rx packet type related fields 2710 * 2711 * Returns appropriate hash type (such as PKT_HASH_TYPE_L2/L3/L4) to be used by 2712 * skb_set_hash based on PTYPE as parsed by HW Rx pipeline and is part of 2713 * Rx desc. 2714 */ 2715 enum pkt_hash_types idpf_ptype_to_htype(const struct idpf_rx_ptype_decoded *decoded) 2716 { 2717 if (!decoded->known) 2718 return PKT_HASH_TYPE_NONE; 2719 if (decoded->payload_layer == IDPF_RX_PTYPE_PAYLOAD_LAYER_PAY2 && 2720 decoded->inner_prot) 2721 return PKT_HASH_TYPE_L4; 2722 if (decoded->payload_layer == IDPF_RX_PTYPE_PAYLOAD_LAYER_PAY2 && 2723 decoded->outer_ip) 2724 return PKT_HASH_TYPE_L3; 2725 if (decoded->outer_ip == IDPF_RX_PTYPE_OUTER_L2) 2726 return PKT_HASH_TYPE_L2; 2727 2728 return PKT_HASH_TYPE_NONE; 2729 } 2730 2731 /** 2732 * idpf_rx_hash - set the hash value in the skb 2733 * @rxq: Rx descriptor ring packet is being transacted on 2734 * @skb: pointer to current skb being populated 2735 * @rx_desc: Receive descriptor 2736 * @decoded: Decoded Rx packet type related fields 2737 */ 2738 static void idpf_rx_hash(struct idpf_queue *rxq, struct sk_buff *skb, 2739 struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, 2740 struct idpf_rx_ptype_decoded *decoded) 2741 { 2742 u32 hash; 2743 2744 if (unlikely(!idpf_is_feature_ena(rxq->vport, NETIF_F_RXHASH))) 2745 return; 2746 2747 hash = le16_to_cpu(rx_desc->hash1) | 2748 (rx_desc->ff2_mirrid_hash2.hash2 << 16) | 2749 (rx_desc->hash3 << 24); 2750 2751 skb_set_hash(skb, hash, idpf_ptype_to_htype(decoded)); 2752 } 2753 2754 /** 2755 * idpf_rx_csum - Indicate in skb if checksum is good 2756 * @rxq: Rx descriptor ring packet is being transacted on 2757 * @skb: pointer to current skb being populated 2758 * @csum_bits: checksum fields extracted from the descriptor 2759 * @decoded: Decoded Rx packet type related fields 2760 * 2761 * skb->protocol must be set before this function is called 2762 */ 2763 static void idpf_rx_csum(struct idpf_queue *rxq, struct sk_buff *skb, 2764 struct idpf_rx_csum_decoded *csum_bits, 2765 struct idpf_rx_ptype_decoded *decoded) 2766 { 2767 bool ipv4, ipv6; 2768 2769 /* check if Rx checksum is enabled */ 2770 if (unlikely(!idpf_is_feature_ena(rxq->vport, NETIF_F_RXCSUM))) 2771 return; 2772 2773 /* check if HW has decoded the packet and checksum */ 2774 if (!(csum_bits->l3l4p)) 2775 return; 2776 2777 ipv4 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV4); 2778 ipv6 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV6); 2779 2780 if (ipv4 && (csum_bits->ipe || csum_bits->eipe)) 2781 goto checksum_fail; 2782 2783 if (ipv6 && csum_bits->ipv6exadd) 2784 return; 2785 2786 /* check for L4 errors and handle packets that were not able to be 2787 * checksummed 2788 */ 2789 if (csum_bits->l4e) 2790 goto checksum_fail; 2791 2792 /* Only report checksum unnecessary for ICMP, TCP, UDP, or SCTP */ 2793 switch (decoded->inner_prot) { 2794 case IDPF_RX_PTYPE_INNER_PROT_ICMP: 2795 case IDPF_RX_PTYPE_INNER_PROT_TCP: 2796 case IDPF_RX_PTYPE_INNER_PROT_UDP: 2797 if (!csum_bits->raw_csum_inv) { 2798 u16 csum = csum_bits->raw_csum; 2799 2800 skb->csum = csum_unfold((__force __sum16)~swab16(csum)); 2801 skb->ip_summed = CHECKSUM_COMPLETE; 2802 } else { 2803 skb->ip_summed = CHECKSUM_UNNECESSARY; 2804 } 2805 break; 2806 case IDPF_RX_PTYPE_INNER_PROT_SCTP: 2807 skb->ip_summed = CHECKSUM_UNNECESSARY; 2808 break; 2809 default: 2810 break; 2811 } 2812 2813 return; 2814 2815 checksum_fail: 2816 u64_stats_update_begin(&rxq->stats_sync); 2817 u64_stats_inc(&rxq->q_stats.rx.hw_csum_err); 2818 u64_stats_update_end(&rxq->stats_sync); 2819 } 2820 2821 /** 2822 * idpf_rx_splitq_extract_csum_bits - Extract checksum bits from descriptor 2823 * @rx_desc: receive descriptor 2824 * @csum: structure to extract checksum fields 2825 * 2826 **/ 2827 static void idpf_rx_splitq_extract_csum_bits(struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, 2828 struct idpf_rx_csum_decoded *csum) 2829 { 2830 u8 qword0, qword1; 2831 2832 qword0 = rx_desc->status_err0_qw0; 2833 qword1 = rx_desc->status_err0_qw1; 2834 2835 csum->ipe = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_IPE_M, 2836 qword1); 2837 csum->eipe = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_EIPE_M, 2838 qword1); 2839 csum->l4e = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_XSUM_L4E_M, 2840 qword1); 2841 csum->l3l4p = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_L3L4P_M, 2842 qword1); 2843 csum->ipv6exadd = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_IPV6EXADD_M, 2844 qword0); 2845 csum->raw_csum_inv = 2846 le16_get_bits(rx_desc->ptype_err_fflags0, 2847 VIRTCHNL2_RX_FLEX_DESC_ADV_RAW_CSUM_INV_M); 2848 csum->raw_csum = le16_to_cpu(rx_desc->misc.raw_cs); 2849 } 2850 2851 /** 2852 * idpf_rx_rsc - Set the RSC fields in the skb 2853 * @rxq : Rx descriptor ring packet is being transacted on 2854 * @skb : pointer to current skb being populated 2855 * @rx_desc: Receive descriptor 2856 * @decoded: Decoded Rx packet type related fields 2857 * 2858 * Return 0 on success and error code on failure 2859 * 2860 * Populate the skb fields with the total number of RSC segments, RSC payload 2861 * length and packet type. 2862 */ 2863 static int idpf_rx_rsc(struct idpf_queue *rxq, struct sk_buff *skb, 2864 struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc, 2865 struct idpf_rx_ptype_decoded *decoded) 2866 { 2867 u16 rsc_segments, rsc_seg_len; 2868 bool ipv4, ipv6; 2869 int len; 2870 2871 if (unlikely(!decoded->outer_ip)) 2872 return -EINVAL; 2873 2874 rsc_seg_len = le16_to_cpu(rx_desc->misc.rscseglen); 2875 if (unlikely(!rsc_seg_len)) 2876 return -EINVAL; 2877 2878 ipv4 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV4); 2879 ipv6 = IDPF_RX_PTYPE_TO_IPV(decoded, IDPF_RX_PTYPE_OUTER_IPV6); 2880 2881 if (unlikely(!(ipv4 ^ ipv6))) 2882 return -EINVAL; 2883 2884 rsc_segments = DIV_ROUND_UP(skb->data_len, rsc_seg_len); 2885 if (unlikely(rsc_segments == 1)) 2886 return 0; 2887 2888 NAPI_GRO_CB(skb)->count = rsc_segments; 2889 skb_shinfo(skb)->gso_size = rsc_seg_len; 2890 2891 skb_reset_network_header(skb); 2892 len = skb->len - skb_transport_offset(skb); 2893 2894 if (ipv4) { 2895 struct iphdr *ipv4h = ip_hdr(skb); 2896 2897 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV4; 2898 2899 /* Reset and set transport header offset in skb */ 2900 skb_set_transport_header(skb, sizeof(struct iphdr)); 2901 2902 /* Compute the TCP pseudo header checksum*/ 2903 tcp_hdr(skb)->check = 2904 ~tcp_v4_check(len, ipv4h->saddr, ipv4h->daddr, 0); 2905 } else { 2906 struct ipv6hdr *ipv6h = ipv6_hdr(skb); 2907 2908 skb_shinfo(skb)->gso_type = SKB_GSO_TCPV6; 2909 skb_set_transport_header(skb, sizeof(struct ipv6hdr)); 2910 tcp_hdr(skb)->check = 2911 ~tcp_v6_check(len, &ipv6h->saddr, &ipv6h->daddr, 0); 2912 } 2913 2914 tcp_gro_complete(skb); 2915 2916 u64_stats_update_begin(&rxq->stats_sync); 2917 u64_stats_inc(&rxq->q_stats.rx.rsc_pkts); 2918 u64_stats_update_end(&rxq->stats_sync); 2919 2920 return 0; 2921 } 2922 2923 /** 2924 * idpf_rx_process_skb_fields - Populate skb header fields from Rx descriptor 2925 * @rxq: Rx descriptor ring packet is being transacted on 2926 * @skb: pointer to current skb being populated 2927 * @rx_desc: Receive descriptor 2928 * 2929 * This function checks the ring, descriptor, and packet information in 2930 * order to populate the hash, checksum, protocol, and 2931 * other fields within the skb. 2932 */ 2933 static int idpf_rx_process_skb_fields(struct idpf_queue *rxq, 2934 struct sk_buff *skb, 2935 struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc) 2936 { 2937 struct idpf_rx_csum_decoded csum_bits = { }; 2938 struct idpf_rx_ptype_decoded decoded; 2939 u16 rx_ptype; 2940 2941 rx_ptype = le16_get_bits(rx_desc->ptype_err_fflags0, 2942 VIRTCHNL2_RX_FLEX_DESC_ADV_PTYPE_M); 2943 2944 decoded = rxq->vport->rx_ptype_lkup[rx_ptype]; 2945 /* If we don't know the ptype we can't do anything else with it. Just 2946 * pass it up the stack as-is. 2947 */ 2948 if (!decoded.known) 2949 return 0; 2950 2951 /* process RSS/hash */ 2952 idpf_rx_hash(rxq, skb, rx_desc, &decoded); 2953 2954 skb->protocol = eth_type_trans(skb, rxq->vport->netdev); 2955 2956 if (le16_get_bits(rx_desc->hdrlen_flags, 2957 VIRTCHNL2_RX_FLEX_DESC_ADV_RSC_M)) 2958 return idpf_rx_rsc(rxq, skb, rx_desc, &decoded); 2959 2960 idpf_rx_splitq_extract_csum_bits(rx_desc, &csum_bits); 2961 idpf_rx_csum(rxq, skb, &csum_bits, &decoded); 2962 2963 return 0; 2964 } 2965 2966 /** 2967 * idpf_rx_add_frag - Add contents of Rx buffer to sk_buff as a frag 2968 * @rx_buf: buffer containing page to add 2969 * @skb: sk_buff to place the data into 2970 * @size: packet length from rx_desc 2971 * 2972 * This function will add the data contained in rx_buf->page to the skb. 2973 * It will just attach the page as a frag to the skb. 2974 * The function will then update the page offset. 2975 */ 2976 void idpf_rx_add_frag(struct idpf_rx_buf *rx_buf, struct sk_buff *skb, 2977 unsigned int size) 2978 { 2979 skb_add_rx_frag(skb, skb_shinfo(skb)->nr_frags, rx_buf->page, 2980 rx_buf->page_offset, size, rx_buf->truesize); 2981 2982 rx_buf->page = NULL; 2983 } 2984 2985 /** 2986 * idpf_rx_construct_skb - Allocate skb and populate it 2987 * @rxq: Rx descriptor queue 2988 * @rx_buf: Rx buffer to pull data from 2989 * @size: the length of the packet 2990 * 2991 * This function allocates an skb. It then populates it with the page 2992 * data from the current receive descriptor, taking care to set up the 2993 * skb correctly. 2994 */ 2995 struct sk_buff *idpf_rx_construct_skb(struct idpf_queue *rxq, 2996 struct idpf_rx_buf *rx_buf, 2997 unsigned int size) 2998 { 2999 unsigned int headlen; 3000 struct sk_buff *skb; 3001 void *va; 3002 3003 va = page_address(rx_buf->page) + rx_buf->page_offset; 3004 3005 /* prefetch first cache line of first page */ 3006 net_prefetch(va); 3007 /* allocate a skb to store the frags */ 3008 skb = __napi_alloc_skb(&rxq->q_vector->napi, IDPF_RX_HDR_SIZE, 3009 GFP_ATOMIC); 3010 if (unlikely(!skb)) { 3011 idpf_rx_put_page(rx_buf); 3012 3013 return NULL; 3014 } 3015 3016 skb_record_rx_queue(skb, rxq->idx); 3017 skb_mark_for_recycle(skb); 3018 3019 /* Determine available headroom for copy */ 3020 headlen = size; 3021 if (headlen > IDPF_RX_HDR_SIZE) 3022 headlen = eth_get_headlen(skb->dev, va, IDPF_RX_HDR_SIZE); 3023 3024 /* align pull length to size of long to optimize memcpy performance */ 3025 memcpy(__skb_put(skb, headlen), va, ALIGN(headlen, sizeof(long))); 3026 3027 /* if we exhaust the linear part then add what is left as a frag */ 3028 size -= headlen; 3029 if (!size) { 3030 idpf_rx_put_page(rx_buf); 3031 3032 return skb; 3033 } 3034 3035 skb_add_rx_frag(skb, 0, rx_buf->page, rx_buf->page_offset + headlen, 3036 size, rx_buf->truesize); 3037 3038 /* Since we're giving the page to the stack, clear our reference to it. 3039 * We'll get a new one during buffer posting. 3040 */ 3041 rx_buf->page = NULL; 3042 3043 return skb; 3044 } 3045 3046 /** 3047 * idpf_rx_hdr_construct_skb - Allocate skb and populate it from header buffer 3048 * @rxq: Rx descriptor queue 3049 * @va: Rx buffer to pull data from 3050 * @size: the length of the packet 3051 * 3052 * This function allocates an skb. It then populates it with the page data from 3053 * the current receive descriptor, taking care to set up the skb correctly. 3054 * This specifically uses a header buffer to start building the skb. 3055 */ 3056 static struct sk_buff *idpf_rx_hdr_construct_skb(struct idpf_queue *rxq, 3057 const void *va, 3058 unsigned int size) 3059 { 3060 struct sk_buff *skb; 3061 3062 /* allocate a skb to store the frags */ 3063 skb = __napi_alloc_skb(&rxq->q_vector->napi, size, GFP_ATOMIC); 3064 if (unlikely(!skb)) 3065 return NULL; 3066 3067 skb_record_rx_queue(skb, rxq->idx); 3068 3069 memcpy(__skb_put(skb, size), va, ALIGN(size, sizeof(long))); 3070 3071 /* More than likely, a payload fragment, which will use a page from 3072 * page_pool will be added to the SKB so mark it for recycle 3073 * preemptively. And if not, it's inconsequential. 3074 */ 3075 skb_mark_for_recycle(skb); 3076 3077 return skb; 3078 } 3079 3080 /** 3081 * idpf_rx_splitq_test_staterr - tests bits in Rx descriptor 3082 * status and error fields 3083 * @stat_err_field: field from descriptor to test bits in 3084 * @stat_err_bits: value to mask 3085 * 3086 */ 3087 static bool idpf_rx_splitq_test_staterr(const u8 stat_err_field, 3088 const u8 stat_err_bits) 3089 { 3090 return !!(stat_err_field & stat_err_bits); 3091 } 3092 3093 /** 3094 * idpf_rx_splitq_is_eop - process handling of EOP buffers 3095 * @rx_desc: Rx descriptor for current buffer 3096 * 3097 * If the buffer is an EOP buffer, this function exits returning true, 3098 * otherwise return false indicating that this is in fact a non-EOP buffer. 3099 */ 3100 static bool idpf_rx_splitq_is_eop(struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc) 3101 { 3102 /* if we are the last buffer then there is nothing else to do */ 3103 return likely(idpf_rx_splitq_test_staterr(rx_desc->status_err0_qw1, 3104 IDPF_RXD_EOF_SPLITQ)); 3105 } 3106 3107 /** 3108 * idpf_rx_splitq_clean - Clean completed descriptors from Rx queue 3109 * @rxq: Rx descriptor queue to retrieve receive buffer queue 3110 * @budget: Total limit on number of packets to process 3111 * 3112 * This function provides a "bounce buffer" approach to Rx interrupt 3113 * processing. The advantage to this is that on systems that have 3114 * expensive overhead for IOMMU access this provides a means of avoiding 3115 * it by maintaining the mapping of the page to the system. 3116 * 3117 * Returns amount of work completed 3118 */ 3119 static int idpf_rx_splitq_clean(struct idpf_queue *rxq, int budget) 3120 { 3121 int total_rx_bytes = 0, total_rx_pkts = 0; 3122 struct idpf_queue *rx_bufq = NULL; 3123 struct sk_buff *skb = rxq->skb; 3124 u16 ntc = rxq->next_to_clean; 3125 3126 /* Process Rx packets bounded by budget */ 3127 while (likely(total_rx_pkts < budget)) { 3128 struct virtchnl2_rx_flex_desc_adv_nic_3 *rx_desc; 3129 struct idpf_sw_queue *refillq = NULL; 3130 struct idpf_rxq_set *rxq_set = NULL; 3131 struct idpf_rx_buf *rx_buf = NULL; 3132 union virtchnl2_rx_desc *desc; 3133 unsigned int pkt_len = 0; 3134 unsigned int hdr_len = 0; 3135 u16 gen_id, buf_id = 0; 3136 /* Header buffer overflow only valid for header split */ 3137 bool hbo = false; 3138 int bufq_id; 3139 u8 rxdid; 3140 3141 /* get the Rx desc from Rx queue based on 'next_to_clean' */ 3142 desc = IDPF_RX_DESC(rxq, ntc); 3143 rx_desc = (struct virtchnl2_rx_flex_desc_adv_nic_3 *)desc; 3144 3145 /* This memory barrier is needed to keep us from reading 3146 * any other fields out of the rx_desc 3147 */ 3148 dma_rmb(); 3149 3150 /* if the descriptor isn't done, no work yet to do */ 3151 gen_id = le16_get_bits(rx_desc->pktlen_gen_bufq_id, 3152 VIRTCHNL2_RX_FLEX_DESC_ADV_GEN_M); 3153 3154 if (test_bit(__IDPF_Q_GEN_CHK, rxq->flags) != gen_id) 3155 break; 3156 3157 rxdid = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_RXDID_M, 3158 rx_desc->rxdid_ucast); 3159 if (rxdid != VIRTCHNL2_RXDID_2_FLEX_SPLITQ) { 3160 IDPF_RX_BUMP_NTC(rxq, ntc); 3161 u64_stats_update_begin(&rxq->stats_sync); 3162 u64_stats_inc(&rxq->q_stats.rx.bad_descs); 3163 u64_stats_update_end(&rxq->stats_sync); 3164 continue; 3165 } 3166 3167 pkt_len = le16_get_bits(rx_desc->pktlen_gen_bufq_id, 3168 VIRTCHNL2_RX_FLEX_DESC_ADV_LEN_PBUF_M); 3169 3170 hbo = FIELD_GET(VIRTCHNL2_RX_FLEX_DESC_ADV_STATUS0_HBO_M, 3171 rx_desc->status_err0_qw1); 3172 3173 if (unlikely(hbo)) { 3174 /* If a header buffer overflow, occurs, i.e. header is 3175 * too large to fit in the header split buffer, HW will 3176 * put the entire packet, including headers, in the 3177 * data/payload buffer. 3178 */ 3179 u64_stats_update_begin(&rxq->stats_sync); 3180 u64_stats_inc(&rxq->q_stats.rx.hsplit_buf_ovf); 3181 u64_stats_update_end(&rxq->stats_sync); 3182 goto bypass_hsplit; 3183 } 3184 3185 hdr_len = le16_get_bits(rx_desc->hdrlen_flags, 3186 VIRTCHNL2_RX_FLEX_DESC_ADV_LEN_HDR_M); 3187 3188 bypass_hsplit: 3189 bufq_id = le16_get_bits(rx_desc->pktlen_gen_bufq_id, 3190 VIRTCHNL2_RX_FLEX_DESC_ADV_BUFQ_ID_M); 3191 3192 rxq_set = container_of(rxq, struct idpf_rxq_set, rxq); 3193 if (!bufq_id) 3194 refillq = rxq_set->refillq0; 3195 else 3196 refillq = rxq_set->refillq1; 3197 3198 /* retrieve buffer from the rxq */ 3199 rx_bufq = &rxq->rxq_grp->splitq.bufq_sets[bufq_id].bufq; 3200 3201 buf_id = le16_to_cpu(rx_desc->buf_id); 3202 3203 rx_buf = &rx_bufq->rx_buf.buf[buf_id]; 3204 3205 if (hdr_len) { 3206 const void *va = (u8 *)rx_bufq->rx_buf.hdr_buf_va + 3207 (u32)buf_id * IDPF_HDR_BUF_SIZE; 3208 3209 skb = idpf_rx_hdr_construct_skb(rxq, va, hdr_len); 3210 u64_stats_update_begin(&rxq->stats_sync); 3211 u64_stats_inc(&rxq->q_stats.rx.hsplit_pkts); 3212 u64_stats_update_end(&rxq->stats_sync); 3213 } 3214 3215 if (pkt_len) { 3216 idpf_rx_sync_for_cpu(rx_buf, pkt_len); 3217 if (skb) 3218 idpf_rx_add_frag(rx_buf, skb, pkt_len); 3219 else 3220 skb = idpf_rx_construct_skb(rxq, rx_buf, 3221 pkt_len); 3222 } else { 3223 idpf_rx_put_page(rx_buf); 3224 } 3225 3226 /* exit if we failed to retrieve a buffer */ 3227 if (!skb) 3228 break; 3229 3230 idpf_rx_post_buf_refill(refillq, buf_id); 3231 3232 IDPF_RX_BUMP_NTC(rxq, ntc); 3233 /* skip if it is non EOP desc */ 3234 if (!idpf_rx_splitq_is_eop(rx_desc)) 3235 continue; 3236 3237 /* pad skb if needed (to make valid ethernet frame) */ 3238 if (eth_skb_pad(skb)) { 3239 skb = NULL; 3240 continue; 3241 } 3242 3243 /* probably a little skewed due to removing CRC */ 3244 total_rx_bytes += skb->len; 3245 3246 /* protocol */ 3247 if (unlikely(idpf_rx_process_skb_fields(rxq, skb, rx_desc))) { 3248 dev_kfree_skb_any(skb); 3249 skb = NULL; 3250 continue; 3251 } 3252 3253 /* send completed skb up the stack */ 3254 napi_gro_receive(&rxq->q_vector->napi, skb); 3255 skb = NULL; 3256 3257 /* update budget accounting */ 3258 total_rx_pkts++; 3259 } 3260 3261 rxq->next_to_clean = ntc; 3262 3263 rxq->skb = skb; 3264 u64_stats_update_begin(&rxq->stats_sync); 3265 u64_stats_add(&rxq->q_stats.rx.packets, total_rx_pkts); 3266 u64_stats_add(&rxq->q_stats.rx.bytes, total_rx_bytes); 3267 u64_stats_update_end(&rxq->stats_sync); 3268 3269 /* guarantee a trip back through this routine if there was a failure */ 3270 return total_rx_pkts; 3271 } 3272 3273 /** 3274 * idpf_rx_update_bufq_desc - Update buffer queue descriptor 3275 * @bufq: Pointer to the buffer queue 3276 * @refill_desc: SW Refill queue descriptor containing buffer ID 3277 * @buf_desc: Buffer queue descriptor 3278 * 3279 * Return 0 on success and negative on failure. 3280 */ 3281 static int idpf_rx_update_bufq_desc(struct idpf_queue *bufq, u16 refill_desc, 3282 struct virtchnl2_splitq_rx_buf_desc *buf_desc) 3283 { 3284 struct idpf_rx_buf *buf; 3285 dma_addr_t addr; 3286 u16 buf_id; 3287 3288 buf_id = FIELD_GET(IDPF_RX_BI_BUFID_M, refill_desc); 3289 3290 buf = &bufq->rx_buf.buf[buf_id]; 3291 3292 addr = idpf_alloc_page(bufq->pp, buf, bufq->rx_buf_size); 3293 if (unlikely(addr == DMA_MAPPING_ERROR)) 3294 return -ENOMEM; 3295 3296 buf_desc->pkt_addr = cpu_to_le64(addr); 3297 buf_desc->qword0.buf_id = cpu_to_le16(buf_id); 3298 3299 if (!bufq->rx_hsplit_en) 3300 return 0; 3301 3302 buf_desc->hdr_addr = cpu_to_le64(bufq->rx_buf.hdr_buf_pa + 3303 (u32)buf_id * IDPF_HDR_BUF_SIZE); 3304 3305 return 0; 3306 } 3307 3308 /** 3309 * idpf_rx_clean_refillq - Clean refill queue buffers 3310 * @bufq: buffer queue to post buffers back to 3311 * @refillq: refill queue to clean 3312 * 3313 * This function takes care of the buffer refill management 3314 */ 3315 static void idpf_rx_clean_refillq(struct idpf_queue *bufq, 3316 struct idpf_sw_queue *refillq) 3317 { 3318 struct virtchnl2_splitq_rx_buf_desc *buf_desc; 3319 u16 bufq_nta = bufq->next_to_alloc; 3320 u16 ntc = refillq->next_to_clean; 3321 int cleaned = 0; 3322 u16 gen; 3323 3324 buf_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, bufq_nta); 3325 3326 /* make sure we stop at ring wrap in the unlikely case ring is full */ 3327 while (likely(cleaned < refillq->desc_count)) { 3328 u16 refill_desc = IDPF_SPLITQ_RX_BI_DESC(refillq, ntc); 3329 bool failure; 3330 3331 gen = FIELD_GET(IDPF_RX_BI_GEN_M, refill_desc); 3332 if (test_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags) != gen) 3333 break; 3334 3335 failure = idpf_rx_update_bufq_desc(bufq, refill_desc, 3336 buf_desc); 3337 if (failure) 3338 break; 3339 3340 if (unlikely(++ntc == refillq->desc_count)) { 3341 change_bit(__IDPF_RFLQ_GEN_CHK, refillq->flags); 3342 ntc = 0; 3343 } 3344 3345 if (unlikely(++bufq_nta == bufq->desc_count)) { 3346 buf_desc = IDPF_SPLITQ_RX_BUF_DESC(bufq, 0); 3347 bufq_nta = 0; 3348 } else { 3349 buf_desc++; 3350 } 3351 3352 cleaned++; 3353 } 3354 3355 if (!cleaned) 3356 return; 3357 3358 /* We want to limit how many transactions on the bus we trigger with 3359 * tail writes so we only do it in strides. It's also important we 3360 * align the write to a multiple of 8 as required by HW. 3361 */ 3362 if (((bufq->next_to_use <= bufq_nta ? 0 : bufq->desc_count) + 3363 bufq_nta - bufq->next_to_use) >= IDPF_RX_BUF_POST_STRIDE) 3364 idpf_rx_buf_hw_update(bufq, ALIGN_DOWN(bufq_nta, 3365 IDPF_RX_BUF_POST_STRIDE)); 3366 3367 /* update next to alloc since we have filled the ring */ 3368 refillq->next_to_clean = ntc; 3369 bufq->next_to_alloc = bufq_nta; 3370 } 3371 3372 /** 3373 * idpf_rx_clean_refillq_all - Clean all refill queues 3374 * @bufq: buffer queue with refill queues 3375 * 3376 * Iterates through all refill queues assigned to the buffer queue assigned to 3377 * this vector. Returns true if clean is complete within budget, false 3378 * otherwise. 3379 */ 3380 static void idpf_rx_clean_refillq_all(struct idpf_queue *bufq) 3381 { 3382 struct idpf_bufq_set *bufq_set; 3383 int i; 3384 3385 bufq_set = container_of(bufq, struct idpf_bufq_set, bufq); 3386 for (i = 0; i < bufq_set->num_refillqs; i++) 3387 idpf_rx_clean_refillq(bufq, &bufq_set->refillqs[i]); 3388 } 3389 3390 /** 3391 * idpf_vport_intr_clean_queues - MSIX mode Interrupt Handler 3392 * @irq: interrupt number 3393 * @data: pointer to a q_vector 3394 * 3395 */ 3396 static irqreturn_t idpf_vport_intr_clean_queues(int __always_unused irq, 3397 void *data) 3398 { 3399 struct idpf_q_vector *q_vector = (struct idpf_q_vector *)data; 3400 3401 q_vector->total_events++; 3402 napi_schedule(&q_vector->napi); 3403 3404 return IRQ_HANDLED; 3405 } 3406 3407 /** 3408 * idpf_vport_intr_napi_del_all - Unregister napi for all q_vectors in vport 3409 * @vport: virtual port structure 3410 * 3411 */ 3412 static void idpf_vport_intr_napi_del_all(struct idpf_vport *vport) 3413 { 3414 u16 v_idx; 3415 3416 for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) 3417 netif_napi_del(&vport->q_vectors[v_idx].napi); 3418 } 3419 3420 /** 3421 * idpf_vport_intr_napi_dis_all - Disable NAPI for all q_vectors in the vport 3422 * @vport: main vport structure 3423 */ 3424 static void idpf_vport_intr_napi_dis_all(struct idpf_vport *vport) 3425 { 3426 int v_idx; 3427 3428 for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) 3429 napi_disable(&vport->q_vectors[v_idx].napi); 3430 } 3431 3432 /** 3433 * idpf_vport_intr_rel - Free memory allocated for interrupt vectors 3434 * @vport: virtual port 3435 * 3436 * Free the memory allocated for interrupt vectors associated to a vport 3437 */ 3438 void idpf_vport_intr_rel(struct idpf_vport *vport) 3439 { 3440 int i, j, v_idx; 3441 3442 for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { 3443 struct idpf_q_vector *q_vector = &vport->q_vectors[v_idx]; 3444 3445 kfree(q_vector->bufq); 3446 q_vector->bufq = NULL; 3447 kfree(q_vector->tx); 3448 q_vector->tx = NULL; 3449 kfree(q_vector->rx); 3450 q_vector->rx = NULL; 3451 } 3452 3453 /* Clean up the mapping of queues to vectors */ 3454 for (i = 0; i < vport->num_rxq_grp; i++) { 3455 struct idpf_rxq_group *rx_qgrp = &vport->rxq_grps[i]; 3456 3457 if (idpf_is_queue_model_split(vport->rxq_model)) 3458 for (j = 0; j < rx_qgrp->splitq.num_rxq_sets; j++) 3459 rx_qgrp->splitq.rxq_sets[j]->rxq.q_vector = NULL; 3460 else 3461 for (j = 0; j < rx_qgrp->singleq.num_rxq; j++) 3462 rx_qgrp->singleq.rxqs[j]->q_vector = NULL; 3463 } 3464 3465 if (idpf_is_queue_model_split(vport->txq_model)) 3466 for (i = 0; i < vport->num_txq_grp; i++) 3467 vport->txq_grps[i].complq->q_vector = NULL; 3468 else 3469 for (i = 0; i < vport->num_txq_grp; i++) 3470 for (j = 0; j < vport->txq_grps[i].num_txq; j++) 3471 vport->txq_grps[i].txqs[j]->q_vector = NULL; 3472 3473 kfree(vport->q_vectors); 3474 vport->q_vectors = NULL; 3475 } 3476 3477 /** 3478 * idpf_vport_intr_rel_irq - Free the IRQ association with the OS 3479 * @vport: main vport structure 3480 */ 3481 static void idpf_vport_intr_rel_irq(struct idpf_vport *vport) 3482 { 3483 struct idpf_adapter *adapter = vport->adapter; 3484 int vector; 3485 3486 for (vector = 0; vector < vport->num_q_vectors; vector++) { 3487 struct idpf_q_vector *q_vector = &vport->q_vectors[vector]; 3488 int irq_num, vidx; 3489 3490 /* free only the irqs that were actually requested */ 3491 if (!q_vector) 3492 continue; 3493 3494 vidx = vport->q_vector_idxs[vector]; 3495 irq_num = adapter->msix_entries[vidx].vector; 3496 3497 /* clear the affinity_mask in the IRQ descriptor */ 3498 irq_set_affinity_hint(irq_num, NULL); 3499 free_irq(irq_num, q_vector); 3500 } 3501 } 3502 3503 /** 3504 * idpf_vport_intr_dis_irq_all - Disable all interrupt 3505 * @vport: main vport structure 3506 */ 3507 static void idpf_vport_intr_dis_irq_all(struct idpf_vport *vport) 3508 { 3509 struct idpf_q_vector *q_vector = vport->q_vectors; 3510 int q_idx; 3511 3512 for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) 3513 writel(0, q_vector[q_idx].intr_reg.dyn_ctl); 3514 } 3515 3516 /** 3517 * idpf_vport_intr_buildreg_itr - Enable default interrupt generation settings 3518 * @q_vector: pointer to q_vector 3519 * @type: itr index 3520 * @itr: itr value 3521 */ 3522 static u32 idpf_vport_intr_buildreg_itr(struct idpf_q_vector *q_vector, 3523 const int type, u16 itr) 3524 { 3525 u32 itr_val; 3526 3527 itr &= IDPF_ITR_MASK; 3528 /* Don't clear PBA because that can cause lost interrupts that 3529 * came in while we were cleaning/polling 3530 */ 3531 itr_val = q_vector->intr_reg.dyn_ctl_intena_m | 3532 (type << q_vector->intr_reg.dyn_ctl_itridx_s) | 3533 (itr << (q_vector->intr_reg.dyn_ctl_intrvl_s - 1)); 3534 3535 return itr_val; 3536 } 3537 3538 /** 3539 * idpf_update_dim_sample - Update dim sample with packets and bytes 3540 * @q_vector: the vector associated with the interrupt 3541 * @dim_sample: dim sample to update 3542 * @dim: dim instance structure 3543 * @packets: total packets 3544 * @bytes: total bytes 3545 * 3546 * Update the dim sample with the packets and bytes which are passed to this 3547 * function. Set the dim state appropriately if the dim settings gets stale. 3548 */ 3549 static void idpf_update_dim_sample(struct idpf_q_vector *q_vector, 3550 struct dim_sample *dim_sample, 3551 struct dim *dim, u64 packets, u64 bytes) 3552 { 3553 dim_update_sample(q_vector->total_events, packets, bytes, dim_sample); 3554 dim_sample->comp_ctr = 0; 3555 3556 /* if dim settings get stale, like when not updated for 1 second or 3557 * longer, force it to start again. This addresses the frequent case 3558 * of an idle queue being switched to by the scheduler. 3559 */ 3560 if (ktime_ms_delta(dim_sample->time, dim->start_sample.time) >= HZ) 3561 dim->state = DIM_START_MEASURE; 3562 } 3563 3564 /** 3565 * idpf_net_dim - Update net DIM algorithm 3566 * @q_vector: the vector associated with the interrupt 3567 * 3568 * Create a DIM sample and notify net_dim() so that it can possibly decide 3569 * a new ITR value based on incoming packets, bytes, and interrupts. 3570 * 3571 * This function is a no-op if the queue is not configured to dynamic ITR. 3572 */ 3573 static void idpf_net_dim(struct idpf_q_vector *q_vector) 3574 { 3575 struct dim_sample dim_sample = { }; 3576 u64 packets, bytes; 3577 u32 i; 3578 3579 if (!IDPF_ITR_IS_DYNAMIC(q_vector->tx_intr_mode)) 3580 goto check_rx_itr; 3581 3582 for (i = 0, packets = 0, bytes = 0; i < q_vector->num_txq; i++) { 3583 struct idpf_queue *txq = q_vector->tx[i]; 3584 unsigned int start; 3585 3586 do { 3587 start = u64_stats_fetch_begin(&txq->stats_sync); 3588 packets += u64_stats_read(&txq->q_stats.tx.packets); 3589 bytes += u64_stats_read(&txq->q_stats.tx.bytes); 3590 } while (u64_stats_fetch_retry(&txq->stats_sync, start)); 3591 } 3592 3593 idpf_update_dim_sample(q_vector, &dim_sample, &q_vector->tx_dim, 3594 packets, bytes); 3595 net_dim(&q_vector->tx_dim, dim_sample); 3596 3597 check_rx_itr: 3598 if (!IDPF_ITR_IS_DYNAMIC(q_vector->rx_intr_mode)) 3599 return; 3600 3601 for (i = 0, packets = 0, bytes = 0; i < q_vector->num_rxq; i++) { 3602 struct idpf_queue *rxq = q_vector->rx[i]; 3603 unsigned int start; 3604 3605 do { 3606 start = u64_stats_fetch_begin(&rxq->stats_sync); 3607 packets += u64_stats_read(&rxq->q_stats.rx.packets); 3608 bytes += u64_stats_read(&rxq->q_stats.rx.bytes); 3609 } while (u64_stats_fetch_retry(&rxq->stats_sync, start)); 3610 } 3611 3612 idpf_update_dim_sample(q_vector, &dim_sample, &q_vector->rx_dim, 3613 packets, bytes); 3614 net_dim(&q_vector->rx_dim, dim_sample); 3615 } 3616 3617 /** 3618 * idpf_vport_intr_update_itr_ena_irq - Update itr and re-enable MSIX interrupt 3619 * @q_vector: q_vector for which itr is being updated and interrupt enabled 3620 * 3621 * Update the net_dim() algorithm and re-enable the interrupt associated with 3622 * this vector. 3623 */ 3624 void idpf_vport_intr_update_itr_ena_irq(struct idpf_q_vector *q_vector) 3625 { 3626 u32 intval; 3627 3628 /* net_dim() updates ITR out-of-band using a work item */ 3629 idpf_net_dim(q_vector); 3630 3631 intval = idpf_vport_intr_buildreg_itr(q_vector, 3632 IDPF_NO_ITR_UPDATE_IDX, 0); 3633 3634 writel(intval, q_vector->intr_reg.dyn_ctl); 3635 } 3636 3637 /** 3638 * idpf_vport_intr_req_irq - get MSI-X vectors from the OS for the vport 3639 * @vport: main vport structure 3640 * @basename: name for the vector 3641 */ 3642 static int idpf_vport_intr_req_irq(struct idpf_vport *vport, char *basename) 3643 { 3644 struct idpf_adapter *adapter = vport->adapter; 3645 int vector, err, irq_num, vidx; 3646 const char *vec_name; 3647 3648 for (vector = 0; vector < vport->num_q_vectors; vector++) { 3649 struct idpf_q_vector *q_vector = &vport->q_vectors[vector]; 3650 3651 vidx = vport->q_vector_idxs[vector]; 3652 irq_num = adapter->msix_entries[vidx].vector; 3653 3654 if (q_vector->num_rxq && q_vector->num_txq) 3655 vec_name = "TxRx"; 3656 else if (q_vector->num_rxq) 3657 vec_name = "Rx"; 3658 else if (q_vector->num_txq) 3659 vec_name = "Tx"; 3660 else 3661 continue; 3662 3663 q_vector->name = kasprintf(GFP_KERNEL, "%s-%s-%d", 3664 basename, vec_name, vidx); 3665 3666 err = request_irq(irq_num, idpf_vport_intr_clean_queues, 0, 3667 q_vector->name, q_vector); 3668 if (err) { 3669 netdev_err(vport->netdev, 3670 "Request_irq failed, error: %d\n", err); 3671 goto free_q_irqs; 3672 } 3673 /* assign the mask for this irq */ 3674 irq_set_affinity_hint(irq_num, &q_vector->affinity_mask); 3675 } 3676 3677 return 0; 3678 3679 free_q_irqs: 3680 while (--vector >= 0) { 3681 vidx = vport->q_vector_idxs[vector]; 3682 irq_num = adapter->msix_entries[vidx].vector; 3683 free_irq(irq_num, &vport->q_vectors[vector]); 3684 } 3685 3686 return err; 3687 } 3688 3689 /** 3690 * idpf_vport_intr_write_itr - Write ITR value to the ITR register 3691 * @q_vector: q_vector structure 3692 * @itr: Interrupt throttling rate 3693 * @tx: Tx or Rx ITR 3694 */ 3695 void idpf_vport_intr_write_itr(struct idpf_q_vector *q_vector, u16 itr, bool tx) 3696 { 3697 struct idpf_intr_reg *intr_reg; 3698 3699 if (tx && !q_vector->tx) 3700 return; 3701 else if (!tx && !q_vector->rx) 3702 return; 3703 3704 intr_reg = &q_vector->intr_reg; 3705 writel(ITR_REG_ALIGN(itr) >> IDPF_ITR_GRAN_S, 3706 tx ? intr_reg->tx_itr : intr_reg->rx_itr); 3707 } 3708 3709 /** 3710 * idpf_vport_intr_ena_irq_all - Enable IRQ for the given vport 3711 * @vport: main vport structure 3712 */ 3713 static void idpf_vport_intr_ena_irq_all(struct idpf_vport *vport) 3714 { 3715 bool dynamic; 3716 int q_idx; 3717 u16 itr; 3718 3719 for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) { 3720 struct idpf_q_vector *qv = &vport->q_vectors[q_idx]; 3721 3722 /* Set the initial ITR values */ 3723 if (qv->num_txq) { 3724 dynamic = IDPF_ITR_IS_DYNAMIC(qv->tx_intr_mode); 3725 itr = vport->tx_itr_profile[qv->tx_dim.profile_ix]; 3726 idpf_vport_intr_write_itr(qv, dynamic ? 3727 itr : qv->tx_itr_value, 3728 true); 3729 } 3730 3731 if (qv->num_rxq) { 3732 dynamic = IDPF_ITR_IS_DYNAMIC(qv->rx_intr_mode); 3733 itr = vport->rx_itr_profile[qv->rx_dim.profile_ix]; 3734 idpf_vport_intr_write_itr(qv, dynamic ? 3735 itr : qv->rx_itr_value, 3736 false); 3737 } 3738 3739 if (qv->num_txq || qv->num_rxq) 3740 idpf_vport_intr_update_itr_ena_irq(qv); 3741 } 3742 } 3743 3744 /** 3745 * idpf_vport_intr_deinit - Release all vector associations for the vport 3746 * @vport: main vport structure 3747 */ 3748 void idpf_vport_intr_deinit(struct idpf_vport *vport) 3749 { 3750 idpf_vport_intr_napi_dis_all(vport); 3751 idpf_vport_intr_napi_del_all(vport); 3752 idpf_vport_intr_dis_irq_all(vport); 3753 idpf_vport_intr_rel_irq(vport); 3754 } 3755 3756 /** 3757 * idpf_tx_dim_work - Call back from the stack 3758 * @work: work queue structure 3759 */ 3760 static void idpf_tx_dim_work(struct work_struct *work) 3761 { 3762 struct idpf_q_vector *q_vector; 3763 struct idpf_vport *vport; 3764 struct dim *dim; 3765 u16 itr; 3766 3767 dim = container_of(work, struct dim, work); 3768 q_vector = container_of(dim, struct idpf_q_vector, tx_dim); 3769 vport = q_vector->vport; 3770 3771 if (dim->profile_ix >= ARRAY_SIZE(vport->tx_itr_profile)) 3772 dim->profile_ix = ARRAY_SIZE(vport->tx_itr_profile) - 1; 3773 3774 /* look up the values in our local table */ 3775 itr = vport->tx_itr_profile[dim->profile_ix]; 3776 3777 idpf_vport_intr_write_itr(q_vector, itr, true); 3778 3779 dim->state = DIM_START_MEASURE; 3780 } 3781 3782 /** 3783 * idpf_rx_dim_work - Call back from the stack 3784 * @work: work queue structure 3785 */ 3786 static void idpf_rx_dim_work(struct work_struct *work) 3787 { 3788 struct idpf_q_vector *q_vector; 3789 struct idpf_vport *vport; 3790 struct dim *dim; 3791 u16 itr; 3792 3793 dim = container_of(work, struct dim, work); 3794 q_vector = container_of(dim, struct idpf_q_vector, rx_dim); 3795 vport = q_vector->vport; 3796 3797 if (dim->profile_ix >= ARRAY_SIZE(vport->rx_itr_profile)) 3798 dim->profile_ix = ARRAY_SIZE(vport->rx_itr_profile) - 1; 3799 3800 /* look up the values in our local table */ 3801 itr = vport->rx_itr_profile[dim->profile_ix]; 3802 3803 idpf_vport_intr_write_itr(q_vector, itr, false); 3804 3805 dim->state = DIM_START_MEASURE; 3806 } 3807 3808 /** 3809 * idpf_init_dim - Set up dynamic interrupt moderation 3810 * @qv: q_vector structure 3811 */ 3812 static void idpf_init_dim(struct idpf_q_vector *qv) 3813 { 3814 INIT_WORK(&qv->tx_dim.work, idpf_tx_dim_work); 3815 qv->tx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE; 3816 qv->tx_dim.profile_ix = IDPF_DIM_DEFAULT_PROFILE_IX; 3817 3818 INIT_WORK(&qv->rx_dim.work, idpf_rx_dim_work); 3819 qv->rx_dim.mode = DIM_CQ_PERIOD_MODE_START_FROM_EQE; 3820 qv->rx_dim.profile_ix = IDPF_DIM_DEFAULT_PROFILE_IX; 3821 } 3822 3823 /** 3824 * idpf_vport_intr_napi_ena_all - Enable NAPI for all q_vectors in the vport 3825 * @vport: main vport structure 3826 */ 3827 static void idpf_vport_intr_napi_ena_all(struct idpf_vport *vport) 3828 { 3829 int q_idx; 3830 3831 for (q_idx = 0; q_idx < vport->num_q_vectors; q_idx++) { 3832 struct idpf_q_vector *q_vector = &vport->q_vectors[q_idx]; 3833 3834 idpf_init_dim(q_vector); 3835 napi_enable(&q_vector->napi); 3836 } 3837 } 3838 3839 /** 3840 * idpf_tx_splitq_clean_all- Clean completion queues 3841 * @q_vec: queue vector 3842 * @budget: Used to determine if we are in netpoll 3843 * @cleaned: returns number of packets cleaned 3844 * 3845 * Returns false if clean is not complete else returns true 3846 */ 3847 static bool idpf_tx_splitq_clean_all(struct idpf_q_vector *q_vec, 3848 int budget, int *cleaned) 3849 { 3850 u16 num_txq = q_vec->num_txq; 3851 bool clean_complete = true; 3852 int i, budget_per_q; 3853 3854 if (unlikely(!num_txq)) 3855 return true; 3856 3857 budget_per_q = DIV_ROUND_UP(budget, num_txq); 3858 for (i = 0; i < num_txq; i++) 3859 clean_complete &= idpf_tx_clean_complq(q_vec->tx[i], 3860 budget_per_q, cleaned); 3861 3862 return clean_complete; 3863 } 3864 3865 /** 3866 * idpf_rx_splitq_clean_all- Clean completion queues 3867 * @q_vec: queue vector 3868 * @budget: Used to determine if we are in netpoll 3869 * @cleaned: returns number of packets cleaned 3870 * 3871 * Returns false if clean is not complete else returns true 3872 */ 3873 static bool idpf_rx_splitq_clean_all(struct idpf_q_vector *q_vec, int budget, 3874 int *cleaned) 3875 { 3876 u16 num_rxq = q_vec->num_rxq; 3877 bool clean_complete = true; 3878 int pkts_cleaned = 0; 3879 int i, budget_per_q; 3880 3881 /* We attempt to distribute budget to each Rx queue fairly, but don't 3882 * allow the budget to go below 1 because that would exit polling early. 3883 */ 3884 budget_per_q = num_rxq ? max(budget / num_rxq, 1) : 0; 3885 for (i = 0; i < num_rxq; i++) { 3886 struct idpf_queue *rxq = q_vec->rx[i]; 3887 int pkts_cleaned_per_q; 3888 3889 pkts_cleaned_per_q = idpf_rx_splitq_clean(rxq, budget_per_q); 3890 /* if we clean as many as budgeted, we must not be done */ 3891 if (pkts_cleaned_per_q >= budget_per_q) 3892 clean_complete = false; 3893 pkts_cleaned += pkts_cleaned_per_q; 3894 } 3895 *cleaned = pkts_cleaned; 3896 3897 for (i = 0; i < q_vec->num_bufq; i++) 3898 idpf_rx_clean_refillq_all(q_vec->bufq[i]); 3899 3900 return clean_complete; 3901 } 3902 3903 /** 3904 * idpf_vport_splitq_napi_poll - NAPI handler 3905 * @napi: struct from which you get q_vector 3906 * @budget: budget provided by stack 3907 */ 3908 static int idpf_vport_splitq_napi_poll(struct napi_struct *napi, int budget) 3909 { 3910 struct idpf_q_vector *q_vector = 3911 container_of(napi, struct idpf_q_vector, napi); 3912 bool clean_complete; 3913 int work_done = 0; 3914 3915 /* Handle case where we are called by netpoll with a budget of 0 */ 3916 if (unlikely(!budget)) { 3917 idpf_tx_splitq_clean_all(q_vector, budget, &work_done); 3918 3919 return 0; 3920 } 3921 3922 clean_complete = idpf_rx_splitq_clean_all(q_vector, budget, &work_done); 3923 clean_complete &= idpf_tx_splitq_clean_all(q_vector, budget, &work_done); 3924 3925 /* If work not completed, return budget and polling will return */ 3926 if (!clean_complete) 3927 return budget; 3928 3929 work_done = min_t(int, work_done, budget - 1); 3930 3931 /* Exit the polling mode, but don't re-enable interrupts if stack might 3932 * poll us due to busy-polling 3933 */ 3934 if (likely(napi_complete_done(napi, work_done))) 3935 idpf_vport_intr_update_itr_ena_irq(q_vector); 3936 3937 /* Switch to poll mode in the tear-down path after sending disable 3938 * queues virtchnl message, as the interrupts will be disabled after 3939 * that 3940 */ 3941 if (unlikely(q_vector->num_txq && test_bit(__IDPF_Q_POLL_MODE, 3942 q_vector->tx[0]->flags))) 3943 return budget; 3944 else 3945 return work_done; 3946 } 3947 3948 /** 3949 * idpf_vport_intr_map_vector_to_qs - Map vectors to queues 3950 * @vport: virtual port 3951 * 3952 * Mapping for vectors to queues 3953 */ 3954 static void idpf_vport_intr_map_vector_to_qs(struct idpf_vport *vport) 3955 { 3956 u16 num_txq_grp = vport->num_txq_grp; 3957 int i, j, qv_idx, bufq_vidx = 0; 3958 struct idpf_rxq_group *rx_qgrp; 3959 struct idpf_txq_group *tx_qgrp; 3960 struct idpf_queue *q, *bufq; 3961 u16 q_index; 3962 3963 for (i = 0, qv_idx = 0; i < vport->num_rxq_grp; i++) { 3964 u16 num_rxq; 3965 3966 rx_qgrp = &vport->rxq_grps[i]; 3967 if (idpf_is_queue_model_split(vport->rxq_model)) 3968 num_rxq = rx_qgrp->splitq.num_rxq_sets; 3969 else 3970 num_rxq = rx_qgrp->singleq.num_rxq; 3971 3972 for (j = 0; j < num_rxq; j++) { 3973 if (qv_idx >= vport->num_q_vectors) 3974 qv_idx = 0; 3975 3976 if (idpf_is_queue_model_split(vport->rxq_model)) 3977 q = &rx_qgrp->splitq.rxq_sets[j]->rxq; 3978 else 3979 q = rx_qgrp->singleq.rxqs[j]; 3980 q->q_vector = &vport->q_vectors[qv_idx]; 3981 q_index = q->q_vector->num_rxq; 3982 q->q_vector->rx[q_index] = q; 3983 q->q_vector->num_rxq++; 3984 qv_idx++; 3985 } 3986 3987 if (idpf_is_queue_model_split(vport->rxq_model)) { 3988 for (j = 0; j < vport->num_bufqs_per_qgrp; j++) { 3989 bufq = &rx_qgrp->splitq.bufq_sets[j].bufq; 3990 bufq->q_vector = &vport->q_vectors[bufq_vidx]; 3991 q_index = bufq->q_vector->num_bufq; 3992 bufq->q_vector->bufq[q_index] = bufq; 3993 bufq->q_vector->num_bufq++; 3994 } 3995 if (++bufq_vidx >= vport->num_q_vectors) 3996 bufq_vidx = 0; 3997 } 3998 } 3999 4000 for (i = 0, qv_idx = 0; i < num_txq_grp; i++) { 4001 u16 num_txq; 4002 4003 tx_qgrp = &vport->txq_grps[i]; 4004 num_txq = tx_qgrp->num_txq; 4005 4006 if (idpf_is_queue_model_split(vport->txq_model)) { 4007 if (qv_idx >= vport->num_q_vectors) 4008 qv_idx = 0; 4009 4010 q = tx_qgrp->complq; 4011 q->q_vector = &vport->q_vectors[qv_idx]; 4012 q_index = q->q_vector->num_txq; 4013 q->q_vector->tx[q_index] = q; 4014 q->q_vector->num_txq++; 4015 qv_idx++; 4016 } else { 4017 for (j = 0; j < num_txq; j++) { 4018 if (qv_idx >= vport->num_q_vectors) 4019 qv_idx = 0; 4020 4021 q = tx_qgrp->txqs[j]; 4022 q->q_vector = &vport->q_vectors[qv_idx]; 4023 q_index = q->q_vector->num_txq; 4024 q->q_vector->tx[q_index] = q; 4025 q->q_vector->num_txq++; 4026 4027 qv_idx++; 4028 } 4029 } 4030 } 4031 } 4032 4033 /** 4034 * idpf_vport_intr_init_vec_idx - Initialize the vector indexes 4035 * @vport: virtual port 4036 * 4037 * Initialize vector indexes with values returened over mailbox 4038 */ 4039 static int idpf_vport_intr_init_vec_idx(struct idpf_vport *vport) 4040 { 4041 struct idpf_adapter *adapter = vport->adapter; 4042 struct virtchnl2_alloc_vectors *ac; 4043 u16 *vecids, total_vecs; 4044 int i; 4045 4046 ac = adapter->req_vec_chunks; 4047 if (!ac) { 4048 for (i = 0; i < vport->num_q_vectors; i++) 4049 vport->q_vectors[i].v_idx = vport->q_vector_idxs[i]; 4050 4051 return 0; 4052 } 4053 4054 total_vecs = idpf_get_reserved_vecs(adapter); 4055 vecids = kcalloc(total_vecs, sizeof(u16), GFP_KERNEL); 4056 if (!vecids) 4057 return -ENOMEM; 4058 4059 idpf_get_vec_ids(adapter, vecids, total_vecs, &ac->vchunks); 4060 4061 for (i = 0; i < vport->num_q_vectors; i++) 4062 vport->q_vectors[i].v_idx = vecids[vport->q_vector_idxs[i]]; 4063 4064 kfree(vecids); 4065 4066 return 0; 4067 } 4068 4069 /** 4070 * idpf_vport_intr_napi_add_all- Register napi handler for all qvectors 4071 * @vport: virtual port structure 4072 */ 4073 static void idpf_vport_intr_napi_add_all(struct idpf_vport *vport) 4074 { 4075 int (*napi_poll)(struct napi_struct *napi, int budget); 4076 u16 v_idx; 4077 4078 if (idpf_is_queue_model_split(vport->txq_model)) 4079 napi_poll = idpf_vport_splitq_napi_poll; 4080 else 4081 napi_poll = idpf_vport_singleq_napi_poll; 4082 4083 for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { 4084 struct idpf_q_vector *q_vector = &vport->q_vectors[v_idx]; 4085 4086 netif_napi_add(vport->netdev, &q_vector->napi, napi_poll); 4087 4088 /* only set affinity_mask if the CPU is online */ 4089 if (cpu_online(v_idx)) 4090 cpumask_set_cpu(v_idx, &q_vector->affinity_mask); 4091 } 4092 } 4093 4094 /** 4095 * idpf_vport_intr_alloc - Allocate memory for interrupt vectors 4096 * @vport: virtual port 4097 * 4098 * We allocate one q_vector per queue interrupt. If allocation fails we 4099 * return -ENOMEM. 4100 */ 4101 int idpf_vport_intr_alloc(struct idpf_vport *vport) 4102 { 4103 u16 txqs_per_vector, rxqs_per_vector, bufqs_per_vector; 4104 struct idpf_q_vector *q_vector; 4105 int v_idx, err; 4106 4107 vport->q_vectors = kcalloc(vport->num_q_vectors, 4108 sizeof(struct idpf_q_vector), GFP_KERNEL); 4109 if (!vport->q_vectors) 4110 return -ENOMEM; 4111 4112 txqs_per_vector = DIV_ROUND_UP(vport->num_txq, vport->num_q_vectors); 4113 rxqs_per_vector = DIV_ROUND_UP(vport->num_rxq, vport->num_q_vectors); 4114 bufqs_per_vector = vport->num_bufqs_per_qgrp * 4115 DIV_ROUND_UP(vport->num_rxq_grp, 4116 vport->num_q_vectors); 4117 4118 for (v_idx = 0; v_idx < vport->num_q_vectors; v_idx++) { 4119 q_vector = &vport->q_vectors[v_idx]; 4120 q_vector->vport = vport; 4121 4122 q_vector->tx_itr_value = IDPF_ITR_TX_DEF; 4123 q_vector->tx_intr_mode = IDPF_ITR_DYNAMIC; 4124 q_vector->tx_itr_idx = VIRTCHNL2_ITR_IDX_1; 4125 4126 q_vector->rx_itr_value = IDPF_ITR_RX_DEF; 4127 q_vector->rx_intr_mode = IDPF_ITR_DYNAMIC; 4128 q_vector->rx_itr_idx = VIRTCHNL2_ITR_IDX_0; 4129 4130 q_vector->tx = kcalloc(txqs_per_vector, 4131 sizeof(struct idpf_queue *), 4132 GFP_KERNEL); 4133 if (!q_vector->tx) { 4134 err = -ENOMEM; 4135 goto error; 4136 } 4137 4138 q_vector->rx = kcalloc(rxqs_per_vector, 4139 sizeof(struct idpf_queue *), 4140 GFP_KERNEL); 4141 if (!q_vector->rx) { 4142 err = -ENOMEM; 4143 goto error; 4144 } 4145 4146 if (!idpf_is_queue_model_split(vport->rxq_model)) 4147 continue; 4148 4149 q_vector->bufq = kcalloc(bufqs_per_vector, 4150 sizeof(struct idpf_queue *), 4151 GFP_KERNEL); 4152 if (!q_vector->bufq) { 4153 err = -ENOMEM; 4154 goto error; 4155 } 4156 } 4157 4158 return 0; 4159 4160 error: 4161 idpf_vport_intr_rel(vport); 4162 4163 return err; 4164 } 4165 4166 /** 4167 * idpf_vport_intr_init - Setup all vectors for the given vport 4168 * @vport: virtual port 4169 * 4170 * Returns 0 on success or negative on failure 4171 */ 4172 int idpf_vport_intr_init(struct idpf_vport *vport) 4173 { 4174 char *int_name; 4175 int err; 4176 4177 err = idpf_vport_intr_init_vec_idx(vport); 4178 if (err) 4179 return err; 4180 4181 idpf_vport_intr_map_vector_to_qs(vport); 4182 idpf_vport_intr_napi_add_all(vport); 4183 idpf_vport_intr_napi_ena_all(vport); 4184 4185 err = vport->adapter->dev_ops.reg_ops.intr_reg_init(vport); 4186 if (err) 4187 goto unroll_vectors_alloc; 4188 4189 int_name = kasprintf(GFP_KERNEL, "%s-%s", 4190 dev_driver_string(&vport->adapter->pdev->dev), 4191 vport->netdev->name); 4192 4193 err = idpf_vport_intr_req_irq(vport, int_name); 4194 if (err) 4195 goto unroll_vectors_alloc; 4196 4197 idpf_vport_intr_ena_irq_all(vport); 4198 4199 return 0; 4200 4201 unroll_vectors_alloc: 4202 idpf_vport_intr_napi_dis_all(vport); 4203 idpf_vport_intr_napi_del_all(vport); 4204 4205 return err; 4206 } 4207 4208 /** 4209 * idpf_config_rss - Send virtchnl messages to configure RSS 4210 * @vport: virtual port 4211 * 4212 * Return 0 on success, negative on failure 4213 */ 4214 int idpf_config_rss(struct idpf_vport *vport) 4215 { 4216 int err; 4217 4218 err = idpf_send_get_set_rss_key_msg(vport, false); 4219 if (err) 4220 return err; 4221 4222 return idpf_send_get_set_rss_lut_msg(vport, false); 4223 } 4224 4225 /** 4226 * idpf_fill_dflt_rss_lut - Fill the indirection table with the default values 4227 * @vport: virtual port structure 4228 */ 4229 static void idpf_fill_dflt_rss_lut(struct idpf_vport *vport) 4230 { 4231 struct idpf_adapter *adapter = vport->adapter; 4232 u16 num_active_rxq = vport->num_rxq; 4233 struct idpf_rss_data *rss_data; 4234 int i; 4235 4236 rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; 4237 4238 for (i = 0; i < rss_data->rss_lut_size; i++) { 4239 rss_data->rss_lut[i] = i % num_active_rxq; 4240 rss_data->cached_lut[i] = rss_data->rss_lut[i]; 4241 } 4242 } 4243 4244 /** 4245 * idpf_init_rss - Allocate and initialize RSS resources 4246 * @vport: virtual port 4247 * 4248 * Return 0 on success, negative on failure 4249 */ 4250 int idpf_init_rss(struct idpf_vport *vport) 4251 { 4252 struct idpf_adapter *adapter = vport->adapter; 4253 struct idpf_rss_data *rss_data; 4254 u32 lut_size; 4255 4256 rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; 4257 4258 lut_size = rss_data->rss_lut_size * sizeof(u32); 4259 rss_data->rss_lut = kzalloc(lut_size, GFP_KERNEL); 4260 if (!rss_data->rss_lut) 4261 return -ENOMEM; 4262 4263 rss_data->cached_lut = kzalloc(lut_size, GFP_KERNEL); 4264 if (!rss_data->cached_lut) { 4265 kfree(rss_data->rss_lut); 4266 rss_data->rss_lut = NULL; 4267 4268 return -ENOMEM; 4269 } 4270 4271 /* Fill the default RSS lut values */ 4272 idpf_fill_dflt_rss_lut(vport); 4273 4274 return idpf_config_rss(vport); 4275 } 4276 4277 /** 4278 * idpf_deinit_rss - Release RSS resources 4279 * @vport: virtual port 4280 */ 4281 void idpf_deinit_rss(struct idpf_vport *vport) 4282 { 4283 struct idpf_adapter *adapter = vport->adapter; 4284 struct idpf_rss_data *rss_data; 4285 4286 rss_data = &adapter->vport_config[vport->idx]->user_config.rss_data; 4287 kfree(rss_data->cached_lut); 4288 rss_data->cached_lut = NULL; 4289 kfree(rss_data->rss_lut); 4290 rss_data->rss_lut = NULL; 4291 } 4292