1 /********************************************************************** 2 * Author: Cavium, Inc. 3 * 4 * Contact: support@cavium.com 5 * Please include "LiquidIO" in the subject. 6 * 7 * Copyright (c) 2003-2016 Cavium, Inc. 8 * 9 * This file is free software; you can redistribute it and/or modify 10 * it under the terms of the GNU General Public License, Version 2, as 11 * published by the Free Software Foundation. 12 * 13 * This file is distributed in the hope that it will be useful, but 14 * AS-IS and WITHOUT ANY WARRANTY; without even the implied warranty 15 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, TITLE, or 16 * NONINFRINGEMENT. See the GNU General Public License for more 17 * details. 18 **********************************************************************/ 19 #include <linux/pci.h> 20 #include <linux/netdevice.h> 21 #include <linux/vmalloc.h> 22 #include "liquidio_common.h" 23 #include "octeon_droq.h" 24 #include "octeon_iq.h" 25 #include "response_manager.h" 26 #include "octeon_device.h" 27 #include "octeon_main.h" 28 #include "octeon_network.h" 29 #include "cn66xx_device.h" 30 #include "cn23xx_pf_device.h" 31 #include "cn23xx_vf_device.h" 32 33 struct iq_post_status { 34 int status; 35 int index; 36 }; 37 38 static void check_db_timeout(struct work_struct *work); 39 static void __check_db_timeout(struct octeon_device *oct, u64 iq_no); 40 41 static void (*reqtype_free_fn[MAX_OCTEON_DEVICES][REQTYPE_LAST + 1]) (void *); 42 43 /* Define this to return the request status comaptible to old code */ 44 /*#define OCTEON_USE_OLD_REQ_STATUS*/ 45 46 /* Return 0 on success, 1 on failure */ 47 int octeon_init_instr_queue(struct octeon_device *oct, 48 union oct_txpciq txpciq, 49 u32 num_descs) 50 { 51 struct octeon_instr_queue *iq; 52 struct octeon_iq_config *conf = NULL; 53 u32 iq_no = (u32)txpciq.s.q_no; 54 u32 q_size; 55 struct cavium_wq *db_wq; 56 int numa_node = dev_to_node(&oct->pci_dev->dev); 57 58 if (OCTEON_CN6XXX(oct)) 59 conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn6xxx))); 60 else if (OCTEON_CN23XX_PF(oct)) 61 conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn23xx_pf))); 62 else if (OCTEON_CN23XX_VF(oct)) 63 conf = &(CFG_GET_IQ_CFG(CHIP_CONF(oct, cn23xx_vf))); 64 65 if (!conf) { 66 dev_err(&oct->pci_dev->dev, "Unsupported Chip %x\n", 67 oct->chip_id); 68 return 1; 69 } 70 71 q_size = (u32)conf->instr_type * num_descs; 72 73 iq = oct->instr_queue[iq_no]; 74 75 iq->oct_dev = oct; 76 77 iq->base_addr = lio_dma_alloc(oct, q_size, &iq->base_addr_dma); 78 if (!iq->base_addr) { 79 dev_err(&oct->pci_dev->dev, "Cannot allocate memory for instr queue %d\n", 80 iq_no); 81 return 1; 82 } 83 84 iq->max_count = num_descs; 85 86 /* Initialize a list to holds requests that have been posted to Octeon 87 * but has yet to be fetched by octeon 88 */ 89 iq->request_list = vzalloc_node(array_size(num_descs, sizeof(*iq->request_list)), 90 numa_node); 91 if (!iq->request_list) 92 iq->request_list = vzalloc(array_size(num_descs, sizeof(*iq->request_list))); 93 if (!iq->request_list) { 94 lio_dma_free(oct, q_size, iq->base_addr, iq->base_addr_dma); 95 dev_err(&oct->pci_dev->dev, "Alloc failed for IQ[%d] nr free list\n", 96 iq_no); 97 return 1; 98 } 99 100 dev_dbg(&oct->pci_dev->dev, "IQ[%d]: base: %p basedma: %pad count: %d\n", 101 iq_no, iq->base_addr, &iq->base_addr_dma, iq->max_count); 102 103 iq->txpciq.u64 = txpciq.u64; 104 iq->fill_threshold = (u32)conf->db_min; 105 iq->fill_cnt = 0; 106 iq->host_write_index = 0; 107 iq->octeon_read_index = 0; 108 iq->flush_index = 0; 109 iq->last_db_time = 0; 110 iq->do_auto_flush = 1; 111 iq->db_timeout = (u32)conf->db_timeout; 112 atomic_set(&iq->instr_pending, 0); 113 iq->pkts_processed = 0; 114 115 /* Initialize the spinlock for this instruction queue */ 116 spin_lock_init(&iq->lock); 117 if (iq_no == 0) { 118 iq->allow_soft_cmds = true; 119 spin_lock_init(&iq->post_lock); 120 } else { 121 iq->allow_soft_cmds = false; 122 } 123 124 spin_lock_init(&iq->iq_flush_running_lock); 125 126 oct->io_qmask.iq |= BIT_ULL(iq_no); 127 128 /* Set the 32B/64B mode for each input queue */ 129 oct->io_qmask.iq64B |= ((conf->instr_type == 64) << iq_no); 130 iq->iqcmd_64B = (conf->instr_type == 64); 131 132 oct->fn_list.setup_iq_regs(oct, iq_no); 133 134 oct->check_db_wq[iq_no].wq = alloc_workqueue("check_iq_db", 135 WQ_MEM_RECLAIM, 136 0); 137 if (!oct->check_db_wq[iq_no].wq) { 138 vfree(iq->request_list); 139 iq->request_list = NULL; 140 lio_dma_free(oct, q_size, iq->base_addr, iq->base_addr_dma); 141 dev_err(&oct->pci_dev->dev, "check db wq create failed for iq %d\n", 142 iq_no); 143 return 1; 144 } 145 146 db_wq = &oct->check_db_wq[iq_no]; 147 148 INIT_DELAYED_WORK(&db_wq->wk.work, check_db_timeout); 149 db_wq->wk.ctxptr = oct; 150 db_wq->wk.ctxul = iq_no; 151 queue_delayed_work(db_wq->wq, &db_wq->wk.work, msecs_to_jiffies(1)); 152 153 return 0; 154 } 155 156 int octeon_delete_instr_queue(struct octeon_device *oct, u32 iq_no) 157 { 158 u64 desc_size = 0, q_size; 159 struct octeon_instr_queue *iq = oct->instr_queue[iq_no]; 160 161 cancel_delayed_work_sync(&oct->check_db_wq[iq_no].wk.work); 162 destroy_workqueue(oct->check_db_wq[iq_no].wq); 163 164 if (OCTEON_CN6XXX(oct)) 165 desc_size = 166 CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn6xxx)); 167 else if (OCTEON_CN23XX_PF(oct)) 168 desc_size = 169 CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn23xx_pf)); 170 else if (OCTEON_CN23XX_VF(oct)) 171 desc_size = 172 CFG_GET_IQ_INSTR_TYPE(CHIP_CONF(oct, cn23xx_vf)); 173 174 vfree(iq->request_list); 175 176 if (iq->base_addr) { 177 q_size = iq->max_count * desc_size; 178 lio_dma_free(oct, (u32)q_size, iq->base_addr, 179 iq->base_addr_dma); 180 oct->io_qmask.iq &= ~(1ULL << iq_no); 181 vfree(oct->instr_queue[iq_no]); 182 oct->instr_queue[iq_no] = NULL; 183 oct->num_iqs--; 184 return 0; 185 } 186 return 1; 187 } 188 EXPORT_SYMBOL_GPL(octeon_delete_instr_queue); 189 190 /* Return 0 on success, 1 on failure */ 191 int octeon_setup_iq(struct octeon_device *oct, 192 int ifidx, 193 int q_index, 194 union oct_txpciq txpciq, 195 u32 num_descs, 196 void *app_ctx) 197 { 198 u32 iq_no = (u32)txpciq.s.q_no; 199 int numa_node = dev_to_node(&oct->pci_dev->dev); 200 201 if (oct->instr_queue[iq_no]) { 202 dev_dbg(&oct->pci_dev->dev, "IQ is in use. Cannot create the IQ: %d again\n", 203 iq_no); 204 oct->instr_queue[iq_no]->txpciq.u64 = txpciq.u64; 205 oct->instr_queue[iq_no]->app_ctx = app_ctx; 206 return 0; 207 } 208 oct->instr_queue[iq_no] = 209 vzalloc_node(sizeof(struct octeon_instr_queue), numa_node); 210 if (!oct->instr_queue[iq_no]) 211 oct->instr_queue[iq_no] = 212 vzalloc(sizeof(struct octeon_instr_queue)); 213 if (!oct->instr_queue[iq_no]) 214 return 1; 215 216 217 oct->instr_queue[iq_no]->q_index = q_index; 218 oct->instr_queue[iq_no]->app_ctx = app_ctx; 219 oct->instr_queue[iq_no]->ifidx = ifidx; 220 221 if (octeon_init_instr_queue(oct, txpciq, num_descs)) { 222 vfree(oct->instr_queue[iq_no]); 223 oct->instr_queue[iq_no] = NULL; 224 return 1; 225 } 226 227 oct->num_iqs++; 228 if (oct->fn_list.enable_io_queues(oct)) { 229 octeon_delete_instr_queue(oct, iq_no); 230 return 1; 231 } 232 233 return 0; 234 } 235 236 int lio_wait_for_instr_fetch(struct octeon_device *oct) 237 { 238 int i, retry = 1000, pending, instr_cnt = 0; 239 240 do { 241 instr_cnt = 0; 242 243 for (i = 0; i < MAX_OCTEON_INSTR_QUEUES(oct); i++) { 244 if (!(oct->io_qmask.iq & BIT_ULL(i))) 245 continue; 246 pending = 247 atomic_read(&oct->instr_queue[i]->instr_pending); 248 if (pending) 249 __check_db_timeout(oct, i); 250 instr_cnt += pending; 251 } 252 253 if (instr_cnt == 0) 254 break; 255 256 schedule_timeout_uninterruptible(1); 257 258 } while (retry-- && instr_cnt); 259 260 return instr_cnt; 261 } 262 EXPORT_SYMBOL_GPL(lio_wait_for_instr_fetch); 263 264 static inline void 265 ring_doorbell(struct octeon_device *oct, struct octeon_instr_queue *iq) 266 { 267 if (atomic_read(&oct->status) == OCT_DEV_RUNNING) { 268 writel(iq->fill_cnt, iq->doorbell_reg); 269 /* make sure doorbell write goes through */ 270 iq->fill_cnt = 0; 271 iq->last_db_time = jiffies; 272 return; 273 } 274 } 275 276 void 277 octeon_ring_doorbell_locked(struct octeon_device *oct, u32 iq_no) 278 { 279 struct octeon_instr_queue *iq; 280 281 iq = oct->instr_queue[iq_no]; 282 spin_lock(&iq->post_lock); 283 if (iq->fill_cnt) 284 ring_doorbell(oct, iq); 285 spin_unlock(&iq->post_lock); 286 } 287 EXPORT_SYMBOL_GPL(octeon_ring_doorbell_locked); 288 289 static inline void __copy_cmd_into_iq(struct octeon_instr_queue *iq, 290 u8 *cmd) 291 { 292 u8 *iqptr, cmdsize; 293 294 cmdsize = ((iq->iqcmd_64B) ? 64 : 32); 295 iqptr = iq->base_addr + (cmdsize * iq->host_write_index); 296 297 memcpy(iqptr, cmd, cmdsize); 298 } 299 300 static inline struct iq_post_status 301 __post_command2(struct octeon_instr_queue *iq, u8 *cmd) 302 { 303 struct iq_post_status st; 304 305 st.status = IQ_SEND_OK; 306 307 /* This ensures that the read index does not wrap around to the same 308 * position if queue gets full before Octeon could fetch any instr. 309 */ 310 if (atomic_read(&iq->instr_pending) >= (s32)(iq->max_count - 1)) { 311 st.status = IQ_SEND_FAILED; 312 st.index = -1; 313 return st; 314 } 315 316 if (atomic_read(&iq->instr_pending) >= (s32)(iq->max_count - 2)) 317 st.status = IQ_SEND_STOP; 318 319 __copy_cmd_into_iq(iq, cmd); 320 321 /* "index" is returned, host_write_index is modified. */ 322 st.index = iq->host_write_index; 323 iq->host_write_index = incr_index(iq->host_write_index, 1, 324 iq->max_count); 325 iq->fill_cnt++; 326 327 /* Flush the command into memory. We need to be sure the data is in 328 * memory before indicating that the instruction is pending. 329 */ 330 wmb(); 331 332 atomic_inc(&iq->instr_pending); 333 334 return st; 335 } 336 337 int 338 octeon_register_reqtype_free_fn(struct octeon_device *oct, int reqtype, 339 void (*fn)(void *)) 340 { 341 if (reqtype > REQTYPE_LAST) { 342 dev_err(&oct->pci_dev->dev, "%s: Invalid reqtype: %d\n", 343 __func__, reqtype); 344 return -EINVAL; 345 } 346 347 reqtype_free_fn[oct->octeon_id][reqtype] = fn; 348 349 return 0; 350 } 351 EXPORT_SYMBOL_GPL(octeon_register_reqtype_free_fn); 352 353 static inline void 354 __add_to_request_list(struct octeon_instr_queue *iq, 355 int idx, void *buf, int reqtype) 356 { 357 iq->request_list[idx].buf = buf; 358 iq->request_list[idx].reqtype = reqtype; 359 } 360 361 /* Can only run in process context */ 362 int 363 lio_process_iq_request_list(struct octeon_device *oct, 364 struct octeon_instr_queue *iq, u32 napi_budget) 365 { 366 struct cavium_wq *cwq = &oct->dma_comp_wq; 367 int reqtype; 368 void *buf; 369 u32 old = iq->flush_index; 370 u32 inst_count = 0; 371 unsigned int pkts_compl = 0, bytes_compl = 0; 372 struct octeon_soft_command *sc; 373 unsigned long flags; 374 375 while (old != iq->octeon_read_index) { 376 reqtype = iq->request_list[old].reqtype; 377 buf = iq->request_list[old].buf; 378 379 if (reqtype == REQTYPE_NONE) 380 goto skip_this; 381 382 octeon_update_tx_completion_counters(buf, reqtype, &pkts_compl, 383 &bytes_compl); 384 385 switch (reqtype) { 386 case REQTYPE_NORESP_NET: 387 case REQTYPE_NORESP_NET_SG: 388 case REQTYPE_RESP_NET_SG: 389 reqtype_free_fn[oct->octeon_id][reqtype](buf); 390 break; 391 case REQTYPE_RESP_NET: 392 case REQTYPE_SOFT_COMMAND: 393 sc = buf; 394 /* We're expecting a response from Octeon. 395 * It's up to lio_process_ordered_list() to 396 * process sc. Add sc to the ordered soft 397 * command response list because we expect 398 * a response from Octeon. 399 */ 400 spin_lock_irqsave(&oct->response_list 401 [OCTEON_ORDERED_SC_LIST].lock, flags); 402 atomic_inc(&oct->response_list 403 [OCTEON_ORDERED_SC_LIST].pending_req_count); 404 list_add_tail(&sc->node, &oct->response_list 405 [OCTEON_ORDERED_SC_LIST].head); 406 spin_unlock_irqrestore(&oct->response_list 407 [OCTEON_ORDERED_SC_LIST].lock, 408 flags); 409 break; 410 default: 411 dev_err(&oct->pci_dev->dev, 412 "%s Unknown reqtype: %d buf: %p at idx %d\n", 413 __func__, reqtype, buf, old); 414 } 415 416 iq->request_list[old].buf = NULL; 417 iq->request_list[old].reqtype = 0; 418 419 skip_this: 420 inst_count++; 421 old = incr_index(old, 1, iq->max_count); 422 423 if ((napi_budget) && (inst_count >= napi_budget)) 424 break; 425 } 426 if (bytes_compl) 427 octeon_report_tx_completion_to_bql(iq->app_ctx, pkts_compl, 428 bytes_compl); 429 iq->flush_index = old; 430 431 if (atomic_read(&oct->response_list 432 [OCTEON_ORDERED_SC_LIST].pending_req_count)) 433 queue_work(cwq->wq, &cwq->wk.work.work); 434 435 return inst_count; 436 } 437 EXPORT_SYMBOL_GPL(lio_process_iq_request_list); 438 439 /* Can only be called from process context */ 440 int 441 octeon_flush_iq(struct octeon_device *oct, struct octeon_instr_queue *iq, 442 u32 napi_budget) 443 { 444 u32 inst_processed = 0; 445 u32 tot_inst_processed = 0; 446 int tx_done = 1; 447 448 if (!spin_trylock(&iq->iq_flush_running_lock)) 449 return tx_done; 450 451 spin_lock_bh(&iq->lock); 452 453 iq->octeon_read_index = oct->fn_list.update_iq_read_idx(iq); 454 455 do { 456 /* Process any outstanding IQ packets. */ 457 if (iq->flush_index == iq->octeon_read_index) 458 break; 459 460 if (napi_budget) 461 inst_processed = 462 lio_process_iq_request_list(oct, iq, 463 napi_budget - 464 tot_inst_processed); 465 else 466 inst_processed = 467 lio_process_iq_request_list(oct, iq, 0); 468 469 if (inst_processed) { 470 iq->pkts_processed += inst_processed; 471 atomic_sub(inst_processed, &iq->instr_pending); 472 iq->stats.instr_processed += inst_processed; 473 } 474 475 tot_inst_processed += inst_processed; 476 } while (tot_inst_processed < napi_budget); 477 478 if (napi_budget && (tot_inst_processed >= napi_budget)) 479 tx_done = 0; 480 481 iq->last_db_time = jiffies; 482 483 spin_unlock_bh(&iq->lock); 484 485 spin_unlock(&iq->iq_flush_running_lock); 486 487 return tx_done; 488 } 489 490 /* Process instruction queue after timeout. 491 * This routine gets called from a workqueue or when removing the module. 492 */ 493 static void __check_db_timeout(struct octeon_device *oct, u64 iq_no) 494 { 495 struct octeon_instr_queue *iq; 496 u64 next_time; 497 498 if (!oct) 499 return; 500 501 iq = oct->instr_queue[iq_no]; 502 if (!iq) 503 return; 504 505 /* return immediately, if no work pending */ 506 if (!atomic_read(&iq->instr_pending)) 507 return; 508 /* If jiffies - last_db_time < db_timeout do nothing */ 509 next_time = iq->last_db_time + iq->db_timeout; 510 if (!time_after(jiffies, (unsigned long)next_time)) 511 return; 512 iq->last_db_time = jiffies; 513 514 /* Flush the instruction queue */ 515 octeon_flush_iq(oct, iq, 0); 516 517 lio_enable_irq(NULL, iq); 518 } 519 520 /* Called by the Poll thread at regular intervals to check the instruction 521 * queue for commands to be posted and for commands that were fetched by Octeon. 522 */ 523 static void check_db_timeout(struct work_struct *work) 524 { 525 struct cavium_wk *wk = (struct cavium_wk *)work; 526 struct octeon_device *oct = (struct octeon_device *)wk->ctxptr; 527 u64 iq_no = wk->ctxul; 528 struct cavium_wq *db_wq = &oct->check_db_wq[iq_no]; 529 u32 delay = 10; 530 531 __check_db_timeout(oct, iq_no); 532 queue_delayed_work(db_wq->wq, &db_wq->wk.work, msecs_to_jiffies(delay)); 533 } 534 535 int 536 octeon_send_command(struct octeon_device *oct, u32 iq_no, 537 u32 force_db, void *cmd, void *buf, 538 u32 datasize, u32 reqtype) 539 { 540 int xmit_stopped; 541 struct iq_post_status st; 542 struct octeon_instr_queue *iq = oct->instr_queue[iq_no]; 543 544 /* Get the lock and prevent other tasks and tx interrupt handler from 545 * running. 546 */ 547 if (iq->allow_soft_cmds) 548 spin_lock_bh(&iq->post_lock); 549 550 st = __post_command2(iq, cmd); 551 552 if (st.status != IQ_SEND_FAILED) { 553 xmit_stopped = octeon_report_sent_bytes_to_bql(buf, reqtype); 554 __add_to_request_list(iq, st.index, buf, reqtype); 555 INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, bytes_sent, datasize); 556 INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, instr_posted, 1); 557 558 if (iq->fill_cnt >= MAX_OCTEON_FILL_COUNT || force_db || 559 xmit_stopped || st.status == IQ_SEND_STOP) 560 ring_doorbell(oct, iq); 561 } else { 562 INCR_INSTRQUEUE_PKT_COUNT(oct, iq_no, instr_dropped, 1); 563 } 564 565 if (iq->allow_soft_cmds) 566 spin_unlock_bh(&iq->post_lock); 567 568 /* This is only done here to expedite packets being flushed 569 * for cases where there are no IQ completion interrupts. 570 */ 571 572 return st.status; 573 } 574 EXPORT_SYMBOL_GPL(octeon_send_command); 575 576 void 577 octeon_prepare_soft_command(struct octeon_device *oct, 578 struct octeon_soft_command *sc, 579 u8 opcode, 580 u8 subcode, 581 u32 irh_ossp, 582 u64 ossp0, 583 u64 ossp1) 584 { 585 struct octeon_config *oct_cfg; 586 struct octeon_instr_ih2 *ih2; 587 struct octeon_instr_ih3 *ih3; 588 struct octeon_instr_pki_ih3 *pki_ih3; 589 struct octeon_instr_irh *irh; 590 struct octeon_instr_rdp *rdp; 591 592 WARN_ON(opcode > 15); 593 WARN_ON(subcode > 127); 594 595 oct_cfg = octeon_get_conf(oct); 596 597 if (OCTEON_CN23XX_PF(oct) || OCTEON_CN23XX_VF(oct)) { 598 ih3 = (struct octeon_instr_ih3 *)&sc->cmd.cmd3.ih3; 599 600 ih3->pkind = oct->instr_queue[sc->iq_no]->txpciq.s.pkind; 601 602 pki_ih3 = (struct octeon_instr_pki_ih3 *)&sc->cmd.cmd3.pki_ih3; 603 604 pki_ih3->w = 1; 605 pki_ih3->raw = 1; 606 pki_ih3->utag = 1; 607 pki_ih3->uqpg = 608 oct->instr_queue[sc->iq_no]->txpciq.s.use_qpg; 609 pki_ih3->utt = 1; 610 pki_ih3->tag = LIO_CONTROL; 611 pki_ih3->tagtype = ATOMIC_TAG; 612 pki_ih3->qpg = 613 oct->instr_queue[sc->iq_no]->txpciq.s.ctrl_qpg; 614 615 pki_ih3->pm = 0x7; 616 pki_ih3->sl = 8; 617 618 if (sc->datasize) 619 ih3->dlengsz = sc->datasize; 620 621 irh = (struct octeon_instr_irh *)&sc->cmd.cmd3.irh; 622 irh->opcode = opcode; 623 irh->subcode = subcode; 624 625 /* opcode/subcode specific parameters (ossp) */ 626 irh->ossp = irh_ossp; 627 sc->cmd.cmd3.ossp[0] = ossp0; 628 sc->cmd.cmd3.ossp[1] = ossp1; 629 630 if (sc->rdatasize) { 631 rdp = (struct octeon_instr_rdp *)&sc->cmd.cmd3.rdp; 632 rdp->pcie_port = oct->pcie_port; 633 rdp->rlen = sc->rdatasize; 634 635 irh->rflag = 1; 636 /*PKI IH3*/ 637 /* pki_ih3 irh+ossp[0]+ossp[1]+rdp+rptr = 48 bytes */ 638 ih3->fsz = LIO_SOFTCMDRESP_IH3; 639 } else { 640 irh->rflag = 0; 641 /*PKI IH3*/ 642 /* pki_h3 + irh + ossp[0] + ossp[1] = 32 bytes */ 643 ih3->fsz = LIO_PCICMD_O3; 644 } 645 646 } else { 647 ih2 = (struct octeon_instr_ih2 *)&sc->cmd.cmd2.ih2; 648 ih2->tagtype = ATOMIC_TAG; 649 ih2->tag = LIO_CONTROL; 650 ih2->raw = 1; 651 ih2->grp = CFG_GET_CTRL_Q_GRP(oct_cfg); 652 653 if (sc->datasize) { 654 ih2->dlengsz = sc->datasize; 655 ih2->rs = 1; 656 } 657 658 irh = (struct octeon_instr_irh *)&sc->cmd.cmd2.irh; 659 irh->opcode = opcode; 660 irh->subcode = subcode; 661 662 /* opcode/subcode specific parameters (ossp) */ 663 irh->ossp = irh_ossp; 664 sc->cmd.cmd2.ossp[0] = ossp0; 665 sc->cmd.cmd2.ossp[1] = ossp1; 666 667 if (sc->rdatasize) { 668 rdp = (struct octeon_instr_rdp *)&sc->cmd.cmd2.rdp; 669 rdp->pcie_port = oct->pcie_port; 670 rdp->rlen = sc->rdatasize; 671 672 irh->rflag = 1; 673 /* irh+ossp[0]+ossp[1]+rdp+rptr = 40 bytes */ 674 ih2->fsz = LIO_SOFTCMDRESP_IH2; 675 } else { 676 irh->rflag = 0; 677 /* irh + ossp[0] + ossp[1] = 24 bytes */ 678 ih2->fsz = LIO_PCICMD_O2; 679 } 680 } 681 } 682 EXPORT_SYMBOL_GPL(octeon_prepare_soft_command); 683 684 int octeon_send_soft_command(struct octeon_device *oct, 685 struct octeon_soft_command *sc) 686 { 687 struct octeon_instr_queue *iq; 688 struct octeon_instr_ih2 *ih2; 689 struct octeon_instr_ih3 *ih3; 690 struct octeon_instr_irh *irh; 691 u32 len; 692 693 iq = oct->instr_queue[sc->iq_no]; 694 if (!iq->allow_soft_cmds) { 695 dev_err(&oct->pci_dev->dev, "Soft commands are not allowed on Queue %d\n", 696 sc->iq_no); 697 INCR_INSTRQUEUE_PKT_COUNT(oct, sc->iq_no, instr_dropped, 1); 698 return IQ_SEND_FAILED; 699 } 700 701 if (OCTEON_CN23XX_PF(oct) || OCTEON_CN23XX_VF(oct)) { 702 ih3 = (struct octeon_instr_ih3 *)&sc->cmd.cmd3.ih3; 703 if (ih3->dlengsz) { 704 WARN_ON(!sc->dmadptr); 705 sc->cmd.cmd3.dptr = sc->dmadptr; 706 } 707 irh = (struct octeon_instr_irh *)&sc->cmd.cmd3.irh; 708 if (irh->rflag) { 709 WARN_ON(!sc->dmarptr); 710 WARN_ON(!sc->status_word); 711 *sc->status_word = COMPLETION_WORD_INIT; 712 sc->cmd.cmd3.rptr = sc->dmarptr; 713 } 714 len = (u32)ih3->dlengsz; 715 } else { 716 ih2 = (struct octeon_instr_ih2 *)&sc->cmd.cmd2.ih2; 717 if (ih2->dlengsz) { 718 WARN_ON(!sc->dmadptr); 719 sc->cmd.cmd2.dptr = sc->dmadptr; 720 } 721 irh = (struct octeon_instr_irh *)&sc->cmd.cmd2.irh; 722 if (irh->rflag) { 723 WARN_ON(!sc->dmarptr); 724 WARN_ON(!sc->status_word); 725 *sc->status_word = COMPLETION_WORD_INIT; 726 sc->cmd.cmd2.rptr = sc->dmarptr; 727 } 728 len = (u32)ih2->dlengsz; 729 } 730 731 sc->expiry_time = jiffies + msecs_to_jiffies(LIO_SC_MAX_TMO_MS); 732 733 return (octeon_send_command(oct, sc->iq_no, 1, &sc->cmd, sc, 734 len, REQTYPE_SOFT_COMMAND)); 735 } 736 EXPORT_SYMBOL_GPL(octeon_send_soft_command); 737 738 int octeon_setup_sc_buffer_pool(struct octeon_device *oct) 739 { 740 int i; 741 u64 dma_addr; 742 struct octeon_soft_command *sc; 743 744 INIT_LIST_HEAD(&oct->sc_buf_pool.head); 745 spin_lock_init(&oct->sc_buf_pool.lock); 746 atomic_set(&oct->sc_buf_pool.alloc_buf_count, 0); 747 748 for (i = 0; i < MAX_SOFT_COMMAND_BUFFERS; i++) { 749 sc = (struct octeon_soft_command *) 750 lio_dma_alloc(oct, 751 SOFT_COMMAND_BUFFER_SIZE, 752 (dma_addr_t *)&dma_addr); 753 if (!sc) { 754 octeon_free_sc_buffer_pool(oct); 755 return 1; 756 } 757 758 sc->dma_addr = dma_addr; 759 sc->size = SOFT_COMMAND_BUFFER_SIZE; 760 761 list_add_tail(&sc->node, &oct->sc_buf_pool.head); 762 } 763 764 return 0; 765 } 766 EXPORT_SYMBOL_GPL(octeon_setup_sc_buffer_pool); 767 768 int octeon_free_sc_done_list(struct octeon_device *oct) 769 { 770 struct octeon_response_list *done_sc_list, *zombie_sc_list; 771 struct octeon_soft_command *sc; 772 struct list_head *tmp, *tmp2; 773 spinlock_t *sc_lists_lock; /* lock for response_list */ 774 775 done_sc_list = &oct->response_list[OCTEON_DONE_SC_LIST]; 776 zombie_sc_list = &oct->response_list[OCTEON_ZOMBIE_SC_LIST]; 777 778 if (!atomic_read(&done_sc_list->pending_req_count)) 779 return 0; 780 781 sc_lists_lock = &oct->response_list[OCTEON_ORDERED_SC_LIST].lock; 782 783 spin_lock_bh(sc_lists_lock); 784 785 list_for_each_safe(tmp, tmp2, &done_sc_list->head) { 786 sc = list_entry(tmp, struct octeon_soft_command, node); 787 788 if (READ_ONCE(sc->caller_is_done)) { 789 list_del(&sc->node); 790 atomic_dec(&done_sc_list->pending_req_count); 791 792 if (*sc->status_word == COMPLETION_WORD_INIT) { 793 /* timeout; move sc to zombie list */ 794 list_add_tail(&sc->node, &zombie_sc_list->head); 795 atomic_inc(&zombie_sc_list->pending_req_count); 796 } else { 797 octeon_free_soft_command(oct, sc); 798 } 799 } 800 } 801 802 spin_unlock_bh(sc_lists_lock); 803 804 return 0; 805 } 806 EXPORT_SYMBOL_GPL(octeon_free_sc_done_list); 807 808 int octeon_free_sc_zombie_list(struct octeon_device *oct) 809 { 810 struct octeon_response_list *zombie_sc_list; 811 struct octeon_soft_command *sc; 812 struct list_head *tmp, *tmp2; 813 spinlock_t *sc_lists_lock; /* lock for response_list */ 814 815 zombie_sc_list = &oct->response_list[OCTEON_ZOMBIE_SC_LIST]; 816 sc_lists_lock = &oct->response_list[OCTEON_ORDERED_SC_LIST].lock; 817 818 spin_lock_bh(sc_lists_lock); 819 820 list_for_each_safe(tmp, tmp2, &zombie_sc_list->head) { 821 list_del(tmp); 822 atomic_dec(&zombie_sc_list->pending_req_count); 823 sc = list_entry(tmp, struct octeon_soft_command, node); 824 octeon_free_soft_command(oct, sc); 825 } 826 827 spin_unlock_bh(sc_lists_lock); 828 829 return 0; 830 } 831 EXPORT_SYMBOL_GPL(octeon_free_sc_zombie_list); 832 833 int octeon_free_sc_buffer_pool(struct octeon_device *oct) 834 { 835 struct list_head *tmp, *tmp2; 836 struct octeon_soft_command *sc; 837 838 octeon_free_sc_zombie_list(oct); 839 840 spin_lock_bh(&oct->sc_buf_pool.lock); 841 842 list_for_each_safe(tmp, tmp2, &oct->sc_buf_pool.head) { 843 list_del(tmp); 844 845 sc = (struct octeon_soft_command *)tmp; 846 847 lio_dma_free(oct, sc->size, sc, sc->dma_addr); 848 } 849 850 INIT_LIST_HEAD(&oct->sc_buf_pool.head); 851 852 spin_unlock_bh(&oct->sc_buf_pool.lock); 853 854 return 0; 855 } 856 EXPORT_SYMBOL_GPL(octeon_free_sc_buffer_pool); 857 858 struct octeon_soft_command *octeon_alloc_soft_command(struct octeon_device *oct, 859 u32 datasize, 860 u32 rdatasize, 861 u32 ctxsize) 862 { 863 u64 dma_addr; 864 u32 size; 865 u32 offset = sizeof(struct octeon_soft_command); 866 struct octeon_soft_command *sc = NULL; 867 struct list_head *tmp; 868 869 if (!rdatasize) 870 rdatasize = 16; 871 872 WARN_ON((offset + datasize + rdatasize + ctxsize) > 873 SOFT_COMMAND_BUFFER_SIZE); 874 875 spin_lock_bh(&oct->sc_buf_pool.lock); 876 877 if (list_empty(&oct->sc_buf_pool.head)) { 878 spin_unlock_bh(&oct->sc_buf_pool.lock); 879 return NULL; 880 } 881 882 list_for_each(tmp, &oct->sc_buf_pool.head) 883 break; 884 885 list_del(tmp); 886 887 atomic_inc(&oct->sc_buf_pool.alloc_buf_count); 888 889 spin_unlock_bh(&oct->sc_buf_pool.lock); 890 891 sc = (struct octeon_soft_command *)tmp; 892 893 dma_addr = sc->dma_addr; 894 size = sc->size; 895 896 memset(sc, 0, sc->size); 897 898 sc->dma_addr = dma_addr; 899 sc->size = size; 900 901 if (ctxsize) { 902 sc->ctxptr = (u8 *)sc + offset; 903 sc->ctxsize = ctxsize; 904 } 905 906 /* Start data at 128 byte boundary */ 907 offset = (offset + ctxsize + 127) & 0xffffff80; 908 909 if (datasize) { 910 sc->virtdptr = (u8 *)sc + offset; 911 sc->dmadptr = dma_addr + offset; 912 sc->datasize = datasize; 913 } 914 915 /* Start rdata at 128 byte boundary */ 916 offset = (offset + datasize + 127) & 0xffffff80; 917 918 if (rdatasize) { 919 WARN_ON(rdatasize < 16); 920 sc->virtrptr = (u8 *)sc + offset; 921 sc->dmarptr = dma_addr + offset; 922 sc->rdatasize = rdatasize; 923 sc->status_word = (u64 *)((u8 *)(sc->virtrptr) + rdatasize - 8); 924 } 925 926 return sc; 927 } 928 EXPORT_SYMBOL_GPL(octeon_alloc_soft_command); 929 930 void octeon_free_soft_command(struct octeon_device *oct, 931 struct octeon_soft_command *sc) 932 { 933 spin_lock_bh(&oct->sc_buf_pool.lock); 934 935 list_add_tail(&sc->node, &oct->sc_buf_pool.head); 936 937 atomic_dec(&oct->sc_buf_pool.alloc_buf_count); 938 939 spin_unlock_bh(&oct->sc_buf_pool.lock); 940 } 941 EXPORT_SYMBOL_GPL(octeon_free_soft_command); 942