1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Intel I/OAT DMA Linux driver 4 * Copyright(c) 2004 - 2015 Intel Corporation. 5 */ 6 7 /* 8 * This driver supports an Intel I/OAT DMA engine, which does asynchronous 9 * copy operations. 10 */ 11 12 #include <linux/init.h> 13 #include <linux/module.h> 14 #include <linux/slab.h> 15 #include <linux/pci.h> 16 #include <linux/interrupt.h> 17 #include <linux/dmaengine.h> 18 #include <linux/delay.h> 19 #include <linux/dma-mapping.h> 20 #include <linux/workqueue.h> 21 #include <linux/prefetch.h> 22 #include <linux/sizes.h> 23 #include "dma.h" 24 #include "registers.h" 25 #include "hw.h" 26 27 #include "../dmaengine.h" 28 29 static char *chanerr_str[] = { 30 "DMA Transfer Source Address Error", 31 "DMA Transfer Destination Address Error", 32 "Next Descriptor Address Error", 33 "Descriptor Error", 34 "Chan Address Value Error", 35 "CHANCMD Error", 36 "Chipset Uncorrectable Data Integrity Error", 37 "DMA Uncorrectable Data Integrity Error", 38 "Read Data Error", 39 "Write Data Error", 40 "Descriptor Control Error", 41 "Descriptor Transfer Size Error", 42 "Completion Address Error", 43 "Interrupt Configuration Error", 44 "Super extended descriptor Address Error", 45 "Unaffiliated Error", 46 "CRC or XOR P Error", 47 "XOR Q Error", 48 "Descriptor Count Error", 49 "DIF All F detect Error", 50 "Guard Tag verification Error", 51 "Application Tag verification Error", 52 "Reference Tag verification Error", 53 "Bundle Bit Error", 54 "Result DIF All F detect Error", 55 "Result Guard Tag verification Error", 56 "Result Application Tag verification Error", 57 "Result Reference Tag verification Error", 58 }; 59 60 static void ioat_eh(struct ioatdma_chan *ioat_chan); 61 62 static void ioat_print_chanerrs(struct ioatdma_chan *ioat_chan, u32 chanerr) 63 { 64 int i; 65 66 for (i = 0; i < ARRAY_SIZE(chanerr_str); i++) { 67 if ((chanerr >> i) & 1) { 68 dev_err(to_dev(ioat_chan), "Err(%d): %s\n", 69 i, chanerr_str[i]); 70 } 71 } 72 } 73 74 /** 75 * ioat_dma_do_interrupt - handler used for single vector interrupt mode 76 * @irq: interrupt id 77 * @data: interrupt data 78 */ 79 irqreturn_t ioat_dma_do_interrupt(int irq, void *data) 80 { 81 struct ioatdma_device *instance = data; 82 struct ioatdma_chan *ioat_chan; 83 unsigned long attnstatus; 84 int bit; 85 u8 intrctrl; 86 87 intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET); 88 89 if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN)) 90 return IRQ_NONE; 91 92 if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) { 93 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET); 94 return IRQ_NONE; 95 } 96 97 attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET); 98 for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) { 99 ioat_chan = ioat_chan_by_index(instance, bit); 100 if (test_bit(IOAT_RUN, &ioat_chan->state)) 101 tasklet_schedule(&ioat_chan->cleanup_task); 102 } 103 104 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET); 105 return IRQ_HANDLED; 106 } 107 108 /** 109 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode 110 * @irq: interrupt id 111 * @data: interrupt data 112 */ 113 irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data) 114 { 115 struct ioatdma_chan *ioat_chan = data; 116 117 if (test_bit(IOAT_RUN, &ioat_chan->state)) 118 tasklet_schedule(&ioat_chan->cleanup_task); 119 120 return IRQ_HANDLED; 121 } 122 123 void ioat_stop(struct ioatdma_chan *ioat_chan) 124 { 125 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 126 struct pci_dev *pdev = ioat_dma->pdev; 127 int chan_id = chan_num(ioat_chan); 128 struct msix_entry *msix; 129 130 /* 1/ stop irq from firing tasklets 131 * 2/ stop the tasklet from re-arming irqs 132 */ 133 clear_bit(IOAT_RUN, &ioat_chan->state); 134 135 /* flush inflight interrupts */ 136 switch (ioat_dma->irq_mode) { 137 case IOAT_MSIX: 138 msix = &ioat_dma->msix_entries[chan_id]; 139 synchronize_irq(msix->vector); 140 break; 141 case IOAT_MSI: 142 case IOAT_INTX: 143 synchronize_irq(pdev->irq); 144 break; 145 default: 146 break; 147 } 148 149 /* flush inflight timers */ 150 del_timer_sync(&ioat_chan->timer); 151 152 /* flush inflight tasklet runs */ 153 tasklet_kill(&ioat_chan->cleanup_task); 154 155 /* final cleanup now that everything is quiesced and can't re-arm */ 156 ioat_cleanup_event((unsigned long)&ioat_chan->dma_chan); 157 } 158 159 static void __ioat_issue_pending(struct ioatdma_chan *ioat_chan) 160 { 161 ioat_chan->dmacount += ioat_ring_pending(ioat_chan); 162 ioat_chan->issued = ioat_chan->head; 163 writew(ioat_chan->dmacount, 164 ioat_chan->reg_base + IOAT_CHAN_DMACOUNT_OFFSET); 165 dev_dbg(to_dev(ioat_chan), 166 "%s: head: %#x tail: %#x issued: %#x count: %#x\n", 167 __func__, ioat_chan->head, ioat_chan->tail, 168 ioat_chan->issued, ioat_chan->dmacount); 169 } 170 171 void ioat_issue_pending(struct dma_chan *c) 172 { 173 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 174 175 if (ioat_ring_pending(ioat_chan)) { 176 spin_lock_bh(&ioat_chan->prep_lock); 177 __ioat_issue_pending(ioat_chan); 178 spin_unlock_bh(&ioat_chan->prep_lock); 179 } 180 } 181 182 /** 183 * ioat_update_pending - log pending descriptors 184 * @ioat: ioat+ channel 185 * 186 * Check if the number of unsubmitted descriptors has exceeded the 187 * watermark. Called with prep_lock held 188 */ 189 static void ioat_update_pending(struct ioatdma_chan *ioat_chan) 190 { 191 if (ioat_ring_pending(ioat_chan) > ioat_pending_level) 192 __ioat_issue_pending(ioat_chan); 193 } 194 195 static void __ioat_start_null_desc(struct ioatdma_chan *ioat_chan) 196 { 197 struct ioat_ring_ent *desc; 198 struct ioat_dma_descriptor *hw; 199 200 if (ioat_ring_space(ioat_chan) < 1) { 201 dev_err(to_dev(ioat_chan), 202 "Unable to start null desc - ring full\n"); 203 return; 204 } 205 206 dev_dbg(to_dev(ioat_chan), 207 "%s: head: %#x tail: %#x issued: %#x\n", 208 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued); 209 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head); 210 211 hw = desc->hw; 212 hw->ctl = 0; 213 hw->ctl_f.null = 1; 214 hw->ctl_f.int_en = 1; 215 hw->ctl_f.compl_write = 1; 216 /* set size to non-zero value (channel returns error when size is 0) */ 217 hw->size = NULL_DESC_BUFFER_SIZE; 218 hw->src_addr = 0; 219 hw->dst_addr = 0; 220 async_tx_ack(&desc->txd); 221 ioat_set_chainaddr(ioat_chan, desc->txd.phys); 222 dump_desc_dbg(ioat_chan, desc); 223 /* make sure descriptors are written before we submit */ 224 wmb(); 225 ioat_chan->head += 1; 226 __ioat_issue_pending(ioat_chan); 227 } 228 229 void ioat_start_null_desc(struct ioatdma_chan *ioat_chan) 230 { 231 spin_lock_bh(&ioat_chan->prep_lock); 232 if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state)) 233 __ioat_start_null_desc(ioat_chan); 234 spin_unlock_bh(&ioat_chan->prep_lock); 235 } 236 237 static void __ioat_restart_chan(struct ioatdma_chan *ioat_chan) 238 { 239 /* set the tail to be re-issued */ 240 ioat_chan->issued = ioat_chan->tail; 241 ioat_chan->dmacount = 0; 242 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 243 244 dev_dbg(to_dev(ioat_chan), 245 "%s: head: %#x tail: %#x issued: %#x count: %#x\n", 246 __func__, ioat_chan->head, ioat_chan->tail, 247 ioat_chan->issued, ioat_chan->dmacount); 248 249 if (ioat_ring_pending(ioat_chan)) { 250 struct ioat_ring_ent *desc; 251 252 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 253 ioat_set_chainaddr(ioat_chan, desc->txd.phys); 254 __ioat_issue_pending(ioat_chan); 255 } else 256 __ioat_start_null_desc(ioat_chan); 257 } 258 259 static int ioat_quiesce(struct ioatdma_chan *ioat_chan, unsigned long tmo) 260 { 261 unsigned long end = jiffies + tmo; 262 int err = 0; 263 u32 status; 264 265 status = ioat_chansts(ioat_chan); 266 if (is_ioat_active(status) || is_ioat_idle(status)) 267 ioat_suspend(ioat_chan); 268 while (is_ioat_active(status) || is_ioat_idle(status)) { 269 if (tmo && time_after(jiffies, end)) { 270 err = -ETIMEDOUT; 271 break; 272 } 273 status = ioat_chansts(ioat_chan); 274 cpu_relax(); 275 } 276 277 return err; 278 } 279 280 static int ioat_reset_sync(struct ioatdma_chan *ioat_chan, unsigned long tmo) 281 { 282 unsigned long end = jiffies + tmo; 283 int err = 0; 284 285 ioat_reset(ioat_chan); 286 while (ioat_reset_pending(ioat_chan)) { 287 if (end && time_after(jiffies, end)) { 288 err = -ETIMEDOUT; 289 break; 290 } 291 cpu_relax(); 292 } 293 294 return err; 295 } 296 297 static dma_cookie_t ioat_tx_submit_unlock(struct dma_async_tx_descriptor *tx) 298 __releases(&ioat_chan->prep_lock) 299 { 300 struct dma_chan *c = tx->chan; 301 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 302 dma_cookie_t cookie; 303 304 cookie = dma_cookie_assign(tx); 305 dev_dbg(to_dev(ioat_chan), "%s: cookie: %d\n", __func__, cookie); 306 307 if (!test_and_set_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state)) 308 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 309 310 /* make descriptor updates visible before advancing ioat->head, 311 * this is purposefully not smp_wmb() since we are also 312 * publishing the descriptor updates to a dma device 313 */ 314 wmb(); 315 316 ioat_chan->head += ioat_chan->produce; 317 318 ioat_update_pending(ioat_chan); 319 spin_unlock_bh(&ioat_chan->prep_lock); 320 321 return cookie; 322 } 323 324 static struct ioat_ring_ent * 325 ioat_alloc_ring_ent(struct dma_chan *chan, int idx, gfp_t flags) 326 { 327 struct ioat_dma_descriptor *hw; 328 struct ioat_ring_ent *desc; 329 struct ioatdma_chan *ioat_chan = to_ioat_chan(chan); 330 int chunk; 331 dma_addr_t phys; 332 u8 *pos; 333 off_t offs; 334 335 chunk = idx / IOAT_DESCS_PER_2M; 336 idx &= (IOAT_DESCS_PER_2M - 1); 337 offs = idx * IOAT_DESC_SZ; 338 pos = (u8 *)ioat_chan->descs[chunk].virt + offs; 339 phys = ioat_chan->descs[chunk].hw + offs; 340 hw = (struct ioat_dma_descriptor *)pos; 341 memset(hw, 0, sizeof(*hw)); 342 343 desc = kmem_cache_zalloc(ioat_cache, flags); 344 if (!desc) 345 return NULL; 346 347 dma_async_tx_descriptor_init(&desc->txd, chan); 348 desc->txd.tx_submit = ioat_tx_submit_unlock; 349 desc->hw = hw; 350 desc->txd.phys = phys; 351 return desc; 352 } 353 354 void ioat_free_ring_ent(struct ioat_ring_ent *desc, struct dma_chan *chan) 355 { 356 kmem_cache_free(ioat_cache, desc); 357 } 358 359 struct ioat_ring_ent ** 360 ioat_alloc_ring(struct dma_chan *c, int order, gfp_t flags) 361 { 362 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 363 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 364 struct ioat_ring_ent **ring; 365 int total_descs = 1 << order; 366 int i, chunks; 367 368 /* allocate the array to hold the software ring */ 369 ring = kcalloc(total_descs, sizeof(*ring), flags); 370 if (!ring) 371 return NULL; 372 373 ioat_chan->desc_chunks = chunks = (total_descs * IOAT_DESC_SZ) / SZ_2M; 374 375 for (i = 0; i < chunks; i++) { 376 struct ioat_descs *descs = &ioat_chan->descs[i]; 377 378 descs->virt = dma_alloc_coherent(to_dev(ioat_chan), 379 SZ_2M, &descs->hw, flags); 380 if (!descs->virt) { 381 int idx; 382 383 for (idx = 0; idx < i; idx++) { 384 descs = &ioat_chan->descs[idx]; 385 dma_free_coherent(to_dev(ioat_chan), SZ_2M, 386 descs->virt, descs->hw); 387 descs->virt = NULL; 388 descs->hw = 0; 389 } 390 391 ioat_chan->desc_chunks = 0; 392 kfree(ring); 393 return NULL; 394 } 395 } 396 397 for (i = 0; i < total_descs; i++) { 398 ring[i] = ioat_alloc_ring_ent(c, i, flags); 399 if (!ring[i]) { 400 int idx; 401 402 while (i--) 403 ioat_free_ring_ent(ring[i], c); 404 405 for (idx = 0; idx < ioat_chan->desc_chunks; idx++) { 406 dma_free_coherent(to_dev(ioat_chan), 407 SZ_2M, 408 ioat_chan->descs[idx].virt, 409 ioat_chan->descs[idx].hw); 410 ioat_chan->descs[idx].virt = NULL; 411 ioat_chan->descs[idx].hw = 0; 412 } 413 414 ioat_chan->desc_chunks = 0; 415 kfree(ring); 416 return NULL; 417 } 418 set_desc_id(ring[i], i); 419 } 420 421 /* link descs */ 422 for (i = 0; i < total_descs-1; i++) { 423 struct ioat_ring_ent *next = ring[i+1]; 424 struct ioat_dma_descriptor *hw = ring[i]->hw; 425 426 hw->next = next->txd.phys; 427 } 428 ring[i]->hw->next = ring[0]->txd.phys; 429 430 /* setup descriptor pre-fetching for v3.4 */ 431 if (ioat_dma->cap & IOAT_CAP_DPS) { 432 u16 drsctl = IOAT_CHAN_DRSZ_2MB | IOAT_CHAN_DRS_EN; 433 434 if (chunks == 1) 435 drsctl |= IOAT_CHAN_DRS_AUTOWRAP; 436 437 writew(drsctl, ioat_chan->reg_base + IOAT_CHAN_DRSCTL_OFFSET); 438 439 } 440 441 return ring; 442 } 443 444 /** 445 * ioat_check_space_lock - verify space and grab ring producer lock 446 * @ioat: ioat,3 channel (ring) to operate on 447 * @num_descs: allocation length 448 */ 449 int ioat_check_space_lock(struct ioatdma_chan *ioat_chan, int num_descs) 450 __acquires(&ioat_chan->prep_lock) 451 { 452 spin_lock_bh(&ioat_chan->prep_lock); 453 /* never allow the last descriptor to be consumed, we need at 454 * least one free at all times to allow for on-the-fly ring 455 * resizing. 456 */ 457 if (likely(ioat_ring_space(ioat_chan) > num_descs)) { 458 dev_dbg(to_dev(ioat_chan), "%s: num_descs: %d (%x:%x:%x)\n", 459 __func__, num_descs, ioat_chan->head, 460 ioat_chan->tail, ioat_chan->issued); 461 ioat_chan->produce = num_descs; 462 return 0; /* with ioat->prep_lock held */ 463 } 464 spin_unlock_bh(&ioat_chan->prep_lock); 465 466 dev_dbg_ratelimited(to_dev(ioat_chan), 467 "%s: ring full! num_descs: %d (%x:%x:%x)\n", 468 __func__, num_descs, ioat_chan->head, 469 ioat_chan->tail, ioat_chan->issued); 470 471 /* progress reclaim in the allocation failure case we may be 472 * called under bh_disabled so we need to trigger the timer 473 * event directly 474 */ 475 if (time_is_before_jiffies(ioat_chan->timer.expires) 476 && timer_pending(&ioat_chan->timer)) { 477 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 478 ioat_timer_event(&ioat_chan->timer); 479 } 480 481 return -ENOMEM; 482 } 483 484 static bool desc_has_ext(struct ioat_ring_ent *desc) 485 { 486 struct ioat_dma_descriptor *hw = desc->hw; 487 488 if (hw->ctl_f.op == IOAT_OP_XOR || 489 hw->ctl_f.op == IOAT_OP_XOR_VAL) { 490 struct ioat_xor_descriptor *xor = desc->xor; 491 492 if (src_cnt_to_sw(xor->ctl_f.src_cnt) > 5) 493 return true; 494 } else if (hw->ctl_f.op == IOAT_OP_PQ || 495 hw->ctl_f.op == IOAT_OP_PQ_VAL) { 496 struct ioat_pq_descriptor *pq = desc->pq; 497 498 if (src_cnt_to_sw(pq->ctl_f.src_cnt) > 3) 499 return true; 500 } 501 502 return false; 503 } 504 505 static void 506 ioat_free_sed(struct ioatdma_device *ioat_dma, struct ioat_sed_ent *sed) 507 { 508 if (!sed) 509 return; 510 511 dma_pool_free(ioat_dma->sed_hw_pool[sed->hw_pool], sed->hw, sed->dma); 512 kmem_cache_free(ioat_sed_cache, sed); 513 } 514 515 static u64 ioat_get_current_completion(struct ioatdma_chan *ioat_chan) 516 { 517 u64 phys_complete; 518 u64 completion; 519 520 completion = *ioat_chan->completion; 521 phys_complete = ioat_chansts_to_addr(completion); 522 523 dev_dbg(to_dev(ioat_chan), "%s: phys_complete: %#llx\n", __func__, 524 (unsigned long long) phys_complete); 525 526 return phys_complete; 527 } 528 529 static bool ioat_cleanup_preamble(struct ioatdma_chan *ioat_chan, 530 u64 *phys_complete) 531 { 532 *phys_complete = ioat_get_current_completion(ioat_chan); 533 if (*phys_complete == ioat_chan->last_completion) 534 return false; 535 536 clear_bit(IOAT_COMPLETION_ACK, &ioat_chan->state); 537 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 538 539 return true; 540 } 541 542 static void 543 desc_get_errstat(struct ioatdma_chan *ioat_chan, struct ioat_ring_ent *desc) 544 { 545 struct ioat_dma_descriptor *hw = desc->hw; 546 547 switch (hw->ctl_f.op) { 548 case IOAT_OP_PQ_VAL: 549 case IOAT_OP_PQ_VAL_16S: 550 { 551 struct ioat_pq_descriptor *pq = desc->pq; 552 553 /* check if there's error written */ 554 if (!pq->dwbes_f.wbes) 555 return; 556 557 /* need to set a chanerr var for checking to clear later */ 558 559 if (pq->dwbes_f.p_val_err) 560 *desc->result |= SUM_CHECK_P_RESULT; 561 562 if (pq->dwbes_f.q_val_err) 563 *desc->result |= SUM_CHECK_Q_RESULT; 564 565 return; 566 } 567 default: 568 return; 569 } 570 } 571 572 /** 573 * __cleanup - reclaim used descriptors 574 * @ioat: channel (ring) to clean 575 */ 576 static void __cleanup(struct ioatdma_chan *ioat_chan, dma_addr_t phys_complete) 577 { 578 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 579 struct ioat_ring_ent *desc; 580 bool seen_current = false; 581 int idx = ioat_chan->tail, i; 582 u16 active; 583 584 dev_dbg(to_dev(ioat_chan), "%s: head: %#x tail: %#x issued: %#x\n", 585 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued); 586 587 /* 588 * At restart of the channel, the completion address and the 589 * channel status will be 0 due to starting a new chain. Since 590 * it's new chain and the first descriptor "fails", there is 591 * nothing to clean up. We do not want to reap the entire submitted 592 * chain due to this 0 address value and then BUG. 593 */ 594 if (!phys_complete) 595 return; 596 597 active = ioat_ring_active(ioat_chan); 598 for (i = 0; i < active && !seen_current; i++) { 599 struct dma_async_tx_descriptor *tx; 600 601 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1)); 602 desc = ioat_get_ring_ent(ioat_chan, idx + i); 603 dump_desc_dbg(ioat_chan, desc); 604 605 /* set err stat if we are using dwbes */ 606 if (ioat_dma->cap & IOAT_CAP_DWBES) 607 desc_get_errstat(ioat_chan, desc); 608 609 tx = &desc->txd; 610 if (tx->cookie) { 611 dma_cookie_complete(tx); 612 dma_descriptor_unmap(tx); 613 dmaengine_desc_get_callback_invoke(tx, NULL); 614 tx->callback = NULL; 615 tx->callback_result = NULL; 616 } 617 618 if (tx->phys == phys_complete) 619 seen_current = true; 620 621 /* skip extended descriptors */ 622 if (desc_has_ext(desc)) { 623 BUG_ON(i + 1 >= active); 624 i++; 625 } 626 627 /* cleanup super extended descriptors */ 628 if (desc->sed) { 629 ioat_free_sed(ioat_dma, desc->sed); 630 desc->sed = NULL; 631 } 632 } 633 634 /* finish all descriptor reads before incrementing tail */ 635 smp_mb(); 636 ioat_chan->tail = idx + i; 637 /* no active descs have written a completion? */ 638 BUG_ON(active && !seen_current); 639 ioat_chan->last_completion = phys_complete; 640 641 if (active - i == 0) { 642 dev_dbg(to_dev(ioat_chan), "%s: cancel completion timeout\n", 643 __func__); 644 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 645 } 646 647 /* microsecond delay by sysfs variable per pending descriptor */ 648 if (ioat_chan->intr_coalesce != ioat_chan->prev_intr_coalesce) { 649 writew(min((ioat_chan->intr_coalesce * (active - i)), 650 IOAT_INTRDELAY_MASK), 651 ioat_chan->ioat_dma->reg_base + IOAT_INTRDELAY_OFFSET); 652 ioat_chan->prev_intr_coalesce = ioat_chan->intr_coalesce; 653 } 654 } 655 656 static void ioat_cleanup(struct ioatdma_chan *ioat_chan) 657 { 658 u64 phys_complete; 659 660 spin_lock_bh(&ioat_chan->cleanup_lock); 661 662 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 663 __cleanup(ioat_chan, phys_complete); 664 665 if (is_ioat_halted(*ioat_chan->completion)) { 666 u32 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 667 668 if (chanerr & 669 (IOAT_CHANERR_HANDLE_MASK | IOAT_CHANERR_RECOVER_MASK)) { 670 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 671 ioat_eh(ioat_chan); 672 } 673 } 674 675 spin_unlock_bh(&ioat_chan->cleanup_lock); 676 } 677 678 void ioat_cleanup_event(unsigned long data) 679 { 680 struct ioatdma_chan *ioat_chan = to_ioat_chan((void *)data); 681 682 ioat_cleanup(ioat_chan); 683 if (!test_bit(IOAT_RUN, &ioat_chan->state)) 684 return; 685 writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET); 686 } 687 688 static void ioat_restart_channel(struct ioatdma_chan *ioat_chan) 689 { 690 u64 phys_complete; 691 692 /* set the completion address register again */ 693 writel(lower_32_bits(ioat_chan->completion_dma), 694 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW); 695 writel(upper_32_bits(ioat_chan->completion_dma), 696 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH); 697 698 ioat_quiesce(ioat_chan, 0); 699 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 700 __cleanup(ioat_chan, phys_complete); 701 702 __ioat_restart_chan(ioat_chan); 703 } 704 705 706 static void ioat_abort_descs(struct ioatdma_chan *ioat_chan) 707 { 708 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 709 struct ioat_ring_ent *desc; 710 u16 active; 711 int idx = ioat_chan->tail, i; 712 713 /* 714 * We assume that the failed descriptor has been processed. 715 * Now we are just returning all the remaining submitted 716 * descriptors to abort. 717 */ 718 active = ioat_ring_active(ioat_chan); 719 720 /* we skip the failed descriptor that tail points to */ 721 for (i = 1; i < active; i++) { 722 struct dma_async_tx_descriptor *tx; 723 724 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1)); 725 desc = ioat_get_ring_ent(ioat_chan, idx + i); 726 727 tx = &desc->txd; 728 if (tx->cookie) { 729 struct dmaengine_result res; 730 731 dma_cookie_complete(tx); 732 dma_descriptor_unmap(tx); 733 res.result = DMA_TRANS_ABORTED; 734 dmaengine_desc_get_callback_invoke(tx, &res); 735 tx->callback = NULL; 736 tx->callback_result = NULL; 737 } 738 739 /* skip extended descriptors */ 740 if (desc_has_ext(desc)) { 741 WARN_ON(i + 1 >= active); 742 i++; 743 } 744 745 /* cleanup super extended descriptors */ 746 if (desc->sed) { 747 ioat_free_sed(ioat_dma, desc->sed); 748 desc->sed = NULL; 749 } 750 } 751 752 smp_mb(); /* finish all descriptor reads before incrementing tail */ 753 ioat_chan->tail = idx + active; 754 755 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 756 ioat_chan->last_completion = *ioat_chan->completion = desc->txd.phys; 757 } 758 759 static void ioat_eh(struct ioatdma_chan *ioat_chan) 760 { 761 struct pci_dev *pdev = to_pdev(ioat_chan); 762 struct ioat_dma_descriptor *hw; 763 struct dma_async_tx_descriptor *tx; 764 u64 phys_complete; 765 struct ioat_ring_ent *desc; 766 u32 err_handled = 0; 767 u32 chanerr_int; 768 u32 chanerr; 769 bool abort = false; 770 struct dmaengine_result res; 771 772 /* cleanup so tail points to descriptor that caused the error */ 773 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 774 __cleanup(ioat_chan, phys_complete); 775 776 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 777 pci_read_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, &chanerr_int); 778 779 dev_dbg(to_dev(ioat_chan), "%s: error = %x:%x\n", 780 __func__, chanerr, chanerr_int); 781 782 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 783 hw = desc->hw; 784 dump_desc_dbg(ioat_chan, desc); 785 786 switch (hw->ctl_f.op) { 787 case IOAT_OP_XOR_VAL: 788 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) { 789 *desc->result |= SUM_CHECK_P_RESULT; 790 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR; 791 } 792 break; 793 case IOAT_OP_PQ_VAL: 794 case IOAT_OP_PQ_VAL_16S: 795 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) { 796 *desc->result |= SUM_CHECK_P_RESULT; 797 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR; 798 } 799 if (chanerr & IOAT_CHANERR_XOR_Q_ERR) { 800 *desc->result |= SUM_CHECK_Q_RESULT; 801 err_handled |= IOAT_CHANERR_XOR_Q_ERR; 802 } 803 break; 804 } 805 806 if (chanerr & IOAT_CHANERR_RECOVER_MASK) { 807 if (chanerr & IOAT_CHANERR_READ_DATA_ERR) { 808 res.result = DMA_TRANS_READ_FAILED; 809 err_handled |= IOAT_CHANERR_READ_DATA_ERR; 810 } else if (chanerr & IOAT_CHANERR_WRITE_DATA_ERR) { 811 res.result = DMA_TRANS_WRITE_FAILED; 812 err_handled |= IOAT_CHANERR_WRITE_DATA_ERR; 813 } 814 815 abort = true; 816 } else 817 res.result = DMA_TRANS_NOERROR; 818 819 /* fault on unhandled error or spurious halt */ 820 if (chanerr ^ err_handled || chanerr == 0) { 821 dev_err(to_dev(ioat_chan), "%s: fatal error (%x:%x)\n", 822 __func__, chanerr, err_handled); 823 dev_err(to_dev(ioat_chan), "Errors handled:\n"); 824 ioat_print_chanerrs(ioat_chan, err_handled); 825 dev_err(to_dev(ioat_chan), "Errors not handled:\n"); 826 ioat_print_chanerrs(ioat_chan, (chanerr & ~err_handled)); 827 828 BUG(); 829 } 830 831 /* cleanup the faulty descriptor since we are continuing */ 832 tx = &desc->txd; 833 if (tx->cookie) { 834 dma_cookie_complete(tx); 835 dma_descriptor_unmap(tx); 836 dmaengine_desc_get_callback_invoke(tx, &res); 837 tx->callback = NULL; 838 tx->callback_result = NULL; 839 } 840 841 /* mark faulting descriptor as complete */ 842 *ioat_chan->completion = desc->txd.phys; 843 844 spin_lock_bh(&ioat_chan->prep_lock); 845 /* we need abort all descriptors */ 846 if (abort) { 847 ioat_abort_descs(ioat_chan); 848 /* clean up the channel, we could be in weird state */ 849 ioat_reset_hw(ioat_chan); 850 } 851 852 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 853 pci_write_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, chanerr_int); 854 855 ioat_restart_channel(ioat_chan); 856 spin_unlock_bh(&ioat_chan->prep_lock); 857 } 858 859 static void check_active(struct ioatdma_chan *ioat_chan) 860 { 861 if (ioat_ring_active(ioat_chan)) { 862 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 863 return; 864 } 865 866 if (test_and_clear_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state)) 867 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 868 } 869 870 void ioat_timer_event(struct timer_list *t) 871 { 872 struct ioatdma_chan *ioat_chan = from_timer(ioat_chan, t, timer); 873 dma_addr_t phys_complete; 874 u64 status; 875 876 status = ioat_chansts(ioat_chan); 877 878 /* when halted due to errors check for channel 879 * programming errors before advancing the completion state 880 */ 881 if (is_ioat_halted(status)) { 882 u32 chanerr; 883 884 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 885 dev_err(to_dev(ioat_chan), "%s: Channel halted (%x)\n", 886 __func__, chanerr); 887 dev_err(to_dev(ioat_chan), "Errors:\n"); 888 ioat_print_chanerrs(ioat_chan, chanerr); 889 890 if (test_bit(IOAT_RUN, &ioat_chan->state)) { 891 spin_lock_bh(&ioat_chan->cleanup_lock); 892 spin_lock_bh(&ioat_chan->prep_lock); 893 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 894 spin_unlock_bh(&ioat_chan->prep_lock); 895 896 ioat_abort_descs(ioat_chan); 897 dev_warn(to_dev(ioat_chan), "Reset channel...\n"); 898 ioat_reset_hw(ioat_chan); 899 dev_warn(to_dev(ioat_chan), "Restart channel...\n"); 900 ioat_restart_channel(ioat_chan); 901 902 spin_lock_bh(&ioat_chan->prep_lock); 903 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 904 spin_unlock_bh(&ioat_chan->prep_lock); 905 spin_unlock_bh(&ioat_chan->cleanup_lock); 906 } 907 908 return; 909 } 910 911 spin_lock_bh(&ioat_chan->cleanup_lock); 912 913 /* handle the no-actives case */ 914 if (!ioat_ring_active(ioat_chan)) { 915 spin_lock_bh(&ioat_chan->prep_lock); 916 check_active(ioat_chan); 917 spin_unlock_bh(&ioat_chan->prep_lock); 918 spin_unlock_bh(&ioat_chan->cleanup_lock); 919 return; 920 } 921 922 /* if we haven't made progress and we have already 923 * acknowledged a pending completion once, then be more 924 * forceful with a restart 925 */ 926 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 927 __cleanup(ioat_chan, phys_complete); 928 else if (test_bit(IOAT_COMPLETION_ACK, &ioat_chan->state)) { 929 u32 chanerr; 930 931 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 932 dev_err(to_dev(ioat_chan), "CHANSTS: %#Lx CHANERR: %#x\n", 933 status, chanerr); 934 dev_err(to_dev(ioat_chan), "Errors:\n"); 935 ioat_print_chanerrs(ioat_chan, chanerr); 936 937 dev_dbg(to_dev(ioat_chan), "Active descriptors: %d\n", 938 ioat_ring_active(ioat_chan)); 939 940 spin_lock_bh(&ioat_chan->prep_lock); 941 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 942 spin_unlock_bh(&ioat_chan->prep_lock); 943 944 ioat_abort_descs(ioat_chan); 945 dev_warn(to_dev(ioat_chan), "Resetting channel...\n"); 946 ioat_reset_hw(ioat_chan); 947 dev_warn(to_dev(ioat_chan), "Restarting channel...\n"); 948 ioat_restart_channel(ioat_chan); 949 950 spin_lock_bh(&ioat_chan->prep_lock); 951 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 952 spin_unlock_bh(&ioat_chan->prep_lock); 953 spin_unlock_bh(&ioat_chan->cleanup_lock); 954 return; 955 } else 956 set_bit(IOAT_COMPLETION_ACK, &ioat_chan->state); 957 958 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 959 spin_unlock_bh(&ioat_chan->cleanup_lock); 960 } 961 962 enum dma_status 963 ioat_tx_status(struct dma_chan *c, dma_cookie_t cookie, 964 struct dma_tx_state *txstate) 965 { 966 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 967 enum dma_status ret; 968 969 ret = dma_cookie_status(c, cookie, txstate); 970 if (ret == DMA_COMPLETE) 971 return ret; 972 973 ioat_cleanup(ioat_chan); 974 975 return dma_cookie_status(c, cookie, txstate); 976 } 977 978 int ioat_reset_hw(struct ioatdma_chan *ioat_chan) 979 { 980 /* throw away whatever the channel was doing and get it 981 * initialized, with ioat3 specific workarounds 982 */ 983 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 984 struct pci_dev *pdev = ioat_dma->pdev; 985 u32 chanerr; 986 u16 dev_id; 987 int err; 988 989 ioat_quiesce(ioat_chan, msecs_to_jiffies(100)); 990 991 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 992 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 993 994 if (ioat_dma->version < IOAT_VER_3_3) { 995 /* clear any pending errors */ 996 err = pci_read_config_dword(pdev, 997 IOAT_PCI_CHANERR_INT_OFFSET, &chanerr); 998 if (err) { 999 dev_err(&pdev->dev, 1000 "channel error register unreachable\n"); 1001 return err; 1002 } 1003 pci_write_config_dword(pdev, 1004 IOAT_PCI_CHANERR_INT_OFFSET, chanerr); 1005 1006 /* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit 1007 * (workaround for spurious config parity error after restart) 1008 */ 1009 pci_read_config_word(pdev, IOAT_PCI_DEVICE_ID_OFFSET, &dev_id); 1010 if (dev_id == PCI_DEVICE_ID_INTEL_IOAT_TBG0) { 1011 pci_write_config_dword(pdev, 1012 IOAT_PCI_DMAUNCERRSTS_OFFSET, 1013 0x10); 1014 } 1015 } 1016 1017 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) { 1018 ioat_dma->msixtba0 = readq(ioat_dma->reg_base + 0x1000); 1019 ioat_dma->msixdata0 = readq(ioat_dma->reg_base + 0x1008); 1020 ioat_dma->msixpba = readq(ioat_dma->reg_base + 0x1800); 1021 } 1022 1023 1024 err = ioat_reset_sync(ioat_chan, msecs_to_jiffies(200)); 1025 if (!err) { 1026 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) { 1027 writeq(ioat_dma->msixtba0, ioat_dma->reg_base + 0x1000); 1028 writeq(ioat_dma->msixdata0, ioat_dma->reg_base + 0x1008); 1029 writeq(ioat_dma->msixpba, ioat_dma->reg_base + 0x1800); 1030 } 1031 } 1032 1033 if (err) 1034 dev_err(&pdev->dev, "Failed to reset: %d\n", err); 1035 1036 return err; 1037 } 1038