1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Intel I/OAT DMA Linux driver 4 * Copyright(c) 2004 - 2015 Intel Corporation. 5 */ 6 7 /* 8 * This driver supports an Intel I/OAT DMA engine, which does asynchronous 9 * copy operations. 10 */ 11 12 #include <linux/init.h> 13 #include <linux/module.h> 14 #include <linux/slab.h> 15 #include <linux/pci.h> 16 #include <linux/interrupt.h> 17 #include <linux/dmaengine.h> 18 #include <linux/delay.h> 19 #include <linux/dma-mapping.h> 20 #include <linux/workqueue.h> 21 #include <linux/prefetch.h> 22 #include <linux/sizes.h> 23 #include "dma.h" 24 #include "registers.h" 25 #include "hw.h" 26 27 #include "../dmaengine.h" 28 29 static char *chanerr_str[] = { 30 "DMA Transfer Source Address Error", 31 "DMA Transfer Destination Address Error", 32 "Next Descriptor Address Error", 33 "Descriptor Error", 34 "Chan Address Value Error", 35 "CHANCMD Error", 36 "Chipset Uncorrectable Data Integrity Error", 37 "DMA Uncorrectable Data Integrity Error", 38 "Read Data Error", 39 "Write Data Error", 40 "Descriptor Control Error", 41 "Descriptor Transfer Size Error", 42 "Completion Address Error", 43 "Interrupt Configuration Error", 44 "Super extended descriptor Address Error", 45 "Unaffiliated Error", 46 "CRC or XOR P Error", 47 "XOR Q Error", 48 "Descriptor Count Error", 49 "DIF All F detect Error", 50 "Guard Tag verification Error", 51 "Application Tag verification Error", 52 "Reference Tag verification Error", 53 "Bundle Bit Error", 54 "Result DIF All F detect Error", 55 "Result Guard Tag verification Error", 56 "Result Application Tag verification Error", 57 "Result Reference Tag verification Error", 58 }; 59 60 static void ioat_eh(struct ioatdma_chan *ioat_chan); 61 62 static void ioat_print_chanerrs(struct ioatdma_chan *ioat_chan, u32 chanerr) 63 { 64 int i; 65 66 for (i = 0; i < ARRAY_SIZE(chanerr_str); i++) { 67 if ((chanerr >> i) & 1) { 68 dev_err(to_dev(ioat_chan), "Err(%d): %s\n", 69 i, chanerr_str[i]); 70 } 71 } 72 } 73 74 /** 75 * ioat_dma_do_interrupt - handler used for single vector interrupt mode 76 * @irq: interrupt id 77 * @data: interrupt data 78 */ 79 irqreturn_t ioat_dma_do_interrupt(int irq, void *data) 80 { 81 struct ioatdma_device *instance = data; 82 struct ioatdma_chan *ioat_chan; 83 unsigned long attnstatus; 84 int bit; 85 u8 intrctrl; 86 87 intrctrl = readb(instance->reg_base + IOAT_INTRCTRL_OFFSET); 88 89 if (!(intrctrl & IOAT_INTRCTRL_MASTER_INT_EN)) 90 return IRQ_NONE; 91 92 if (!(intrctrl & IOAT_INTRCTRL_INT_STATUS)) { 93 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET); 94 return IRQ_NONE; 95 } 96 97 attnstatus = readl(instance->reg_base + IOAT_ATTNSTATUS_OFFSET); 98 for_each_set_bit(bit, &attnstatus, BITS_PER_LONG) { 99 ioat_chan = ioat_chan_by_index(instance, bit); 100 if (test_bit(IOAT_RUN, &ioat_chan->state)) 101 tasklet_schedule(&ioat_chan->cleanup_task); 102 } 103 104 writeb(intrctrl, instance->reg_base + IOAT_INTRCTRL_OFFSET); 105 return IRQ_HANDLED; 106 } 107 108 /** 109 * ioat_dma_do_interrupt_msix - handler used for vector-per-channel interrupt mode 110 * @irq: interrupt id 111 * @data: interrupt data 112 */ 113 irqreturn_t ioat_dma_do_interrupt_msix(int irq, void *data) 114 { 115 struct ioatdma_chan *ioat_chan = data; 116 117 if (test_bit(IOAT_RUN, &ioat_chan->state)) 118 tasklet_schedule(&ioat_chan->cleanup_task); 119 120 return IRQ_HANDLED; 121 } 122 123 void ioat_stop(struct ioatdma_chan *ioat_chan) 124 { 125 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 126 struct pci_dev *pdev = ioat_dma->pdev; 127 int chan_id = chan_num(ioat_chan); 128 struct msix_entry *msix; 129 130 /* 1/ stop irq from firing tasklets 131 * 2/ stop the tasklet from re-arming irqs 132 */ 133 clear_bit(IOAT_RUN, &ioat_chan->state); 134 135 /* flush inflight interrupts */ 136 switch (ioat_dma->irq_mode) { 137 case IOAT_MSIX: 138 msix = &ioat_dma->msix_entries[chan_id]; 139 synchronize_irq(msix->vector); 140 break; 141 case IOAT_MSI: 142 case IOAT_INTX: 143 synchronize_irq(pdev->irq); 144 break; 145 default: 146 break; 147 } 148 149 /* flush inflight timers */ 150 del_timer_sync(&ioat_chan->timer); 151 152 /* flush inflight tasklet runs */ 153 tasklet_kill(&ioat_chan->cleanup_task); 154 155 /* final cleanup now that everything is quiesced and can't re-arm */ 156 ioat_cleanup_event((unsigned long)&ioat_chan->dma_chan); 157 } 158 159 static void __ioat_issue_pending(struct ioatdma_chan *ioat_chan) 160 { 161 ioat_chan->dmacount += ioat_ring_pending(ioat_chan); 162 ioat_chan->issued = ioat_chan->head; 163 writew(ioat_chan->dmacount, 164 ioat_chan->reg_base + IOAT_CHAN_DMACOUNT_OFFSET); 165 dev_dbg(to_dev(ioat_chan), 166 "%s: head: %#x tail: %#x issued: %#x count: %#x\n", 167 __func__, ioat_chan->head, ioat_chan->tail, 168 ioat_chan->issued, ioat_chan->dmacount); 169 } 170 171 void ioat_issue_pending(struct dma_chan *c) 172 { 173 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 174 175 if (ioat_ring_pending(ioat_chan)) { 176 spin_lock_bh(&ioat_chan->prep_lock); 177 __ioat_issue_pending(ioat_chan); 178 spin_unlock_bh(&ioat_chan->prep_lock); 179 } 180 } 181 182 /** 183 * ioat_update_pending - log pending descriptors 184 * @ioat: ioat+ channel 185 * 186 * Check if the number of unsubmitted descriptors has exceeded the 187 * watermark. Called with prep_lock held 188 */ 189 static void ioat_update_pending(struct ioatdma_chan *ioat_chan) 190 { 191 if (ioat_ring_pending(ioat_chan) > ioat_pending_level) 192 __ioat_issue_pending(ioat_chan); 193 } 194 195 static void __ioat_start_null_desc(struct ioatdma_chan *ioat_chan) 196 { 197 struct ioat_ring_ent *desc; 198 struct ioat_dma_descriptor *hw; 199 200 if (ioat_ring_space(ioat_chan) < 1) { 201 dev_err(to_dev(ioat_chan), 202 "Unable to start null desc - ring full\n"); 203 return; 204 } 205 206 dev_dbg(to_dev(ioat_chan), 207 "%s: head: %#x tail: %#x issued: %#x\n", 208 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued); 209 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->head); 210 211 hw = desc->hw; 212 hw->ctl = 0; 213 hw->ctl_f.null = 1; 214 hw->ctl_f.int_en = 1; 215 hw->ctl_f.compl_write = 1; 216 /* set size to non-zero value (channel returns error when size is 0) */ 217 hw->size = NULL_DESC_BUFFER_SIZE; 218 hw->src_addr = 0; 219 hw->dst_addr = 0; 220 async_tx_ack(&desc->txd); 221 ioat_set_chainaddr(ioat_chan, desc->txd.phys); 222 dump_desc_dbg(ioat_chan, desc); 223 /* make sure descriptors are written before we submit */ 224 wmb(); 225 ioat_chan->head += 1; 226 __ioat_issue_pending(ioat_chan); 227 } 228 229 void ioat_start_null_desc(struct ioatdma_chan *ioat_chan) 230 { 231 spin_lock_bh(&ioat_chan->prep_lock); 232 if (!test_bit(IOAT_CHAN_DOWN, &ioat_chan->state)) 233 __ioat_start_null_desc(ioat_chan); 234 spin_unlock_bh(&ioat_chan->prep_lock); 235 } 236 237 static void __ioat_restart_chan(struct ioatdma_chan *ioat_chan) 238 { 239 /* set the tail to be re-issued */ 240 ioat_chan->issued = ioat_chan->tail; 241 ioat_chan->dmacount = 0; 242 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 243 244 dev_dbg(to_dev(ioat_chan), 245 "%s: head: %#x tail: %#x issued: %#x count: %#x\n", 246 __func__, ioat_chan->head, ioat_chan->tail, 247 ioat_chan->issued, ioat_chan->dmacount); 248 249 if (ioat_ring_pending(ioat_chan)) { 250 struct ioat_ring_ent *desc; 251 252 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 253 ioat_set_chainaddr(ioat_chan, desc->txd.phys); 254 __ioat_issue_pending(ioat_chan); 255 } else 256 __ioat_start_null_desc(ioat_chan); 257 } 258 259 static int ioat_quiesce(struct ioatdma_chan *ioat_chan, unsigned long tmo) 260 { 261 unsigned long end = jiffies + tmo; 262 int err = 0; 263 u32 status; 264 265 status = ioat_chansts(ioat_chan); 266 if (is_ioat_active(status) || is_ioat_idle(status)) 267 ioat_suspend(ioat_chan); 268 while (is_ioat_active(status) || is_ioat_idle(status)) { 269 if (tmo && time_after(jiffies, end)) { 270 err = -ETIMEDOUT; 271 break; 272 } 273 status = ioat_chansts(ioat_chan); 274 cpu_relax(); 275 } 276 277 return err; 278 } 279 280 static int ioat_reset_sync(struct ioatdma_chan *ioat_chan, unsigned long tmo) 281 { 282 unsigned long end = jiffies + tmo; 283 int err = 0; 284 285 ioat_reset(ioat_chan); 286 while (ioat_reset_pending(ioat_chan)) { 287 if (end && time_after(jiffies, end)) { 288 err = -ETIMEDOUT; 289 break; 290 } 291 cpu_relax(); 292 } 293 294 return err; 295 } 296 297 static dma_cookie_t ioat_tx_submit_unlock(struct dma_async_tx_descriptor *tx) 298 __releases(&ioat_chan->prep_lock) 299 { 300 struct dma_chan *c = tx->chan; 301 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 302 dma_cookie_t cookie; 303 304 cookie = dma_cookie_assign(tx); 305 dev_dbg(to_dev(ioat_chan), "%s: cookie: %d\n", __func__, cookie); 306 307 if (!test_and_set_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state)) 308 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 309 310 /* make descriptor updates visible before advancing ioat->head, 311 * this is purposefully not smp_wmb() since we are also 312 * publishing the descriptor updates to a dma device 313 */ 314 wmb(); 315 316 ioat_chan->head += ioat_chan->produce; 317 318 ioat_update_pending(ioat_chan); 319 spin_unlock_bh(&ioat_chan->prep_lock); 320 321 return cookie; 322 } 323 324 static struct ioat_ring_ent * 325 ioat_alloc_ring_ent(struct dma_chan *chan, int idx, gfp_t flags) 326 { 327 struct ioat_dma_descriptor *hw; 328 struct ioat_ring_ent *desc; 329 struct ioatdma_chan *ioat_chan = to_ioat_chan(chan); 330 int chunk; 331 dma_addr_t phys; 332 u8 *pos; 333 off_t offs; 334 335 chunk = idx / IOAT_DESCS_PER_2M; 336 idx &= (IOAT_DESCS_PER_2M - 1); 337 offs = idx * IOAT_DESC_SZ; 338 pos = (u8 *)ioat_chan->descs[chunk].virt + offs; 339 phys = ioat_chan->descs[chunk].hw + offs; 340 hw = (struct ioat_dma_descriptor *)pos; 341 memset(hw, 0, sizeof(*hw)); 342 343 desc = kmem_cache_zalloc(ioat_cache, flags); 344 if (!desc) 345 return NULL; 346 347 dma_async_tx_descriptor_init(&desc->txd, chan); 348 desc->txd.tx_submit = ioat_tx_submit_unlock; 349 desc->hw = hw; 350 desc->txd.phys = phys; 351 return desc; 352 } 353 354 void ioat_free_ring_ent(struct ioat_ring_ent *desc, struct dma_chan *chan) 355 { 356 kmem_cache_free(ioat_cache, desc); 357 } 358 359 struct ioat_ring_ent ** 360 ioat_alloc_ring(struct dma_chan *c, int order, gfp_t flags) 361 { 362 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 363 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 364 struct ioat_ring_ent **ring; 365 int total_descs = 1 << order; 366 int i, chunks; 367 368 /* allocate the array to hold the software ring */ 369 ring = kcalloc(total_descs, sizeof(*ring), flags); 370 if (!ring) 371 return NULL; 372 373 ioat_chan->desc_chunks = chunks = (total_descs * IOAT_DESC_SZ) / SZ_2M; 374 375 for (i = 0; i < chunks; i++) { 376 struct ioat_descs *descs = &ioat_chan->descs[i]; 377 378 descs->virt = dma_alloc_coherent(to_dev(ioat_chan), 379 SZ_2M, &descs->hw, flags); 380 if (!descs->virt && (i > 0)) { 381 int idx; 382 383 for (idx = 0; idx < i; idx++) { 384 dma_free_coherent(to_dev(ioat_chan), SZ_2M, 385 descs->virt, descs->hw); 386 descs->virt = NULL; 387 descs->hw = 0; 388 } 389 390 ioat_chan->desc_chunks = 0; 391 kfree(ring); 392 return NULL; 393 } 394 } 395 396 for (i = 0; i < total_descs; i++) { 397 ring[i] = ioat_alloc_ring_ent(c, i, flags); 398 if (!ring[i]) { 399 int idx; 400 401 while (i--) 402 ioat_free_ring_ent(ring[i], c); 403 404 for (idx = 0; idx < ioat_chan->desc_chunks; idx++) { 405 dma_free_coherent(to_dev(ioat_chan), 406 SZ_2M, 407 ioat_chan->descs[idx].virt, 408 ioat_chan->descs[idx].hw); 409 ioat_chan->descs[idx].virt = NULL; 410 ioat_chan->descs[idx].hw = 0; 411 } 412 413 ioat_chan->desc_chunks = 0; 414 kfree(ring); 415 return NULL; 416 } 417 set_desc_id(ring[i], i); 418 } 419 420 /* link descs */ 421 for (i = 0; i < total_descs-1; i++) { 422 struct ioat_ring_ent *next = ring[i+1]; 423 struct ioat_dma_descriptor *hw = ring[i]->hw; 424 425 hw->next = next->txd.phys; 426 } 427 ring[i]->hw->next = ring[0]->txd.phys; 428 429 /* setup descriptor pre-fetching for v3.4 */ 430 if (ioat_dma->cap & IOAT_CAP_DPS) { 431 u16 drsctl = IOAT_CHAN_DRSZ_2MB | IOAT_CHAN_DRS_EN; 432 433 if (chunks == 1) 434 drsctl |= IOAT_CHAN_DRS_AUTOWRAP; 435 436 writew(drsctl, ioat_chan->reg_base + IOAT_CHAN_DRSCTL_OFFSET); 437 438 } 439 440 return ring; 441 } 442 443 /** 444 * ioat_check_space_lock - verify space and grab ring producer lock 445 * @ioat: ioat,3 channel (ring) to operate on 446 * @num_descs: allocation length 447 */ 448 int ioat_check_space_lock(struct ioatdma_chan *ioat_chan, int num_descs) 449 __acquires(&ioat_chan->prep_lock) 450 { 451 spin_lock_bh(&ioat_chan->prep_lock); 452 /* never allow the last descriptor to be consumed, we need at 453 * least one free at all times to allow for on-the-fly ring 454 * resizing. 455 */ 456 if (likely(ioat_ring_space(ioat_chan) > num_descs)) { 457 dev_dbg(to_dev(ioat_chan), "%s: num_descs: %d (%x:%x:%x)\n", 458 __func__, num_descs, ioat_chan->head, 459 ioat_chan->tail, ioat_chan->issued); 460 ioat_chan->produce = num_descs; 461 return 0; /* with ioat->prep_lock held */ 462 } 463 spin_unlock_bh(&ioat_chan->prep_lock); 464 465 dev_dbg_ratelimited(to_dev(ioat_chan), 466 "%s: ring full! num_descs: %d (%x:%x:%x)\n", 467 __func__, num_descs, ioat_chan->head, 468 ioat_chan->tail, ioat_chan->issued); 469 470 /* progress reclaim in the allocation failure case we may be 471 * called under bh_disabled so we need to trigger the timer 472 * event directly 473 */ 474 if (time_is_before_jiffies(ioat_chan->timer.expires) 475 && timer_pending(&ioat_chan->timer)) { 476 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 477 ioat_timer_event(&ioat_chan->timer); 478 } 479 480 return -ENOMEM; 481 } 482 483 static bool desc_has_ext(struct ioat_ring_ent *desc) 484 { 485 struct ioat_dma_descriptor *hw = desc->hw; 486 487 if (hw->ctl_f.op == IOAT_OP_XOR || 488 hw->ctl_f.op == IOAT_OP_XOR_VAL) { 489 struct ioat_xor_descriptor *xor = desc->xor; 490 491 if (src_cnt_to_sw(xor->ctl_f.src_cnt) > 5) 492 return true; 493 } else if (hw->ctl_f.op == IOAT_OP_PQ || 494 hw->ctl_f.op == IOAT_OP_PQ_VAL) { 495 struct ioat_pq_descriptor *pq = desc->pq; 496 497 if (src_cnt_to_sw(pq->ctl_f.src_cnt) > 3) 498 return true; 499 } 500 501 return false; 502 } 503 504 static void 505 ioat_free_sed(struct ioatdma_device *ioat_dma, struct ioat_sed_ent *sed) 506 { 507 if (!sed) 508 return; 509 510 dma_pool_free(ioat_dma->sed_hw_pool[sed->hw_pool], sed->hw, sed->dma); 511 kmem_cache_free(ioat_sed_cache, sed); 512 } 513 514 static u64 ioat_get_current_completion(struct ioatdma_chan *ioat_chan) 515 { 516 u64 phys_complete; 517 u64 completion; 518 519 completion = *ioat_chan->completion; 520 phys_complete = ioat_chansts_to_addr(completion); 521 522 dev_dbg(to_dev(ioat_chan), "%s: phys_complete: %#llx\n", __func__, 523 (unsigned long long) phys_complete); 524 525 return phys_complete; 526 } 527 528 static bool ioat_cleanup_preamble(struct ioatdma_chan *ioat_chan, 529 u64 *phys_complete) 530 { 531 *phys_complete = ioat_get_current_completion(ioat_chan); 532 if (*phys_complete == ioat_chan->last_completion) 533 return false; 534 535 clear_bit(IOAT_COMPLETION_ACK, &ioat_chan->state); 536 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 537 538 return true; 539 } 540 541 static void 542 desc_get_errstat(struct ioatdma_chan *ioat_chan, struct ioat_ring_ent *desc) 543 { 544 struct ioat_dma_descriptor *hw = desc->hw; 545 546 switch (hw->ctl_f.op) { 547 case IOAT_OP_PQ_VAL: 548 case IOAT_OP_PQ_VAL_16S: 549 { 550 struct ioat_pq_descriptor *pq = desc->pq; 551 552 /* check if there's error written */ 553 if (!pq->dwbes_f.wbes) 554 return; 555 556 /* need to set a chanerr var for checking to clear later */ 557 558 if (pq->dwbes_f.p_val_err) 559 *desc->result |= SUM_CHECK_P_RESULT; 560 561 if (pq->dwbes_f.q_val_err) 562 *desc->result |= SUM_CHECK_Q_RESULT; 563 564 return; 565 } 566 default: 567 return; 568 } 569 } 570 571 /** 572 * __cleanup - reclaim used descriptors 573 * @ioat: channel (ring) to clean 574 */ 575 static void __cleanup(struct ioatdma_chan *ioat_chan, dma_addr_t phys_complete) 576 { 577 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 578 struct ioat_ring_ent *desc; 579 bool seen_current = false; 580 int idx = ioat_chan->tail, i; 581 u16 active; 582 583 dev_dbg(to_dev(ioat_chan), "%s: head: %#x tail: %#x issued: %#x\n", 584 __func__, ioat_chan->head, ioat_chan->tail, ioat_chan->issued); 585 586 /* 587 * At restart of the channel, the completion address and the 588 * channel status will be 0 due to starting a new chain. Since 589 * it's new chain and the first descriptor "fails", there is 590 * nothing to clean up. We do not want to reap the entire submitted 591 * chain due to this 0 address value and then BUG. 592 */ 593 if (!phys_complete) 594 return; 595 596 active = ioat_ring_active(ioat_chan); 597 for (i = 0; i < active && !seen_current; i++) { 598 struct dma_async_tx_descriptor *tx; 599 600 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1)); 601 desc = ioat_get_ring_ent(ioat_chan, idx + i); 602 dump_desc_dbg(ioat_chan, desc); 603 604 /* set err stat if we are using dwbes */ 605 if (ioat_dma->cap & IOAT_CAP_DWBES) 606 desc_get_errstat(ioat_chan, desc); 607 608 tx = &desc->txd; 609 if (tx->cookie) { 610 dma_cookie_complete(tx); 611 dma_descriptor_unmap(tx); 612 dmaengine_desc_get_callback_invoke(tx, NULL); 613 tx->callback = NULL; 614 tx->callback_result = NULL; 615 } 616 617 if (tx->phys == phys_complete) 618 seen_current = true; 619 620 /* skip extended descriptors */ 621 if (desc_has_ext(desc)) { 622 BUG_ON(i + 1 >= active); 623 i++; 624 } 625 626 /* cleanup super extended descriptors */ 627 if (desc->sed) { 628 ioat_free_sed(ioat_dma, desc->sed); 629 desc->sed = NULL; 630 } 631 } 632 633 /* finish all descriptor reads before incrementing tail */ 634 smp_mb(); 635 ioat_chan->tail = idx + i; 636 /* no active descs have written a completion? */ 637 BUG_ON(active && !seen_current); 638 ioat_chan->last_completion = phys_complete; 639 640 if (active - i == 0) { 641 dev_dbg(to_dev(ioat_chan), "%s: cancel completion timeout\n", 642 __func__); 643 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 644 } 645 646 /* microsecond delay by sysfs variable per pending descriptor */ 647 if (ioat_chan->intr_coalesce != ioat_chan->prev_intr_coalesce) { 648 writew(min((ioat_chan->intr_coalesce * (active - i)), 649 IOAT_INTRDELAY_MASK), 650 ioat_chan->ioat_dma->reg_base + IOAT_INTRDELAY_OFFSET); 651 ioat_chan->prev_intr_coalesce = ioat_chan->intr_coalesce; 652 } 653 } 654 655 static void ioat_cleanup(struct ioatdma_chan *ioat_chan) 656 { 657 u64 phys_complete; 658 659 spin_lock_bh(&ioat_chan->cleanup_lock); 660 661 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 662 __cleanup(ioat_chan, phys_complete); 663 664 if (is_ioat_halted(*ioat_chan->completion)) { 665 u32 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 666 667 if (chanerr & 668 (IOAT_CHANERR_HANDLE_MASK | IOAT_CHANERR_RECOVER_MASK)) { 669 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 670 ioat_eh(ioat_chan); 671 } 672 } 673 674 spin_unlock_bh(&ioat_chan->cleanup_lock); 675 } 676 677 void ioat_cleanup_event(unsigned long data) 678 { 679 struct ioatdma_chan *ioat_chan = to_ioat_chan((void *)data); 680 681 ioat_cleanup(ioat_chan); 682 if (!test_bit(IOAT_RUN, &ioat_chan->state)) 683 return; 684 writew(IOAT_CHANCTRL_RUN, ioat_chan->reg_base + IOAT_CHANCTRL_OFFSET); 685 } 686 687 static void ioat_restart_channel(struct ioatdma_chan *ioat_chan) 688 { 689 u64 phys_complete; 690 691 /* set the completion address register again */ 692 writel(lower_32_bits(ioat_chan->completion_dma), 693 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_LOW); 694 writel(upper_32_bits(ioat_chan->completion_dma), 695 ioat_chan->reg_base + IOAT_CHANCMP_OFFSET_HIGH); 696 697 ioat_quiesce(ioat_chan, 0); 698 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 699 __cleanup(ioat_chan, phys_complete); 700 701 __ioat_restart_chan(ioat_chan); 702 } 703 704 705 static void ioat_abort_descs(struct ioatdma_chan *ioat_chan) 706 { 707 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 708 struct ioat_ring_ent *desc; 709 u16 active; 710 int idx = ioat_chan->tail, i; 711 712 /* 713 * We assume that the failed descriptor has been processed. 714 * Now we are just returning all the remaining submitted 715 * descriptors to abort. 716 */ 717 active = ioat_ring_active(ioat_chan); 718 719 /* we skip the failed descriptor that tail points to */ 720 for (i = 1; i < active; i++) { 721 struct dma_async_tx_descriptor *tx; 722 723 prefetch(ioat_get_ring_ent(ioat_chan, idx + i + 1)); 724 desc = ioat_get_ring_ent(ioat_chan, idx + i); 725 726 tx = &desc->txd; 727 if (tx->cookie) { 728 struct dmaengine_result res; 729 730 dma_cookie_complete(tx); 731 dma_descriptor_unmap(tx); 732 res.result = DMA_TRANS_ABORTED; 733 dmaengine_desc_get_callback_invoke(tx, &res); 734 tx->callback = NULL; 735 tx->callback_result = NULL; 736 } 737 738 /* skip extended descriptors */ 739 if (desc_has_ext(desc)) { 740 WARN_ON(i + 1 >= active); 741 i++; 742 } 743 744 /* cleanup super extended descriptors */ 745 if (desc->sed) { 746 ioat_free_sed(ioat_dma, desc->sed); 747 desc->sed = NULL; 748 } 749 } 750 751 smp_mb(); /* finish all descriptor reads before incrementing tail */ 752 ioat_chan->tail = idx + active; 753 754 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 755 ioat_chan->last_completion = *ioat_chan->completion = desc->txd.phys; 756 } 757 758 static void ioat_eh(struct ioatdma_chan *ioat_chan) 759 { 760 struct pci_dev *pdev = to_pdev(ioat_chan); 761 struct ioat_dma_descriptor *hw; 762 struct dma_async_tx_descriptor *tx; 763 u64 phys_complete; 764 struct ioat_ring_ent *desc; 765 u32 err_handled = 0; 766 u32 chanerr_int; 767 u32 chanerr; 768 bool abort = false; 769 struct dmaengine_result res; 770 771 /* cleanup so tail points to descriptor that caused the error */ 772 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 773 __cleanup(ioat_chan, phys_complete); 774 775 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 776 pci_read_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, &chanerr_int); 777 778 dev_dbg(to_dev(ioat_chan), "%s: error = %x:%x\n", 779 __func__, chanerr, chanerr_int); 780 781 desc = ioat_get_ring_ent(ioat_chan, ioat_chan->tail); 782 hw = desc->hw; 783 dump_desc_dbg(ioat_chan, desc); 784 785 switch (hw->ctl_f.op) { 786 case IOAT_OP_XOR_VAL: 787 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) { 788 *desc->result |= SUM_CHECK_P_RESULT; 789 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR; 790 } 791 break; 792 case IOAT_OP_PQ_VAL: 793 case IOAT_OP_PQ_VAL_16S: 794 if (chanerr & IOAT_CHANERR_XOR_P_OR_CRC_ERR) { 795 *desc->result |= SUM_CHECK_P_RESULT; 796 err_handled |= IOAT_CHANERR_XOR_P_OR_CRC_ERR; 797 } 798 if (chanerr & IOAT_CHANERR_XOR_Q_ERR) { 799 *desc->result |= SUM_CHECK_Q_RESULT; 800 err_handled |= IOAT_CHANERR_XOR_Q_ERR; 801 } 802 break; 803 } 804 805 if (chanerr & IOAT_CHANERR_RECOVER_MASK) { 806 if (chanerr & IOAT_CHANERR_READ_DATA_ERR) { 807 res.result = DMA_TRANS_READ_FAILED; 808 err_handled |= IOAT_CHANERR_READ_DATA_ERR; 809 } else if (chanerr & IOAT_CHANERR_WRITE_DATA_ERR) { 810 res.result = DMA_TRANS_WRITE_FAILED; 811 err_handled |= IOAT_CHANERR_WRITE_DATA_ERR; 812 } 813 814 abort = true; 815 } else 816 res.result = DMA_TRANS_NOERROR; 817 818 /* fault on unhandled error or spurious halt */ 819 if (chanerr ^ err_handled || chanerr == 0) { 820 dev_err(to_dev(ioat_chan), "%s: fatal error (%x:%x)\n", 821 __func__, chanerr, err_handled); 822 dev_err(to_dev(ioat_chan), "Errors handled:\n"); 823 ioat_print_chanerrs(ioat_chan, err_handled); 824 dev_err(to_dev(ioat_chan), "Errors not handled:\n"); 825 ioat_print_chanerrs(ioat_chan, (chanerr & ~err_handled)); 826 827 BUG(); 828 } 829 830 /* cleanup the faulty descriptor since we are continuing */ 831 tx = &desc->txd; 832 if (tx->cookie) { 833 dma_cookie_complete(tx); 834 dma_descriptor_unmap(tx); 835 dmaengine_desc_get_callback_invoke(tx, &res); 836 tx->callback = NULL; 837 tx->callback_result = NULL; 838 } 839 840 /* mark faulting descriptor as complete */ 841 *ioat_chan->completion = desc->txd.phys; 842 843 spin_lock_bh(&ioat_chan->prep_lock); 844 /* we need abort all descriptors */ 845 if (abort) { 846 ioat_abort_descs(ioat_chan); 847 /* clean up the channel, we could be in weird state */ 848 ioat_reset_hw(ioat_chan); 849 } 850 851 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 852 pci_write_config_dword(pdev, IOAT_PCI_CHANERR_INT_OFFSET, chanerr_int); 853 854 ioat_restart_channel(ioat_chan); 855 spin_unlock_bh(&ioat_chan->prep_lock); 856 } 857 858 static void check_active(struct ioatdma_chan *ioat_chan) 859 { 860 if (ioat_ring_active(ioat_chan)) { 861 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 862 return; 863 } 864 865 if (test_and_clear_bit(IOAT_CHAN_ACTIVE, &ioat_chan->state)) 866 mod_timer(&ioat_chan->timer, jiffies + IDLE_TIMEOUT); 867 } 868 869 void ioat_timer_event(struct timer_list *t) 870 { 871 struct ioatdma_chan *ioat_chan = from_timer(ioat_chan, t, timer); 872 dma_addr_t phys_complete; 873 u64 status; 874 875 status = ioat_chansts(ioat_chan); 876 877 /* when halted due to errors check for channel 878 * programming errors before advancing the completion state 879 */ 880 if (is_ioat_halted(status)) { 881 u32 chanerr; 882 883 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 884 dev_err(to_dev(ioat_chan), "%s: Channel halted (%x)\n", 885 __func__, chanerr); 886 dev_err(to_dev(ioat_chan), "Errors:\n"); 887 ioat_print_chanerrs(ioat_chan, chanerr); 888 889 if (test_bit(IOAT_RUN, &ioat_chan->state)) { 890 spin_lock_bh(&ioat_chan->cleanup_lock); 891 spin_lock_bh(&ioat_chan->prep_lock); 892 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 893 spin_unlock_bh(&ioat_chan->prep_lock); 894 895 ioat_abort_descs(ioat_chan); 896 dev_warn(to_dev(ioat_chan), "Reset channel...\n"); 897 ioat_reset_hw(ioat_chan); 898 dev_warn(to_dev(ioat_chan), "Restart channel...\n"); 899 ioat_restart_channel(ioat_chan); 900 901 spin_lock_bh(&ioat_chan->prep_lock); 902 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 903 spin_unlock_bh(&ioat_chan->prep_lock); 904 spin_unlock_bh(&ioat_chan->cleanup_lock); 905 } 906 907 return; 908 } 909 910 spin_lock_bh(&ioat_chan->cleanup_lock); 911 912 /* handle the no-actives case */ 913 if (!ioat_ring_active(ioat_chan)) { 914 spin_lock_bh(&ioat_chan->prep_lock); 915 check_active(ioat_chan); 916 spin_unlock_bh(&ioat_chan->prep_lock); 917 spin_unlock_bh(&ioat_chan->cleanup_lock); 918 return; 919 } 920 921 /* if we haven't made progress and we have already 922 * acknowledged a pending completion once, then be more 923 * forceful with a restart 924 */ 925 if (ioat_cleanup_preamble(ioat_chan, &phys_complete)) 926 __cleanup(ioat_chan, phys_complete); 927 else if (test_bit(IOAT_COMPLETION_ACK, &ioat_chan->state)) { 928 u32 chanerr; 929 930 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 931 dev_err(to_dev(ioat_chan), "CHANSTS: %#Lx CHANERR: %#x\n", 932 status, chanerr); 933 dev_err(to_dev(ioat_chan), "Errors:\n"); 934 ioat_print_chanerrs(ioat_chan, chanerr); 935 936 dev_dbg(to_dev(ioat_chan), "Active descriptors: %d\n", 937 ioat_ring_active(ioat_chan)); 938 939 spin_lock_bh(&ioat_chan->prep_lock); 940 set_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 941 spin_unlock_bh(&ioat_chan->prep_lock); 942 943 ioat_abort_descs(ioat_chan); 944 dev_warn(to_dev(ioat_chan), "Resetting channel...\n"); 945 ioat_reset_hw(ioat_chan); 946 dev_warn(to_dev(ioat_chan), "Restarting channel...\n"); 947 ioat_restart_channel(ioat_chan); 948 949 spin_lock_bh(&ioat_chan->prep_lock); 950 clear_bit(IOAT_CHAN_DOWN, &ioat_chan->state); 951 spin_unlock_bh(&ioat_chan->prep_lock); 952 spin_unlock_bh(&ioat_chan->cleanup_lock); 953 return; 954 } else 955 set_bit(IOAT_COMPLETION_ACK, &ioat_chan->state); 956 957 mod_timer(&ioat_chan->timer, jiffies + COMPLETION_TIMEOUT); 958 spin_unlock_bh(&ioat_chan->cleanup_lock); 959 } 960 961 enum dma_status 962 ioat_tx_status(struct dma_chan *c, dma_cookie_t cookie, 963 struct dma_tx_state *txstate) 964 { 965 struct ioatdma_chan *ioat_chan = to_ioat_chan(c); 966 enum dma_status ret; 967 968 ret = dma_cookie_status(c, cookie, txstate); 969 if (ret == DMA_COMPLETE) 970 return ret; 971 972 ioat_cleanup(ioat_chan); 973 974 return dma_cookie_status(c, cookie, txstate); 975 } 976 977 int ioat_reset_hw(struct ioatdma_chan *ioat_chan) 978 { 979 /* throw away whatever the channel was doing and get it 980 * initialized, with ioat3 specific workarounds 981 */ 982 struct ioatdma_device *ioat_dma = ioat_chan->ioat_dma; 983 struct pci_dev *pdev = ioat_dma->pdev; 984 u32 chanerr; 985 u16 dev_id; 986 int err; 987 988 ioat_quiesce(ioat_chan, msecs_to_jiffies(100)); 989 990 chanerr = readl(ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 991 writel(chanerr, ioat_chan->reg_base + IOAT_CHANERR_OFFSET); 992 993 if (ioat_dma->version < IOAT_VER_3_3) { 994 /* clear any pending errors */ 995 err = pci_read_config_dword(pdev, 996 IOAT_PCI_CHANERR_INT_OFFSET, &chanerr); 997 if (err) { 998 dev_err(&pdev->dev, 999 "channel error register unreachable\n"); 1000 return err; 1001 } 1002 pci_write_config_dword(pdev, 1003 IOAT_PCI_CHANERR_INT_OFFSET, chanerr); 1004 1005 /* Clear DMAUNCERRSTS Cfg-Reg Parity Error status bit 1006 * (workaround for spurious config parity error after restart) 1007 */ 1008 pci_read_config_word(pdev, IOAT_PCI_DEVICE_ID_OFFSET, &dev_id); 1009 if (dev_id == PCI_DEVICE_ID_INTEL_IOAT_TBG0) { 1010 pci_write_config_dword(pdev, 1011 IOAT_PCI_DMAUNCERRSTS_OFFSET, 1012 0x10); 1013 } 1014 } 1015 1016 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) { 1017 ioat_dma->msixtba0 = readq(ioat_dma->reg_base + 0x1000); 1018 ioat_dma->msixdata0 = readq(ioat_dma->reg_base + 0x1008); 1019 ioat_dma->msixpba = readq(ioat_dma->reg_base + 0x1800); 1020 } 1021 1022 1023 err = ioat_reset_sync(ioat_chan, msecs_to_jiffies(200)); 1024 if (!err) { 1025 if (is_bwd_ioat(pdev) && (ioat_dma->irq_mode == IOAT_MSIX)) { 1026 writeq(ioat_dma->msixtba0, ioat_dma->reg_base + 0x1000); 1027 writeq(ioat_dma->msixdata0, ioat_dma->reg_base + 0x1008); 1028 writeq(ioat_dma->msixpba, ioat_dma->reg_base + 0x1800); 1029 } 1030 } 1031 1032 if (err) 1033 dev_err(&pdev->dev, "Failed to reset: %d\n", err); 1034 1035 return err; 1036 } 1037