1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21 /* 22 * Copyright 2010 Sun Microsystems, Inc. All rights reserved. 23 * Use is subject to license terms. 24 */ 25 26 /* 27 * PX Fault Management Architecture 28 */ 29 #include <sys/types.h> 30 #include <sys/sunndi.h> 31 #include <sys/sunddi.h> 32 #include <sys/fm/protocol.h> 33 #include <sys/fm/util.h> 34 #include <sys/fm/io/pci.h> 35 #include <sys/membar.h> 36 #include "px_obj.h" 37 38 extern uint_t px_ranges_phi_mask; 39 40 #define PX_PCIE_PANIC_BITS \ 41 (PCIE_AER_UCE_DLP | PCIE_AER_UCE_FCP | PCIE_AER_UCE_TO | \ 42 PCIE_AER_UCE_RO | PCIE_AER_UCE_MTLP | PCIE_AER_UCE_ECRC) 43 #define PX_PCIE_NO_PANIC_BITS \ 44 (PCIE_AER_UCE_TRAINING | PCIE_AER_UCE_SD | PCIE_AER_UCE_CA | \ 45 PCIE_AER_UCE_UC | PCIE_AER_UCE_UR) 46 47 /* 48 * Global panicing state variabled used to control if further error handling 49 * should occur. If the system is already panic'ing or if PX itself has 50 * recommended panic'ing the system, no further error handling should occur to 51 * prevent the system from hanging. 52 */ 53 boolean_t px_panicing = B_FALSE; 54 55 static pf_data_t *px_get_pfd(px_t *px_p); 56 57 static int px_pcie_ptlp(dev_info_t *dip, ddi_fm_error_t *derr, 58 px_err_pcie_t *regs); 59 60 #if defined(DEBUG) 61 static void px_pcie_log(dev_info_t *dip, px_err_pcie_t *regs); 62 #else /* DEBUG */ 63 #define px_pcie_log 0 && 64 #endif /* DEBUG */ 65 66 /* 67 * Initialize px FMA support 68 */ 69 int 70 px_fm_attach(px_t *px_p) 71 { 72 int i; 73 dev_info_t *dip = px_p->px_dip; 74 pcie_bus_t *bus_p; 75 76 px_p->px_fm_cap = DDI_FM_EREPORT_CAPABLE | DDI_FM_ERRCB_CAPABLE | 77 DDI_FM_ACCCHK_CAPABLE | DDI_FM_DMACHK_CAPABLE; 78 79 /* 80 * check parents' capability 81 */ 82 ddi_fm_init(dip, &px_p->px_fm_cap, &px_p->px_fm_ibc); 83 84 /* 85 * parents need to be ereport and error handling capable 86 */ 87 ASSERT(px_p->px_fm_cap && 88 (DDI_FM_ERRCB_CAPABLE | DDI_FM_EREPORT_CAPABLE)); 89 90 /* 91 * Initialize lock to synchronize fabric error handling 92 */ 93 mutex_init(&px_p->px_fm_mutex, NULL, MUTEX_DRIVER, 94 (void *)px_p->px_fm_ibc); 95 96 px_p->px_pfd_idx = 0; 97 for (i = 0; i < 5; i++) 98 pcie_rc_init_pfd(dip, &px_p->px_pfd_arr[i]); 99 PCIE_DIP2PFD(dip) = px_p->px_pfd_arr; 100 101 bus_p = PCIE_DIP2BUS(dip); 102 bus_p->bus_rp_bdf = px_p->px_bdf; 103 bus_p->bus_rp_dip = dip; 104 105 /* 106 * register error callback in parent 107 */ 108 ddi_fm_handler_register(dip, px_fm_callback, px_p); 109 110 return (DDI_SUCCESS); 111 } 112 113 /* 114 * Deregister FMA 115 */ 116 void 117 px_fm_detach(px_t *px_p) 118 { 119 int i; 120 121 ddi_fm_handler_unregister(px_p->px_dip); 122 mutex_destroy(&px_p->px_fm_mutex); 123 ddi_fm_fini(px_p->px_dip); 124 for (i = 0; i < 5; i++) 125 pcie_rc_fini_pfd(&px_p->px_pfd_arr[i]); 126 } 127 128 /* 129 * Function used to setup access functions depending on level of desired 130 * protection. 131 */ 132 void 133 px_fm_acc_setup(ddi_map_req_t *mp, dev_info_t *rdip, pci_regspec_t *rp) 134 { 135 uchar_t fflag; 136 ndi_err_t *errp; 137 ddi_acc_hdl_t *hp; 138 ddi_acc_impl_t *ap; 139 140 hp = mp->map_handlep; 141 ap = (ddi_acc_impl_t *)hp->ah_platform_private; 142 fflag = ap->ahi_common.ah_acc.devacc_attr_access; 143 144 if (mp->map_op == DDI_MO_MAP_LOCKED) { 145 ndi_fmc_insert(rdip, ACC_HANDLE, (void *)hp, NULL); 146 switch (fflag) { 147 case DDI_FLAGERR_ACC: 148 ap->ahi_get8 = i_ddi_prot_get8; 149 ap->ahi_get16 = i_ddi_prot_get16; 150 ap->ahi_get32 = i_ddi_prot_get32; 151 ap->ahi_get64 = i_ddi_prot_get64; 152 ap->ahi_put8 = i_ddi_prot_put8; 153 ap->ahi_put16 = i_ddi_prot_put16; 154 ap->ahi_put32 = i_ddi_prot_put32; 155 ap->ahi_put64 = i_ddi_prot_put64; 156 ap->ahi_rep_get8 = i_ddi_prot_rep_get8; 157 ap->ahi_rep_get16 = i_ddi_prot_rep_get16; 158 ap->ahi_rep_get32 = i_ddi_prot_rep_get32; 159 ap->ahi_rep_get64 = i_ddi_prot_rep_get64; 160 ap->ahi_rep_put8 = i_ddi_prot_rep_put8; 161 ap->ahi_rep_put16 = i_ddi_prot_rep_put16; 162 ap->ahi_rep_put32 = i_ddi_prot_rep_put32; 163 ap->ahi_rep_put64 = i_ddi_prot_rep_put64; 164 impl_acc_err_init(hp); 165 errp = ((ddi_acc_impl_t *)hp)->ahi_err; 166 if ((rp->pci_phys_hi & PCI_REG_ADDR_M) == 167 PCI_ADDR_CONFIG) 168 errp->err_cf = px_err_cfg_hdl_check; 169 else 170 errp->err_cf = px_err_pio_hdl_check; 171 break; 172 case DDI_CAUTIOUS_ACC : 173 ap->ahi_get8 = i_ddi_caut_get8; 174 ap->ahi_get16 = i_ddi_caut_get16; 175 ap->ahi_get32 = i_ddi_caut_get32; 176 ap->ahi_get64 = i_ddi_caut_get64; 177 ap->ahi_put8 = i_ddi_caut_put8; 178 ap->ahi_put16 = i_ddi_caut_put16; 179 ap->ahi_put32 = i_ddi_caut_put32; 180 ap->ahi_put64 = i_ddi_caut_put64; 181 ap->ahi_rep_get8 = i_ddi_caut_rep_get8; 182 ap->ahi_rep_get16 = i_ddi_caut_rep_get16; 183 ap->ahi_rep_get32 = i_ddi_caut_rep_get32; 184 ap->ahi_rep_get64 = i_ddi_caut_rep_get64; 185 ap->ahi_rep_put8 = i_ddi_caut_rep_put8; 186 ap->ahi_rep_put16 = i_ddi_caut_rep_put16; 187 ap->ahi_rep_put32 = i_ddi_caut_rep_put32; 188 ap->ahi_rep_put64 = i_ddi_caut_rep_put64; 189 impl_acc_err_init(hp); 190 errp = ((ddi_acc_impl_t *)hp)->ahi_err; 191 if ((rp->pci_phys_hi & PCI_REG_ADDR_M) == 192 PCI_ADDR_CONFIG) 193 errp->err_cf = px_err_cfg_hdl_check; 194 else 195 errp->err_cf = px_err_pio_hdl_check; 196 break; 197 default: 198 /* Illegal state, remove the handle from cache */ 199 ndi_fmc_remove(rdip, ACC_HANDLE, (void *)hp); 200 break; 201 } 202 } else if (mp->map_op == DDI_MO_UNMAP) { 203 ndi_fmc_remove(rdip, ACC_HANDLE, (void *)hp); 204 } 205 } 206 207 /* 208 * Function used to initialize FMA for our children nodes. Called 209 * through pci busops when child node calls ddi_fm_init. 210 */ 211 /*ARGSUSED*/ 212 int 213 px_fm_init_child(dev_info_t *dip, dev_info_t *cdip, int cap, 214 ddi_iblock_cookie_t *ibc_p) 215 { 216 px_t *px_p = DIP_TO_STATE(dip); 217 218 ASSERT(ibc_p != NULL); 219 *ibc_p = px_p->px_fm_ibc; 220 221 return (px_p->px_fm_cap); 222 } 223 224 /* 225 * lock access for exclusive PCIe access 226 */ 227 void 228 px_bus_enter(dev_info_t *dip, ddi_acc_handle_t handle) 229 { 230 px_pec_t *pec_p = ((px_t *)DIP_TO_STATE(dip))->px_pec_p; 231 232 /* 233 * Exclusive access has been used for cautious put/get, 234 * Both utilize i_ddi_ontrap which, on sparcv9, implements 235 * similar protection as what on_trap() does, and which calls 236 * membar #Sync to flush out all cpu deferred errors 237 * prior to get/put operation, so here we're not calling 238 * membar #Sync - a difference from what's in pci_bus_enter(). 239 */ 240 mutex_enter(&pec_p->pec_pokefault_mutex); 241 pec_p->pec_acc_hdl = handle; 242 } 243 244 /* 245 * unlock access for exclusive PCIe access 246 */ 247 /* ARGSUSED */ 248 void 249 px_bus_exit(dev_info_t *dip, ddi_acc_handle_t handle) 250 { 251 px_t *px_p = DIP_TO_STATE(dip); 252 px_pec_t *pec_p = px_p->px_pec_p; 253 254 pec_p->pec_acc_hdl = NULL; 255 mutex_exit(&pec_p->pec_pokefault_mutex); 256 } 257 258 static uint64_t 259 px_in_addr_range(dev_info_t *dip, pci_ranges_t *ranges_p, uint64_t addr) 260 { 261 uint64_t addr_low, addr_high; 262 263 addr_low = (uint64_t)(ranges_p->parent_high & px_ranges_phi_mask) << 32; 264 addr_low |= (uint64_t)ranges_p->parent_low; 265 addr_high = addr_low + ((uint64_t)ranges_p->size_high << 32) + 266 (uint64_t)ranges_p->size_low; 267 268 DBG(DBG_ERR_INTR, dip, "Addr: 0x%llx high: 0x%llx low: 0x%llx\n", 269 addr, addr_high, addr_low); 270 271 if ((addr < addr_high) && (addr >= addr_low)) 272 return (addr_low); 273 274 return (0); 275 } 276 277 /* 278 * PCI error callback which is registered with our parent to call 279 * for PCIe logging when the CPU traps due to PCIe Uncorrectable Errors 280 * and PCI BERR/TO/UE on IO Loads. 281 */ 282 /*ARGSUSED*/ 283 int 284 px_fm_callback(dev_info_t *dip, ddi_fm_error_t *derr, const void *impl_data) 285 { 286 dev_info_t *pdip = ddi_get_parent(dip); 287 px_t *px_p = (px_t *)impl_data; 288 int i, acc_type = 0; 289 int lookup, rc_err, fab_err; 290 uint64_t addr, base_addr; 291 uint64_t fault_addr = (uint64_t)derr->fme_bus_specific; 292 pcie_req_id_t bdf = PCIE_INVALID_BDF; 293 pci_ranges_t *ranges_p; 294 int range_len; 295 296 /* 297 * If the current thread already owns the px_fm_mutex, then we 298 * have encountered an error while processing a previous 299 * error. Attempting to take the mutex again will cause the 300 * system to deadlock. 301 */ 302 if (px_p->px_fm_mutex_owner == curthread) 303 return (DDI_FM_FATAL); 304 305 i_ddi_fm_handler_exit(pdip); 306 if (px_fm_enter(px_p) != DDI_SUCCESS) { 307 i_ddi_fm_handler_enter(pdip); 308 return (DDI_FM_FATAL); 309 } 310 311 /* 312 * Make sure this failed load came from this PCIe port. Check by 313 * matching the upper 32 bits of the address with the ranges property. 314 */ 315 range_len = px_p->px_ranges_length / sizeof (pci_ranges_t); 316 i = 0; 317 for (ranges_p = px_p->px_ranges_p; i < range_len; i++, ranges_p++) { 318 base_addr = px_in_addr_range(dip, ranges_p, fault_addr); 319 if (base_addr) { 320 switch (ranges_p->child_high & PCI_ADDR_MASK) { 321 case PCI_ADDR_CONFIG: 322 acc_type = PF_ADDR_CFG; 323 addr = NULL; 324 bdf = (pcie_req_id_t)((fault_addr >> 12) & 325 0xFFFF); 326 break; 327 case PCI_ADDR_IO: 328 case PCI_ADDR_MEM64: 329 case PCI_ADDR_MEM32: 330 acc_type = PF_ADDR_PIO; 331 addr = fault_addr - base_addr; 332 bdf = PCIE_INVALID_BDF; 333 break; 334 } 335 break; 336 } 337 } 338 339 /* This address doesn't belong to this leaf, just return with OK */ 340 if (!acc_type) { 341 px_fm_exit(px_p); 342 i_ddi_fm_handler_enter(pdip); 343 return (DDI_FM_OK); 344 } 345 346 rc_err = px_err_cmn_intr(px_p, derr, PX_TRAP_CALL, PX_FM_BLOCK_ALL); 347 lookup = pf_hdl_lookup(dip, derr->fme_ena, acc_type, (uint64_t)addr, 348 bdf); 349 350 px_rp_en_q(px_p, bdf, addr, 351 (PCI_STAT_R_MAST_AB | PCI_STAT_R_TARG_AB)); 352 353 fab_err = px_scan_fabric(px_p, dip, derr); 354 355 px_fm_exit(px_p); 356 i_ddi_fm_handler_enter(pdip); 357 358 if (!px_die) 359 return (DDI_FM_OK); 360 361 if ((rc_err & (PX_PANIC | PX_PROTECTED)) || 362 (fab_err & PF_ERR_FATAL_FLAGS) || 363 (lookup == PF_HDL_NOTFOUND)) 364 return (DDI_FM_FATAL); 365 else if ((rc_err == PX_NO_ERROR) && (fab_err == PF_ERR_NO_ERROR)) 366 return (DDI_FM_OK); 367 368 return (DDI_FM_NONFATAL); 369 } 370 371 /* 372 * px_err_fabric_intr: 373 * Interrupt handler for PCIE fabric block. 374 * o lock 375 * o create derr 376 * o px_err_cmn_intr(leaf, with jbc) 377 * o send ereport(fire fmri, derr, payload = BDF) 378 * o dispatch (leaf) 379 * o unlock 380 * o handle error: fatal? fm_panic() : return INTR_CLAIMED) 381 */ 382 /* ARGSUSED */ 383 uint_t 384 px_err_fabric_intr(px_t *px_p, msgcode_t msg_code, pcie_req_id_t rid) 385 { 386 dev_info_t *rpdip = px_p->px_dip; 387 int rc_err, fab_err; 388 ddi_fm_error_t derr; 389 uint32_t rp_status; 390 uint16_t ce_source, ue_source; 391 392 if (px_fm_enter(px_p) != DDI_SUCCESS) 393 goto done; 394 395 /* Create the derr */ 396 bzero(&derr, sizeof (ddi_fm_error_t)); 397 derr.fme_version = DDI_FME_VERSION; 398 derr.fme_ena = fm_ena_generate(0, FM_ENA_FMT1); 399 derr.fme_flag = DDI_FM_ERR_UNEXPECTED; 400 401 px_err_safeacc_check(px_p, &derr); 402 403 if (msg_code == PCIE_MSG_CODE_ERR_COR) { 404 rp_status = PCIE_AER_RE_STS_CE_RCVD; 405 ce_source = rid; 406 ue_source = 0; 407 } else { 408 rp_status = PCIE_AER_RE_STS_FE_NFE_RCVD; 409 ce_source = 0; 410 ue_source = rid; 411 if (msg_code == PCIE_MSG_CODE_ERR_NONFATAL) 412 rp_status |= PCIE_AER_RE_STS_NFE_MSGS_RCVD; 413 else { 414 rp_status |= PCIE_AER_RE_STS_FE_MSGS_RCVD; 415 rp_status |= PCIE_AER_RE_STS_FIRST_UC_FATAL; 416 } 417 } 418 419 if (derr.fme_flag == DDI_FM_ERR_UNEXPECTED) { 420 ddi_fm_ereport_post(rpdip, PCI_ERROR_SUBCLASS "." PCIEX_FABRIC, 421 derr.fme_ena, 422 DDI_NOSLEEP, FM_VERSION, DATA_TYPE_UINT8, 0, 423 FIRE_PRIMARY, DATA_TYPE_BOOLEAN_VALUE, B_TRUE, 424 "pcie_adv_rp_status", DATA_TYPE_UINT32, rp_status, 425 "pcie_adv_rp_command", DATA_TYPE_UINT32, 0, 426 "pcie_adv_rp_ce_src_id", DATA_TYPE_UINT16, ce_source, 427 "pcie_adv_rp_ue_src_id", DATA_TYPE_UINT16, ue_source, 428 NULL); 429 } 430 431 /* Ensure that the rid of the fabric message will get scanned. */ 432 px_rp_en_q(px_p, rid, NULL, NULL); 433 434 rc_err = px_err_cmn_intr(px_p, &derr, PX_INTR_CALL, PX_FM_BLOCK_PCIE); 435 436 /* call rootport dispatch */ 437 fab_err = px_scan_fabric(px_p, rpdip, &derr); 438 439 px_err_panic(rc_err, PX_RC, fab_err, B_TRUE); 440 px_fm_exit(px_p); 441 px_err_panic(rc_err, PX_RC, fab_err, B_FALSE); 442 443 done: 444 return (DDI_INTR_CLAIMED); 445 } 446 447 /* 448 * px_scan_fabric: 449 * 450 * Check for drain state and if there is anything to scan. 451 */ 452 int 453 px_scan_fabric(px_t *px_p, dev_info_t *rpdip, ddi_fm_error_t *derr) { 454 int fab_err = 0; 455 456 ASSERT(MUTEX_HELD(&px_p->px_fm_mutex)); 457 458 if (!px_lib_is_in_drain_state(px_p) && px_p->px_pfd_idx) { 459 fab_err = pf_scan_fabric(rpdip, derr, px_p->px_pfd_arr); 460 px_p->px_pfd_idx = 0; 461 } 462 463 return (fab_err); 464 } 465 466 /* 467 * px_err_safeacc_check: 468 * Check to see if a peek/poke and cautious access is currently being 469 * done on a particular leaf. 470 * 471 * Safe access reads induced fire errors will be handled by cpu trap handler 472 * which will call px_fm_callback() which calls this function. In that 473 * case, the derr fields will be set by trap handler with the correct values. 474 * 475 * Safe access writes induced errors will be handled by px interrupt 476 * handlers, this function will fill in the derr fields. 477 * 478 * If a cpu trap does occur, it will quiesce all other interrupts allowing 479 * the cpu trap error handling to finish before Fire receives an interrupt. 480 * 481 * If fire does indeed have an error when a cpu trap occurs as a result of 482 * a safe access, a trap followed by a Mondo/Fabric interrupt will occur. 483 * In which case derr will be initialized as "UNEXPECTED" by the interrupt 484 * handler and this function will need to find if this error occured in the 485 * middle of a safe access operation. 486 * 487 * @param px_p leaf in which to check access 488 * @param derr fm err data structure to be updated 489 */ 490 void 491 px_err_safeacc_check(px_t *px_p, ddi_fm_error_t *derr) 492 { 493 px_pec_t *pec_p = px_p->px_pec_p; 494 int acctype = pec_p->pec_safeacc_type; 495 496 ASSERT(MUTEX_HELD(&px_p->px_fm_mutex)); 497 498 if (derr->fme_flag != DDI_FM_ERR_UNEXPECTED) { 499 return; 500 } 501 502 /* safe access checking */ 503 switch (acctype) { 504 case DDI_FM_ERR_EXPECTED: 505 /* 506 * cautious access protection, protected from all err. 507 */ 508 ddi_fm_acc_err_get(pec_p->pec_acc_hdl, derr, 509 DDI_FME_VERSION); 510 derr->fme_flag = acctype; 511 derr->fme_acc_handle = pec_p->pec_acc_hdl; 512 break; 513 case DDI_FM_ERR_POKE: 514 /* 515 * ddi_poke protection, check nexus and children for 516 * expected errors. 517 */ 518 membar_sync(); 519 derr->fme_flag = acctype; 520 break; 521 case DDI_FM_ERR_PEEK: 522 derr->fme_flag = acctype; 523 break; 524 } 525 } 526 527 /* 528 * Suggest panic if any EQ (except CE q) has overflown. 529 */ 530 int 531 px_err_check_eq(dev_info_t *dip) 532 { 533 px_t *px_p = DIP_TO_STATE(dip); 534 px_msiq_state_t *msiq_state_p = &px_p->px_ib_p->ib_msiq_state; 535 px_pec_t *pec_p = px_p->px_pec_p; 536 msiqid_t eq_no = msiq_state_p->msiq_1st_msiq_id; 537 pci_msiq_state_t msiq_state; 538 int i; 539 540 for (i = 0; i < msiq_state_p->msiq_cnt; i++) { 541 if (i + eq_no == pec_p->pec_corr_msg_msiq_id) /* skip CE q */ 542 continue; 543 if ((px_lib_msiq_getstate(dip, i + eq_no, &msiq_state) != 544 DDI_SUCCESS) || msiq_state == PCI_MSIQ_STATE_ERROR) 545 return (PX_PANIC); 546 } 547 return (PX_NO_PANIC); 548 } 549 550 /* ARGSUSED */ 551 int 552 px_err_check_pcie(dev_info_t *dip, ddi_fm_error_t *derr, px_err_pcie_t *regs) 553 { 554 px_t *px_p = DIP_TO_STATE(dip); 555 pf_data_t *pfd_p = px_get_pfd(px_p); 556 int i; 557 pf_pcie_adv_err_regs_t *adv_reg = PCIE_ADV_REG(pfd_p); 558 559 /* 560 * set RC s_status in PCI term to coordinate with downstream fabric 561 * errors ananlysis. 562 */ 563 if (regs->primary_ue & PCIE_AER_UCE_UR) 564 PCI_BDG_ERR_REG(pfd_p)->pci_bdg_sec_stat = PCI_STAT_R_MAST_AB; 565 if (regs->primary_ue & PCIE_AER_UCE_CA) 566 PCI_BDG_ERR_REG(pfd_p)->pci_bdg_sec_stat = PCI_STAT_R_TARG_AB; 567 if (regs->primary_ue & (PCIE_AER_UCE_PTLP | PCIE_AER_UCE_ECRC)) 568 PCI_BDG_ERR_REG(pfd_p)->pci_bdg_sec_stat = PCI_STAT_PERROR; 569 570 if (!regs->primary_ue) 571 goto done; 572 573 adv_reg->pcie_ce_status = regs->ce_reg; 574 adv_reg->pcie_ue_status = regs->ue_reg | regs->primary_ue; 575 PCIE_ADV_HDR(pfd_p, 0) = regs->rx_hdr1; 576 PCIE_ADV_HDR(pfd_p, 1) = regs->rx_hdr2; 577 PCIE_ADV_HDR(pfd_p, 2) = regs->rx_hdr3; 578 PCIE_ADV_HDR(pfd_p, 3) = regs->rx_hdr4; 579 for (i = regs->primary_ue; i != 1; i = i >> 1) 580 adv_reg->pcie_adv_ctl++; 581 582 if (regs->primary_ue & (PCIE_AER_UCE_UR | PCIE_AER_UCE_CA)) { 583 if (pf_tlp_decode(PCIE_DIP2BUS(dip), adv_reg) == DDI_SUCCESS) 584 PCIE_ROOT_FAULT(pfd_p)->scan_bdf = 585 adv_reg->pcie_ue_tgt_bdf; 586 } else if (regs->primary_ue & PCIE_AER_UCE_PTLP) { 587 if (pf_tlp_decode(PCIE_DIP2BUS(dip), adv_reg) == DDI_SUCCESS) { 588 PCIE_ROOT_FAULT(pfd_p)->scan_bdf = 589 adv_reg->pcie_ue_tgt_bdf; 590 if (adv_reg->pcie_ue_tgt_trans == 591 PF_ADDR_PIO) 592 PCIE_ROOT_FAULT(pfd_p)->scan_addr = 593 adv_reg->pcie_ue_tgt_addr; 594 } 595 596 /* 597 * Normally for Poisoned Completion TLPs we can look at the 598 * transmit log header for the original request and the original 599 * address, however this doesn't seem to be working. HW BUG. 600 */ 601 } 602 603 done: 604 px_pcie_log(dip, regs); 605 606 /* Return No Error here and let the pcie misc module analyse it */ 607 return (PX_NO_ERROR); 608 } 609 610 #if defined(DEBUG) 611 static void 612 px_pcie_log(dev_info_t *dip, px_err_pcie_t *regs) 613 { 614 DBG(DBG_ERR_INTR, dip, 615 "A PCIe RC error has occured\n" 616 "\tCE: 0x%x UE: 0x%x Primary UE: 0x%x\n" 617 "\tTX Hdr: 0x%x 0x%x 0x%x 0x%x\n\tRX Hdr: 0x%x 0x%x 0x%x 0x%x\n", 618 regs->ce_reg, regs->ue_reg, regs->primary_ue, 619 regs->tx_hdr1, regs->tx_hdr2, regs->tx_hdr3, regs->tx_hdr4, 620 regs->rx_hdr1, regs->rx_hdr2, regs->rx_hdr3, regs->rx_hdr4); 621 } 622 #endif 623 624 /* 625 * look through poisoned TLP cases and suggest panic/no panic depend on 626 * handle lookup. 627 */ 628 static int 629 px_pcie_ptlp(dev_info_t *dip, ddi_fm_error_t *derr, px_err_pcie_t *regs) 630 { 631 pf_pcie_adv_err_regs_t adv_reg; 632 pcie_req_id_t bdf; 633 uint64_t addr; 634 uint32_t trans_type; 635 int tlp_sts, tlp_cmd; 636 int lookup = PF_HDL_NOTFOUND; 637 638 if (regs->primary_ue != PCIE_AER_UCE_PTLP) 639 return (PX_PANIC); 640 641 if (!regs->rx_hdr1) 642 goto done; 643 644 adv_reg.pcie_ue_hdr[0] = regs->rx_hdr1; 645 adv_reg.pcie_ue_hdr[1] = regs->rx_hdr2; 646 adv_reg.pcie_ue_hdr[2] = regs->rx_hdr3; 647 adv_reg.pcie_ue_hdr[3] = regs->rx_hdr4; 648 649 tlp_sts = pf_tlp_decode(PCIE_DIP2BUS(dip), &adv_reg); 650 tlp_cmd = ((pcie_tlp_hdr_t *)(adv_reg.pcie_ue_hdr))->type; 651 652 if (tlp_sts == DDI_FAILURE) 653 goto done; 654 655 bdf = adv_reg.pcie_ue_tgt_bdf; 656 addr = adv_reg.pcie_ue_tgt_addr; 657 trans_type = adv_reg.pcie_ue_tgt_trans; 658 659 switch (tlp_cmd) { 660 case PCIE_TLP_TYPE_CPL: 661 case PCIE_TLP_TYPE_CPLLK: 662 /* 663 * Usually a PTLP is a CPL with data. Grab the completer BDF 664 * from the RX TLP, and the original address from the TX TLP. 665 */ 666 if (regs->tx_hdr1) { 667 adv_reg.pcie_ue_hdr[0] = regs->tx_hdr1; 668 adv_reg.pcie_ue_hdr[1] = regs->tx_hdr2; 669 adv_reg.pcie_ue_hdr[2] = regs->tx_hdr3; 670 adv_reg.pcie_ue_hdr[3] = regs->tx_hdr4; 671 672 lookup = pf_tlp_decode(PCIE_DIP2BUS(dip), &adv_reg); 673 if (lookup != DDI_SUCCESS) 674 break; 675 addr = adv_reg.pcie_ue_tgt_addr; 676 trans_type = adv_reg.pcie_ue_tgt_trans; 677 } /* FALLTHRU */ 678 case PCIE_TLP_TYPE_IO: 679 case PCIE_TLP_TYPE_MEM: 680 case PCIE_TLP_TYPE_MEMLK: 681 lookup = pf_hdl_lookup(dip, derr->fme_ena, trans_type, addr, 682 bdf); 683 break; 684 default: 685 lookup = PF_HDL_NOTFOUND; 686 } 687 done: 688 return (lookup == PF_HDL_FOUND ? PX_NO_PANIC : PX_PANIC); 689 } 690 691 /* 692 * px_get_pdf automatically allocates a RC pf_data_t and returns a pointer to 693 * it. This function should be used when an error requires a fabric scan. 694 */ 695 static pf_data_t * 696 px_get_pfd(px_t *px_p) { 697 int idx = px_p->px_pfd_idx++; 698 pf_data_t *pfd_p = &px_p->px_pfd_arr[idx]; 699 700 /* Clear Old Data */ 701 PCIE_ROOT_FAULT(pfd_p)->scan_bdf = PCIE_INVALID_BDF; 702 PCIE_ROOT_FAULT(pfd_p)->scan_addr = 0; 703 PCI_BDG_ERR_REG(pfd_p)->pci_bdg_sec_stat = 0; 704 PCIE_ADV_REG(pfd_p)->pcie_ce_status = 0; 705 PCIE_ADV_REG(pfd_p)->pcie_ue_status = 0; 706 707 pfd_p->pe_next = NULL; 708 709 if (idx > 0) { 710 px_p->px_pfd_arr[idx - 1].pe_next = pfd_p; 711 pfd_p->pe_prev = &px_p->px_pfd_arr[idx - 1]; 712 } else { 713 pfd_p->pe_prev = NULL; 714 } 715 716 pfd_p->pe_valid = B_TRUE; 717 718 return (pfd_p); 719 } 720 721 /* 722 * This function appends a pf_data structure to the error q which is used later 723 * during PCIe fabric scan. It signifies: 724 * o errs rcvd in RC, that may have been propagated to/from the fabric 725 * o the fabric scan code should scan the device path of fault bdf/addr 726 * 727 * scan_bdf: The bdf that caused the fault, which may have error bits set. 728 * scan_addr: The PIO addr that caused the fault, such as failed PIO, but not 729 * failed DMAs. 730 * s_status: Secondary Status equivalent to why the fault occured. 731 * (ie S-TA/MA, R-TA) 732 * Either the scan bdf or addr may be NULL, but not both. 733 */ 734 void 735 px_rp_en_q(px_t *px_p, pcie_req_id_t scan_bdf, uint32_t scan_addr, 736 uint16_t s_status) 737 { 738 pf_data_t *pfd_p; 739 740 if (!PCIE_CHECK_VALID_BDF(scan_bdf) && !scan_addr) 741 return; 742 743 pfd_p = px_get_pfd(px_p); 744 745 PCIE_ROOT_FAULT(pfd_p)->scan_bdf = scan_bdf; 746 PCIE_ROOT_FAULT(pfd_p)->scan_addr = (uint64_t)scan_addr; 747 PCI_BDG_ERR_REG(pfd_p)->pci_bdg_sec_stat = s_status; 748 } 749 750 751 /* 752 * Find and Mark CFG Handles as failed associated with the given BDF. We should 753 * always know the BDF for CFG accesses, since it is encoded in the address of 754 * the TLP. Since there can be multiple cfg handles, mark them all as failed. 755 */ 756 /* ARGSUSED */ 757 int 758 px_err_cfg_hdl_check(dev_info_t *dip, const void *handle, const void *arg1, 759 const void *arg2) 760 { 761 int status = DDI_FM_FATAL; 762 uint32_t addr = *(uint32_t *)arg1; 763 uint16_t bdf = *(uint16_t *)arg2; 764 pcie_bus_t *bus_p; 765 766 DBG(DBG_ERR_INTR, dip, "Check CFG Hdl: dip 0x%p addr 0x%x bdf=0x%x\n", 767 dip, addr, bdf); 768 769 bus_p = PCIE_DIP2BUS(dip); 770 771 /* 772 * Because CFG and IO Acc Handlers are on the same cache list and both 773 * types of hdls gets called for both types of errors. For this checker 774 * only mark the device as "Non-Fatal" if the addr == NULL and bdf != 775 * NULL. 776 */ 777 status = (!addr && (PCIE_CHECK_VALID_BDF(bdf) && 778 (bus_p->bus_bdf == bdf))) ? DDI_FM_NONFATAL : DDI_FM_FATAL; 779 780 return (status); 781 } 782 783 /* 784 * Find and Mark all ACC Handles associated with a give address and BDF as 785 * failed. If the BDF != NULL, then check to see if the device has a ACC Handle 786 * associated with ADDR. If the handle is not found, mark all the handles as 787 * failed. If the BDF == NULL, mark the handle as failed if it is associated 788 * with ADDR. 789 */ 790 int 791 px_err_pio_hdl_check(dev_info_t *dip, const void *handle, const void *arg1, 792 const void *arg2) 793 { 794 dev_info_t *px_dip; 795 px_t *px_p; 796 pci_ranges_t *ranges_p; 797 int range_len; 798 ddi_acc_handle_t ap = (ddi_acc_handle_t)handle; 799 ddi_acc_hdl_t *hp = impl_acc_hdl_get(ap); 800 int i, status = DDI_FM_FATAL; 801 uint64_t fault_addr = *(uint64_t *)arg1; 802 uint16_t bdf = *(uint16_t *)arg2; 803 uint64_t base_addr, range_addr; 804 uint_t size; 805 806 /* 807 * Find the correct px dip. On system with a real Root Port, it's the 808 * node above the root port. On systems without a real Root Port the px 809 * dip is the bus_rp_dip. 810 */ 811 px_dip = PCIE_DIP2BUS(dip)->bus_rp_dip; 812 813 if (!PCIE_IS_RC(PCIE_DIP2BUS(px_dip))) 814 px_dip = ddi_get_parent(px_dip); 815 816 ASSERT(PCIE_IS_RC(PCIE_DIP2BUS(px_dip))); 817 px_p = INST_TO_STATE(ddi_get_instance(px_dip)); 818 819 DBG(DBG_ERR_INTR, dip, "Check PIO Hdl: dip 0x%x addr 0x%x bdf=0x%x\n", 820 dip, fault_addr, bdf); 821 822 /* Normalize the base addr to the addr and strip off the HB info. */ 823 base_addr = (hp->ah_pfn << MMU_PAGESHIFT) + hp->ah_offset; 824 range_len = px_p->px_ranges_length / sizeof (pci_ranges_t); 825 i = 0; 826 for (ranges_p = px_p->px_ranges_p; i < range_len; i++, ranges_p++) { 827 range_addr = px_in_addr_range(dip, ranges_p, base_addr); 828 if (range_addr) { 829 switch (ranges_p->child_high & PCI_ADDR_MASK) { 830 case PCI_ADDR_IO: 831 case PCI_ADDR_MEM64: 832 case PCI_ADDR_MEM32: 833 base_addr = base_addr - range_addr; 834 break; 835 } 836 break; 837 } 838 } 839 840 /* 841 * Mark the handle as failed if the ADDR is mapped, or if we 842 * know the BDF and ADDR == 0. 843 */ 844 size = hp->ah_len; 845 if (((fault_addr >= base_addr) && (fault_addr < (base_addr + size))) || 846 ((fault_addr == NULL) && (PCIE_CHECK_VALID_BDF(bdf) && 847 (bdf == PCIE_DIP2BUS(dip)->bus_bdf)))) 848 status = DDI_FM_NONFATAL; 849 850 return (status); 851 } 852 853 /* 854 * Find and Mark all DNA Handles associated with a give address and BDF as 855 * failed. If the BDF != NULL, then check to see if the device has a DMA Handle 856 * associated with ADDR. If the handle is not found, mark all the handles as 857 * failed. If the BDF == NULL, mark the handle as failed if it is associated 858 * with ADDR. 859 */ 860 int 861 px_err_dma_hdl_check(dev_info_t *dip, const void *handle, const void *arg1, 862 const void *arg2) 863 { 864 ddi_dma_impl_t *pcie_dp; 865 int status = DDI_FM_FATAL; 866 uint32_t addr = *(uint32_t *)arg1; 867 uint16_t bdf = *(uint16_t *)arg2; 868 uint32_t base_addr; 869 uint_t size; 870 871 DBG(DBG_ERR_INTR, dip, "Check PIO Hdl: dip 0x%x addr 0x%x bdf=0x%x\n", 872 dip, addr, bdf); 873 874 pcie_dp = (ddi_dma_impl_t *)handle; 875 base_addr = (uint32_t)pcie_dp->dmai_mapping; 876 size = pcie_dp->dmai_size; 877 878 /* 879 * Mark the handle as failed if the ADDR is mapped, or if we 880 * know the BDF and ADDR == 0. 881 */ 882 if (((addr >= base_addr) && (addr < (base_addr + size))) || 883 ((addr == NULL) && PCIE_CHECK_VALID_BDF(bdf))) 884 status = DDI_FM_NONFATAL; 885 886 return (status); 887 } 888 889 int 890 px_fm_enter(px_t *px_p) { 891 if (px_panicing || (px_p->px_fm_mutex_owner == curthread)) 892 return (DDI_FAILURE); 893 894 mutex_enter(&px_p->px_fm_mutex); 895 /* 896 * In rare cases when trap occurs and in the middle of scanning the 897 * fabric, a PIO will fail in the scan fabric. The CPU error handling 898 * code will correctly panic the system, while a mondo for the failed 899 * PIO may also show up. Normally the mondo will try to grab the mutex 900 * and wait until the callback finishes. But in this rare case, 901 * mutex_enter actually suceeds also continues to scan the fabric. 902 * 903 * This code below is designed specifically to check for this case. If 904 * we successfully grab the px_fm_mutex, the px_fm_mutex_owner better be 905 * NULL. If it isn't that means we are in the rare corner case. Return 906 * DDI_FAILURE, this should prevent PX from doing anymore error 907 * handling. 908 */ 909 if (px_p->px_fm_mutex_owner) { 910 return (DDI_FAILURE); 911 } 912 913 px_p->px_fm_mutex_owner = curthread; 914 915 if (px_panicing) { 916 px_fm_exit(px_p); 917 return (DDI_FAILURE); 918 } 919 return (DDI_SUCCESS); 920 } 921 922 void 923 px_fm_exit(px_t *px_p) { 924 px_p->px_fm_mutex_owner = NULL; 925 mutex_exit(&px_p->px_fm_mutex); 926 } 927 928 /* 929 * Panic if the err tunable is set and that we are not already in the middle 930 * of panic'ing. 931 * 932 * rc_err = Error severity of PX specific errors 933 * msg = Where the error was detected 934 * fabric_err = Error severity of PCIe Fabric errors 935 * isTest = Test if error severity causes panic 936 */ 937 #define MSZ (sizeof (fm_msg) -strlen(fm_msg) - 1) 938 void 939 px_err_panic(int rc_err, int msg, int fabric_err, boolean_t isTest) 940 { 941 char fm_msg[96] = ""; 942 int ferr = PX_NO_ERROR; 943 944 if (panicstr) { 945 px_panicing = B_TRUE; 946 return; 947 } 948 949 if (!(rc_err & px_die)) 950 goto fabric; 951 if (msg & PX_RC) 952 (void) strncat(fm_msg, px_panic_rc_msg, MSZ); 953 if (msg & PX_RP) 954 (void) strncat(fm_msg, px_panic_rp_msg, MSZ); 955 if (msg & PX_HB) 956 (void) strncat(fm_msg, px_panic_hb_msg, MSZ); 957 958 fabric: 959 if (fabric_err & PF_ERR_FATAL_FLAGS) 960 ferr = PX_PANIC; 961 else if (fabric_err & ~(PF_ERR_FATAL_FLAGS | PF_ERR_NO_ERROR)) 962 ferr = PX_NO_PANIC; 963 964 if (ferr & px_die) { 965 if (strlen(fm_msg)) { 966 (void) strncat(fm_msg, " and", MSZ); 967 } 968 (void) strncat(fm_msg, px_panic_fab_msg, MSZ); 969 } 970 971 if (strlen(fm_msg)) { 972 px_panicing = B_TRUE; 973 if (!isTest) 974 fm_panic("Fatal error has occured in:%s.(0x%x)(0x%x)", 975 fm_msg, rc_err, fabric_err); 976 } 977 } 978