1 /*- 2 * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3 * 4 * Copyright 2019 Justin Hibbits 5 * 6 * Redistribution and use in source and binary forms, with or without 7 * modification, are permitted provided that the following conditions 8 * are met: 9 * 1. Redistributions of source code must retain the above copyright 10 * notice, this list of conditions and the following disclaimer. 11 * 2. Redistributions in binary form must reproduce the above copyright 12 * notice, this list of conditions and the following disclaimer in the 13 * documentation and/or other materials provided with the distribution. 14 * 15 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR 16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES 17 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. 18 * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, 19 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, 20 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; 21 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED 22 * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, 23 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 24 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 25 * SUCH DAMAGE. 26 */ 27 28 #include <sys/cdefs.h> 29 __FBSDID("$FreeBSD$"); 30 31 #include "opt_platform.h" 32 33 #include <sys/param.h> 34 #include <sys/systm.h> 35 #include <sys/module.h> 36 #include <sys/bus.h> 37 #include <sys/conf.h> 38 #include <sys/endian.h> 39 #include <sys/kernel.h> 40 #include <sys/lock.h> 41 #include <sys/malloc.h> 42 #include <sys/mutex.h> 43 #include <sys/smp.h> 44 45 #include <vm/vm.h> 46 #include <vm/pmap.h> 47 48 #include <machine/bus.h> 49 #include <machine/intr_machdep.h> 50 #include <machine/md_var.h> 51 52 #include <dev/ofw/ofw_bus.h> 53 #include <dev/ofw/ofw_bus_subr.h> 54 55 #ifdef POWERNV 56 #include <powerpc/powernv/opal.h> 57 #endif 58 59 #include "pic_if.h" 60 61 #define XIVE_PRIORITY 7 /* Random non-zero number */ 62 #define MAX_XIVE_IRQS (1<<24) /* 24-bit XIRR field */ 63 64 /* Registers */ 65 #define XIVE_TM_QW1_OS 0x010 /* Guest OS registers */ 66 #define XIVE_TM_QW2_HV_POOL 0x020 /* Hypervisor pool registers */ 67 #define XIVE_TM_QW3_HV 0x030 /* Hypervisor registers */ 68 69 #define XIVE_TM_NSR 0x00 70 #define XIVE_TM_CPPR 0x01 71 #define XIVE_TM_IPB 0x02 72 #define XIVE_TM_LSMFB 0x03 73 #define XIVE_TM_ACK_CNT 0x04 74 #define XIVE_TM_INC 0x05 75 #define XIVE_TM_AGE 0x06 76 #define XIVE_TM_PIPR 0x07 77 78 #define TM_WORD0 0x0 79 #define TM_WORD2 0x8 80 #define TM_QW2W2_VP 0x80000000 81 82 #define XIVE_TM_SPC_ACK 0x800 83 #define TM_QW3NSR_HE_SHIFT 14 84 #define TM_QW3_NSR_HE_NONE 0 85 #define TM_QW3_NSR_HE_POOL 1 86 #define TM_QW3_NSR_HE_PHYS 2 87 #define TM_QW3_NSR_HE_LSI 3 88 #define XIVE_TM_SPC_PULL_POOL_CTX 0x828 89 90 #define XIVE_IRQ_LOAD_EOI 0x000 91 #define XIVE_IRQ_STORE_EOI 0x400 92 #define XIVE_IRQ_PQ_00 0xc00 93 #define XIVE_IRQ_PQ_01 0xd00 94 95 #define XIVE_IRQ_VAL_P 0x02 96 #define XIVE_IRQ_VAL_Q 0x01 97 98 struct xive_softc; 99 struct xive_irq; 100 101 extern void (*powernv_smp_ap_extra_init)(void); 102 103 /* Private support */ 104 static void xive_setup_cpu(void); 105 static void xive_smp_cpu_startup(void); 106 static void xive_init_irq(struct xive_irq *irqd, u_int irq); 107 static struct xive_irq *xive_configure_irq(u_int irq); 108 static int xive_provision_page(struct xive_softc *sc); 109 110 /* Interfaces */ 111 static int xive_probe(device_t); 112 static int xive_attach(device_t); 113 static int xics_probe(device_t); 114 static int xics_attach(device_t); 115 116 static void xive_bind(device_t, u_int, cpuset_t, void **); 117 static void xive_dispatch(device_t, struct trapframe *); 118 static void xive_enable(device_t, u_int, u_int, void **); 119 static void xive_eoi(device_t, u_int, void *); 120 static void xive_ipi(device_t, u_int); 121 static void xive_mask(device_t, u_int, void *); 122 static void xive_unmask(device_t, u_int, void *); 123 static void xive_translate_code(device_t dev, u_int irq, int code, 124 enum intr_trigger *trig, enum intr_polarity *pol); 125 126 static device_method_t xive_methods[] = { 127 /* Device interface */ 128 DEVMETHOD(device_probe, xive_probe), 129 DEVMETHOD(device_attach, xive_attach), 130 131 /* PIC interface */ 132 DEVMETHOD(pic_bind, xive_bind), 133 DEVMETHOD(pic_dispatch, xive_dispatch), 134 DEVMETHOD(pic_enable, xive_enable), 135 DEVMETHOD(pic_eoi, xive_eoi), 136 DEVMETHOD(pic_ipi, xive_ipi), 137 DEVMETHOD(pic_mask, xive_mask), 138 DEVMETHOD(pic_unmask, xive_unmask), 139 DEVMETHOD(pic_translate_code, xive_translate_code), 140 141 DEVMETHOD_END 142 }; 143 144 static device_method_t xics_methods[] = { 145 /* Device interface */ 146 DEVMETHOD(device_probe, xics_probe), 147 DEVMETHOD(device_attach, xics_attach), 148 149 DEVMETHOD_END 150 }; 151 152 struct xive_softc { 153 struct mtx sc_mtx; 154 struct resource *sc_mem; 155 vm_size_t sc_prov_page_size; 156 uint32_t sc_offset; 157 }; 158 159 struct xive_queue { 160 uint32_t *q_page; 161 uint32_t *q_eoi_page; 162 uint32_t q_toggle; 163 uint32_t q_size; 164 uint32_t q_index; 165 uint32_t q_mask; 166 }; 167 168 struct xive_irq { 169 uint32_t girq; 170 uint32_t lirq; 171 uint64_t vp; 172 uint64_t flags; 173 #define OPAL_XIVE_IRQ_EOI_VIA_FW 0x00000020 174 #define OPAL_XIVE_IRQ_MASK_VIA_FW 0x00000010 175 #define OPAL_XIVE_IRQ_SHIFT_BUG 0x00000008 176 #define OPAL_XIVE_IRQ_LSI 0x00000004 177 #define OPAL_XIVE_IRQ_STORE_EOI 0x00000002 178 #define OPAL_XIVE_IRQ_TRIGGER_PAGE 0x00000001 179 uint8_t prio; 180 vm_offset_t eoi_page; 181 vm_offset_t trig_page; 182 vm_size_t esb_size; 183 int chip; 184 }; 185 186 struct xive_cpu { 187 uint64_t vp; 188 uint64_t flags; 189 struct xive_irq ipi_data; 190 struct xive_queue queue; /* We only use a single queue for now. */ 191 uint64_t cam; 192 uint32_t chip; 193 }; 194 195 static driver_t xive_driver = { 196 "xive", 197 xive_methods, 198 sizeof(struct xive_softc) 199 }; 200 201 static driver_t xics_driver = { 202 "xivevc", 203 xics_methods, 204 0 205 }; 206 207 static devclass_t xive_devclass; 208 static devclass_t xics_devclass; 209 210 EARLY_DRIVER_MODULE(xive, ofwbus, xive_driver, xive_devclass, 0, 0, 211 BUS_PASS_INTERRUPT-1); 212 EARLY_DRIVER_MODULE(xivevc, ofwbus, xics_driver, xics_devclass, 0, 0, 213 BUS_PASS_INTERRUPT); 214 215 MALLOC_DEFINE(M_XIVE, "xive", "XIVE Memory"); 216 217 DPCPU_DEFINE_STATIC(struct xive_cpu, xive_cpu_data); 218 219 static int xive_ipi_vector = -1; 220 221 /* 222 * XIVE Exploitation mode driver. 223 * 224 * The XIVE, present in the POWER9 CPU, can run in two modes: XICS emulation 225 * mode, and "Exploitation mode". XICS emulation mode is compatible with the 226 * POWER8 and earlier XICS interrupt controller, using OPAL calls to emulate 227 * hypervisor calls and memory accesses. Exploitation mode gives us raw access 228 * to the XIVE MMIO, improving performance significantly. 229 * 230 * The XIVE controller is a very bizarre interrupt controller. It uses queues 231 * in memory to pass interrupts around, and maps itself into 512GB of physical 232 * device address space, giving each interrupt in the system one or more pages 233 * of address space. An IRQ is tied to a virtual processor, which could be a 234 * physical CPU thread, or a guest CPU thread (LPAR running on a physical 235 * thread). Thus, the controller can route interrupts directly to guest OSes 236 * bypassing processing by the hypervisor, thereby improving performance of the 237 * guest OS. 238 * 239 * An IRQ, in addition to being tied to a virtual processor, has one or two 240 * page mappings: an EOI page, and an optional trigger page. The trigger page 241 * could be the same as the EOI page. Level-sensitive interrupts (LSIs) don't 242 * have a trigger page, as they're external interrupts controlled by physical 243 * lines. MSIs and IPIs have trigger pages. An IPI is really just another IRQ 244 * in the XIVE, which is triggered by software. 245 * 246 * An interesting behavior of the XIVE controller is that oftentimes the 247 * contents of an address location don't actually matter, but the direction of 248 * the action is the signifier (read vs write), and the address is significant. 249 * Hence, masking and unmasking an interrupt is done by reading different 250 * addresses in the EOI page, and triggering an interrupt consists of writing to 251 * the trigger page. 252 * 253 * Additionally, the MMIO region mapped is CPU-sensitive, just like the 254 * per-processor register space (private access) in OpenPIC. In order for a CPU 255 * to receive interrupts it must itself configure its CPPR (Current Processor 256 * Priority Register), it cannot be set by any other processor. This 257 * necessitates the xive_smp_cpu_startup() function. 258 * 259 * Queues are pages of memory, sized powers-of-two, that are shared with the 260 * XIVE. The XIVE writes into the queue with an alternating polarity bit, which 261 * flips when the queue wraps. 262 */ 263 264 /* 265 * Offset-based read/write interfaces. 266 */ 267 static uint16_t 268 xive_read_2(struct xive_softc *sc, bus_size_t offset) 269 { 270 271 return (bus_read_2(sc->sc_mem, sc->sc_offset + offset)); 272 } 273 274 static void 275 xive_write_1(struct xive_softc *sc, bus_size_t offset, uint8_t val) 276 { 277 278 bus_write_1(sc->sc_mem, sc->sc_offset + offset, val); 279 } 280 281 /* EOI and Trigger page access interfaces. */ 282 static uint64_t 283 xive_read_mmap8(vm_offset_t addr) 284 { 285 return (*(volatile uint64_t *)addr); 286 } 287 288 static void 289 xive_write_mmap8(vm_offset_t addr, uint64_t val) 290 { 291 *(uint64_t *)(addr) = val; 292 } 293 294 /* Device interfaces. */ 295 static int 296 xive_probe(device_t dev) 297 { 298 299 if (!ofw_bus_is_compatible(dev, "ibm,opal-xive-pe")) 300 return (ENXIO); 301 302 device_set_desc(dev, "External Interrupt Virtualization Engine"); 303 304 /* Make sure we always win against the xicp driver. */ 305 return (BUS_PROBE_DEFAULT); 306 } 307 308 static int 309 xics_probe(device_t dev) 310 { 311 312 if (!ofw_bus_is_compatible(dev, "ibm,opal-xive-vc")) 313 return (ENXIO); 314 315 device_set_desc(dev, "External Interrupt Virtualization Engine Root"); 316 return (BUS_PROBE_DEFAULT); 317 } 318 319 static int 320 xive_attach(device_t dev) 321 { 322 struct xive_softc *sc = device_get_softc(dev); 323 struct xive_cpu *xive_cpud; 324 phandle_t phandle = ofw_bus_get_node(dev); 325 int64_t vp_block; 326 int error; 327 int rid; 328 int i, order; 329 uint64_t vp_id; 330 int64_t ipi_irq; 331 332 opal_call(OPAL_XIVE_RESET, OPAL_XIVE_XICS_MODE_EXP); 333 334 error = OF_getencprop(phandle, "ibm,xive-provision-page-size", 335 (pcell_t *)&sc->sc_prov_page_size, sizeof(sc->sc_prov_page_size)); 336 337 rid = 1; /* Get the Hypervisor-level register set. */ 338 sc->sc_mem = bus_alloc_resource_any(dev, SYS_RES_MEMORY, 339 &rid, RF_ACTIVE); 340 sc->sc_offset = XIVE_TM_QW3_HV; 341 342 mtx_init(&sc->sc_mtx, "XIVE", NULL, MTX_DEF); 343 344 /* Workaround for qemu single-thread powernv */ 345 if (mp_maxid == 0) 346 order = 1; 347 else 348 order = fls(mp_maxid + (mp_maxid - 1)) - 1; 349 350 do { 351 vp_block = opal_call(OPAL_XIVE_ALLOCATE_VP_BLOCK, order); 352 if (vp_block == OPAL_BUSY) 353 DELAY(10); 354 else if (vp_block == OPAL_XIVE_PROVISIONING) 355 xive_provision_page(sc); 356 else 357 break; 358 } while (1); 359 360 if (vp_block < 0) { 361 device_printf(dev, 362 "Unable to allocate VP block. Opal error %d\n", 363 (int)vp_block); 364 bus_release_resource(dev, SYS_RES_MEMORY, rid, sc->sc_mem); 365 return (ENXIO); 366 } 367 368 /* 369 * Set up the VPs. Try to do as much as we can in attach, to lessen 370 * what's needed at AP spawn time. 371 */ 372 CPU_FOREACH(i) { 373 vp_id = pcpu_find(i)->pc_hwref; 374 375 xive_cpud = DPCPU_ID_PTR(i, xive_cpu_data); 376 xive_cpud->vp = vp_id + vp_block; 377 opal_call(OPAL_XIVE_GET_VP_INFO, xive_cpud->vp, NULL, 378 vtophys(&xive_cpud->cam), NULL, vtophys(&xive_cpud->chip)); 379 380 xive_cpud->cam = be64toh(xive_cpud->cam); 381 xive_cpud->chip = be64toh(xive_cpud->chip); 382 383 /* Allocate the queue page and populate the queue state data. */ 384 xive_cpud->queue.q_page = contigmalloc(PAGE_SIZE, M_XIVE, 385 M_ZERO | M_WAITOK, 0, BUS_SPACE_MAXADDR, PAGE_SIZE, 0); 386 xive_cpud->queue.q_size = 1 << PAGE_SHIFT; 387 xive_cpud->queue.q_mask = 388 ((xive_cpud->queue.q_size / sizeof(int)) - 1); 389 xive_cpud->queue.q_toggle = 0; 390 xive_cpud->queue.q_index = 0; 391 do { 392 error = opal_call(OPAL_XIVE_SET_VP_INFO, xive_cpud->vp, 393 OPAL_XIVE_VP_ENABLED, 0); 394 } while (error == OPAL_BUSY); 395 error = opal_call(OPAL_XIVE_SET_QUEUE_INFO, vp_id, 396 XIVE_PRIORITY, vtophys(xive_cpud->queue.q_page), PAGE_SHIFT, 397 OPAL_XIVE_EQ_ALWAYS_NOTIFY | OPAL_XIVE_EQ_ENABLED); 398 399 do { 400 ipi_irq = opal_call(OPAL_XIVE_ALLOCATE_IRQ, 401 xive_cpud->chip); 402 } while (ipi_irq == OPAL_BUSY); 403 404 if (ipi_irq < 0) 405 device_printf(root_pic, 406 "Failed allocating IPI. OPAL error %d\n", 407 (int)ipi_irq); 408 else { 409 xive_init_irq(&xive_cpud->ipi_data, ipi_irq); 410 xive_cpud->ipi_data.vp = vp_id; 411 xive_cpud->ipi_data.lirq = MAX_XIVE_IRQS; 412 opal_call(OPAL_XIVE_SET_IRQ_CONFIG, ipi_irq, 413 xive_cpud->ipi_data.vp, XIVE_PRIORITY, 414 MAX_XIVE_IRQS); 415 } 416 } 417 418 powerpc_register_pic(dev, OF_xref_from_node(phandle), MAX_XIVE_IRQS, 419 1 /* Number of IPIs */, FALSE); 420 root_pic = dev; 421 422 xive_setup_cpu(); 423 powernv_smp_ap_extra_init = xive_smp_cpu_startup; 424 425 return (0); 426 } 427 428 static int 429 xics_attach(device_t dev) 430 { 431 phandle_t phandle = ofw_bus_get_node(dev); 432 433 /* The XIVE (root PIC) will handle all our interrupts */ 434 powerpc_register_pic(root_pic, OF_xref_from_node(phandle), 435 MAX_XIVE_IRQS, 1 /* Number of IPIs */, FALSE); 436 437 return (0); 438 } 439 440 /* 441 * PIC I/F methods. 442 */ 443 444 static void 445 xive_bind(device_t dev, u_int irq, cpuset_t cpumask, void **priv) 446 { 447 struct xive_irq *irqd; 448 int cpu; 449 int ncpus, i, error; 450 451 if (*priv == NULL) 452 *priv = xive_configure_irq(irq); 453 454 irqd = *priv; 455 456 /* 457 * This doesn't appear to actually support affinity groups, so pick a 458 * random CPU. 459 */ 460 ncpus = 0; 461 CPU_FOREACH(cpu) 462 if (CPU_ISSET(cpu, &cpumask)) ncpus++; 463 464 i = mftb() % ncpus; 465 ncpus = 0; 466 CPU_FOREACH(cpu) { 467 if (!CPU_ISSET(cpu, &cpumask)) 468 continue; 469 if (ncpus == i) 470 break; 471 ncpus++; 472 } 473 474 opal_call(OPAL_XIVE_SYNC, OPAL_XIVE_SYNC_QUEUE, irq); 475 476 irqd->vp = pcpu_find(cpu)->pc_hwref; 477 error = opal_call(OPAL_XIVE_SET_IRQ_CONFIG, irq, irqd->vp, 478 XIVE_PRIORITY, irqd->lirq); 479 480 if (error < 0) 481 panic("Cannot bind interrupt %d to CPU %d", irq, cpu); 482 483 xive_eoi(dev, irq, irqd); 484 } 485 486 /* Read the next entry in the queue page and update the index. */ 487 static int 488 xive_read_eq(struct xive_queue *q) 489 { 490 uint32_t i = be32toh(q->q_page[q->q_index]); 491 492 /* Check validity, using current queue polarity. */ 493 if ((i >> 31) == q->q_toggle) 494 return (0); 495 496 q->q_index = (q->q_index + 1) & q->q_mask; 497 498 if (q->q_index == 0) 499 q->q_toggle ^= 1; 500 501 return (i & 0x7fffffff); 502 } 503 504 static void 505 xive_dispatch(device_t dev, struct trapframe *tf) 506 { 507 struct xive_softc *sc; 508 struct xive_cpu *xive_cpud; 509 uint32_t vector; 510 uint16_t ack; 511 uint8_t cppr, he; 512 513 sc = device_get_softc(dev); 514 515 xive_cpud = DPCPU_PTR(xive_cpu_data); 516 for (;;) { 517 ack = xive_read_2(sc, XIVE_TM_SPC_ACK); 518 cppr = (ack & 0xff); 519 520 he = ack >> TM_QW3NSR_HE_SHIFT; 521 522 if (he == TM_QW3_NSR_HE_NONE) 523 break; 524 525 else if (__predict_false(he != TM_QW3_NSR_HE_PHYS)) { 526 /* 527 * We don't support TM_QW3_NSR_HE_POOL or 528 * TM_QW3_NSR_HE_LSI interrupts. 529 */ 530 device_printf(dev, 531 "Unexpected interrupt he type: %d\n", he); 532 goto end; 533 } 534 535 xive_write_1(sc, XIVE_TM_CPPR, cppr); 536 537 for (;;) { 538 vector = xive_read_eq(&xive_cpud->queue); 539 540 if (vector == 0) 541 break; 542 543 if (vector == MAX_XIVE_IRQS) 544 vector = xive_ipi_vector; 545 546 powerpc_dispatch_intr(vector, tf); 547 } 548 } 549 end: 550 xive_write_1(sc, XIVE_TM_CPPR, 0xff); 551 } 552 553 static void 554 xive_enable(device_t dev, u_int irq, u_int vector, void **priv) 555 { 556 struct xive_irq *irqd; 557 cell_t status, cpu; 558 559 if (irq == MAX_XIVE_IRQS) { 560 if (xive_ipi_vector == -1) 561 xive_ipi_vector = vector; 562 return; 563 } 564 if (*priv == NULL) 565 *priv = xive_configure_irq(irq); 566 567 irqd = *priv; 568 569 /* Bind to this CPU to start */ 570 cpu = PCPU_GET(hwref); 571 irqd->lirq = vector; 572 573 for (;;) { 574 status = opal_call(OPAL_XIVE_SET_IRQ_CONFIG, irq, cpu, 575 XIVE_PRIORITY, vector); 576 if (status != OPAL_BUSY) 577 break; 578 DELAY(10); 579 } 580 581 if (status != 0) 582 panic("OPAL_SET_XIVE IRQ %d -> cpu %d failed: %d", irq, 583 cpu, status); 584 585 xive_unmask(dev, irq, *priv); 586 } 587 588 static void 589 xive_eoi(device_t dev, u_int irq, void *priv) 590 { 591 struct xive_irq *rirq; 592 struct xive_cpu *cpud; 593 uint8_t eoi_val; 594 595 if (irq == MAX_XIVE_IRQS) { 596 cpud = DPCPU_PTR(xive_cpu_data); 597 rirq = &cpud->ipi_data; 598 } else 599 rirq = priv; 600 601 if (rirq->flags & OPAL_XIVE_IRQ_EOI_VIA_FW) 602 opal_call(OPAL_INT_EOI, irq); 603 else if (rirq->flags & OPAL_XIVE_IRQ_STORE_EOI) 604 xive_write_mmap8(rirq->eoi_page + XIVE_IRQ_STORE_EOI, 0); 605 else if (rirq->flags & OPAL_XIVE_IRQ_LSI) 606 xive_read_mmap8(rirq->eoi_page + XIVE_IRQ_LOAD_EOI); 607 else { 608 eoi_val = xive_read_mmap8(rirq->eoi_page + XIVE_IRQ_PQ_00); 609 if ((eoi_val & XIVE_IRQ_VAL_Q) && rirq->trig_page != 0) 610 xive_write_mmap8(rirq->trig_page, 0); 611 } 612 } 613 614 static void 615 xive_ipi(device_t dev, u_int cpu) 616 { 617 struct xive_cpu *xive_cpud; 618 619 xive_cpud = DPCPU_ID_PTR(cpu, xive_cpu_data); 620 621 if (xive_cpud->ipi_data.trig_page == 0) 622 return; 623 xive_write_mmap8(xive_cpud->ipi_data.trig_page, 0); 624 } 625 626 static void 627 xive_mask(device_t dev, u_int irq, void *priv) 628 { 629 struct xive_irq *rirq; 630 631 /* Never mask IPIs */ 632 if (irq == MAX_XIVE_IRQS) 633 return; 634 635 rirq = priv; 636 637 if (!(rirq->flags & OPAL_XIVE_IRQ_LSI)) 638 return; 639 xive_read_mmap8(rirq->eoi_page + XIVE_IRQ_PQ_01); 640 } 641 642 static void 643 xive_unmask(device_t dev, u_int irq, void *priv) 644 { 645 struct xive_irq *rirq; 646 647 rirq = priv; 648 649 xive_read_mmap8(rirq->eoi_page + XIVE_IRQ_PQ_00); 650 } 651 652 static void 653 xive_translate_code(device_t dev, u_int irq, int code, 654 enum intr_trigger *trig, enum intr_polarity *pol) 655 { 656 switch (code) { 657 case 0: 658 /* L to H edge */ 659 *trig = INTR_TRIGGER_EDGE; 660 *pol = INTR_POLARITY_HIGH; 661 break; 662 case 1: 663 /* Active L level */ 664 *trig = INTR_TRIGGER_LEVEL; 665 *pol = INTR_POLARITY_LOW; 666 break; 667 default: 668 *trig = INTR_TRIGGER_CONFORM; 669 *pol = INTR_POLARITY_CONFORM; 670 } 671 } 672 673 /* Private functions. */ 674 /* 675 * Setup the current CPU. Called by the BSP at driver attachment, and by each 676 * AP at wakeup (via xive_smp_cpu_startup()). 677 */ 678 static void 679 xive_setup_cpu(void) 680 { 681 struct xive_softc *sc; 682 struct xive_cpu *cpup; 683 uint32_t val; 684 685 cpup = DPCPU_PTR(xive_cpu_data); 686 687 sc = device_get_softc(root_pic); 688 689 val = bus_read_4(sc->sc_mem, XIVE_TM_QW2_HV_POOL + TM_WORD2); 690 if (val & TM_QW2W2_VP) 691 bus_read_8(sc->sc_mem, XIVE_TM_SPC_PULL_POOL_CTX); 692 693 bus_write_4(sc->sc_mem, XIVE_TM_QW2_HV_POOL + TM_WORD0, 0xff); 694 bus_write_4(sc->sc_mem, XIVE_TM_QW2_HV_POOL + TM_WORD2, 695 TM_QW2W2_VP | cpup->cam); 696 697 xive_unmask(root_pic, cpup->ipi_data.girq, &cpup->ipi_data); 698 xive_write_1(sc, XIVE_TM_CPPR, 0xff); 699 } 700 701 /* Populate an IRQ structure, mapping the EOI and trigger pages. */ 702 static void 703 xive_init_irq(struct xive_irq *irqd, u_int irq) 704 { 705 uint64_t eoi_phys, trig_phys; 706 uint32_t esb_shift; 707 708 opal_call(OPAL_XIVE_GET_IRQ_INFO, irq, 709 vtophys(&irqd->flags), vtophys(&eoi_phys), 710 vtophys(&trig_phys), vtophys(&esb_shift), 711 vtophys(&irqd->chip)); 712 713 irqd->flags = be64toh(irqd->flags); 714 eoi_phys = be64toh(eoi_phys); 715 trig_phys = be64toh(trig_phys); 716 esb_shift = be32toh(esb_shift); 717 irqd->chip = be32toh(irqd->chip); 718 719 irqd->girq = irq; 720 irqd->esb_size = 1 << esb_shift; 721 irqd->eoi_page = (vm_offset_t)pmap_mapdev(eoi_phys, irqd->esb_size); 722 723 if (eoi_phys == trig_phys) 724 irqd->trig_page = irqd->eoi_page; 725 else if (trig_phys != 0) 726 irqd->trig_page = (vm_offset_t)pmap_mapdev(trig_phys, 727 irqd->esb_size); 728 else 729 irqd->trig_page = 0; 730 731 opal_call(OPAL_XIVE_GET_IRQ_CONFIG, irq, vtophys(&irqd->vp), 732 vtophys(&irqd->prio), vtophys(&irqd->lirq)); 733 734 irqd->vp = be64toh(irqd->vp); 735 irqd->prio = be64toh(irqd->prio); 736 irqd->lirq = be32toh(irqd->lirq); 737 } 738 739 /* Allocate an IRQ struct before populating it. */ 740 static struct xive_irq * 741 xive_configure_irq(u_int irq) 742 { 743 struct xive_irq *irqd; 744 745 irqd = malloc(sizeof(struct xive_irq), M_XIVE, M_WAITOK); 746 747 xive_init_irq(irqd, irq); 748 749 return (irqd); 750 } 751 752 /* 753 * Part of the OPAL API. OPAL_XIVE_ALLOCATE_VP_BLOCK might require more pages, 754 * provisioned through this call. 755 */ 756 static int 757 xive_provision_page(struct xive_softc *sc) 758 { 759 void *prov_page; 760 int error; 761 762 do { 763 prov_page = contigmalloc(sc->sc_prov_page_size, M_XIVE, 0, 764 0, BUS_SPACE_MAXADDR, 765 sc->sc_prov_page_size, sc->sc_prov_page_size); 766 767 error = opal_call(OPAL_XIVE_DONATE_PAGE, -1, 768 vtophys(prov_page)); 769 } while (error == OPAL_XIVE_PROVISIONING); 770 771 return (0); 772 } 773 774 /* The XIVE_TM_CPPR register must be set by each thread */ 775 static void 776 xive_smp_cpu_startup(void) 777 { 778 779 xive_setup_cpu(); 780 } 781