1366f6083SPeter Grehan /*- 2c49761ddSPedro F. Giffuni * SPDX-License-Identifier: BSD-2-Clause-FreeBSD 3c49761ddSPedro F. Giffuni * 4366f6083SPeter Grehan * Copyright (c) 2011 NetApp, Inc. 5366f6083SPeter Grehan * All rights reserved. 6366f6083SPeter Grehan * 7366f6083SPeter Grehan * Redistribution and use in source and binary forms, with or without 8366f6083SPeter Grehan * modification, are permitted provided that the following conditions 9366f6083SPeter Grehan * are met: 10366f6083SPeter Grehan * 1. Redistributions of source code must retain the above copyright 11366f6083SPeter Grehan * notice, this list of conditions and the following disclaimer. 12366f6083SPeter Grehan * 2. Redistributions in binary form must reproduce the above copyright 13366f6083SPeter Grehan * notice, this list of conditions and the following disclaimer in the 14366f6083SPeter Grehan * documentation and/or other materials provided with the distribution. 15366f6083SPeter Grehan * 16366f6083SPeter Grehan * THIS SOFTWARE IS PROVIDED BY NETAPP, INC ``AS IS'' AND 17366f6083SPeter Grehan * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 18366f6083SPeter Grehan * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 19366f6083SPeter Grehan * ARE DISCLAIMED. IN NO EVENT SHALL NETAPP, INC OR CONTRIBUTORS BE LIABLE 20366f6083SPeter Grehan * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 21366f6083SPeter Grehan * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 22366f6083SPeter Grehan * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 23366f6083SPeter Grehan * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 24366f6083SPeter Grehan * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 25366f6083SPeter Grehan * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 26366f6083SPeter Grehan * SUCH DAMAGE. 27366f6083SPeter Grehan * 28366f6083SPeter Grehan * $FreeBSD$ 29366f6083SPeter Grehan */ 30366f6083SPeter Grehan 31366f6083SPeter Grehan #include <sys/cdefs.h> 32366f6083SPeter Grehan __FBSDID("$FreeBSD$"); 33366f6083SPeter Grehan 34366f6083SPeter Grehan #include <sys/param.h> 35366f6083SPeter Grehan #include <sys/systm.h> 36366f6083SPeter Grehan #include <sys/kernel.h> 37cd942e0fSPeter Grehan #include <sys/malloc.h> 38366f6083SPeter Grehan #include <sys/module.h> 39366f6083SPeter Grehan #include <sys/bus.h> 40366f6083SPeter Grehan #include <sys/pciio.h> 41366f6083SPeter Grehan #include <sys/rman.h> 42a5615c90SPeter Grehan #include <sys/smp.h> 4351f45d01SNeel Natu #include <sys/sysctl.h> 44366f6083SPeter Grehan 45366f6083SPeter Grehan #include <dev/pci/pcivar.h> 46366f6083SPeter Grehan #include <dev/pci/pcireg.h> 47366f6083SPeter Grehan 48366f6083SPeter Grehan #include <machine/resource.h> 49366f6083SPeter Grehan 50366f6083SPeter Grehan #include <machine/vmm.h> 51366f6083SPeter Grehan #include <machine/vmm_dev.h> 52366f6083SPeter Grehan 53366f6083SPeter Grehan #include "vmm_lapic.h" 54366f6083SPeter Grehan #include "vmm_ktr.h" 55366f6083SPeter Grehan 56366f6083SPeter Grehan #include "iommu.h" 57366f6083SPeter Grehan #include "ppt.h" 58366f6083SPeter Grehan 5975dd3366SNeel Natu /* XXX locking */ 6075dd3366SNeel Natu 61366f6083SPeter Grehan #define MAX_MSIMSGS 32 62366f6083SPeter Grehan 632b89a044SNeel Natu /* 642b89a044SNeel Natu * If the MSI-X table is located in the middle of a BAR then that MMIO 652b89a044SNeel Natu * region gets split into two segments - one segment above the MSI-X table 662b89a044SNeel Natu * and the other segment below the MSI-X table - with a hole in place of 672b89a044SNeel Natu * the MSI-X table so accesses to it can be trapped and emulated. 682b89a044SNeel Natu * 692b89a044SNeel Natu * So, allocate a MMIO segment for each BAR register + 1 additional segment. 702b89a044SNeel Natu */ 712b89a044SNeel Natu #define MAX_MMIOSEGS ((PCIR_MAX_BAR_0 + 1) + 1) 722b89a044SNeel Natu 73cd942e0fSPeter Grehan MALLOC_DEFINE(M_PPTMSIX, "pptmsix", "Passthru MSI-X resources"); 74cd942e0fSPeter Grehan 75366f6083SPeter Grehan struct pptintr_arg { /* pptintr(pptintr_arg) */ 76366f6083SPeter Grehan struct pptdev *pptdev; 774f8be175SNeel Natu uint64_t addr; 784f8be175SNeel Natu uint64_t msg_data; 79366f6083SPeter Grehan }; 80366f6083SPeter Grehan 819b1aa8d6SNeel Natu struct pptseg { 829b1aa8d6SNeel Natu vm_paddr_t gpa; 839b1aa8d6SNeel Natu size_t len; 849b1aa8d6SNeel Natu int wired; 859b1aa8d6SNeel Natu }; 869b1aa8d6SNeel Natu 87a15f820aSRyan Stone struct pptdev { 88366f6083SPeter Grehan device_t dev; 89366f6083SPeter Grehan struct vm *vm; /* owner of this device */ 90a15f820aSRyan Stone TAILQ_ENTRY(pptdev) next; 919b1aa8d6SNeel Natu struct pptseg mmio[MAX_MMIOSEGS]; 92366f6083SPeter Grehan struct { 93366f6083SPeter Grehan int num_msgs; /* guest state */ 94366f6083SPeter Grehan 95366f6083SPeter Grehan int startrid; /* host state */ 96366f6083SPeter Grehan struct resource *res[MAX_MSIMSGS]; 97366f6083SPeter Grehan void *cookie[MAX_MSIMSGS]; 98366f6083SPeter Grehan struct pptintr_arg arg[MAX_MSIMSGS]; 99366f6083SPeter Grehan } msi; 100cd942e0fSPeter Grehan 101cd942e0fSPeter Grehan struct { 102cd942e0fSPeter Grehan int num_msgs; 103cd942e0fSPeter Grehan int startrid; 104cd942e0fSPeter Grehan int msix_table_rid; 1050d1fd6e5SJohn Baldwin int msix_pba_rid; 106cd942e0fSPeter Grehan struct resource *msix_table_res; 1070d1fd6e5SJohn Baldwin struct resource *msix_pba_res; 108cd942e0fSPeter Grehan struct resource **res; 109cd942e0fSPeter Grehan void **cookie; 110cd942e0fSPeter Grehan struct pptintr_arg *arg; 111cd942e0fSPeter Grehan } msix; 112a15f820aSRyan Stone }; 113366f6083SPeter Grehan 11451f45d01SNeel Natu SYSCTL_DECL(_hw_vmm); 115*b40598c5SPawel Biernacki SYSCTL_NODE(_hw_vmm, OID_AUTO, ppt, CTLFLAG_RW | CTLFLAG_MPSAFE, 0, 116*b40598c5SPawel Biernacki "bhyve passthru devices"); 11751f45d01SNeel Natu 118366f6083SPeter Grehan static int num_pptdevs; 11951f45d01SNeel Natu SYSCTL_INT(_hw_vmm_ppt, OID_AUTO, devices, CTLFLAG_RD, &num_pptdevs, 0, 12051f45d01SNeel Natu "number of pci passthru devices"); 121366f6083SPeter Grehan 122a15f820aSRyan Stone static TAILQ_HEAD(, pptdev) pptdev_list = TAILQ_HEAD_INITIALIZER(pptdev_list); 123a15f820aSRyan Stone 124366f6083SPeter Grehan static int 125366f6083SPeter Grehan ppt_probe(device_t dev) 126366f6083SPeter Grehan { 127366f6083SPeter Grehan int bus, slot, func; 128366f6083SPeter Grehan struct pci_devinfo *dinfo; 129366f6083SPeter Grehan 130366f6083SPeter Grehan dinfo = (struct pci_devinfo *)device_get_ivars(dev); 131366f6083SPeter Grehan 132366f6083SPeter Grehan bus = pci_get_bus(dev); 133366f6083SPeter Grehan slot = pci_get_slot(dev); 134366f6083SPeter Grehan func = pci_get_function(dev); 135366f6083SPeter Grehan 136366f6083SPeter Grehan /* 137366f6083SPeter Grehan * To qualify as a pci passthrough device a device must: 138366f6083SPeter Grehan * - be allowed by administrator to be used in this role 139366f6083SPeter Grehan * - be an endpoint device 140366f6083SPeter Grehan */ 141a15f820aSRyan Stone if ((dinfo->cfg.hdrtype & PCIM_HDRTYPE) != PCIM_HDRTYPE_NORMAL) 142a15f820aSRyan Stone return (ENXIO); 143a15f820aSRyan Stone else if (vmm_is_pptdev(bus, slot, func)) 144366f6083SPeter Grehan return (0); 145366f6083SPeter Grehan else 146a15f820aSRyan Stone /* 147a15f820aSRyan Stone * Returning BUS_PROBE_NOWILDCARD here matches devices that the 148a15f820aSRyan Stone * SR-IOV infrastructure specified as "ppt" passthrough devices. 149a15f820aSRyan Stone * All normal devices that did not have "ppt" specified as their 150a15f820aSRyan Stone * driver will not be matched by this. 151a15f820aSRyan Stone */ 152a15f820aSRyan Stone return (BUS_PROBE_NOWILDCARD); 153366f6083SPeter Grehan } 154366f6083SPeter Grehan 155366f6083SPeter Grehan static int 156366f6083SPeter Grehan ppt_attach(device_t dev) 157366f6083SPeter Grehan { 158a15f820aSRyan Stone struct pptdev *ppt; 159366f6083SPeter Grehan 160a15f820aSRyan Stone ppt = device_get_softc(dev); 161366f6083SPeter Grehan 1626db55a0fSJohn Baldwin iommu_remove_device(iommu_host_domain(), pci_get_rid(dev)); 163a15f820aSRyan Stone num_pptdevs++; 164a15f820aSRyan Stone TAILQ_INSERT_TAIL(&pptdev_list, ppt, next); 165a15f820aSRyan Stone ppt->dev = dev; 166366f6083SPeter Grehan 167366f6083SPeter Grehan if (bootverbose) 168366f6083SPeter Grehan device_printf(dev, "attached\n"); 169366f6083SPeter Grehan 170366f6083SPeter Grehan return (0); 171366f6083SPeter Grehan } 172366f6083SPeter Grehan 173366f6083SPeter Grehan static int 174366f6083SPeter Grehan ppt_detach(device_t dev) 175366f6083SPeter Grehan { 176a15f820aSRyan Stone struct pptdev *ppt; 177a15f820aSRyan Stone 178a15f820aSRyan Stone ppt = device_get_softc(dev); 179a15f820aSRyan Stone 180a15f820aSRyan Stone if (ppt->vm != NULL) 181a15f820aSRyan Stone return (EBUSY); 182a15f820aSRyan Stone num_pptdevs--; 183a15f820aSRyan Stone TAILQ_REMOVE(&pptdev_list, ppt, next); 1846db55a0fSJohn Baldwin pci_disable_busmaster(dev); 1856db55a0fSJohn Baldwin iommu_add_device(iommu_host_domain(), pci_get_rid(dev)); 186366f6083SPeter Grehan 187366f6083SPeter Grehan return (0); 188366f6083SPeter Grehan } 189366f6083SPeter Grehan 190366f6083SPeter Grehan static device_method_t ppt_methods[] = { 191366f6083SPeter Grehan /* Device interface */ 192366f6083SPeter Grehan DEVMETHOD(device_probe, ppt_probe), 193366f6083SPeter Grehan DEVMETHOD(device_attach, ppt_attach), 194366f6083SPeter Grehan DEVMETHOD(device_detach, ppt_detach), 195366f6083SPeter Grehan {0, 0} 196366f6083SPeter Grehan }; 197366f6083SPeter Grehan 198366f6083SPeter Grehan static devclass_t ppt_devclass; 199a15f820aSRyan Stone DEFINE_CLASS_0(ppt, ppt_driver, ppt_methods, sizeof(struct pptdev)); 200366f6083SPeter Grehan DRIVER_MODULE(ppt, pci, ppt_driver, ppt_devclass, NULL, NULL); 201366f6083SPeter Grehan 202366f6083SPeter Grehan static struct pptdev * 203366f6083SPeter Grehan ppt_find(int bus, int slot, int func) 204366f6083SPeter Grehan { 205366f6083SPeter Grehan device_t dev; 206a15f820aSRyan Stone struct pptdev *ppt; 207a15f820aSRyan Stone int b, s, f; 208366f6083SPeter Grehan 209a15f820aSRyan Stone TAILQ_FOREACH(ppt, &pptdev_list, next) { 210a15f820aSRyan Stone dev = ppt->dev; 211366f6083SPeter Grehan b = pci_get_bus(dev); 212366f6083SPeter Grehan s = pci_get_slot(dev); 213366f6083SPeter Grehan f = pci_get_function(dev); 214366f6083SPeter Grehan if (bus == b && slot == s && func == f) 215a15f820aSRyan Stone return (ppt); 216366f6083SPeter Grehan } 217366f6083SPeter Grehan return (NULL); 218366f6083SPeter Grehan } 219366f6083SPeter Grehan 220366f6083SPeter Grehan static void 221366f6083SPeter Grehan ppt_unmap_mmio(struct vm *vm, struct pptdev *ppt) 222366f6083SPeter Grehan { 223366f6083SPeter Grehan int i; 2249b1aa8d6SNeel Natu struct pptseg *seg; 225366f6083SPeter Grehan 226366f6083SPeter Grehan for (i = 0; i < MAX_MMIOSEGS; i++) { 227366f6083SPeter Grehan seg = &ppt->mmio[i]; 228366f6083SPeter Grehan if (seg->len == 0) 229366f6083SPeter Grehan continue; 230366f6083SPeter Grehan (void)vm_unmap_mmio(vm, seg->gpa, seg->len); 2319b1aa8d6SNeel Natu bzero(seg, sizeof(struct pptseg)); 232366f6083SPeter Grehan } 233366f6083SPeter Grehan } 234366f6083SPeter Grehan 235366f6083SPeter Grehan static void 236366f6083SPeter Grehan ppt_teardown_msi(struct pptdev *ppt) 237366f6083SPeter Grehan { 238366f6083SPeter Grehan int i, rid; 239366f6083SPeter Grehan void *cookie; 240366f6083SPeter Grehan struct resource *res; 241366f6083SPeter Grehan 242366f6083SPeter Grehan if (ppt->msi.num_msgs == 0) 243366f6083SPeter Grehan return; 244366f6083SPeter Grehan 245366f6083SPeter Grehan for (i = 0; i < ppt->msi.num_msgs; i++) { 246366f6083SPeter Grehan rid = ppt->msi.startrid + i; 247366f6083SPeter Grehan res = ppt->msi.res[i]; 248366f6083SPeter Grehan cookie = ppt->msi.cookie[i]; 249366f6083SPeter Grehan 250366f6083SPeter Grehan if (cookie != NULL) 251366f6083SPeter Grehan bus_teardown_intr(ppt->dev, res, cookie); 252366f6083SPeter Grehan 253366f6083SPeter Grehan if (res != NULL) 254366f6083SPeter Grehan bus_release_resource(ppt->dev, SYS_RES_IRQ, rid, res); 255366f6083SPeter Grehan 256366f6083SPeter Grehan ppt->msi.res[i] = NULL; 257366f6083SPeter Grehan ppt->msi.cookie[i] = NULL; 258366f6083SPeter Grehan } 259366f6083SPeter Grehan 260366f6083SPeter Grehan if (ppt->msi.startrid == 1) 261366f6083SPeter Grehan pci_release_msi(ppt->dev); 262366f6083SPeter Grehan 263366f6083SPeter Grehan ppt->msi.num_msgs = 0; 264366f6083SPeter Grehan } 265366f6083SPeter Grehan 266cd942e0fSPeter Grehan static void 267cd942e0fSPeter Grehan ppt_teardown_msix_intr(struct pptdev *ppt, int idx) 268cd942e0fSPeter Grehan { 269cd942e0fSPeter Grehan int rid; 270cd942e0fSPeter Grehan struct resource *res; 271cd942e0fSPeter Grehan void *cookie; 272cd942e0fSPeter Grehan 273cd942e0fSPeter Grehan rid = ppt->msix.startrid + idx; 274cd942e0fSPeter Grehan res = ppt->msix.res[idx]; 275cd942e0fSPeter Grehan cookie = ppt->msix.cookie[idx]; 276cd942e0fSPeter Grehan 277cd942e0fSPeter Grehan if (cookie != NULL) 278cd942e0fSPeter Grehan bus_teardown_intr(ppt->dev, res, cookie); 279cd942e0fSPeter Grehan 280cd942e0fSPeter Grehan if (res != NULL) 281cd942e0fSPeter Grehan bus_release_resource(ppt->dev, SYS_RES_IRQ, rid, res); 282cd942e0fSPeter Grehan 283cd942e0fSPeter Grehan ppt->msix.res[idx] = NULL; 284cd942e0fSPeter Grehan ppt->msix.cookie[idx] = NULL; 285cd942e0fSPeter Grehan } 286cd942e0fSPeter Grehan 287cd942e0fSPeter Grehan static void 288cd942e0fSPeter Grehan ppt_teardown_msix(struct pptdev *ppt) 289cd942e0fSPeter Grehan { 290920bc340SNeel Natu int i; 291cd942e0fSPeter Grehan 292cd942e0fSPeter Grehan if (ppt->msix.num_msgs == 0) 293cd942e0fSPeter Grehan return; 294cd942e0fSPeter Grehan 295cd942e0fSPeter Grehan for (i = 0; i < ppt->msix.num_msgs; i++) 296cd942e0fSPeter Grehan ppt_teardown_msix_intr(ppt, i); 297cd942e0fSPeter Grehan 2980d1fd6e5SJohn Baldwin free(ppt->msix.res, M_PPTMSIX); 2990d1fd6e5SJohn Baldwin free(ppt->msix.cookie, M_PPTMSIX); 3000d1fd6e5SJohn Baldwin free(ppt->msix.arg, M_PPTMSIX); 3010d1fd6e5SJohn Baldwin 3020d1fd6e5SJohn Baldwin pci_release_msi(ppt->dev); 3030d1fd6e5SJohn Baldwin 304cd942e0fSPeter Grehan if (ppt->msix.msix_table_res) { 305cd942e0fSPeter Grehan bus_release_resource(ppt->dev, SYS_RES_MEMORY, 306cd942e0fSPeter Grehan ppt->msix.msix_table_rid, 307cd942e0fSPeter Grehan ppt->msix.msix_table_res); 308cd942e0fSPeter Grehan ppt->msix.msix_table_res = NULL; 309cd942e0fSPeter Grehan ppt->msix.msix_table_rid = 0; 310cd942e0fSPeter Grehan } 3110d1fd6e5SJohn Baldwin if (ppt->msix.msix_pba_res) { 3120d1fd6e5SJohn Baldwin bus_release_resource(ppt->dev, SYS_RES_MEMORY, 3130d1fd6e5SJohn Baldwin ppt->msix.msix_pba_rid, 3140d1fd6e5SJohn Baldwin ppt->msix.msix_pba_res); 3150d1fd6e5SJohn Baldwin ppt->msix.msix_pba_res = NULL; 3160d1fd6e5SJohn Baldwin ppt->msix.msix_pba_rid = 0; 3170d1fd6e5SJohn Baldwin } 318cd942e0fSPeter Grehan 319cd942e0fSPeter Grehan ppt->msix.num_msgs = 0; 320cd942e0fSPeter Grehan } 321cd942e0fSPeter Grehan 322366f6083SPeter Grehan int 32351f45d01SNeel Natu ppt_avail_devices(void) 32451f45d01SNeel Natu { 32551f45d01SNeel Natu 32651f45d01SNeel Natu return (num_pptdevs); 32751f45d01SNeel Natu } 32851f45d01SNeel Natu 32951f45d01SNeel Natu int 33051f45d01SNeel Natu ppt_assigned_devices(struct vm *vm) 331318224bbSNeel Natu { 332a15f820aSRyan Stone struct pptdev *ppt; 333a15f820aSRyan Stone int num; 334318224bbSNeel Natu 335318224bbSNeel Natu num = 0; 336a15f820aSRyan Stone TAILQ_FOREACH(ppt, &pptdev_list, next) { 337a15f820aSRyan Stone if (ppt->vm == vm) 338318224bbSNeel Natu num++; 339318224bbSNeel Natu } 340318224bbSNeel Natu return (num); 341318224bbSNeel Natu } 342318224bbSNeel Natu 343490d56c5SEd Maste bool 344318224bbSNeel Natu ppt_is_mmio(struct vm *vm, vm_paddr_t gpa) 345318224bbSNeel Natu { 346a15f820aSRyan Stone int i; 347318224bbSNeel Natu struct pptdev *ppt; 3489b1aa8d6SNeel Natu struct pptseg *seg; 349318224bbSNeel Natu 350a15f820aSRyan Stone TAILQ_FOREACH(ppt, &pptdev_list, next) { 351318224bbSNeel Natu if (ppt->vm != vm) 352318224bbSNeel Natu continue; 353318224bbSNeel Natu 354318224bbSNeel Natu for (i = 0; i < MAX_MMIOSEGS; i++) { 355318224bbSNeel Natu seg = &ppt->mmio[i]; 356318224bbSNeel Natu if (seg->len == 0) 357318224bbSNeel Natu continue; 358318224bbSNeel Natu if (gpa >= seg->gpa && gpa < seg->gpa + seg->len) 359490d56c5SEd Maste return (true); 360318224bbSNeel Natu } 361318224bbSNeel Natu } 362318224bbSNeel Natu 363490d56c5SEd Maste return (false); 364318224bbSNeel Natu } 365318224bbSNeel Natu 366adb947a6SPeter Grehan static void 367adb947a6SPeter Grehan ppt_pci_reset(device_t dev) 368adb947a6SPeter Grehan { 369adb947a6SPeter Grehan 370adb947a6SPeter Grehan if (pcie_flr(dev, 3715db2a4a8SKonstantin Belousov max(pcie_get_max_completion_timeout(dev) / 1000, 10), true)) 372adb947a6SPeter Grehan return; 373adb947a6SPeter Grehan 3745db2a4a8SKonstantin Belousov pci_power_reset(dev); 375adb947a6SPeter Grehan } 376adb947a6SPeter Grehan 377318224bbSNeel Natu int 378366f6083SPeter Grehan ppt_assign_device(struct vm *vm, int bus, int slot, int func) 379366f6083SPeter Grehan { 380366f6083SPeter Grehan struct pptdev *ppt; 381366f6083SPeter Grehan 382366f6083SPeter Grehan ppt = ppt_find(bus, slot, func); 383366f6083SPeter Grehan if (ppt != NULL) { 384366f6083SPeter Grehan /* 385366f6083SPeter Grehan * If this device is owned by a different VM then we 386366f6083SPeter Grehan * cannot change its owner. 387366f6083SPeter Grehan */ 388366f6083SPeter Grehan if (ppt->vm != NULL && ppt->vm != vm) 389366f6083SPeter Grehan return (EBUSY); 390366f6083SPeter Grehan 391da0fc925SJohn Baldwin pci_save_state(ppt->dev); 392adb947a6SPeter Grehan ppt_pci_reset(ppt->dev); 393da0fc925SJohn Baldwin pci_restore_state(ppt->dev); 394366f6083SPeter Grehan ppt->vm = vm; 395a8667250SRyan Stone iommu_add_device(vm_iommu_domain(vm), pci_get_rid(ppt->dev)); 396366f6083SPeter Grehan return (0); 397366f6083SPeter Grehan } 398366f6083SPeter Grehan return (ENOENT); 399366f6083SPeter Grehan } 400366f6083SPeter Grehan 401366f6083SPeter Grehan int 402366f6083SPeter Grehan ppt_unassign_device(struct vm *vm, int bus, int slot, int func) 403366f6083SPeter Grehan { 404366f6083SPeter Grehan struct pptdev *ppt; 405366f6083SPeter Grehan 406366f6083SPeter Grehan ppt = ppt_find(bus, slot, func); 407366f6083SPeter Grehan if (ppt != NULL) { 408366f6083SPeter Grehan /* 409366f6083SPeter Grehan * If this device is not owned by this 'vm' then bail out. 410366f6083SPeter Grehan */ 411366f6083SPeter Grehan if (ppt->vm != vm) 412366f6083SPeter Grehan return (EBUSY); 413da0fc925SJohn Baldwin 414da0fc925SJohn Baldwin pci_save_state(ppt->dev); 415adb947a6SPeter Grehan ppt_pci_reset(ppt->dev); 416da0fc925SJohn Baldwin pci_restore_state(ppt->dev); 417366f6083SPeter Grehan ppt_unmap_mmio(vm, ppt); 418366f6083SPeter Grehan ppt_teardown_msi(ppt); 419cd942e0fSPeter Grehan ppt_teardown_msix(ppt); 420a8667250SRyan Stone iommu_remove_device(vm_iommu_domain(vm), pci_get_rid(ppt->dev)); 421366f6083SPeter Grehan ppt->vm = NULL; 422366f6083SPeter Grehan return (0); 423366f6083SPeter Grehan } 424366f6083SPeter Grehan return (ENOENT); 425366f6083SPeter Grehan } 426366f6083SPeter Grehan 427366f6083SPeter Grehan int 428366f6083SPeter Grehan ppt_unassign_all(struct vm *vm) 429366f6083SPeter Grehan { 430a15f820aSRyan Stone struct pptdev *ppt; 431a15f820aSRyan Stone int bus, slot, func; 432366f6083SPeter Grehan device_t dev; 433366f6083SPeter Grehan 434a15f820aSRyan Stone TAILQ_FOREACH(ppt, &pptdev_list, next) { 435a15f820aSRyan Stone if (ppt->vm == vm) { 436a15f820aSRyan Stone dev = ppt->dev; 437366f6083SPeter Grehan bus = pci_get_bus(dev); 438366f6083SPeter Grehan slot = pci_get_slot(dev); 439366f6083SPeter Grehan func = pci_get_function(dev); 440318224bbSNeel Natu vm_unassign_pptdev(vm, bus, slot, func); 441366f6083SPeter Grehan } 442366f6083SPeter Grehan } 443366f6083SPeter Grehan 444366f6083SPeter Grehan return (0); 445366f6083SPeter Grehan } 446366f6083SPeter Grehan 447366f6083SPeter Grehan int 448366f6083SPeter Grehan ppt_map_mmio(struct vm *vm, int bus, int slot, int func, 449366f6083SPeter Grehan vm_paddr_t gpa, size_t len, vm_paddr_t hpa) 450366f6083SPeter Grehan { 451366f6083SPeter Grehan int i, error; 4529b1aa8d6SNeel Natu struct pptseg *seg; 453366f6083SPeter Grehan struct pptdev *ppt; 454366f6083SPeter Grehan 455366f6083SPeter Grehan ppt = ppt_find(bus, slot, func); 456366f6083SPeter Grehan if (ppt != NULL) { 457366f6083SPeter Grehan if (ppt->vm != vm) 458366f6083SPeter Grehan return (EBUSY); 459366f6083SPeter Grehan 460366f6083SPeter Grehan for (i = 0; i < MAX_MMIOSEGS; i++) { 461366f6083SPeter Grehan seg = &ppt->mmio[i]; 462366f6083SPeter Grehan if (seg->len == 0) { 463366f6083SPeter Grehan error = vm_map_mmio(vm, gpa, len, hpa); 464366f6083SPeter Grehan if (error == 0) { 465366f6083SPeter Grehan seg->gpa = gpa; 466366f6083SPeter Grehan seg->len = len; 467366f6083SPeter Grehan } 468366f6083SPeter Grehan return (error); 469366f6083SPeter Grehan } 470366f6083SPeter Grehan } 471366f6083SPeter Grehan return (ENOSPC); 472366f6083SPeter Grehan } 473366f6083SPeter Grehan return (ENOENT); 474366f6083SPeter Grehan } 475366f6083SPeter Grehan 476366f6083SPeter Grehan static int 477366f6083SPeter Grehan pptintr(void *arg) 478366f6083SPeter Grehan { 479366f6083SPeter Grehan struct pptdev *ppt; 480366f6083SPeter Grehan struct pptintr_arg *pptarg; 481366f6083SPeter Grehan 482366f6083SPeter Grehan pptarg = arg; 483366f6083SPeter Grehan ppt = pptarg->pptdev; 484366f6083SPeter Grehan 485366f6083SPeter Grehan if (ppt->vm != NULL) 4864f8be175SNeel Natu lapic_intr_msi(ppt->vm, pptarg->addr, pptarg->msg_data); 487366f6083SPeter Grehan else { 488366f6083SPeter Grehan /* 489366f6083SPeter Grehan * XXX 490366f6083SPeter Grehan * This is not expected to happen - panic? 491366f6083SPeter Grehan */ 492366f6083SPeter Grehan } 493366f6083SPeter Grehan 494366f6083SPeter Grehan /* 495366f6083SPeter Grehan * For legacy interrupts give other filters a chance in case 496366f6083SPeter Grehan * the interrupt was not generated by the passthrough device. 497366f6083SPeter Grehan */ 498366f6083SPeter Grehan if (ppt->msi.startrid == 0) 499366f6083SPeter Grehan return (FILTER_STRAY); 500366f6083SPeter Grehan else 501366f6083SPeter Grehan return (FILTER_HANDLED); 502366f6083SPeter Grehan } 503366f6083SPeter Grehan 504366f6083SPeter Grehan int 505366f6083SPeter Grehan ppt_setup_msi(struct vm *vm, int vcpu, int bus, int slot, int func, 5064f8be175SNeel Natu uint64_t addr, uint64_t msg, int numvec) 507366f6083SPeter Grehan { 508366f6083SPeter Grehan int i, rid, flags; 509366f6083SPeter Grehan int msi_count, startrid, error, tmp; 510366f6083SPeter Grehan struct pptdev *ppt; 511366f6083SPeter Grehan 5124f8be175SNeel Natu if (numvec < 0 || numvec > MAX_MSIMSGS) 513366f6083SPeter Grehan return (EINVAL); 514366f6083SPeter Grehan 515366f6083SPeter Grehan ppt = ppt_find(bus, slot, func); 516366f6083SPeter Grehan if (ppt == NULL) 517366f6083SPeter Grehan return (ENOENT); 518366f6083SPeter Grehan if (ppt->vm != vm) /* Make sure we own this device */ 519366f6083SPeter Grehan return (EBUSY); 520366f6083SPeter Grehan 521366f6083SPeter Grehan /* Free any allocated resources */ 522485b3300SNeel Natu ppt_teardown_msi(ppt); 523366f6083SPeter Grehan 524366f6083SPeter Grehan if (numvec == 0) /* nothing more to do */ 525366f6083SPeter Grehan return (0); 526366f6083SPeter Grehan 527366f6083SPeter Grehan flags = RF_ACTIVE; 528366f6083SPeter Grehan msi_count = pci_msi_count(ppt->dev); 529366f6083SPeter Grehan if (msi_count == 0) { 530366f6083SPeter Grehan startrid = 0; /* legacy interrupt */ 531366f6083SPeter Grehan msi_count = 1; 532366f6083SPeter Grehan flags |= RF_SHAREABLE; 533366f6083SPeter Grehan } else 534366f6083SPeter Grehan startrid = 1; /* MSI */ 535366f6083SPeter Grehan 536366f6083SPeter Grehan /* 537366f6083SPeter Grehan * The device must be capable of supporting the number of vectors 538366f6083SPeter Grehan * the guest wants to allocate. 539366f6083SPeter Grehan */ 540366f6083SPeter Grehan if (numvec > msi_count) 541366f6083SPeter Grehan return (EINVAL); 542366f6083SPeter Grehan 543366f6083SPeter Grehan /* 544366f6083SPeter Grehan * Make sure that we can allocate all the MSI vectors that are needed 545366f6083SPeter Grehan * by the guest. 546366f6083SPeter Grehan */ 547366f6083SPeter Grehan if (startrid == 1) { 548366f6083SPeter Grehan tmp = numvec; 549366f6083SPeter Grehan error = pci_alloc_msi(ppt->dev, &tmp); 550366f6083SPeter Grehan if (error) 551366f6083SPeter Grehan return (error); 552366f6083SPeter Grehan else if (tmp != numvec) { 553366f6083SPeter Grehan pci_release_msi(ppt->dev); 554366f6083SPeter Grehan return (ENOSPC); 555366f6083SPeter Grehan } else { 556366f6083SPeter Grehan /* success */ 557366f6083SPeter Grehan } 558366f6083SPeter Grehan } 559366f6083SPeter Grehan 560366f6083SPeter Grehan ppt->msi.startrid = startrid; 561366f6083SPeter Grehan 562366f6083SPeter Grehan /* 563366f6083SPeter Grehan * Allocate the irq resource and attach it to the interrupt handler. 564366f6083SPeter Grehan */ 565366f6083SPeter Grehan for (i = 0; i < numvec; i++) { 566366f6083SPeter Grehan ppt->msi.num_msgs = i + 1; 567366f6083SPeter Grehan ppt->msi.cookie[i] = NULL; 568366f6083SPeter Grehan 569366f6083SPeter Grehan rid = startrid + i; 570366f6083SPeter Grehan ppt->msi.res[i] = bus_alloc_resource_any(ppt->dev, SYS_RES_IRQ, 571366f6083SPeter Grehan &rid, flags); 572366f6083SPeter Grehan if (ppt->msi.res[i] == NULL) 573366f6083SPeter Grehan break; 574366f6083SPeter Grehan 575366f6083SPeter Grehan ppt->msi.arg[i].pptdev = ppt; 5764f8be175SNeel Natu ppt->msi.arg[i].addr = addr; 5774f8be175SNeel Natu ppt->msi.arg[i].msg_data = msg + i; 578366f6083SPeter Grehan 579366f6083SPeter Grehan error = bus_setup_intr(ppt->dev, ppt->msi.res[i], 58034a6b2d6SJohn Baldwin INTR_TYPE_NET | INTR_MPSAFE, 581366f6083SPeter Grehan pptintr, NULL, &ppt->msi.arg[i], 582366f6083SPeter Grehan &ppt->msi.cookie[i]); 583366f6083SPeter Grehan if (error != 0) 584366f6083SPeter Grehan break; 585366f6083SPeter Grehan } 586366f6083SPeter Grehan 587366f6083SPeter Grehan if (i < numvec) { 588485b3300SNeel Natu ppt_teardown_msi(ppt); 589366f6083SPeter Grehan return (ENXIO); 590366f6083SPeter Grehan } 591366f6083SPeter Grehan 592366f6083SPeter Grehan return (0); 593366f6083SPeter Grehan } 594cd942e0fSPeter Grehan 595cd942e0fSPeter Grehan int 596cd942e0fSPeter Grehan ppt_setup_msix(struct vm *vm, int vcpu, int bus, int slot, int func, 5974f8be175SNeel Natu int idx, uint64_t addr, uint64_t msg, uint32_t vector_control) 598cd942e0fSPeter Grehan { 599cd942e0fSPeter Grehan struct pptdev *ppt; 600cd942e0fSPeter Grehan struct pci_devinfo *dinfo; 601920bc340SNeel Natu int numvec, alloced, rid, error; 602cd942e0fSPeter Grehan size_t res_size, cookie_size, arg_size; 603cd942e0fSPeter Grehan 604cd942e0fSPeter Grehan ppt = ppt_find(bus, slot, func); 605cd942e0fSPeter Grehan if (ppt == NULL) 606cd942e0fSPeter Grehan return (ENOENT); 607cd942e0fSPeter Grehan if (ppt->vm != vm) /* Make sure we own this device */ 608cd942e0fSPeter Grehan return (EBUSY); 609cd942e0fSPeter Grehan 610cd942e0fSPeter Grehan dinfo = device_get_ivars(ppt->dev); 611cd942e0fSPeter Grehan if (!dinfo) 612cd942e0fSPeter Grehan return (ENXIO); 613cd942e0fSPeter Grehan 614cd942e0fSPeter Grehan /* 615cd942e0fSPeter Grehan * First-time configuration: 616cd942e0fSPeter Grehan * Allocate the MSI-X table 617cd942e0fSPeter Grehan * Allocate the IRQ resources 618cd942e0fSPeter Grehan * Set up some variables in ppt->msix 619cd942e0fSPeter Grehan */ 620920bc340SNeel Natu if (ppt->msix.num_msgs == 0) { 621920bc340SNeel Natu numvec = pci_msix_count(ppt->dev); 622920bc340SNeel Natu if (numvec <= 0) 623920bc340SNeel Natu return (EINVAL); 624cd942e0fSPeter Grehan 625cd942e0fSPeter Grehan ppt->msix.startrid = 1; 626920bc340SNeel Natu ppt->msix.num_msgs = numvec; 627cd942e0fSPeter Grehan 628cd942e0fSPeter Grehan res_size = numvec * sizeof(ppt->msix.res[0]); 629cd942e0fSPeter Grehan cookie_size = numvec * sizeof(ppt->msix.cookie[0]); 630cd942e0fSPeter Grehan arg_size = numvec * sizeof(ppt->msix.arg[0]); 631cd942e0fSPeter Grehan 632920bc340SNeel Natu ppt->msix.res = malloc(res_size, M_PPTMSIX, M_WAITOK | M_ZERO); 633920bc340SNeel Natu ppt->msix.cookie = malloc(cookie_size, M_PPTMSIX, 634920bc340SNeel Natu M_WAITOK | M_ZERO); 635920bc340SNeel Natu ppt->msix.arg = malloc(arg_size, M_PPTMSIX, M_WAITOK | M_ZERO); 636920bc340SNeel Natu 637920bc340SNeel Natu rid = dinfo->cfg.msix.msix_table_bar; 638920bc340SNeel Natu ppt->msix.msix_table_res = bus_alloc_resource_any(ppt->dev, 639920bc340SNeel Natu SYS_RES_MEMORY, &rid, RF_ACTIVE); 640920bc340SNeel Natu 641920bc340SNeel Natu if (ppt->msix.msix_table_res == NULL) { 642cd942e0fSPeter Grehan ppt_teardown_msix(ppt); 643cd942e0fSPeter Grehan return (ENOSPC); 644cd942e0fSPeter Grehan } 645920bc340SNeel Natu ppt->msix.msix_table_rid = rid; 646920bc340SNeel Natu 6470d1fd6e5SJohn Baldwin if (dinfo->cfg.msix.msix_table_bar != 6480d1fd6e5SJohn Baldwin dinfo->cfg.msix.msix_pba_bar) { 6490d1fd6e5SJohn Baldwin rid = dinfo->cfg.msix.msix_pba_bar; 6500d1fd6e5SJohn Baldwin ppt->msix.msix_pba_res = bus_alloc_resource_any( 6510d1fd6e5SJohn Baldwin ppt->dev, SYS_RES_MEMORY, &rid, RF_ACTIVE); 6520d1fd6e5SJohn Baldwin 6530d1fd6e5SJohn Baldwin if (ppt->msix.msix_pba_res == NULL) { 6540d1fd6e5SJohn Baldwin ppt_teardown_msix(ppt); 6550d1fd6e5SJohn Baldwin return (ENOSPC); 6560d1fd6e5SJohn Baldwin } 6570d1fd6e5SJohn Baldwin ppt->msix.msix_pba_rid = rid; 6580d1fd6e5SJohn Baldwin } 6590d1fd6e5SJohn Baldwin 660920bc340SNeel Natu alloced = numvec; 661920bc340SNeel Natu error = pci_alloc_msix(ppt->dev, &alloced); 662920bc340SNeel Natu if (error || alloced != numvec) { 663920bc340SNeel Natu ppt_teardown_msix(ppt); 664920bc340SNeel Natu return (error == 0 ? ENOSPC: error); 665920bc340SNeel Natu } 666cd942e0fSPeter Grehan } 667cd942e0fSPeter Grehan 668cd942e0fSPeter Grehan if ((vector_control & PCIM_MSIX_VCTRL_MASK) == 0) { 669cd942e0fSPeter Grehan /* Tear down the IRQ if it's already set up */ 670cd942e0fSPeter Grehan ppt_teardown_msix_intr(ppt, idx); 671cd942e0fSPeter Grehan 672cd942e0fSPeter Grehan /* Allocate the IRQ resource */ 673cd942e0fSPeter Grehan ppt->msix.cookie[idx] = NULL; 674cd942e0fSPeter Grehan rid = ppt->msix.startrid + idx; 675cd942e0fSPeter Grehan ppt->msix.res[idx] = bus_alloc_resource_any(ppt->dev, SYS_RES_IRQ, 676cd942e0fSPeter Grehan &rid, RF_ACTIVE); 677cd942e0fSPeter Grehan if (ppt->msix.res[idx] == NULL) 678cd942e0fSPeter Grehan return (ENXIO); 679cd942e0fSPeter Grehan 680cd942e0fSPeter Grehan ppt->msix.arg[idx].pptdev = ppt; 6814f8be175SNeel Natu ppt->msix.arg[idx].addr = addr; 6824f8be175SNeel Natu ppt->msix.arg[idx].msg_data = msg; 683cd942e0fSPeter Grehan 684cd942e0fSPeter Grehan /* Setup the MSI-X interrupt */ 685cd942e0fSPeter Grehan error = bus_setup_intr(ppt->dev, ppt->msix.res[idx], 686cd942e0fSPeter Grehan INTR_TYPE_NET | INTR_MPSAFE, 687cd942e0fSPeter Grehan pptintr, NULL, &ppt->msix.arg[idx], 688cd942e0fSPeter Grehan &ppt->msix.cookie[idx]); 689cd942e0fSPeter Grehan 690cd942e0fSPeter Grehan if (error != 0) { 691cd942e0fSPeter Grehan bus_release_resource(ppt->dev, SYS_RES_IRQ, rid, ppt->msix.res[idx]); 692cd942e0fSPeter Grehan ppt->msix.cookie[idx] = NULL; 693cd942e0fSPeter Grehan ppt->msix.res[idx] = NULL; 694cd942e0fSPeter Grehan return (ENXIO); 695cd942e0fSPeter Grehan } 696cd942e0fSPeter Grehan } else { 697cd942e0fSPeter Grehan /* Masked, tear it down if it's already been set up */ 698cd942e0fSPeter Grehan ppt_teardown_msix_intr(ppt, idx); 699cd942e0fSPeter Grehan } 700cd942e0fSPeter Grehan 701cd942e0fSPeter Grehan return (0); 702cd942e0fSPeter Grehan } 703