1d1b054daSYu Zhao /* 2d1b054daSYu Zhao * drivers/pci/iov.c 3d1b054daSYu Zhao * 4d1b054daSYu Zhao * Copyright (C) 2009 Intel Corporation, Yu Zhao <yu.zhao@intel.com> 5d1b054daSYu Zhao * 6d1b054daSYu Zhao * PCI Express I/O Virtualization (IOV) support. 7d1b054daSYu Zhao * Single Root IOV 1.0 8302b4215SYu Zhao * Address Translation Service 1.0 9d1b054daSYu Zhao */ 10d1b054daSYu Zhao 11d1b054daSYu Zhao #include <linux/pci.h> 125a0e3ad6STejun Heo #include <linux/slab.h> 13d1b054daSYu Zhao #include <linux/mutex.h> 14363c75dbSPaul Gortmaker #include <linux/export.h> 15d1b054daSYu Zhao #include <linux/string.h> 16d1b054daSYu Zhao #include <linux/delay.h> 175cdede24SJoerg Roedel #include <linux/pci-ats.h> 18d1b054daSYu Zhao #include "pci.h" 19d1b054daSYu Zhao 20dd7cc44dSYu Zhao #define VIRTFN_ID_LEN 16 21d1b054daSYu Zhao 22a28724b0SYu Zhao static inline u8 virtfn_bus(struct pci_dev *dev, int id) 23a28724b0SYu Zhao { 24a28724b0SYu Zhao return dev->bus->number + ((dev->devfn + dev->sriov->offset + 25a28724b0SYu Zhao dev->sriov->stride * id) >> 8); 26a28724b0SYu Zhao } 27a28724b0SYu Zhao 28a28724b0SYu Zhao static inline u8 virtfn_devfn(struct pci_dev *dev, int id) 29a28724b0SYu Zhao { 30a28724b0SYu Zhao return (dev->devfn + dev->sriov->offset + 31a28724b0SYu Zhao dev->sriov->stride * id) & 0xff; 32a28724b0SYu Zhao } 33a28724b0SYu Zhao 34dd7cc44dSYu Zhao static struct pci_bus *virtfn_add_bus(struct pci_bus *bus, int busnr) 35dd7cc44dSYu Zhao { 36dd7cc44dSYu Zhao int rc; 37dd7cc44dSYu Zhao struct pci_bus *child; 38dd7cc44dSYu Zhao 39dd7cc44dSYu Zhao if (bus->number == busnr) 40dd7cc44dSYu Zhao return bus; 41dd7cc44dSYu Zhao 42dd7cc44dSYu Zhao child = pci_find_bus(pci_domain_nr(bus), busnr); 43dd7cc44dSYu Zhao if (child) 44dd7cc44dSYu Zhao return child; 45dd7cc44dSYu Zhao 46dd7cc44dSYu Zhao child = pci_add_new_bus(bus, NULL, busnr); 47dd7cc44dSYu Zhao if (!child) 48dd7cc44dSYu Zhao return NULL; 49dd7cc44dSYu Zhao 50dd7cc44dSYu Zhao child->subordinate = busnr; 51dd7cc44dSYu Zhao child->dev.parent = bus->bridge; 52dd7cc44dSYu Zhao rc = pci_bus_add_child(child); 53dd7cc44dSYu Zhao if (rc) { 54dd7cc44dSYu Zhao pci_remove_bus(child); 55dd7cc44dSYu Zhao return NULL; 56dd7cc44dSYu Zhao } 57dd7cc44dSYu Zhao 58dd7cc44dSYu Zhao return child; 59dd7cc44dSYu Zhao } 60dd7cc44dSYu Zhao 61dd7cc44dSYu Zhao static void virtfn_remove_bus(struct pci_bus *bus, int busnr) 62dd7cc44dSYu Zhao { 63dd7cc44dSYu Zhao struct pci_bus *child; 64dd7cc44dSYu Zhao 65dd7cc44dSYu Zhao if (bus->number == busnr) 66dd7cc44dSYu Zhao return; 67dd7cc44dSYu Zhao 68dd7cc44dSYu Zhao child = pci_find_bus(pci_domain_nr(bus), busnr); 69dd7cc44dSYu Zhao BUG_ON(!child); 70dd7cc44dSYu Zhao 71dd7cc44dSYu Zhao if (list_empty(&child->devices)) 72dd7cc44dSYu Zhao pci_remove_bus(child); 73dd7cc44dSYu Zhao } 74dd7cc44dSYu Zhao 75dd7cc44dSYu Zhao static int virtfn_add(struct pci_dev *dev, int id, int reset) 76dd7cc44dSYu Zhao { 77dd7cc44dSYu Zhao int i; 78dd7cc44dSYu Zhao int rc; 79dd7cc44dSYu Zhao u64 size; 80dd7cc44dSYu Zhao char buf[VIRTFN_ID_LEN]; 81dd7cc44dSYu Zhao struct pci_dev *virtfn; 82dd7cc44dSYu Zhao struct resource *res; 83dd7cc44dSYu Zhao struct pci_sriov *iov = dev->sriov; 84dd7cc44dSYu Zhao 85dd7cc44dSYu Zhao virtfn = alloc_pci_dev(); 86dd7cc44dSYu Zhao if (!virtfn) 87dd7cc44dSYu Zhao return -ENOMEM; 88dd7cc44dSYu Zhao 89dd7cc44dSYu Zhao mutex_lock(&iov->dev->sriov->lock); 90dd7cc44dSYu Zhao virtfn->bus = virtfn_add_bus(dev->bus, virtfn_bus(dev, id)); 91dd7cc44dSYu Zhao if (!virtfn->bus) { 92dd7cc44dSYu Zhao kfree(virtfn); 93dd7cc44dSYu Zhao mutex_unlock(&iov->dev->sriov->lock); 94dd7cc44dSYu Zhao return -ENOMEM; 95dd7cc44dSYu Zhao } 96dd7cc44dSYu Zhao virtfn->devfn = virtfn_devfn(dev, id); 97dd7cc44dSYu Zhao virtfn->vendor = dev->vendor; 98dd7cc44dSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_DID, &virtfn->device); 99dd7cc44dSYu Zhao pci_setup_device(virtfn); 100dd7cc44dSYu Zhao virtfn->dev.parent = dev->dev.parent; 101dd7cc44dSYu Zhao 102dd7cc44dSYu Zhao for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) { 103dd7cc44dSYu Zhao res = dev->resource + PCI_IOV_RESOURCES + i; 104dd7cc44dSYu Zhao if (!res->parent) 105dd7cc44dSYu Zhao continue; 106dd7cc44dSYu Zhao virtfn->resource[i].name = pci_name(virtfn); 107dd7cc44dSYu Zhao virtfn->resource[i].flags = res->flags; 108dd7cc44dSYu Zhao size = resource_size(res); 109dd7cc44dSYu Zhao do_div(size, iov->total); 110dd7cc44dSYu Zhao virtfn->resource[i].start = res->start + size * id; 111dd7cc44dSYu Zhao virtfn->resource[i].end = virtfn->resource[i].start + size - 1; 112dd7cc44dSYu Zhao rc = request_resource(res, &virtfn->resource[i]); 113dd7cc44dSYu Zhao BUG_ON(rc); 114dd7cc44dSYu Zhao } 115dd7cc44dSYu Zhao 116dd7cc44dSYu Zhao if (reset) 1178c1c699fSYu Zhao __pci_reset_function(virtfn); 118dd7cc44dSYu Zhao 119dd7cc44dSYu Zhao pci_device_add(virtfn, virtfn->bus); 120dd7cc44dSYu Zhao mutex_unlock(&iov->dev->sriov->lock); 121dd7cc44dSYu Zhao 122dd7cc44dSYu Zhao virtfn->physfn = pci_dev_get(dev); 123dd7cc44dSYu Zhao virtfn->is_virtfn = 1; 124dd7cc44dSYu Zhao 125dd7cc44dSYu Zhao rc = pci_bus_add_device(virtfn); 126dd7cc44dSYu Zhao if (rc) 127dd7cc44dSYu Zhao goto failed1; 128dd7cc44dSYu Zhao sprintf(buf, "virtfn%u", id); 129dd7cc44dSYu Zhao rc = sysfs_create_link(&dev->dev.kobj, &virtfn->dev.kobj, buf); 130dd7cc44dSYu Zhao if (rc) 131dd7cc44dSYu Zhao goto failed1; 132dd7cc44dSYu Zhao rc = sysfs_create_link(&virtfn->dev.kobj, &dev->dev.kobj, "physfn"); 133dd7cc44dSYu Zhao if (rc) 134dd7cc44dSYu Zhao goto failed2; 135dd7cc44dSYu Zhao 136dd7cc44dSYu Zhao kobject_uevent(&virtfn->dev.kobj, KOBJ_CHANGE); 137dd7cc44dSYu Zhao 138dd7cc44dSYu Zhao return 0; 139dd7cc44dSYu Zhao 140dd7cc44dSYu Zhao failed2: 141dd7cc44dSYu Zhao sysfs_remove_link(&dev->dev.kobj, buf); 142dd7cc44dSYu Zhao failed1: 143dd7cc44dSYu Zhao pci_dev_put(dev); 144dd7cc44dSYu Zhao mutex_lock(&iov->dev->sriov->lock); 145*210647afSYinghai Lu pci_stop_and_remove_bus_device(virtfn); 146dd7cc44dSYu Zhao virtfn_remove_bus(dev->bus, virtfn_bus(dev, id)); 147dd7cc44dSYu Zhao mutex_unlock(&iov->dev->sriov->lock); 148dd7cc44dSYu Zhao 149dd7cc44dSYu Zhao return rc; 150dd7cc44dSYu Zhao } 151dd7cc44dSYu Zhao 152dd7cc44dSYu Zhao static void virtfn_remove(struct pci_dev *dev, int id, int reset) 153dd7cc44dSYu Zhao { 154dd7cc44dSYu Zhao char buf[VIRTFN_ID_LEN]; 155dd7cc44dSYu Zhao struct pci_bus *bus; 156dd7cc44dSYu Zhao struct pci_dev *virtfn; 157dd7cc44dSYu Zhao struct pci_sriov *iov = dev->sriov; 158dd7cc44dSYu Zhao 159dd7cc44dSYu Zhao bus = pci_find_bus(pci_domain_nr(dev->bus), virtfn_bus(dev, id)); 160dd7cc44dSYu Zhao if (!bus) 161dd7cc44dSYu Zhao return; 162dd7cc44dSYu Zhao 163dd7cc44dSYu Zhao virtfn = pci_get_slot(bus, virtfn_devfn(dev, id)); 164dd7cc44dSYu Zhao if (!virtfn) 165dd7cc44dSYu Zhao return; 166dd7cc44dSYu Zhao 167dd7cc44dSYu Zhao pci_dev_put(virtfn); 168dd7cc44dSYu Zhao 169dd7cc44dSYu Zhao if (reset) { 170dd7cc44dSYu Zhao device_release_driver(&virtfn->dev); 1718c1c699fSYu Zhao __pci_reset_function(virtfn); 172dd7cc44dSYu Zhao } 173dd7cc44dSYu Zhao 174dd7cc44dSYu Zhao sprintf(buf, "virtfn%u", id); 175dd7cc44dSYu Zhao sysfs_remove_link(&dev->dev.kobj, buf); 17609cedbefSYinghai Lu /* 17709cedbefSYinghai Lu * pci_stop_dev() could have been called for this virtfn already, 17809cedbefSYinghai Lu * so the directory for the virtfn may have been removed before. 17909cedbefSYinghai Lu * Double check to avoid spurious sysfs warnings. 18009cedbefSYinghai Lu */ 18109cedbefSYinghai Lu if (virtfn->dev.kobj.sd) 182dd7cc44dSYu Zhao sysfs_remove_link(&virtfn->dev.kobj, "physfn"); 183dd7cc44dSYu Zhao 184dd7cc44dSYu Zhao mutex_lock(&iov->dev->sriov->lock); 185*210647afSYinghai Lu pci_stop_and_remove_bus_device(virtfn); 186dd7cc44dSYu Zhao virtfn_remove_bus(dev->bus, virtfn_bus(dev, id)); 187dd7cc44dSYu Zhao mutex_unlock(&iov->dev->sriov->lock); 188dd7cc44dSYu Zhao 189dd7cc44dSYu Zhao pci_dev_put(dev); 190dd7cc44dSYu Zhao } 191dd7cc44dSYu Zhao 19274bb1bccSYu Zhao static int sriov_migration(struct pci_dev *dev) 19374bb1bccSYu Zhao { 19474bb1bccSYu Zhao u16 status; 19574bb1bccSYu Zhao struct pci_sriov *iov = dev->sriov; 19674bb1bccSYu Zhao 19774bb1bccSYu Zhao if (!iov->nr_virtfn) 19874bb1bccSYu Zhao return 0; 19974bb1bccSYu Zhao 20074bb1bccSYu Zhao if (!(iov->cap & PCI_SRIOV_CAP_VFM)) 20174bb1bccSYu Zhao return 0; 20274bb1bccSYu Zhao 20374bb1bccSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_STATUS, &status); 20474bb1bccSYu Zhao if (!(status & PCI_SRIOV_STATUS_VFM)) 20574bb1bccSYu Zhao return 0; 20674bb1bccSYu Zhao 20774bb1bccSYu Zhao schedule_work(&iov->mtask); 20874bb1bccSYu Zhao 20974bb1bccSYu Zhao return 1; 21074bb1bccSYu Zhao } 21174bb1bccSYu Zhao 21274bb1bccSYu Zhao static void sriov_migration_task(struct work_struct *work) 21374bb1bccSYu Zhao { 21474bb1bccSYu Zhao int i; 21574bb1bccSYu Zhao u8 state; 21674bb1bccSYu Zhao u16 status; 21774bb1bccSYu Zhao struct pci_sriov *iov = container_of(work, struct pci_sriov, mtask); 21874bb1bccSYu Zhao 21974bb1bccSYu Zhao for (i = iov->initial; i < iov->nr_virtfn; i++) { 22074bb1bccSYu Zhao state = readb(iov->mstate + i); 22174bb1bccSYu Zhao if (state == PCI_SRIOV_VFM_MI) { 22274bb1bccSYu Zhao writeb(PCI_SRIOV_VFM_AV, iov->mstate + i); 22374bb1bccSYu Zhao state = readb(iov->mstate + i); 22474bb1bccSYu Zhao if (state == PCI_SRIOV_VFM_AV) 22574bb1bccSYu Zhao virtfn_add(iov->self, i, 1); 22674bb1bccSYu Zhao } else if (state == PCI_SRIOV_VFM_MO) { 22774bb1bccSYu Zhao virtfn_remove(iov->self, i, 1); 22874bb1bccSYu Zhao writeb(PCI_SRIOV_VFM_UA, iov->mstate + i); 22974bb1bccSYu Zhao state = readb(iov->mstate + i); 23074bb1bccSYu Zhao if (state == PCI_SRIOV_VFM_AV) 23174bb1bccSYu Zhao virtfn_add(iov->self, i, 0); 23274bb1bccSYu Zhao } 23374bb1bccSYu Zhao } 23474bb1bccSYu Zhao 23574bb1bccSYu Zhao pci_read_config_word(iov->self, iov->pos + PCI_SRIOV_STATUS, &status); 23674bb1bccSYu Zhao status &= ~PCI_SRIOV_STATUS_VFM; 23774bb1bccSYu Zhao pci_write_config_word(iov->self, iov->pos + PCI_SRIOV_STATUS, status); 23874bb1bccSYu Zhao } 23974bb1bccSYu Zhao 24074bb1bccSYu Zhao static int sriov_enable_migration(struct pci_dev *dev, int nr_virtfn) 24174bb1bccSYu Zhao { 24274bb1bccSYu Zhao int bir; 24374bb1bccSYu Zhao u32 table; 24474bb1bccSYu Zhao resource_size_t pa; 24574bb1bccSYu Zhao struct pci_sriov *iov = dev->sriov; 24674bb1bccSYu Zhao 24774bb1bccSYu Zhao if (nr_virtfn <= iov->initial) 24874bb1bccSYu Zhao return 0; 24974bb1bccSYu Zhao 25074bb1bccSYu Zhao pci_read_config_dword(dev, iov->pos + PCI_SRIOV_VFM, &table); 25174bb1bccSYu Zhao bir = PCI_SRIOV_VFM_BIR(table); 25274bb1bccSYu Zhao if (bir > PCI_STD_RESOURCE_END) 25374bb1bccSYu Zhao return -EIO; 25474bb1bccSYu Zhao 25574bb1bccSYu Zhao table = PCI_SRIOV_VFM_OFFSET(table); 25674bb1bccSYu Zhao if (table + nr_virtfn > pci_resource_len(dev, bir)) 25774bb1bccSYu Zhao return -EIO; 25874bb1bccSYu Zhao 25974bb1bccSYu Zhao pa = pci_resource_start(dev, bir) + table; 26074bb1bccSYu Zhao iov->mstate = ioremap(pa, nr_virtfn); 26174bb1bccSYu Zhao if (!iov->mstate) 26274bb1bccSYu Zhao return -ENOMEM; 26374bb1bccSYu Zhao 26474bb1bccSYu Zhao INIT_WORK(&iov->mtask, sriov_migration_task); 26574bb1bccSYu Zhao 26674bb1bccSYu Zhao iov->ctrl |= PCI_SRIOV_CTRL_VFM | PCI_SRIOV_CTRL_INTR; 26774bb1bccSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 26874bb1bccSYu Zhao 26974bb1bccSYu Zhao return 0; 27074bb1bccSYu Zhao } 27174bb1bccSYu Zhao 27274bb1bccSYu Zhao static void sriov_disable_migration(struct pci_dev *dev) 27374bb1bccSYu Zhao { 27474bb1bccSYu Zhao struct pci_sriov *iov = dev->sriov; 27574bb1bccSYu Zhao 27674bb1bccSYu Zhao iov->ctrl &= ~(PCI_SRIOV_CTRL_VFM | PCI_SRIOV_CTRL_INTR); 27774bb1bccSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 27874bb1bccSYu Zhao 27974bb1bccSYu Zhao cancel_work_sync(&iov->mtask); 28074bb1bccSYu Zhao iounmap(iov->mstate); 28174bb1bccSYu Zhao } 28274bb1bccSYu Zhao 283dd7cc44dSYu Zhao static int sriov_enable(struct pci_dev *dev, int nr_virtfn) 284dd7cc44dSYu Zhao { 285dd7cc44dSYu Zhao int rc; 286dd7cc44dSYu Zhao int i, j; 287dd7cc44dSYu Zhao int nres; 288dd7cc44dSYu Zhao u16 offset, stride, initial; 289dd7cc44dSYu Zhao struct resource *res; 290dd7cc44dSYu Zhao struct pci_dev *pdev; 291dd7cc44dSYu Zhao struct pci_sriov *iov = dev->sriov; 292bbef98abSRam Pai int bars = 0; 293dd7cc44dSYu Zhao 294dd7cc44dSYu Zhao if (!nr_virtfn) 295dd7cc44dSYu Zhao return 0; 296dd7cc44dSYu Zhao 297dd7cc44dSYu Zhao if (iov->nr_virtfn) 298dd7cc44dSYu Zhao return -EINVAL; 299dd7cc44dSYu Zhao 300dd7cc44dSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_INITIAL_VF, &initial); 301dd7cc44dSYu Zhao if (initial > iov->total || 302dd7cc44dSYu Zhao (!(iov->cap & PCI_SRIOV_CAP_VFM) && (initial != iov->total))) 303dd7cc44dSYu Zhao return -EIO; 304dd7cc44dSYu Zhao 305dd7cc44dSYu Zhao if (nr_virtfn < 0 || nr_virtfn > iov->total || 306dd7cc44dSYu Zhao (!(iov->cap & PCI_SRIOV_CAP_VFM) && (nr_virtfn > initial))) 307dd7cc44dSYu Zhao return -EINVAL; 308dd7cc44dSYu Zhao 309dd7cc44dSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_NUM_VF, nr_virtfn); 310dd7cc44dSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_OFFSET, &offset); 311dd7cc44dSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_VF_STRIDE, &stride); 312dd7cc44dSYu Zhao if (!offset || (nr_virtfn > 1 && !stride)) 313dd7cc44dSYu Zhao return -EIO; 314dd7cc44dSYu Zhao 315dd7cc44dSYu Zhao nres = 0; 316dd7cc44dSYu Zhao for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) { 317bbef98abSRam Pai bars |= (1 << (i + PCI_IOV_RESOURCES)); 318dd7cc44dSYu Zhao res = dev->resource + PCI_IOV_RESOURCES + i; 319dd7cc44dSYu Zhao if (res->parent) 320dd7cc44dSYu Zhao nres++; 321dd7cc44dSYu Zhao } 322dd7cc44dSYu Zhao if (nres != iov->nres) { 323dd7cc44dSYu Zhao dev_err(&dev->dev, "not enough MMIO resources for SR-IOV\n"); 324dd7cc44dSYu Zhao return -ENOMEM; 325dd7cc44dSYu Zhao } 326dd7cc44dSYu Zhao 327dd7cc44dSYu Zhao iov->offset = offset; 328dd7cc44dSYu Zhao iov->stride = stride; 329dd7cc44dSYu Zhao 330dd7cc44dSYu Zhao if (virtfn_bus(dev, nr_virtfn - 1) > dev->bus->subordinate) { 331dd7cc44dSYu Zhao dev_err(&dev->dev, "SR-IOV: bus number out of range\n"); 332dd7cc44dSYu Zhao return -ENOMEM; 333dd7cc44dSYu Zhao } 334dd7cc44dSYu Zhao 335bbef98abSRam Pai if (pci_enable_resources(dev, bars)) { 336bbef98abSRam Pai dev_err(&dev->dev, "SR-IOV: IOV BARS not allocated\n"); 337bbef98abSRam Pai return -ENOMEM; 338bbef98abSRam Pai } 339bbef98abSRam Pai 340dd7cc44dSYu Zhao if (iov->link != dev->devfn) { 341dd7cc44dSYu Zhao pdev = pci_get_slot(dev->bus, iov->link); 342dd7cc44dSYu Zhao if (!pdev) 343dd7cc44dSYu Zhao return -ENODEV; 344dd7cc44dSYu Zhao 345dd7cc44dSYu Zhao pci_dev_put(pdev); 346dd7cc44dSYu Zhao 347dd7cc44dSYu Zhao if (!pdev->is_physfn) 348dd7cc44dSYu Zhao return -ENODEV; 349dd7cc44dSYu Zhao 350dd7cc44dSYu Zhao rc = sysfs_create_link(&dev->dev.kobj, 351dd7cc44dSYu Zhao &pdev->dev.kobj, "dep_link"); 352dd7cc44dSYu Zhao if (rc) 353dd7cc44dSYu Zhao return rc; 354dd7cc44dSYu Zhao } 355dd7cc44dSYu Zhao 356dd7cc44dSYu Zhao iov->ctrl |= PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE; 357fb51ccbfSJan Kiszka pci_cfg_access_lock(dev); 358dd7cc44dSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 359dd7cc44dSYu Zhao msleep(100); 360fb51ccbfSJan Kiszka pci_cfg_access_unlock(dev); 361dd7cc44dSYu Zhao 362dd7cc44dSYu Zhao iov->initial = initial; 363dd7cc44dSYu Zhao if (nr_virtfn < initial) 364dd7cc44dSYu Zhao initial = nr_virtfn; 365dd7cc44dSYu Zhao 366dd7cc44dSYu Zhao for (i = 0; i < initial; i++) { 367dd7cc44dSYu Zhao rc = virtfn_add(dev, i, 0); 368dd7cc44dSYu Zhao if (rc) 369dd7cc44dSYu Zhao goto failed; 370dd7cc44dSYu Zhao } 371dd7cc44dSYu Zhao 37274bb1bccSYu Zhao if (iov->cap & PCI_SRIOV_CAP_VFM) { 37374bb1bccSYu Zhao rc = sriov_enable_migration(dev, nr_virtfn); 37474bb1bccSYu Zhao if (rc) 37574bb1bccSYu Zhao goto failed; 37674bb1bccSYu Zhao } 37774bb1bccSYu Zhao 378dd7cc44dSYu Zhao kobject_uevent(&dev->dev.kobj, KOBJ_CHANGE); 379dd7cc44dSYu Zhao iov->nr_virtfn = nr_virtfn; 380dd7cc44dSYu Zhao 381dd7cc44dSYu Zhao return 0; 382dd7cc44dSYu Zhao 383dd7cc44dSYu Zhao failed: 384dd7cc44dSYu Zhao for (j = 0; j < i; j++) 385dd7cc44dSYu Zhao virtfn_remove(dev, j, 0); 386dd7cc44dSYu Zhao 387dd7cc44dSYu Zhao iov->ctrl &= ~(PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE); 388fb51ccbfSJan Kiszka pci_cfg_access_lock(dev); 389dd7cc44dSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 390dd7cc44dSYu Zhao ssleep(1); 391fb51ccbfSJan Kiszka pci_cfg_access_unlock(dev); 392dd7cc44dSYu Zhao 393dd7cc44dSYu Zhao if (iov->link != dev->devfn) 394dd7cc44dSYu Zhao sysfs_remove_link(&dev->dev.kobj, "dep_link"); 395dd7cc44dSYu Zhao 396dd7cc44dSYu Zhao return rc; 397dd7cc44dSYu Zhao } 398dd7cc44dSYu Zhao 399dd7cc44dSYu Zhao static void sriov_disable(struct pci_dev *dev) 400dd7cc44dSYu Zhao { 401dd7cc44dSYu Zhao int i; 402dd7cc44dSYu Zhao struct pci_sriov *iov = dev->sriov; 403dd7cc44dSYu Zhao 404dd7cc44dSYu Zhao if (!iov->nr_virtfn) 405dd7cc44dSYu Zhao return; 406dd7cc44dSYu Zhao 40774bb1bccSYu Zhao if (iov->cap & PCI_SRIOV_CAP_VFM) 40874bb1bccSYu Zhao sriov_disable_migration(dev); 40974bb1bccSYu Zhao 410dd7cc44dSYu Zhao for (i = 0; i < iov->nr_virtfn; i++) 411dd7cc44dSYu Zhao virtfn_remove(dev, i, 0); 412dd7cc44dSYu Zhao 413dd7cc44dSYu Zhao iov->ctrl &= ~(PCI_SRIOV_CTRL_VFE | PCI_SRIOV_CTRL_MSE); 414fb51ccbfSJan Kiszka pci_cfg_access_lock(dev); 415dd7cc44dSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 416dd7cc44dSYu Zhao ssleep(1); 417fb51ccbfSJan Kiszka pci_cfg_access_unlock(dev); 418dd7cc44dSYu Zhao 419dd7cc44dSYu Zhao if (iov->link != dev->devfn) 420dd7cc44dSYu Zhao sysfs_remove_link(&dev->dev.kobj, "dep_link"); 421dd7cc44dSYu Zhao 422dd7cc44dSYu Zhao iov->nr_virtfn = 0; 423dd7cc44dSYu Zhao } 424dd7cc44dSYu Zhao 425d1b054daSYu Zhao static int sriov_init(struct pci_dev *dev, int pos) 426d1b054daSYu Zhao { 427d1b054daSYu Zhao int i; 428d1b054daSYu Zhao int rc; 429d1b054daSYu Zhao int nres; 430d1b054daSYu Zhao u32 pgsz; 431d1b054daSYu Zhao u16 ctrl, total, offset, stride; 432d1b054daSYu Zhao struct pci_sriov *iov; 433d1b054daSYu Zhao struct resource *res; 434d1b054daSYu Zhao struct pci_dev *pdev; 435d1b054daSYu Zhao 436d1b054daSYu Zhao if (dev->pcie_type != PCI_EXP_TYPE_RC_END && 437d1b054daSYu Zhao dev->pcie_type != PCI_EXP_TYPE_ENDPOINT) 438d1b054daSYu Zhao return -ENODEV; 439d1b054daSYu Zhao 440d1b054daSYu Zhao pci_read_config_word(dev, pos + PCI_SRIOV_CTRL, &ctrl); 441d1b054daSYu Zhao if (ctrl & PCI_SRIOV_CTRL_VFE) { 442d1b054daSYu Zhao pci_write_config_word(dev, pos + PCI_SRIOV_CTRL, 0); 443d1b054daSYu Zhao ssleep(1); 444d1b054daSYu Zhao } 445d1b054daSYu Zhao 446d1b054daSYu Zhao pci_read_config_word(dev, pos + PCI_SRIOV_TOTAL_VF, &total); 447d1b054daSYu Zhao if (!total) 448d1b054daSYu Zhao return 0; 449d1b054daSYu Zhao 450d1b054daSYu Zhao ctrl = 0; 451d1b054daSYu Zhao list_for_each_entry(pdev, &dev->bus->devices, bus_list) 452d1b054daSYu Zhao if (pdev->is_physfn) 453d1b054daSYu Zhao goto found; 454d1b054daSYu Zhao 455d1b054daSYu Zhao pdev = NULL; 456d1b054daSYu Zhao if (pci_ari_enabled(dev->bus)) 457d1b054daSYu Zhao ctrl |= PCI_SRIOV_CTRL_ARI; 458d1b054daSYu Zhao 459d1b054daSYu Zhao found: 460d1b054daSYu Zhao pci_write_config_word(dev, pos + PCI_SRIOV_CTRL, ctrl); 461d1b054daSYu Zhao pci_read_config_word(dev, pos + PCI_SRIOV_VF_OFFSET, &offset); 462d1b054daSYu Zhao pci_read_config_word(dev, pos + PCI_SRIOV_VF_STRIDE, &stride); 463d1b054daSYu Zhao if (!offset || (total > 1 && !stride)) 464d1b054daSYu Zhao return -EIO; 465d1b054daSYu Zhao 466d1b054daSYu Zhao pci_read_config_dword(dev, pos + PCI_SRIOV_SUP_PGSIZE, &pgsz); 467d1b054daSYu Zhao i = PAGE_SHIFT > 12 ? PAGE_SHIFT - 12 : 0; 468d1b054daSYu Zhao pgsz &= ~((1 << i) - 1); 469d1b054daSYu Zhao if (!pgsz) 470d1b054daSYu Zhao return -EIO; 471d1b054daSYu Zhao 472d1b054daSYu Zhao pgsz &= ~(pgsz - 1); 4738161fe91SVaidyanathan Srinivasan pci_write_config_dword(dev, pos + PCI_SRIOV_SYS_PGSIZE, pgsz); 474d1b054daSYu Zhao 475d1b054daSYu Zhao nres = 0; 476d1b054daSYu Zhao for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) { 477d1b054daSYu Zhao res = dev->resource + PCI_IOV_RESOURCES + i; 478d1b054daSYu Zhao i += __pci_read_base(dev, pci_bar_unknown, res, 479d1b054daSYu Zhao pos + PCI_SRIOV_BAR + i * 4); 480d1b054daSYu Zhao if (!res->flags) 481d1b054daSYu Zhao continue; 482d1b054daSYu Zhao if (resource_size(res) & (PAGE_SIZE - 1)) { 483d1b054daSYu Zhao rc = -EIO; 484d1b054daSYu Zhao goto failed; 485d1b054daSYu Zhao } 486d1b054daSYu Zhao res->end = res->start + resource_size(res) * total - 1; 487d1b054daSYu Zhao nres++; 488d1b054daSYu Zhao } 489d1b054daSYu Zhao 490d1b054daSYu Zhao iov = kzalloc(sizeof(*iov), GFP_KERNEL); 491d1b054daSYu Zhao if (!iov) { 492d1b054daSYu Zhao rc = -ENOMEM; 493d1b054daSYu Zhao goto failed; 494d1b054daSYu Zhao } 495d1b054daSYu Zhao 496d1b054daSYu Zhao iov->pos = pos; 497d1b054daSYu Zhao iov->nres = nres; 498d1b054daSYu Zhao iov->ctrl = ctrl; 499d1b054daSYu Zhao iov->total = total; 500d1b054daSYu Zhao iov->offset = offset; 501d1b054daSYu Zhao iov->stride = stride; 502d1b054daSYu Zhao iov->pgsz = pgsz; 503d1b054daSYu Zhao iov->self = dev; 504d1b054daSYu Zhao pci_read_config_dword(dev, pos + PCI_SRIOV_CAP, &iov->cap); 505d1b054daSYu Zhao pci_read_config_byte(dev, pos + PCI_SRIOV_FUNC_LINK, &iov->link); 5064d135dbeSYu Zhao if (dev->pcie_type == PCI_EXP_TYPE_RC_END) 5074d135dbeSYu Zhao iov->link = PCI_DEVFN(PCI_SLOT(dev->devfn), iov->link); 508d1b054daSYu Zhao 509d1b054daSYu Zhao if (pdev) 510d1b054daSYu Zhao iov->dev = pci_dev_get(pdev); 511e277d2fcSYu Zhao else 512d1b054daSYu Zhao iov->dev = dev; 513e277d2fcSYu Zhao 514d1b054daSYu Zhao mutex_init(&iov->lock); 515d1b054daSYu Zhao 516d1b054daSYu Zhao dev->sriov = iov; 517d1b054daSYu Zhao dev->is_physfn = 1; 518d1b054daSYu Zhao 519d1b054daSYu Zhao return 0; 520d1b054daSYu Zhao 521d1b054daSYu Zhao failed: 522d1b054daSYu Zhao for (i = 0; i < PCI_SRIOV_NUM_BARS; i++) { 523d1b054daSYu Zhao res = dev->resource + PCI_IOV_RESOURCES + i; 524d1b054daSYu Zhao res->flags = 0; 525d1b054daSYu Zhao } 526d1b054daSYu Zhao 527d1b054daSYu Zhao return rc; 528d1b054daSYu Zhao } 529d1b054daSYu Zhao 530d1b054daSYu Zhao static void sriov_release(struct pci_dev *dev) 531d1b054daSYu Zhao { 532dd7cc44dSYu Zhao BUG_ON(dev->sriov->nr_virtfn); 533dd7cc44dSYu Zhao 534e277d2fcSYu Zhao if (dev != dev->sriov->dev) 535d1b054daSYu Zhao pci_dev_put(dev->sriov->dev); 536d1b054daSYu Zhao 537e277d2fcSYu Zhao mutex_destroy(&dev->sriov->lock); 538e277d2fcSYu Zhao 539d1b054daSYu Zhao kfree(dev->sriov); 540d1b054daSYu Zhao dev->sriov = NULL; 541d1b054daSYu Zhao } 542d1b054daSYu Zhao 5438c5cdb6aSYu Zhao static void sriov_restore_state(struct pci_dev *dev) 5448c5cdb6aSYu Zhao { 5458c5cdb6aSYu Zhao int i; 5468c5cdb6aSYu Zhao u16 ctrl; 5478c5cdb6aSYu Zhao struct pci_sriov *iov = dev->sriov; 5488c5cdb6aSYu Zhao 5498c5cdb6aSYu Zhao pci_read_config_word(dev, iov->pos + PCI_SRIOV_CTRL, &ctrl); 5508c5cdb6aSYu Zhao if (ctrl & PCI_SRIOV_CTRL_VFE) 5518c5cdb6aSYu Zhao return; 5528c5cdb6aSYu Zhao 5538c5cdb6aSYu Zhao for (i = PCI_IOV_RESOURCES; i <= PCI_IOV_RESOURCE_END; i++) 5548c5cdb6aSYu Zhao pci_update_resource(dev, i); 5558c5cdb6aSYu Zhao 5568c5cdb6aSYu Zhao pci_write_config_dword(dev, iov->pos + PCI_SRIOV_SYS_PGSIZE, iov->pgsz); 557dd7cc44dSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_NUM_VF, iov->nr_virtfn); 5588c5cdb6aSYu Zhao pci_write_config_word(dev, iov->pos + PCI_SRIOV_CTRL, iov->ctrl); 5598c5cdb6aSYu Zhao if (iov->ctrl & PCI_SRIOV_CTRL_VFE) 5608c5cdb6aSYu Zhao msleep(100); 5618c5cdb6aSYu Zhao } 5628c5cdb6aSYu Zhao 563d1b054daSYu Zhao /** 564d1b054daSYu Zhao * pci_iov_init - initialize the IOV capability 565d1b054daSYu Zhao * @dev: the PCI device 566d1b054daSYu Zhao * 567d1b054daSYu Zhao * Returns 0 on success, or negative on failure. 568d1b054daSYu Zhao */ 569d1b054daSYu Zhao int pci_iov_init(struct pci_dev *dev) 570d1b054daSYu Zhao { 571d1b054daSYu Zhao int pos; 572d1b054daSYu Zhao 5735f4d91a1SKenji Kaneshige if (!pci_is_pcie(dev)) 574d1b054daSYu Zhao return -ENODEV; 575d1b054daSYu Zhao 576d1b054daSYu Zhao pos = pci_find_ext_capability(dev, PCI_EXT_CAP_ID_SRIOV); 577d1b054daSYu Zhao if (pos) 578d1b054daSYu Zhao return sriov_init(dev, pos); 579d1b054daSYu Zhao 580d1b054daSYu Zhao return -ENODEV; 581d1b054daSYu Zhao } 582d1b054daSYu Zhao 583d1b054daSYu Zhao /** 584d1b054daSYu Zhao * pci_iov_release - release resources used by the IOV capability 585d1b054daSYu Zhao * @dev: the PCI device 586d1b054daSYu Zhao */ 587d1b054daSYu Zhao void pci_iov_release(struct pci_dev *dev) 588d1b054daSYu Zhao { 589d1b054daSYu Zhao if (dev->is_physfn) 590d1b054daSYu Zhao sriov_release(dev); 591d1b054daSYu Zhao } 592d1b054daSYu Zhao 593d1b054daSYu Zhao /** 594d1b054daSYu Zhao * pci_iov_resource_bar - get position of the SR-IOV BAR 595d1b054daSYu Zhao * @dev: the PCI device 596d1b054daSYu Zhao * @resno: the resource number 597d1b054daSYu Zhao * @type: the BAR type to be filled in 598d1b054daSYu Zhao * 599d1b054daSYu Zhao * Returns position of the BAR encapsulated in the SR-IOV capability. 600d1b054daSYu Zhao */ 601d1b054daSYu Zhao int pci_iov_resource_bar(struct pci_dev *dev, int resno, 602d1b054daSYu Zhao enum pci_bar_type *type) 603d1b054daSYu Zhao { 604d1b054daSYu Zhao if (resno < PCI_IOV_RESOURCES || resno > PCI_IOV_RESOURCE_END) 605d1b054daSYu Zhao return 0; 606d1b054daSYu Zhao 607d1b054daSYu Zhao BUG_ON(!dev->is_physfn); 608d1b054daSYu Zhao 609d1b054daSYu Zhao *type = pci_bar_unknown; 610d1b054daSYu Zhao 611d1b054daSYu Zhao return dev->sriov->pos + PCI_SRIOV_BAR + 612d1b054daSYu Zhao 4 * (resno - PCI_IOV_RESOURCES); 613d1b054daSYu Zhao } 6148c5cdb6aSYu Zhao 6158c5cdb6aSYu Zhao /** 6166faf17f6SChris Wright * pci_sriov_resource_alignment - get resource alignment for VF BAR 6176faf17f6SChris Wright * @dev: the PCI device 6186faf17f6SChris Wright * @resno: the resource number 6196faf17f6SChris Wright * 6206faf17f6SChris Wright * Returns the alignment of the VF BAR found in the SR-IOV capability. 6216faf17f6SChris Wright * This is not the same as the resource size which is defined as 6226faf17f6SChris Wright * the VF BAR size multiplied by the number of VFs. The alignment 6236faf17f6SChris Wright * is just the VF BAR size. 6246faf17f6SChris Wright */ 6250e52247aSCam Macdonell resource_size_t pci_sriov_resource_alignment(struct pci_dev *dev, int resno) 6266faf17f6SChris Wright { 6276faf17f6SChris Wright struct resource tmp; 6286faf17f6SChris Wright enum pci_bar_type type; 6296faf17f6SChris Wright int reg = pci_iov_resource_bar(dev, resno, &type); 6306faf17f6SChris Wright 6316faf17f6SChris Wright if (!reg) 6326faf17f6SChris Wright return 0; 6336faf17f6SChris Wright 6346faf17f6SChris Wright __pci_read_base(dev, type, &tmp, reg); 6356faf17f6SChris Wright return resource_alignment(&tmp); 6366faf17f6SChris Wright } 6376faf17f6SChris Wright 6386faf17f6SChris Wright /** 6398c5cdb6aSYu Zhao * pci_restore_iov_state - restore the state of the IOV capability 6408c5cdb6aSYu Zhao * @dev: the PCI device 6418c5cdb6aSYu Zhao */ 6428c5cdb6aSYu Zhao void pci_restore_iov_state(struct pci_dev *dev) 6438c5cdb6aSYu Zhao { 6448c5cdb6aSYu Zhao if (dev->is_physfn) 6458c5cdb6aSYu Zhao sriov_restore_state(dev); 6468c5cdb6aSYu Zhao } 647a28724b0SYu Zhao 648a28724b0SYu Zhao /** 649a28724b0SYu Zhao * pci_iov_bus_range - find bus range used by Virtual Function 650a28724b0SYu Zhao * @bus: the PCI bus 651a28724b0SYu Zhao * 652a28724b0SYu Zhao * Returns max number of buses (exclude current one) used by Virtual 653a28724b0SYu Zhao * Functions. 654a28724b0SYu Zhao */ 655a28724b0SYu Zhao int pci_iov_bus_range(struct pci_bus *bus) 656a28724b0SYu Zhao { 657a28724b0SYu Zhao int max = 0; 658a28724b0SYu Zhao u8 busnr; 659a28724b0SYu Zhao struct pci_dev *dev; 660a28724b0SYu Zhao 661a28724b0SYu Zhao list_for_each_entry(dev, &bus->devices, bus_list) { 662a28724b0SYu Zhao if (!dev->is_physfn) 663a28724b0SYu Zhao continue; 664a28724b0SYu Zhao busnr = virtfn_bus(dev, dev->sriov->total - 1); 665a28724b0SYu Zhao if (busnr > max) 666a28724b0SYu Zhao max = busnr; 667a28724b0SYu Zhao } 668a28724b0SYu Zhao 669a28724b0SYu Zhao return max ? max - bus->number : 0; 670a28724b0SYu Zhao } 671dd7cc44dSYu Zhao 672dd7cc44dSYu Zhao /** 673dd7cc44dSYu Zhao * pci_enable_sriov - enable the SR-IOV capability 674dd7cc44dSYu Zhao * @dev: the PCI device 67552a8873bSRandy Dunlap * @nr_virtfn: number of virtual functions to enable 676dd7cc44dSYu Zhao * 677dd7cc44dSYu Zhao * Returns 0 on success, or negative on failure. 678dd7cc44dSYu Zhao */ 679dd7cc44dSYu Zhao int pci_enable_sriov(struct pci_dev *dev, int nr_virtfn) 680dd7cc44dSYu Zhao { 681dd7cc44dSYu Zhao might_sleep(); 682dd7cc44dSYu Zhao 683dd7cc44dSYu Zhao if (!dev->is_physfn) 684dd7cc44dSYu Zhao return -ENODEV; 685dd7cc44dSYu Zhao 686dd7cc44dSYu Zhao return sriov_enable(dev, nr_virtfn); 687dd7cc44dSYu Zhao } 688dd7cc44dSYu Zhao EXPORT_SYMBOL_GPL(pci_enable_sriov); 689dd7cc44dSYu Zhao 690dd7cc44dSYu Zhao /** 691dd7cc44dSYu Zhao * pci_disable_sriov - disable the SR-IOV capability 692dd7cc44dSYu Zhao * @dev: the PCI device 693dd7cc44dSYu Zhao */ 694dd7cc44dSYu Zhao void pci_disable_sriov(struct pci_dev *dev) 695dd7cc44dSYu Zhao { 696dd7cc44dSYu Zhao might_sleep(); 697dd7cc44dSYu Zhao 698dd7cc44dSYu Zhao if (!dev->is_physfn) 699dd7cc44dSYu Zhao return; 700dd7cc44dSYu Zhao 701dd7cc44dSYu Zhao sriov_disable(dev); 702dd7cc44dSYu Zhao } 703dd7cc44dSYu Zhao EXPORT_SYMBOL_GPL(pci_disable_sriov); 70474bb1bccSYu Zhao 70574bb1bccSYu Zhao /** 70674bb1bccSYu Zhao * pci_sriov_migration - notify SR-IOV core of Virtual Function Migration 70774bb1bccSYu Zhao * @dev: the PCI device 70874bb1bccSYu Zhao * 70974bb1bccSYu Zhao * Returns IRQ_HANDLED if the IRQ is handled, or IRQ_NONE if not. 71074bb1bccSYu Zhao * 71174bb1bccSYu Zhao * Physical Function driver is responsible to register IRQ handler using 71274bb1bccSYu Zhao * VF Migration Interrupt Message Number, and call this function when the 71374bb1bccSYu Zhao * interrupt is generated by the hardware. 71474bb1bccSYu Zhao */ 71574bb1bccSYu Zhao irqreturn_t pci_sriov_migration(struct pci_dev *dev) 71674bb1bccSYu Zhao { 71774bb1bccSYu Zhao if (!dev->is_physfn) 71874bb1bccSYu Zhao return IRQ_NONE; 71974bb1bccSYu Zhao 72074bb1bccSYu Zhao return sriov_migration(dev) ? IRQ_HANDLED : IRQ_NONE; 72174bb1bccSYu Zhao } 72274bb1bccSYu Zhao EXPORT_SYMBOL_GPL(pci_sriov_migration); 723302b4215SYu Zhao 724fb8a0d9dSWilliams, Mitch A /** 725fb8a0d9dSWilliams, Mitch A * pci_num_vf - return number of VFs associated with a PF device_release_driver 726fb8a0d9dSWilliams, Mitch A * @dev: the PCI device 727fb8a0d9dSWilliams, Mitch A * 728fb8a0d9dSWilliams, Mitch A * Returns number of VFs, or 0 if SR-IOV is not enabled. 729fb8a0d9dSWilliams, Mitch A */ 730fb8a0d9dSWilliams, Mitch A int pci_num_vf(struct pci_dev *dev) 731fb8a0d9dSWilliams, Mitch A { 732fb8a0d9dSWilliams, Mitch A if (!dev || !dev->is_physfn) 733fb8a0d9dSWilliams, Mitch A return 0; 734fb8a0d9dSWilliams, Mitch A else 735fb8a0d9dSWilliams, Mitch A return dev->sriov->nr_virtfn; 736fb8a0d9dSWilliams, Mitch A } 737fb8a0d9dSWilliams, Mitch A EXPORT_SYMBOL_GPL(pci_num_vf); 738