1 /* 2 * PCI Stub Driver - Grabs devices in backend to be exported later 3 * 4 * Ryan Wilson <hap9@epoch.ncsc.mil> 5 * Chris Bookholt <hap10@epoch.ncsc.mil> 6 */ 7 #include <linux/module.h> 8 #include <linux/init.h> 9 #include <linux/rwsem.h> 10 #include <linux/list.h> 11 #include <linux/spinlock.h> 12 #include <linux/kref.h> 13 #include <linux/pci.h> 14 #include <linux/wait.h> 15 #include <linux/sched.h> 16 #include <linux/atomic.h> 17 #include <xen/events.h> 18 #include <asm/xen/pci.h> 19 #include <asm/xen/hypervisor.h> 20 #include "pciback.h" 21 #include "conf_space.h" 22 #include "conf_space_quirks.h" 23 24 static char *pci_devs_to_hide; 25 wait_queue_head_t xen_pcibk_aer_wait_queue; 26 /*Add sem for sync AER handling and xen_pcibk remove/reconfigue ops, 27 * We want to avoid in middle of AER ops, xen_pcibk devices is being removed 28 */ 29 static DECLARE_RWSEM(pcistub_sem); 30 module_param_named(hide, pci_devs_to_hide, charp, 0444); 31 32 struct pcistub_device_id { 33 struct list_head slot_list; 34 int domain; 35 unsigned char bus; 36 unsigned int devfn; 37 }; 38 static LIST_HEAD(pcistub_device_ids); 39 static DEFINE_SPINLOCK(device_ids_lock); 40 41 struct pcistub_device { 42 struct kref kref; 43 struct list_head dev_list; 44 spinlock_t lock; 45 46 struct pci_dev *dev; 47 struct xen_pcibk_device *pdev;/* non-NULL if struct pci_dev is in use */ 48 }; 49 50 /* Access to pcistub_devices & seized_devices lists and the initialize_devices 51 * flag must be locked with pcistub_devices_lock 52 */ 53 static DEFINE_SPINLOCK(pcistub_devices_lock); 54 static LIST_HEAD(pcistub_devices); 55 56 /* wait for device_initcall before initializing our devices 57 * (see pcistub_init_devices_late) 58 */ 59 static int initialize_devices; 60 static LIST_HEAD(seized_devices); 61 62 static struct pcistub_device *pcistub_device_alloc(struct pci_dev *dev) 63 { 64 struct pcistub_device *psdev; 65 66 dev_dbg(&dev->dev, "pcistub_device_alloc\n"); 67 68 psdev = kzalloc(sizeof(*psdev), GFP_ATOMIC); 69 if (!psdev) 70 return NULL; 71 72 psdev->dev = pci_dev_get(dev); 73 if (!psdev->dev) { 74 kfree(psdev); 75 return NULL; 76 } 77 78 kref_init(&psdev->kref); 79 spin_lock_init(&psdev->lock); 80 81 return psdev; 82 } 83 84 /* Don't call this directly as it's called by pcistub_device_put */ 85 static void pcistub_device_release(struct kref *kref) 86 { 87 struct pcistub_device *psdev; 88 89 psdev = container_of(kref, struct pcistub_device, kref); 90 91 dev_dbg(&psdev->dev->dev, "pcistub_device_release\n"); 92 93 xen_unregister_device_domain_owner(psdev->dev); 94 95 /* Clean-up the device */ 96 xen_pcibk_reset_device(psdev->dev); 97 xen_pcibk_config_free_dyn_fields(psdev->dev); 98 xen_pcibk_config_free_dev(psdev->dev); 99 kfree(pci_get_drvdata(psdev->dev)); 100 pci_set_drvdata(psdev->dev, NULL); 101 102 psdev->dev->dev_flags &= ~PCI_DEV_FLAGS_ASSIGNED; 103 pci_dev_put(psdev->dev); 104 105 kfree(psdev); 106 } 107 108 static inline void pcistub_device_get(struct pcistub_device *psdev) 109 { 110 kref_get(&psdev->kref); 111 } 112 113 static inline void pcistub_device_put(struct pcistub_device *psdev) 114 { 115 kref_put(&psdev->kref, pcistub_device_release); 116 } 117 118 static struct pcistub_device *pcistub_device_find(int domain, int bus, 119 int slot, int func) 120 { 121 struct pcistub_device *psdev = NULL; 122 unsigned long flags; 123 124 spin_lock_irqsave(&pcistub_devices_lock, flags); 125 126 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 127 if (psdev->dev != NULL 128 && domain == pci_domain_nr(psdev->dev->bus) 129 && bus == psdev->dev->bus->number 130 && PCI_DEVFN(slot, func) == psdev->dev->devfn) { 131 pcistub_device_get(psdev); 132 goto out; 133 } 134 } 135 136 /* didn't find it */ 137 psdev = NULL; 138 139 out: 140 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 141 return psdev; 142 } 143 144 static struct pci_dev *pcistub_device_get_pci_dev(struct xen_pcibk_device *pdev, 145 struct pcistub_device *psdev) 146 { 147 struct pci_dev *pci_dev = NULL; 148 unsigned long flags; 149 150 pcistub_device_get(psdev); 151 152 spin_lock_irqsave(&psdev->lock, flags); 153 if (!psdev->pdev) { 154 psdev->pdev = pdev; 155 pci_dev = psdev->dev; 156 } 157 spin_unlock_irqrestore(&psdev->lock, flags); 158 159 if (!pci_dev) 160 pcistub_device_put(psdev); 161 162 return pci_dev; 163 } 164 165 struct pci_dev *pcistub_get_pci_dev_by_slot(struct xen_pcibk_device *pdev, 166 int domain, int bus, 167 int slot, int func) 168 { 169 struct pcistub_device *psdev; 170 struct pci_dev *found_dev = NULL; 171 unsigned long flags; 172 173 spin_lock_irqsave(&pcistub_devices_lock, flags); 174 175 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 176 if (psdev->dev != NULL 177 && domain == pci_domain_nr(psdev->dev->bus) 178 && bus == psdev->dev->bus->number 179 && PCI_DEVFN(slot, func) == psdev->dev->devfn) { 180 found_dev = pcistub_device_get_pci_dev(pdev, psdev); 181 break; 182 } 183 } 184 185 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 186 return found_dev; 187 } 188 189 struct pci_dev *pcistub_get_pci_dev(struct xen_pcibk_device *pdev, 190 struct pci_dev *dev) 191 { 192 struct pcistub_device *psdev; 193 struct pci_dev *found_dev = NULL; 194 unsigned long flags; 195 196 spin_lock_irqsave(&pcistub_devices_lock, flags); 197 198 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 199 if (psdev->dev == dev) { 200 found_dev = pcistub_device_get_pci_dev(pdev, psdev); 201 break; 202 } 203 } 204 205 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 206 return found_dev; 207 } 208 209 void pcistub_put_pci_dev(struct pci_dev *dev) 210 { 211 struct pcistub_device *psdev, *found_psdev = NULL; 212 unsigned long flags; 213 214 spin_lock_irqsave(&pcistub_devices_lock, flags); 215 216 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 217 if (psdev->dev == dev) { 218 found_psdev = psdev; 219 break; 220 } 221 } 222 223 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 224 if (WARN_ON(!found_psdev)) 225 return; 226 227 /*hold this lock for avoiding breaking link between 228 * pcistub and xen_pcibk when AER is in processing 229 */ 230 down_write(&pcistub_sem); 231 /* Cleanup our device 232 * (so it's ready for the next domain) 233 */ 234 xen_pcibk_reset_device(found_psdev->dev); 235 xen_pcibk_config_free_dyn_fields(found_psdev->dev); 236 xen_pcibk_config_reset_dev(found_psdev->dev); 237 238 xen_unregister_device_domain_owner(found_psdev->dev); 239 240 spin_lock_irqsave(&found_psdev->lock, flags); 241 found_psdev->pdev = NULL; 242 spin_unlock_irqrestore(&found_psdev->lock, flags); 243 244 pcistub_device_put(found_psdev); 245 up_write(&pcistub_sem); 246 } 247 248 static int __devinit pcistub_match_one(struct pci_dev *dev, 249 struct pcistub_device_id *pdev_id) 250 { 251 /* Match the specified device by domain, bus, slot, func and also if 252 * any of the device's parent bridges match. 253 */ 254 for (; dev != NULL; dev = dev->bus->self) { 255 if (pci_domain_nr(dev->bus) == pdev_id->domain 256 && dev->bus->number == pdev_id->bus 257 && dev->devfn == pdev_id->devfn) 258 return 1; 259 260 /* Sometimes topmost bridge links to itself. */ 261 if (dev == dev->bus->self) 262 break; 263 } 264 265 return 0; 266 } 267 268 static int __devinit pcistub_match(struct pci_dev *dev) 269 { 270 struct pcistub_device_id *pdev_id; 271 unsigned long flags; 272 int found = 0; 273 274 spin_lock_irqsave(&device_ids_lock, flags); 275 list_for_each_entry(pdev_id, &pcistub_device_ids, slot_list) { 276 if (pcistub_match_one(dev, pdev_id)) { 277 found = 1; 278 break; 279 } 280 } 281 spin_unlock_irqrestore(&device_ids_lock, flags); 282 283 return found; 284 } 285 286 static int __devinit pcistub_init_device(struct pci_dev *dev) 287 { 288 struct xen_pcibk_dev_data *dev_data; 289 int err = 0; 290 291 dev_dbg(&dev->dev, "initializing...\n"); 292 293 /* The PCI backend is not intended to be a module (or to work with 294 * removable PCI devices (yet). If it were, xen_pcibk_config_free() 295 * would need to be called somewhere to free the memory allocated 296 * here and then to call kfree(pci_get_drvdata(psdev->dev)). 297 */ 298 dev_data = kzalloc(sizeof(*dev_data) + strlen(DRV_NAME "[]") 299 + strlen(pci_name(dev)) + 1, GFP_ATOMIC); 300 if (!dev_data) { 301 err = -ENOMEM; 302 goto out; 303 } 304 pci_set_drvdata(dev, dev_data); 305 306 /* 307 * Setup name for fake IRQ handler. It will only be enabled 308 * once the device is turned on by the guest. 309 */ 310 sprintf(dev_data->irq_name, DRV_NAME "[%s]", pci_name(dev)); 311 312 dev_dbg(&dev->dev, "initializing config\n"); 313 314 init_waitqueue_head(&xen_pcibk_aer_wait_queue); 315 err = xen_pcibk_config_init_dev(dev); 316 if (err) 317 goto out; 318 319 /* HACK: Force device (& ACPI) to determine what IRQ it's on - we 320 * must do this here because pcibios_enable_device may specify 321 * the pci device's true irq (and possibly its other resources) 322 * if they differ from what's in the configuration space. 323 * This makes the assumption that the device's resources won't 324 * change after this point (otherwise this code may break!) 325 */ 326 dev_dbg(&dev->dev, "enabling device\n"); 327 err = pci_enable_device(dev); 328 if (err) 329 goto config_release; 330 331 /* Now disable the device (this also ensures some private device 332 * data is setup before we export) 333 */ 334 dev_dbg(&dev->dev, "reset device\n"); 335 xen_pcibk_reset_device(dev); 336 337 dev->dev_flags |= PCI_DEV_FLAGS_ASSIGNED; 338 return 0; 339 340 config_release: 341 xen_pcibk_config_free_dev(dev); 342 343 out: 344 pci_set_drvdata(dev, NULL); 345 kfree(dev_data); 346 return err; 347 } 348 349 /* 350 * Because some initialization still happens on 351 * devices during fs_initcall, we need to defer 352 * full initialization of our devices until 353 * device_initcall. 354 */ 355 static int __init pcistub_init_devices_late(void) 356 { 357 struct pcistub_device *psdev; 358 unsigned long flags; 359 int err = 0; 360 361 pr_debug(DRV_NAME ": pcistub_init_devices_late\n"); 362 363 spin_lock_irqsave(&pcistub_devices_lock, flags); 364 365 while (!list_empty(&seized_devices)) { 366 psdev = container_of(seized_devices.next, 367 struct pcistub_device, dev_list); 368 list_del(&psdev->dev_list); 369 370 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 371 372 err = pcistub_init_device(psdev->dev); 373 if (err) { 374 dev_err(&psdev->dev->dev, 375 "error %d initializing device\n", err); 376 kfree(psdev); 377 psdev = NULL; 378 } 379 380 spin_lock_irqsave(&pcistub_devices_lock, flags); 381 382 if (psdev) 383 list_add_tail(&psdev->dev_list, &pcistub_devices); 384 } 385 386 initialize_devices = 1; 387 388 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 389 390 return 0; 391 } 392 393 static int __devinit pcistub_seize(struct pci_dev *dev) 394 { 395 struct pcistub_device *psdev; 396 unsigned long flags; 397 int err = 0; 398 399 psdev = pcistub_device_alloc(dev); 400 if (!psdev) 401 return -ENOMEM; 402 403 spin_lock_irqsave(&pcistub_devices_lock, flags); 404 405 if (initialize_devices) { 406 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 407 408 /* don't want irqs disabled when calling pcistub_init_device */ 409 err = pcistub_init_device(psdev->dev); 410 411 spin_lock_irqsave(&pcistub_devices_lock, flags); 412 413 if (!err) 414 list_add(&psdev->dev_list, &pcistub_devices); 415 } else { 416 dev_dbg(&dev->dev, "deferring initialization\n"); 417 list_add(&psdev->dev_list, &seized_devices); 418 } 419 420 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 421 422 if (err) 423 pcistub_device_put(psdev); 424 425 return err; 426 } 427 428 static int __devinit pcistub_probe(struct pci_dev *dev, 429 const struct pci_device_id *id) 430 { 431 int err = 0; 432 433 dev_dbg(&dev->dev, "probing...\n"); 434 435 if (pcistub_match(dev)) { 436 437 if (dev->hdr_type != PCI_HEADER_TYPE_NORMAL 438 && dev->hdr_type != PCI_HEADER_TYPE_BRIDGE) { 439 dev_err(&dev->dev, "can't export pci devices that " 440 "don't have a normal (0) or bridge (1) " 441 "header type!\n"); 442 err = -ENODEV; 443 goto out; 444 } 445 446 dev_info(&dev->dev, "seizing device\n"); 447 err = pcistub_seize(dev); 448 } else 449 /* Didn't find the device */ 450 err = -ENODEV; 451 452 out: 453 return err; 454 } 455 456 static void pcistub_remove(struct pci_dev *dev) 457 { 458 struct pcistub_device *psdev, *found_psdev = NULL; 459 unsigned long flags; 460 461 dev_dbg(&dev->dev, "removing\n"); 462 463 spin_lock_irqsave(&pcistub_devices_lock, flags); 464 465 xen_pcibk_config_quirk_release(dev); 466 467 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 468 if (psdev->dev == dev) { 469 found_psdev = psdev; 470 break; 471 } 472 } 473 474 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 475 476 if (found_psdev) { 477 dev_dbg(&dev->dev, "found device to remove - in use? %p\n", 478 found_psdev->pdev); 479 480 if (found_psdev->pdev) { 481 printk(KERN_WARNING DRV_NAME ": ****** removing device " 482 "%s while still in-use! ******\n", 483 pci_name(found_psdev->dev)); 484 printk(KERN_WARNING DRV_NAME ": ****** driver domain may" 485 " still access this device's i/o resources!\n"); 486 printk(KERN_WARNING DRV_NAME ": ****** shutdown driver " 487 "domain before binding device\n"); 488 printk(KERN_WARNING DRV_NAME ": ****** to other drivers " 489 "or domains\n"); 490 491 xen_pcibk_release_pci_dev(found_psdev->pdev, 492 found_psdev->dev); 493 } 494 495 spin_lock_irqsave(&pcistub_devices_lock, flags); 496 list_del(&found_psdev->dev_list); 497 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 498 499 /* the final put for releasing from the list */ 500 pcistub_device_put(found_psdev); 501 } 502 } 503 504 static DEFINE_PCI_DEVICE_TABLE(pcistub_ids) = { 505 { 506 .vendor = PCI_ANY_ID, 507 .device = PCI_ANY_ID, 508 .subvendor = PCI_ANY_ID, 509 .subdevice = PCI_ANY_ID, 510 }, 511 {0,}, 512 }; 513 514 #define PCI_NODENAME_MAX 40 515 static void kill_domain_by_device(struct pcistub_device *psdev) 516 { 517 struct xenbus_transaction xbt; 518 int err; 519 char nodename[PCI_NODENAME_MAX]; 520 521 BUG_ON(!psdev); 522 snprintf(nodename, PCI_NODENAME_MAX, "/local/domain/0/backend/pci/%d/0", 523 psdev->pdev->xdev->otherend_id); 524 525 again: 526 err = xenbus_transaction_start(&xbt); 527 if (err) { 528 dev_err(&psdev->dev->dev, 529 "error %d when start xenbus transaction\n", err); 530 return; 531 } 532 /*PV AER handlers will set this flag*/ 533 xenbus_printf(xbt, nodename, "aerState" , "aerfail"); 534 err = xenbus_transaction_end(xbt, 0); 535 if (err) { 536 if (err == -EAGAIN) 537 goto again; 538 dev_err(&psdev->dev->dev, 539 "error %d when end xenbus transaction\n", err); 540 return; 541 } 542 } 543 544 /* For each aer recovery step error_detected, mmio_enabled, etc, front_end and 545 * backend need to have cooperation. In xen_pcibk, those steps will do similar 546 * jobs: send service request and waiting for front_end response. 547 */ 548 static pci_ers_result_t common_process(struct pcistub_device *psdev, 549 pci_channel_state_t state, int aer_cmd, 550 pci_ers_result_t result) 551 { 552 pci_ers_result_t res = result; 553 struct xen_pcie_aer_op *aer_op; 554 int ret; 555 556 /*with PV AER drivers*/ 557 aer_op = &(psdev->pdev->sh_info->aer_op); 558 aer_op->cmd = aer_cmd ; 559 /*useful for error_detected callback*/ 560 aer_op->err = state; 561 /*pcifront_end BDF*/ 562 ret = xen_pcibk_get_pcifront_dev(psdev->dev, psdev->pdev, 563 &aer_op->domain, &aer_op->bus, &aer_op->devfn); 564 if (!ret) { 565 dev_err(&psdev->dev->dev, 566 DRV_NAME ": failed to get pcifront device\n"); 567 return PCI_ERS_RESULT_NONE; 568 } 569 wmb(); 570 571 dev_dbg(&psdev->dev->dev, 572 DRV_NAME ": aer_op %x dom %x bus %x devfn %x\n", 573 aer_cmd, aer_op->domain, aer_op->bus, aer_op->devfn); 574 /*local flag to mark there's aer request, xen_pcibk callback will use 575 * this flag to judge whether we need to check pci-front give aer 576 * service ack signal 577 */ 578 set_bit(_PCIB_op_pending, (unsigned long *)&psdev->pdev->flags); 579 580 /*It is possible that a pcifront conf_read_write ops request invokes 581 * the callback which cause the spurious execution of wake_up. 582 * Yet it is harmless and better than a spinlock here 583 */ 584 set_bit(_XEN_PCIB_active, 585 (unsigned long *)&psdev->pdev->sh_info->flags); 586 wmb(); 587 notify_remote_via_irq(psdev->pdev->evtchn_irq); 588 589 ret = wait_event_timeout(xen_pcibk_aer_wait_queue, 590 !(test_bit(_XEN_PCIB_active, (unsigned long *) 591 &psdev->pdev->sh_info->flags)), 300*HZ); 592 593 if (!ret) { 594 if (test_bit(_XEN_PCIB_active, 595 (unsigned long *)&psdev->pdev->sh_info->flags)) { 596 dev_err(&psdev->dev->dev, 597 "pcifront aer process not responding!\n"); 598 clear_bit(_XEN_PCIB_active, 599 (unsigned long *)&psdev->pdev->sh_info->flags); 600 aer_op->err = PCI_ERS_RESULT_NONE; 601 return res; 602 } 603 } 604 clear_bit(_PCIB_op_pending, (unsigned long *)&psdev->pdev->flags); 605 606 if (test_bit(_XEN_PCIF_active, 607 (unsigned long *)&psdev->pdev->sh_info->flags)) { 608 dev_dbg(&psdev->dev->dev, 609 "schedule pci_conf service in " DRV_NAME "\n"); 610 xen_pcibk_test_and_schedule_op(psdev->pdev); 611 } 612 613 res = (pci_ers_result_t)aer_op->err; 614 return res; 615 } 616 617 /* 618 * xen_pcibk_slot_reset: it will send the slot_reset request to pcifront in case 619 * of the device driver could provide this service, and then wait for pcifront 620 * ack. 621 * @dev: pointer to PCI devices 622 * return value is used by aer_core do_recovery policy 623 */ 624 static pci_ers_result_t xen_pcibk_slot_reset(struct pci_dev *dev) 625 { 626 struct pcistub_device *psdev; 627 pci_ers_result_t result; 628 629 result = PCI_ERS_RESULT_RECOVERED; 630 dev_dbg(&dev->dev, "xen_pcibk_slot_reset(bus:%x,devfn:%x)\n", 631 dev->bus->number, dev->devfn); 632 633 down_write(&pcistub_sem); 634 psdev = pcistub_device_find(pci_domain_nr(dev->bus), 635 dev->bus->number, 636 PCI_SLOT(dev->devfn), 637 PCI_FUNC(dev->devfn)); 638 639 if (!psdev || !psdev->pdev) { 640 dev_err(&dev->dev, 641 DRV_NAME " device is not found/assigned\n"); 642 goto end; 643 } 644 645 if (!psdev->pdev->sh_info) { 646 dev_err(&dev->dev, DRV_NAME " device is not connected or owned" 647 " by HVM, kill it\n"); 648 kill_domain_by_device(psdev); 649 goto release; 650 } 651 652 if (!test_bit(_XEN_PCIB_AERHANDLER, 653 (unsigned long *)&psdev->pdev->sh_info->flags)) { 654 dev_err(&dev->dev, 655 "guest with no AER driver should have been killed\n"); 656 goto release; 657 } 658 result = common_process(psdev, 1, XEN_PCI_OP_aer_slotreset, result); 659 660 if (result == PCI_ERS_RESULT_NONE || 661 result == PCI_ERS_RESULT_DISCONNECT) { 662 dev_dbg(&dev->dev, 663 "No AER slot_reset service or disconnected!\n"); 664 kill_domain_by_device(psdev); 665 } 666 release: 667 pcistub_device_put(psdev); 668 end: 669 up_write(&pcistub_sem); 670 return result; 671 672 } 673 674 675 /*xen_pcibk_mmio_enabled: it will send the mmio_enabled request to pcifront 676 * in case of the device driver could provide this service, and then wait 677 * for pcifront ack 678 * @dev: pointer to PCI devices 679 * return value is used by aer_core do_recovery policy 680 */ 681 682 static pci_ers_result_t xen_pcibk_mmio_enabled(struct pci_dev *dev) 683 { 684 struct pcistub_device *psdev; 685 pci_ers_result_t result; 686 687 result = PCI_ERS_RESULT_RECOVERED; 688 dev_dbg(&dev->dev, "xen_pcibk_mmio_enabled(bus:%x,devfn:%x)\n", 689 dev->bus->number, dev->devfn); 690 691 down_write(&pcistub_sem); 692 psdev = pcistub_device_find(pci_domain_nr(dev->bus), 693 dev->bus->number, 694 PCI_SLOT(dev->devfn), 695 PCI_FUNC(dev->devfn)); 696 697 if (!psdev || !psdev->pdev) { 698 dev_err(&dev->dev, 699 DRV_NAME " device is not found/assigned\n"); 700 goto end; 701 } 702 703 if (!psdev->pdev->sh_info) { 704 dev_err(&dev->dev, DRV_NAME " device is not connected or owned" 705 " by HVM, kill it\n"); 706 kill_domain_by_device(psdev); 707 goto release; 708 } 709 710 if (!test_bit(_XEN_PCIB_AERHANDLER, 711 (unsigned long *)&psdev->pdev->sh_info->flags)) { 712 dev_err(&dev->dev, 713 "guest with no AER driver should have been killed\n"); 714 goto release; 715 } 716 result = common_process(psdev, 1, XEN_PCI_OP_aer_mmio, result); 717 718 if (result == PCI_ERS_RESULT_NONE || 719 result == PCI_ERS_RESULT_DISCONNECT) { 720 dev_dbg(&dev->dev, 721 "No AER mmio_enabled service or disconnected!\n"); 722 kill_domain_by_device(psdev); 723 } 724 release: 725 pcistub_device_put(psdev); 726 end: 727 up_write(&pcistub_sem); 728 return result; 729 } 730 731 /*xen_pcibk_error_detected: it will send the error_detected request to pcifront 732 * in case of the device driver could provide this service, and then wait 733 * for pcifront ack. 734 * @dev: pointer to PCI devices 735 * @error: the current PCI connection state 736 * return value is used by aer_core do_recovery policy 737 */ 738 739 static pci_ers_result_t xen_pcibk_error_detected(struct pci_dev *dev, 740 pci_channel_state_t error) 741 { 742 struct pcistub_device *psdev; 743 pci_ers_result_t result; 744 745 result = PCI_ERS_RESULT_CAN_RECOVER; 746 dev_dbg(&dev->dev, "xen_pcibk_error_detected(bus:%x,devfn:%x)\n", 747 dev->bus->number, dev->devfn); 748 749 down_write(&pcistub_sem); 750 psdev = pcistub_device_find(pci_domain_nr(dev->bus), 751 dev->bus->number, 752 PCI_SLOT(dev->devfn), 753 PCI_FUNC(dev->devfn)); 754 755 if (!psdev || !psdev->pdev) { 756 dev_err(&dev->dev, 757 DRV_NAME " device is not found/assigned\n"); 758 goto end; 759 } 760 761 if (!psdev->pdev->sh_info) { 762 dev_err(&dev->dev, DRV_NAME " device is not connected or owned" 763 " by HVM, kill it\n"); 764 kill_domain_by_device(psdev); 765 goto release; 766 } 767 768 /*Guest owns the device yet no aer handler regiested, kill guest*/ 769 if (!test_bit(_XEN_PCIB_AERHANDLER, 770 (unsigned long *)&psdev->pdev->sh_info->flags)) { 771 dev_dbg(&dev->dev, "guest may have no aer driver, kill it\n"); 772 kill_domain_by_device(psdev); 773 goto release; 774 } 775 result = common_process(psdev, error, XEN_PCI_OP_aer_detected, result); 776 777 if (result == PCI_ERS_RESULT_NONE || 778 result == PCI_ERS_RESULT_DISCONNECT) { 779 dev_dbg(&dev->dev, 780 "No AER error_detected service or disconnected!\n"); 781 kill_domain_by_device(psdev); 782 } 783 release: 784 pcistub_device_put(psdev); 785 end: 786 up_write(&pcistub_sem); 787 return result; 788 } 789 790 /*xen_pcibk_error_resume: it will send the error_resume request to pcifront 791 * in case of the device driver could provide this service, and then wait 792 * for pcifront ack. 793 * @dev: pointer to PCI devices 794 */ 795 796 static void xen_pcibk_error_resume(struct pci_dev *dev) 797 { 798 struct pcistub_device *psdev; 799 800 dev_dbg(&dev->dev, "xen_pcibk_error_resume(bus:%x,devfn:%x)\n", 801 dev->bus->number, dev->devfn); 802 803 down_write(&pcistub_sem); 804 psdev = pcistub_device_find(pci_domain_nr(dev->bus), 805 dev->bus->number, 806 PCI_SLOT(dev->devfn), 807 PCI_FUNC(dev->devfn)); 808 809 if (!psdev || !psdev->pdev) { 810 dev_err(&dev->dev, 811 DRV_NAME " device is not found/assigned\n"); 812 goto end; 813 } 814 815 if (!psdev->pdev->sh_info) { 816 dev_err(&dev->dev, DRV_NAME " device is not connected or owned" 817 " by HVM, kill it\n"); 818 kill_domain_by_device(psdev); 819 goto release; 820 } 821 822 if (!test_bit(_XEN_PCIB_AERHANDLER, 823 (unsigned long *)&psdev->pdev->sh_info->flags)) { 824 dev_err(&dev->dev, 825 "guest with no AER driver should have been killed\n"); 826 kill_domain_by_device(psdev); 827 goto release; 828 } 829 common_process(psdev, 1, XEN_PCI_OP_aer_resume, 830 PCI_ERS_RESULT_RECOVERED); 831 release: 832 pcistub_device_put(psdev); 833 end: 834 up_write(&pcistub_sem); 835 return; 836 } 837 838 /*add xen_pcibk AER handling*/ 839 static struct pci_error_handlers xen_pcibk_error_handler = { 840 .error_detected = xen_pcibk_error_detected, 841 .mmio_enabled = xen_pcibk_mmio_enabled, 842 .slot_reset = xen_pcibk_slot_reset, 843 .resume = xen_pcibk_error_resume, 844 }; 845 846 /* 847 * Note: There is no MODULE_DEVICE_TABLE entry here because this isn't 848 * for a normal device. I don't want it to be loaded automatically. 849 */ 850 851 static struct pci_driver xen_pcibk_pci_driver = { 852 /* The name should be xen_pciback, but until the tools are updated 853 * we will keep it as pciback. */ 854 .name = "pciback", 855 .id_table = pcistub_ids, 856 .probe = pcistub_probe, 857 .remove = pcistub_remove, 858 .err_handler = &xen_pcibk_error_handler, 859 }; 860 861 static inline int str_to_slot(const char *buf, int *domain, int *bus, 862 int *slot, int *func) 863 { 864 int err; 865 866 err = sscanf(buf, " %x:%x:%x.%x", domain, bus, slot, func); 867 if (err == 4) 868 return 0; 869 else if (err < 0) 870 return -EINVAL; 871 872 /* try again without domain */ 873 *domain = 0; 874 err = sscanf(buf, " %x:%x.%x", bus, slot, func); 875 if (err == 3) 876 return 0; 877 878 return -EINVAL; 879 } 880 881 static inline int str_to_quirk(const char *buf, int *domain, int *bus, int 882 *slot, int *func, int *reg, int *size, int *mask) 883 { 884 int err; 885 886 err = 887 sscanf(buf, " %04x:%02x:%02x.%1x-%08x:%1x:%08x", domain, bus, slot, 888 func, reg, size, mask); 889 if (err == 7) 890 return 0; 891 return -EINVAL; 892 } 893 894 static int pcistub_device_id_add(int domain, int bus, int slot, int func) 895 { 896 struct pcistub_device_id *pci_dev_id; 897 unsigned long flags; 898 899 pci_dev_id = kmalloc(sizeof(*pci_dev_id), GFP_KERNEL); 900 if (!pci_dev_id) 901 return -ENOMEM; 902 903 pci_dev_id->domain = domain; 904 pci_dev_id->bus = bus; 905 pci_dev_id->devfn = PCI_DEVFN(slot, func); 906 907 pr_debug(DRV_NAME ": wants to seize %04x:%02x:%02x.%01x\n", 908 domain, bus, slot, func); 909 910 spin_lock_irqsave(&device_ids_lock, flags); 911 list_add_tail(&pci_dev_id->slot_list, &pcistub_device_ids); 912 spin_unlock_irqrestore(&device_ids_lock, flags); 913 914 return 0; 915 } 916 917 static int pcistub_device_id_remove(int domain, int bus, int slot, int func) 918 { 919 struct pcistub_device_id *pci_dev_id, *t; 920 int devfn = PCI_DEVFN(slot, func); 921 int err = -ENOENT; 922 unsigned long flags; 923 924 spin_lock_irqsave(&device_ids_lock, flags); 925 list_for_each_entry_safe(pci_dev_id, t, &pcistub_device_ids, 926 slot_list) { 927 if (pci_dev_id->domain == domain 928 && pci_dev_id->bus == bus && pci_dev_id->devfn == devfn) { 929 /* Don't break; here because it's possible the same 930 * slot could be in the list more than once 931 */ 932 list_del(&pci_dev_id->slot_list); 933 kfree(pci_dev_id); 934 935 err = 0; 936 937 pr_debug(DRV_NAME ": removed %04x:%02x:%02x.%01x from " 938 "seize list\n", domain, bus, slot, func); 939 } 940 } 941 spin_unlock_irqrestore(&device_ids_lock, flags); 942 943 return err; 944 } 945 946 static int pcistub_reg_add(int domain, int bus, int slot, int func, int reg, 947 int size, int mask) 948 { 949 int err = 0; 950 struct pcistub_device *psdev; 951 struct pci_dev *dev; 952 struct config_field *field; 953 954 psdev = pcistub_device_find(domain, bus, slot, func); 955 if (!psdev || !psdev->dev) { 956 err = -ENODEV; 957 goto out; 958 } 959 dev = psdev->dev; 960 961 field = kzalloc(sizeof(*field), GFP_ATOMIC); 962 if (!field) { 963 err = -ENOMEM; 964 goto out; 965 } 966 967 field->offset = reg; 968 field->size = size; 969 field->mask = mask; 970 field->init = NULL; 971 field->reset = NULL; 972 field->release = NULL; 973 field->clean = xen_pcibk_config_field_free; 974 975 err = xen_pcibk_config_quirks_add_field(dev, field); 976 if (err) 977 kfree(field); 978 out: 979 return err; 980 } 981 982 static ssize_t pcistub_slot_add(struct device_driver *drv, const char *buf, 983 size_t count) 984 { 985 int domain, bus, slot, func; 986 int err; 987 988 err = str_to_slot(buf, &domain, &bus, &slot, &func); 989 if (err) 990 goto out; 991 992 err = pcistub_device_id_add(domain, bus, slot, func); 993 994 out: 995 if (!err) 996 err = count; 997 return err; 998 } 999 static DRIVER_ATTR(new_slot, S_IWUSR, NULL, pcistub_slot_add); 1000 1001 static ssize_t pcistub_slot_remove(struct device_driver *drv, const char *buf, 1002 size_t count) 1003 { 1004 int domain, bus, slot, func; 1005 int err; 1006 1007 err = str_to_slot(buf, &domain, &bus, &slot, &func); 1008 if (err) 1009 goto out; 1010 1011 err = pcistub_device_id_remove(domain, bus, slot, func); 1012 1013 out: 1014 if (!err) 1015 err = count; 1016 return err; 1017 } 1018 static DRIVER_ATTR(remove_slot, S_IWUSR, NULL, pcistub_slot_remove); 1019 1020 static ssize_t pcistub_slot_show(struct device_driver *drv, char *buf) 1021 { 1022 struct pcistub_device_id *pci_dev_id; 1023 size_t count = 0; 1024 unsigned long flags; 1025 1026 spin_lock_irqsave(&device_ids_lock, flags); 1027 list_for_each_entry(pci_dev_id, &pcistub_device_ids, slot_list) { 1028 if (count >= PAGE_SIZE) 1029 break; 1030 1031 count += scnprintf(buf + count, PAGE_SIZE - count, 1032 "%04x:%02x:%02x.%01x\n", 1033 pci_dev_id->domain, pci_dev_id->bus, 1034 PCI_SLOT(pci_dev_id->devfn), 1035 PCI_FUNC(pci_dev_id->devfn)); 1036 } 1037 spin_unlock_irqrestore(&device_ids_lock, flags); 1038 1039 return count; 1040 } 1041 static DRIVER_ATTR(slots, S_IRUSR, pcistub_slot_show, NULL); 1042 1043 static ssize_t pcistub_irq_handler_show(struct device_driver *drv, char *buf) 1044 { 1045 struct pcistub_device *psdev; 1046 struct xen_pcibk_dev_data *dev_data; 1047 size_t count = 0; 1048 unsigned long flags; 1049 1050 spin_lock_irqsave(&pcistub_devices_lock, flags); 1051 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 1052 if (count >= PAGE_SIZE) 1053 break; 1054 if (!psdev->dev) 1055 continue; 1056 dev_data = pci_get_drvdata(psdev->dev); 1057 if (!dev_data) 1058 continue; 1059 count += 1060 scnprintf(buf + count, PAGE_SIZE - count, 1061 "%s:%s:%sing:%ld\n", 1062 pci_name(psdev->dev), 1063 dev_data->isr_on ? "on" : "off", 1064 dev_data->ack_intr ? "ack" : "not ack", 1065 dev_data->handled); 1066 } 1067 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 1068 return count; 1069 } 1070 static DRIVER_ATTR(irq_handlers, S_IRUSR, pcistub_irq_handler_show, NULL); 1071 1072 static ssize_t pcistub_irq_handler_switch(struct device_driver *drv, 1073 const char *buf, 1074 size_t count) 1075 { 1076 struct pcistub_device *psdev; 1077 struct xen_pcibk_dev_data *dev_data; 1078 int domain, bus, slot, func; 1079 int err = -ENOENT; 1080 1081 err = str_to_slot(buf, &domain, &bus, &slot, &func); 1082 if (err) 1083 goto out; 1084 1085 psdev = pcistub_device_find(domain, bus, slot, func); 1086 1087 if (!psdev) 1088 goto out; 1089 1090 dev_data = pci_get_drvdata(psdev->dev); 1091 if (!dev_data) 1092 goto out; 1093 1094 dev_dbg(&psdev->dev->dev, "%s fake irq handler: %d->%d\n", 1095 dev_data->irq_name, dev_data->isr_on, 1096 !dev_data->isr_on); 1097 1098 dev_data->isr_on = !(dev_data->isr_on); 1099 if (dev_data->isr_on) 1100 dev_data->ack_intr = 1; 1101 out: 1102 if (!err) 1103 err = count; 1104 return err; 1105 } 1106 static DRIVER_ATTR(irq_handler_state, S_IWUSR, NULL, 1107 pcistub_irq_handler_switch); 1108 1109 static ssize_t pcistub_quirk_add(struct device_driver *drv, const char *buf, 1110 size_t count) 1111 { 1112 int domain, bus, slot, func, reg, size, mask; 1113 int err; 1114 1115 err = str_to_quirk(buf, &domain, &bus, &slot, &func, ®, &size, 1116 &mask); 1117 if (err) 1118 goto out; 1119 1120 err = pcistub_reg_add(domain, bus, slot, func, reg, size, mask); 1121 1122 out: 1123 if (!err) 1124 err = count; 1125 return err; 1126 } 1127 1128 static ssize_t pcistub_quirk_show(struct device_driver *drv, char *buf) 1129 { 1130 int count = 0; 1131 unsigned long flags; 1132 struct xen_pcibk_config_quirk *quirk; 1133 struct xen_pcibk_dev_data *dev_data; 1134 const struct config_field *field; 1135 const struct config_field_entry *cfg_entry; 1136 1137 spin_lock_irqsave(&device_ids_lock, flags); 1138 list_for_each_entry(quirk, &xen_pcibk_quirks, quirks_list) { 1139 if (count >= PAGE_SIZE) 1140 goto out; 1141 1142 count += scnprintf(buf + count, PAGE_SIZE - count, 1143 "%02x:%02x.%01x\n\t%04x:%04x:%04x:%04x\n", 1144 quirk->pdev->bus->number, 1145 PCI_SLOT(quirk->pdev->devfn), 1146 PCI_FUNC(quirk->pdev->devfn), 1147 quirk->devid.vendor, quirk->devid.device, 1148 quirk->devid.subvendor, 1149 quirk->devid.subdevice); 1150 1151 dev_data = pci_get_drvdata(quirk->pdev); 1152 1153 list_for_each_entry(cfg_entry, &dev_data->config_fields, list) { 1154 field = cfg_entry->field; 1155 if (count >= PAGE_SIZE) 1156 goto out; 1157 1158 count += scnprintf(buf + count, PAGE_SIZE - count, 1159 "\t\t%08x:%01x:%08x\n", 1160 cfg_entry->base_offset + 1161 field->offset, field->size, 1162 field->mask); 1163 } 1164 } 1165 1166 out: 1167 spin_unlock_irqrestore(&device_ids_lock, flags); 1168 1169 return count; 1170 } 1171 static DRIVER_ATTR(quirks, S_IRUSR | S_IWUSR, pcistub_quirk_show, 1172 pcistub_quirk_add); 1173 1174 static ssize_t permissive_add(struct device_driver *drv, const char *buf, 1175 size_t count) 1176 { 1177 int domain, bus, slot, func; 1178 int err; 1179 struct pcistub_device *psdev; 1180 struct xen_pcibk_dev_data *dev_data; 1181 err = str_to_slot(buf, &domain, &bus, &slot, &func); 1182 if (err) 1183 goto out; 1184 psdev = pcistub_device_find(domain, bus, slot, func); 1185 if (!psdev) { 1186 err = -ENODEV; 1187 goto out; 1188 } 1189 if (!psdev->dev) { 1190 err = -ENODEV; 1191 goto release; 1192 } 1193 dev_data = pci_get_drvdata(psdev->dev); 1194 /* the driver data for a device should never be null at this point */ 1195 if (!dev_data) { 1196 err = -ENXIO; 1197 goto release; 1198 } 1199 if (!dev_data->permissive) { 1200 dev_data->permissive = 1; 1201 /* Let user know that what they're doing could be unsafe */ 1202 dev_warn(&psdev->dev->dev, "enabling permissive mode " 1203 "configuration space accesses!\n"); 1204 dev_warn(&psdev->dev->dev, 1205 "permissive mode is potentially unsafe!\n"); 1206 } 1207 release: 1208 pcistub_device_put(psdev); 1209 out: 1210 if (!err) 1211 err = count; 1212 return err; 1213 } 1214 1215 static ssize_t permissive_show(struct device_driver *drv, char *buf) 1216 { 1217 struct pcistub_device *psdev; 1218 struct xen_pcibk_dev_data *dev_data; 1219 size_t count = 0; 1220 unsigned long flags; 1221 spin_lock_irqsave(&pcistub_devices_lock, flags); 1222 list_for_each_entry(psdev, &pcistub_devices, dev_list) { 1223 if (count >= PAGE_SIZE) 1224 break; 1225 if (!psdev->dev) 1226 continue; 1227 dev_data = pci_get_drvdata(psdev->dev); 1228 if (!dev_data || !dev_data->permissive) 1229 continue; 1230 count += 1231 scnprintf(buf + count, PAGE_SIZE - count, "%s\n", 1232 pci_name(psdev->dev)); 1233 } 1234 spin_unlock_irqrestore(&pcistub_devices_lock, flags); 1235 return count; 1236 } 1237 static DRIVER_ATTR(permissive, S_IRUSR | S_IWUSR, permissive_show, 1238 permissive_add); 1239 1240 static void pcistub_exit(void) 1241 { 1242 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_new_slot); 1243 driver_remove_file(&xen_pcibk_pci_driver.driver, 1244 &driver_attr_remove_slot); 1245 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_slots); 1246 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_quirks); 1247 driver_remove_file(&xen_pcibk_pci_driver.driver, 1248 &driver_attr_permissive); 1249 driver_remove_file(&xen_pcibk_pci_driver.driver, 1250 &driver_attr_irq_handlers); 1251 driver_remove_file(&xen_pcibk_pci_driver.driver, 1252 &driver_attr_irq_handler_state); 1253 pci_unregister_driver(&xen_pcibk_pci_driver); 1254 } 1255 1256 static int __init pcistub_init(void) 1257 { 1258 int pos = 0; 1259 int err = 0; 1260 int domain, bus, slot, func; 1261 int parsed; 1262 1263 if (pci_devs_to_hide && *pci_devs_to_hide) { 1264 do { 1265 parsed = 0; 1266 1267 err = sscanf(pci_devs_to_hide + pos, 1268 " (%x:%x:%x.%x) %n", 1269 &domain, &bus, &slot, &func, &parsed); 1270 if (err != 4) { 1271 domain = 0; 1272 err = sscanf(pci_devs_to_hide + pos, 1273 " (%x:%x.%x) %n", 1274 &bus, &slot, &func, &parsed); 1275 if (err != 3) 1276 goto parse_error; 1277 } 1278 1279 err = pcistub_device_id_add(domain, bus, slot, func); 1280 if (err) 1281 goto out; 1282 1283 /* if parsed<=0, we've reached the end of the string */ 1284 pos += parsed; 1285 } while (parsed > 0 && pci_devs_to_hide[pos]); 1286 } 1287 1288 /* If we're the first PCI Device Driver to register, we're the 1289 * first one to get offered PCI devices as they become 1290 * available (and thus we can be the first to grab them) 1291 */ 1292 err = pci_register_driver(&xen_pcibk_pci_driver); 1293 if (err < 0) 1294 goto out; 1295 1296 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1297 &driver_attr_new_slot); 1298 if (!err) 1299 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1300 &driver_attr_remove_slot); 1301 if (!err) 1302 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1303 &driver_attr_slots); 1304 if (!err) 1305 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1306 &driver_attr_quirks); 1307 if (!err) 1308 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1309 &driver_attr_permissive); 1310 1311 if (!err) 1312 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1313 &driver_attr_irq_handlers); 1314 if (!err) 1315 err = driver_create_file(&xen_pcibk_pci_driver.driver, 1316 &driver_attr_irq_handler_state); 1317 if (err) 1318 pcistub_exit(); 1319 1320 out: 1321 return err; 1322 1323 parse_error: 1324 printk(KERN_ERR DRV_NAME ": Error parsing pci_devs_to_hide at \"%s\"\n", 1325 pci_devs_to_hide + pos); 1326 return -EINVAL; 1327 } 1328 1329 #ifndef MODULE 1330 /* 1331 * fs_initcall happens before device_initcall 1332 * so xen_pcibk *should* get called first (b/c we 1333 * want to suck up any device before other drivers 1334 * get a chance by being the first pci device 1335 * driver to register) 1336 */ 1337 fs_initcall(pcistub_init); 1338 #endif 1339 1340 static int __init xen_pcibk_init(void) 1341 { 1342 int err; 1343 1344 if (!xen_initial_domain()) 1345 return -ENODEV; 1346 1347 err = xen_pcibk_config_init(); 1348 if (err) 1349 return err; 1350 1351 #ifdef MODULE 1352 err = pcistub_init(); 1353 if (err < 0) 1354 return err; 1355 #endif 1356 1357 pcistub_init_devices_late(); 1358 err = xen_pcibk_xenbus_register(); 1359 if (err) 1360 pcistub_exit(); 1361 1362 return err; 1363 } 1364 1365 static void __exit xen_pcibk_cleanup(void) 1366 { 1367 xen_pcibk_xenbus_unregister(); 1368 pcistub_exit(); 1369 } 1370 1371 module_init(xen_pcibk_init); 1372 module_exit(xen_pcibk_cleanup); 1373 1374 MODULE_LICENSE("Dual BSD/GPL"); 1375 MODULE_ALIAS("xen-backend:pci"); 1376