2 * PCI Stub Driver - Grabs devices in backend to be exported later
4 * Ryan Wilson <hap9@epoch.ncsc.mil>
5 * Chris Bookholt <hap10@epoch.ncsc.mil>
8 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
10 #include <linux/module.h>
11 #include <linux/init.h>
12 #include <linux/rwsem.h>
13 #include <linux/list.h>
14 #include <linux/spinlock.h>
15 #include <linux/kref.h>
16 #include <linux/pci.h>
17 #include <linux/wait.h>
18 #include <linux/sched.h>
19 #include <linux/atomic.h>
20 #include <xen/events.h>
21 #include <asm/xen/pci.h>
22 #include <asm/xen/hypervisor.h>
23 #include <xen/interface/physdev.h>
25 #include "conf_space.h"
26 #include "conf_space_quirks.h"
28 static char *pci_devs_to_hide;
29 wait_queue_head_t xen_pcibk_aer_wait_queue;
30 /*Add sem for sync AER handling and xen_pcibk remove/reconfigue ops,
31 * We want to avoid in middle of AER ops, xen_pcibk devices is being removed
33 static DECLARE_RWSEM(pcistub_sem);
34 module_param_named(hide, pci_devs_to_hide, charp, 0444);
36 struct pcistub_device_id {
37 struct list_head slot_list;
42 static LIST_HEAD(pcistub_device_ids);
43 static DEFINE_SPINLOCK(device_ids_lock);
45 struct pcistub_device {
47 struct list_head dev_list;
51 struct xen_pcibk_device *pdev;/* non-NULL if struct pci_dev is in use */
54 /* Access to pcistub_devices & seized_devices lists and the initialize_devices
55 * flag must be locked with pcistub_devices_lock
57 static DEFINE_SPINLOCK(pcistub_devices_lock);
58 static LIST_HEAD(pcistub_devices);
60 /* wait for device_initcall before initializing our devices
61 * (see pcistub_init_devices_late)
63 static int initialize_devices;
64 static LIST_HEAD(seized_devices);
66 static struct pcistub_device *pcistub_device_alloc(struct pci_dev *dev)
68 struct pcistub_device *psdev;
70 dev_dbg(&dev->dev, "pcistub_device_alloc\n");
72 psdev = kzalloc(sizeof(*psdev), GFP_ATOMIC);
76 psdev->dev = pci_dev_get(dev);
82 kref_init(&psdev->kref);
83 spin_lock_init(&psdev->lock);
88 /* Don't call this directly as it's called by pcistub_device_put */
89 static void pcistub_device_release(struct kref *kref)
91 struct pcistub_device *psdev;
93 struct xen_pcibk_dev_data *dev_data;
95 psdev = container_of(kref, struct pcistub_device, kref);
97 dev_data = pci_get_drvdata(dev);
99 dev_dbg(&dev->dev, "pcistub_device_release\n");
101 xen_unregister_device_domain_owner(dev);
103 /* Call the reset function which does not take lock as this
104 * is called from "unbind" which takes a device_lock mutex.
106 __pci_reset_function_locked(dev);
107 if (pci_load_and_free_saved_state(dev, &dev_data->pci_saved_state))
108 dev_dbg(&dev->dev, "Could not reload PCI state\n");
110 pci_restore_state(dev);
113 struct physdev_pci_device ppdev = {
114 .seg = pci_domain_nr(dev->bus),
115 .bus = dev->bus->number,
118 int err = HYPERVISOR_physdev_op(PHYSDEVOP_release_msix,
122 dev_warn(&dev->dev, "MSI-X release failed (%d)\n",
126 /* Disable the device */
127 xen_pcibk_reset_device(dev);
130 pci_set_drvdata(dev, NULL);
132 /* Clean-up the device */
133 xen_pcibk_config_free_dyn_fields(dev);
134 xen_pcibk_config_free_dev(dev);
136 dev->dev_flags &= ~PCI_DEV_FLAGS_ASSIGNED;
142 static inline void pcistub_device_get(struct pcistub_device *psdev)
144 kref_get(&psdev->kref);
147 static inline void pcistub_device_put(struct pcistub_device *psdev)
149 kref_put(&psdev->kref, pcistub_device_release);
152 static struct pcistub_device *pcistub_device_find(int domain, int bus,
155 struct pcistub_device *psdev = NULL;
158 spin_lock_irqsave(&pcistub_devices_lock, flags);
160 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
161 if (psdev->dev != NULL
162 && domain == pci_domain_nr(psdev->dev->bus)
163 && bus == psdev->dev->bus->number
164 && slot == PCI_SLOT(psdev->dev->devfn)
165 && func == PCI_FUNC(psdev->dev->devfn)) {
166 pcistub_device_get(psdev);
175 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
179 static struct pci_dev *pcistub_device_get_pci_dev(struct xen_pcibk_device *pdev,
180 struct pcistub_device *psdev)
182 struct pci_dev *pci_dev = NULL;
185 pcistub_device_get(psdev);
187 spin_lock_irqsave(&psdev->lock, flags);
190 pci_dev = psdev->dev;
192 spin_unlock_irqrestore(&psdev->lock, flags);
195 pcistub_device_put(psdev);
200 struct pci_dev *pcistub_get_pci_dev_by_slot(struct xen_pcibk_device *pdev,
204 struct pcistub_device *psdev;
205 struct pci_dev *found_dev = NULL;
208 spin_lock_irqsave(&pcistub_devices_lock, flags);
210 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
211 if (psdev->dev != NULL
212 && domain == pci_domain_nr(psdev->dev->bus)
213 && bus == psdev->dev->bus->number
214 && slot == PCI_SLOT(psdev->dev->devfn)
215 && func == PCI_FUNC(psdev->dev->devfn)) {
216 found_dev = pcistub_device_get_pci_dev(pdev, psdev);
221 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
225 struct pci_dev *pcistub_get_pci_dev(struct xen_pcibk_device *pdev,
228 struct pcistub_device *psdev;
229 struct pci_dev *found_dev = NULL;
232 spin_lock_irqsave(&pcistub_devices_lock, flags);
234 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
235 if (psdev->dev == dev) {
236 found_dev = pcistub_device_get_pci_dev(pdev, psdev);
241 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
245 void pcistub_put_pci_dev(struct pci_dev *dev)
247 struct pcistub_device *psdev, *found_psdev = NULL;
250 spin_lock_irqsave(&pcistub_devices_lock, flags);
252 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
253 if (psdev->dev == dev) {
259 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
260 if (WARN_ON(!found_psdev))
263 /*hold this lock for avoiding breaking link between
264 * pcistub and xen_pcibk when AER is in processing
266 down_write(&pcistub_sem);
267 /* Cleanup our device
268 * (so it's ready for the next domain)
271 /* This is OK - we are running from workqueue context
272 * and want to inhibit the user from fiddling with 'reset'
274 pci_reset_function(dev);
275 pci_restore_state(dev);
277 /* This disables the device. */
278 xen_pcibk_reset_device(dev);
280 /* And cleanup up our emulated fields. */
281 xen_pcibk_config_reset_dev(dev);
282 xen_pcibk_config_free_dyn_fields(dev);
284 xen_unregister_device_domain_owner(dev);
286 spin_lock_irqsave(&found_psdev->lock, flags);
287 found_psdev->pdev = NULL;
288 spin_unlock_irqrestore(&found_psdev->lock, flags);
290 pcistub_device_put(found_psdev);
291 up_write(&pcistub_sem);
294 static int pcistub_match_one(struct pci_dev *dev,
295 struct pcistub_device_id *pdev_id)
297 /* Match the specified device by domain, bus, slot, func and also if
298 * any of the device's parent bridges match.
300 for (; dev != NULL; dev = dev->bus->self) {
301 if (pci_domain_nr(dev->bus) == pdev_id->domain
302 && dev->bus->number == pdev_id->bus
303 && dev->devfn == pdev_id->devfn)
306 /* Sometimes topmost bridge links to itself. */
307 if (dev == dev->bus->self)
314 static int pcistub_match(struct pci_dev *dev)
316 struct pcistub_device_id *pdev_id;
320 spin_lock_irqsave(&device_ids_lock, flags);
321 list_for_each_entry(pdev_id, &pcistub_device_ids, slot_list) {
322 if (pcistub_match_one(dev, pdev_id)) {
327 spin_unlock_irqrestore(&device_ids_lock, flags);
332 static int pcistub_init_device(struct pci_dev *dev)
334 struct xen_pcibk_dev_data *dev_data;
337 dev_dbg(&dev->dev, "initializing...\n");
339 /* The PCI backend is not intended to be a module (or to work with
340 * removable PCI devices (yet). If it were, xen_pcibk_config_free()
341 * would need to be called somewhere to free the memory allocated
342 * here and then to call kfree(pci_get_drvdata(psdev->dev)).
344 dev_data = kzalloc(sizeof(*dev_data) + strlen(DRV_NAME "[]")
345 + strlen(pci_name(dev)) + 1, GFP_ATOMIC);
350 pci_set_drvdata(dev, dev_data);
353 * Setup name for fake IRQ handler. It will only be enabled
354 * once the device is turned on by the guest.
356 sprintf(dev_data->irq_name, DRV_NAME "[%s]", pci_name(dev));
358 dev_dbg(&dev->dev, "initializing config\n");
360 init_waitqueue_head(&xen_pcibk_aer_wait_queue);
361 err = xen_pcibk_config_init_dev(dev);
365 /* HACK: Force device (& ACPI) to determine what IRQ it's on - we
366 * must do this here because pcibios_enable_device may specify
367 * the pci device's true irq (and possibly its other resources)
368 * if they differ from what's in the configuration space.
369 * This makes the assumption that the device's resources won't
370 * change after this point (otherwise this code may break!)
372 dev_dbg(&dev->dev, "enabling device\n");
373 err = pci_enable_device(dev);
378 struct physdev_pci_device ppdev = {
379 .seg = pci_domain_nr(dev->bus),
380 .bus = dev->bus->number,
384 err = HYPERVISOR_physdev_op(PHYSDEVOP_prepare_msix, &ppdev);
386 dev_err(&dev->dev, "MSI-X preparation failed (%d)\n",
390 /* We need the device active to save the state. */
391 dev_dbg(&dev->dev, "save state of device\n");
393 dev_data->pci_saved_state = pci_store_saved_state(dev);
394 if (!dev_data->pci_saved_state)
395 dev_err(&dev->dev, "Could not store PCI conf saved state!\n");
397 dev_dbg(&dev->dev, "resetting (FLR, D3, etc) the device\n");
398 __pci_reset_function_locked(dev);
399 pci_restore_state(dev);
401 /* Now disable the device (this also ensures some private device
402 * data is setup before we export)
404 dev_dbg(&dev->dev, "reset device\n");
405 xen_pcibk_reset_device(dev);
407 dev->dev_flags |= PCI_DEV_FLAGS_ASSIGNED;
411 xen_pcibk_config_free_dev(dev);
414 pci_set_drvdata(dev, NULL);
420 * Because some initialization still happens on
421 * devices during fs_initcall, we need to defer
422 * full initialization of our devices until
425 static int __init pcistub_init_devices_late(void)
427 struct pcistub_device *psdev;
431 spin_lock_irqsave(&pcistub_devices_lock, flags);
433 while (!list_empty(&seized_devices)) {
434 psdev = container_of(seized_devices.next,
435 struct pcistub_device, dev_list);
436 list_del(&psdev->dev_list);
438 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
440 err = pcistub_init_device(psdev->dev);
442 dev_err(&psdev->dev->dev,
443 "error %d initializing device\n", err);
448 spin_lock_irqsave(&pcistub_devices_lock, flags);
451 list_add_tail(&psdev->dev_list, &pcistub_devices);
454 initialize_devices = 1;
456 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
461 static int pcistub_seize(struct pci_dev *dev)
463 struct pcistub_device *psdev;
467 psdev = pcistub_device_alloc(dev);
471 spin_lock_irqsave(&pcistub_devices_lock, flags);
473 if (initialize_devices) {
474 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
476 /* don't want irqs disabled when calling pcistub_init_device */
477 err = pcistub_init_device(psdev->dev);
479 spin_lock_irqsave(&pcistub_devices_lock, flags);
482 list_add(&psdev->dev_list, &pcistub_devices);
484 dev_dbg(&dev->dev, "deferring initialization\n");
485 list_add(&psdev->dev_list, &seized_devices);
488 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
491 pcistub_device_put(psdev);
496 /* Called when 'bind'. This means we must _NOT_ call pci_reset_function or
497 * other functions that take the sysfs lock. */
498 static int pcistub_probe(struct pci_dev *dev, const struct pci_device_id *id)
502 dev_dbg(&dev->dev, "probing...\n");
504 if (pcistub_match(dev)) {
506 if (dev->hdr_type != PCI_HEADER_TYPE_NORMAL
507 && dev->hdr_type != PCI_HEADER_TYPE_BRIDGE) {
508 dev_err(&dev->dev, "can't export pci devices that "
509 "don't have a normal (0) or bridge (1) "
515 dev_info(&dev->dev, "seizing device\n");
516 err = pcistub_seize(dev);
518 /* Didn't find the device */
525 /* Called when 'unbind'. This means we must _NOT_ call pci_reset_function or
526 * other functions that take the sysfs lock. */
527 static void pcistub_remove(struct pci_dev *dev)
529 struct pcistub_device *psdev, *found_psdev = NULL;
532 dev_dbg(&dev->dev, "removing\n");
534 spin_lock_irqsave(&pcistub_devices_lock, flags);
536 xen_pcibk_config_quirk_release(dev);
538 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
539 if (psdev->dev == dev) {
545 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
548 dev_dbg(&dev->dev, "found device to remove - in use? %p\n",
551 if (found_psdev->pdev) {
552 pr_warn("****** removing device %s while still in-use! ******\n",
553 pci_name(found_psdev->dev));
554 pr_warn("****** driver domain may still access this device's i/o resources!\n");
555 pr_warn("****** shutdown driver domain before binding device\n");
556 pr_warn("****** to other drivers or domains\n");
558 /* N.B. This ends up calling pcistub_put_pci_dev which ends up
560 xen_pcibk_release_pci_dev(found_psdev->pdev,
564 spin_lock_irqsave(&pcistub_devices_lock, flags);
565 list_del(&found_psdev->dev_list);
566 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
568 /* the final put for releasing from the list */
569 pcistub_device_put(found_psdev);
573 static DEFINE_PCI_DEVICE_TABLE(pcistub_ids) = {
575 .vendor = PCI_ANY_ID,
576 .device = PCI_ANY_ID,
577 .subvendor = PCI_ANY_ID,
578 .subdevice = PCI_ANY_ID,
583 #define PCI_NODENAME_MAX 40
584 static void kill_domain_by_device(struct pcistub_device *psdev)
586 struct xenbus_transaction xbt;
588 char nodename[PCI_NODENAME_MAX];
591 snprintf(nodename, PCI_NODENAME_MAX, "/local/domain/0/backend/pci/%d/0",
592 psdev->pdev->xdev->otherend_id);
595 err = xenbus_transaction_start(&xbt);
597 dev_err(&psdev->dev->dev,
598 "error %d when start xenbus transaction\n", err);
601 /*PV AER handlers will set this flag*/
602 xenbus_printf(xbt, nodename, "aerState" , "aerfail");
603 err = xenbus_transaction_end(xbt, 0);
607 dev_err(&psdev->dev->dev,
608 "error %d when end xenbus transaction\n", err);
613 /* For each aer recovery step error_detected, mmio_enabled, etc, front_end and
614 * backend need to have cooperation. In xen_pcibk, those steps will do similar
615 * jobs: send service request and waiting for front_end response.
617 static pci_ers_result_t common_process(struct pcistub_device *psdev,
618 pci_channel_state_t state, int aer_cmd,
619 pci_ers_result_t result)
621 pci_ers_result_t res = result;
622 struct xen_pcie_aer_op *aer_op;
625 /*with PV AER drivers*/
626 aer_op = &(psdev->pdev->sh_info->aer_op);
627 aer_op->cmd = aer_cmd ;
628 /*useful for error_detected callback*/
631 ret = xen_pcibk_get_pcifront_dev(psdev->dev, psdev->pdev,
632 &aer_op->domain, &aer_op->bus, &aer_op->devfn);
634 dev_err(&psdev->dev->dev,
635 DRV_NAME ": failed to get pcifront device\n");
636 return PCI_ERS_RESULT_NONE;
640 dev_dbg(&psdev->dev->dev,
641 DRV_NAME ": aer_op %x dom %x bus %x devfn %x\n",
642 aer_cmd, aer_op->domain, aer_op->bus, aer_op->devfn);
643 /*local flag to mark there's aer request, xen_pcibk callback will use
644 * this flag to judge whether we need to check pci-front give aer
647 set_bit(_PCIB_op_pending, (unsigned long *)&psdev->pdev->flags);
649 /*It is possible that a pcifront conf_read_write ops request invokes
650 * the callback which cause the spurious execution of wake_up.
651 * Yet it is harmless and better than a spinlock here
653 set_bit(_XEN_PCIB_active,
654 (unsigned long *)&psdev->pdev->sh_info->flags);
656 notify_remote_via_irq(psdev->pdev->evtchn_irq);
658 ret = wait_event_timeout(xen_pcibk_aer_wait_queue,
659 !(test_bit(_XEN_PCIB_active, (unsigned long *)
660 &psdev->pdev->sh_info->flags)), 300*HZ);
663 if (test_bit(_XEN_PCIB_active,
664 (unsigned long *)&psdev->pdev->sh_info->flags)) {
665 dev_err(&psdev->dev->dev,
666 "pcifront aer process not responding!\n");
667 clear_bit(_XEN_PCIB_active,
668 (unsigned long *)&psdev->pdev->sh_info->flags);
669 aer_op->err = PCI_ERS_RESULT_NONE;
673 clear_bit(_PCIB_op_pending, (unsigned long *)&psdev->pdev->flags);
675 if (test_bit(_XEN_PCIF_active,
676 (unsigned long *)&psdev->pdev->sh_info->flags)) {
677 dev_dbg(&psdev->dev->dev,
678 "schedule pci_conf service in " DRV_NAME "\n");
679 xen_pcibk_test_and_schedule_op(psdev->pdev);
682 res = (pci_ers_result_t)aer_op->err;
687 * xen_pcibk_slot_reset: it will send the slot_reset request to pcifront in case
688 * of the device driver could provide this service, and then wait for pcifront
690 * @dev: pointer to PCI devices
691 * return value is used by aer_core do_recovery policy
693 static pci_ers_result_t xen_pcibk_slot_reset(struct pci_dev *dev)
695 struct pcistub_device *psdev;
696 pci_ers_result_t result;
698 result = PCI_ERS_RESULT_RECOVERED;
699 dev_dbg(&dev->dev, "xen_pcibk_slot_reset(bus:%x,devfn:%x)\n",
700 dev->bus->number, dev->devfn);
702 down_write(&pcistub_sem);
703 psdev = pcistub_device_find(pci_domain_nr(dev->bus),
705 PCI_SLOT(dev->devfn),
706 PCI_FUNC(dev->devfn));
708 if (!psdev || !psdev->pdev) {
710 DRV_NAME " device is not found/assigned\n");
714 if (!psdev->pdev->sh_info) {
715 dev_err(&dev->dev, DRV_NAME " device is not connected or owned"
716 " by HVM, kill it\n");
717 kill_domain_by_device(psdev);
721 if (!test_bit(_XEN_PCIB_AERHANDLER,
722 (unsigned long *)&psdev->pdev->sh_info->flags)) {
724 "guest with no AER driver should have been killed\n");
727 result = common_process(psdev, 1, XEN_PCI_OP_aer_slotreset, result);
729 if (result == PCI_ERS_RESULT_NONE ||
730 result == PCI_ERS_RESULT_DISCONNECT) {
732 "No AER slot_reset service or disconnected!\n");
733 kill_domain_by_device(psdev);
737 pcistub_device_put(psdev);
738 up_write(&pcistub_sem);
744 /*xen_pcibk_mmio_enabled: it will send the mmio_enabled request to pcifront
745 * in case of the device driver could provide this service, and then wait
747 * @dev: pointer to PCI devices
748 * return value is used by aer_core do_recovery policy
751 static pci_ers_result_t xen_pcibk_mmio_enabled(struct pci_dev *dev)
753 struct pcistub_device *psdev;
754 pci_ers_result_t result;
756 result = PCI_ERS_RESULT_RECOVERED;
757 dev_dbg(&dev->dev, "xen_pcibk_mmio_enabled(bus:%x,devfn:%x)\n",
758 dev->bus->number, dev->devfn);
760 down_write(&pcistub_sem);
761 psdev = pcistub_device_find(pci_domain_nr(dev->bus),
763 PCI_SLOT(dev->devfn),
764 PCI_FUNC(dev->devfn));
766 if (!psdev || !psdev->pdev) {
768 DRV_NAME " device is not found/assigned\n");
772 if (!psdev->pdev->sh_info) {
773 dev_err(&dev->dev, DRV_NAME " device is not connected or owned"
774 " by HVM, kill it\n");
775 kill_domain_by_device(psdev);
779 if (!test_bit(_XEN_PCIB_AERHANDLER,
780 (unsigned long *)&psdev->pdev->sh_info->flags)) {
782 "guest with no AER driver should have been killed\n");
785 result = common_process(psdev, 1, XEN_PCI_OP_aer_mmio, result);
787 if (result == PCI_ERS_RESULT_NONE ||
788 result == PCI_ERS_RESULT_DISCONNECT) {
790 "No AER mmio_enabled service or disconnected!\n");
791 kill_domain_by_device(psdev);
795 pcistub_device_put(psdev);
796 up_write(&pcistub_sem);
800 /*xen_pcibk_error_detected: it will send the error_detected request to pcifront
801 * in case of the device driver could provide this service, and then wait
803 * @dev: pointer to PCI devices
804 * @error: the current PCI connection state
805 * return value is used by aer_core do_recovery policy
808 static pci_ers_result_t xen_pcibk_error_detected(struct pci_dev *dev,
809 pci_channel_state_t error)
811 struct pcistub_device *psdev;
812 pci_ers_result_t result;
814 result = PCI_ERS_RESULT_CAN_RECOVER;
815 dev_dbg(&dev->dev, "xen_pcibk_error_detected(bus:%x,devfn:%x)\n",
816 dev->bus->number, dev->devfn);
818 down_write(&pcistub_sem);
819 psdev = pcistub_device_find(pci_domain_nr(dev->bus),
821 PCI_SLOT(dev->devfn),
822 PCI_FUNC(dev->devfn));
824 if (!psdev || !psdev->pdev) {
826 DRV_NAME " device is not found/assigned\n");
830 if (!psdev->pdev->sh_info) {
831 dev_err(&dev->dev, DRV_NAME " device is not connected or owned"
832 " by HVM, kill it\n");
833 kill_domain_by_device(psdev);
837 /*Guest owns the device yet no aer handler regiested, kill guest*/
838 if (!test_bit(_XEN_PCIB_AERHANDLER,
839 (unsigned long *)&psdev->pdev->sh_info->flags)) {
840 dev_dbg(&dev->dev, "guest may have no aer driver, kill it\n");
841 kill_domain_by_device(psdev);
844 result = common_process(psdev, error, XEN_PCI_OP_aer_detected, result);
846 if (result == PCI_ERS_RESULT_NONE ||
847 result == PCI_ERS_RESULT_DISCONNECT) {
849 "No AER error_detected service or disconnected!\n");
850 kill_domain_by_device(psdev);
854 pcistub_device_put(psdev);
855 up_write(&pcistub_sem);
859 /*xen_pcibk_error_resume: it will send the error_resume request to pcifront
860 * in case of the device driver could provide this service, and then wait
862 * @dev: pointer to PCI devices
865 static void xen_pcibk_error_resume(struct pci_dev *dev)
867 struct pcistub_device *psdev;
869 dev_dbg(&dev->dev, "xen_pcibk_error_resume(bus:%x,devfn:%x)\n",
870 dev->bus->number, dev->devfn);
872 down_write(&pcistub_sem);
873 psdev = pcistub_device_find(pci_domain_nr(dev->bus),
875 PCI_SLOT(dev->devfn),
876 PCI_FUNC(dev->devfn));
878 if (!psdev || !psdev->pdev) {
880 DRV_NAME " device is not found/assigned\n");
884 if (!psdev->pdev->sh_info) {
885 dev_err(&dev->dev, DRV_NAME " device is not connected or owned"
886 " by HVM, kill it\n");
887 kill_domain_by_device(psdev);
891 if (!test_bit(_XEN_PCIB_AERHANDLER,
892 (unsigned long *)&psdev->pdev->sh_info->flags)) {
894 "guest with no AER driver should have been killed\n");
895 kill_domain_by_device(psdev);
898 common_process(psdev, 1, XEN_PCI_OP_aer_resume,
899 PCI_ERS_RESULT_RECOVERED);
902 pcistub_device_put(psdev);
903 up_write(&pcistub_sem);
907 /*add xen_pcibk AER handling*/
908 static const struct pci_error_handlers xen_pcibk_error_handler = {
909 .error_detected = xen_pcibk_error_detected,
910 .mmio_enabled = xen_pcibk_mmio_enabled,
911 .slot_reset = xen_pcibk_slot_reset,
912 .resume = xen_pcibk_error_resume,
916 * Note: There is no MODULE_DEVICE_TABLE entry here because this isn't
917 * for a normal device. I don't want it to be loaded automatically.
920 static struct pci_driver xen_pcibk_pci_driver = {
921 /* The name should be xen_pciback, but until the tools are updated
922 * we will keep it as pciback. */
924 .id_table = pcistub_ids,
925 .probe = pcistub_probe,
926 .remove = pcistub_remove,
927 .err_handler = &xen_pcibk_error_handler,
930 static inline int str_to_slot(const char *buf, int *domain, int *bus,
931 int *slot, int *func)
935 switch (sscanf(buf, " %x:%x:%x.%x %n", domain, bus, slot, func,
939 sscanf(buf, " %x:%x:%x.* %n", domain, bus, slot, &parsed);
943 sscanf(buf, " %x:%x:*.* %n", domain, bus, &parsed);
946 if (parsed && !buf[parsed])
949 /* try again without domain */
951 switch (sscanf(buf, " %x:%x.%x %n", bus, slot, func, &parsed)) {
954 sscanf(buf, " %x:%x.* %n", bus, slot, &parsed);
958 sscanf(buf, " %x:*.* %n", bus, &parsed);
961 if (parsed && !buf[parsed])
967 static inline int str_to_quirk(const char *buf, int *domain, int *bus, int
968 *slot, int *func, int *reg, int *size, int *mask)
972 sscanf(buf, " %x:%x:%x.%x-%x:%x:%x %n", domain, bus, slot, func,
973 reg, size, mask, &parsed);
974 if (parsed && !buf[parsed])
977 /* try again without domain */
979 sscanf(buf, " %x:%x.%x-%x:%x:%x %n", bus, slot, func, reg, size,
981 if (parsed && !buf[parsed])
987 static int pcistub_device_id_add(int domain, int bus, int slot, int func)
989 struct pcistub_device_id *pci_dev_id;
991 int rc = 0, devfn = PCI_DEVFN(slot, func);
994 for (slot = 0; !rc && slot < 32; ++slot)
995 rc = pcistub_device_id_add(domain, bus, slot, func);
1000 for (func = 0; !rc && func < 8; ++func)
1001 rc = pcistub_device_id_add(domain, bus, slot, func);
1006 #if !defined(MODULE) /* pci_domains_supported is not being exported */ \
1007 || !defined(CONFIG_PCI_DOMAINS)
1008 !pci_domains_supported ? domain :
1010 domain < 0 || domain > 0xffff)
1011 || bus < 0 || bus > 0xff
1012 || PCI_SLOT(devfn) != slot
1013 || PCI_FUNC(devfn) != func)
1016 pci_dev_id = kmalloc(sizeof(*pci_dev_id), GFP_KERNEL);
1020 pci_dev_id->domain = domain;
1021 pci_dev_id->bus = bus;
1022 pci_dev_id->devfn = devfn;
1024 pr_debug("wants to seize %04x:%02x:%02x.%d\n",
1025 domain, bus, slot, func);
1027 spin_lock_irqsave(&device_ids_lock, flags);
1028 list_add_tail(&pci_dev_id->slot_list, &pcistub_device_ids);
1029 spin_unlock_irqrestore(&device_ids_lock, flags);
1034 static int pcistub_device_id_remove(int domain, int bus, int slot, int func)
1036 struct pcistub_device_id *pci_dev_id, *t;
1038 unsigned long flags;
1040 spin_lock_irqsave(&device_ids_lock, flags);
1041 list_for_each_entry_safe(pci_dev_id, t, &pcistub_device_ids,
1043 if (pci_dev_id->domain == domain && pci_dev_id->bus == bus
1044 && (slot < 0 || PCI_SLOT(pci_dev_id->devfn) == slot)
1045 && (func < 0 || PCI_FUNC(pci_dev_id->devfn) == func)) {
1046 /* Don't break; here because it's possible the same
1047 * slot could be in the list more than once
1049 list_del(&pci_dev_id->slot_list);
1054 pr_debug("removed %04x:%02x:%02x.%d from seize list\n",
1055 domain, bus, slot, func);
1058 spin_unlock_irqrestore(&device_ids_lock, flags);
1063 static int pcistub_reg_add(int domain, int bus, int slot, int func,
1064 unsigned int reg, unsigned int size,
1068 struct pcistub_device *psdev;
1069 struct pci_dev *dev;
1070 struct config_field *field;
1072 if (reg > 0xfff || (size < 4 && (mask >> (size * 8))))
1075 psdev = pcistub_device_find(domain, bus, slot, func);
1082 field = kzalloc(sizeof(*field), GFP_ATOMIC);
1088 field->offset = reg;
1092 field->reset = NULL;
1093 field->release = NULL;
1094 field->clean = xen_pcibk_config_field_free;
1096 err = xen_pcibk_config_quirks_add_field(dev, field);
1101 pcistub_device_put(psdev);
1105 static ssize_t pcistub_slot_add(struct device_driver *drv, const char *buf,
1108 int domain, bus, slot, func;
1111 err = str_to_slot(buf, &domain, &bus, &slot, &func);
1115 err = pcistub_device_id_add(domain, bus, slot, func);
1122 static DRIVER_ATTR(new_slot, S_IWUSR, NULL, pcistub_slot_add);
1124 static ssize_t pcistub_slot_remove(struct device_driver *drv, const char *buf,
1127 int domain, bus, slot, func;
1130 err = str_to_slot(buf, &domain, &bus, &slot, &func);
1134 err = pcistub_device_id_remove(domain, bus, slot, func);
1141 static DRIVER_ATTR(remove_slot, S_IWUSR, NULL, pcistub_slot_remove);
1143 static ssize_t pcistub_slot_show(struct device_driver *drv, char *buf)
1145 struct pcistub_device_id *pci_dev_id;
1147 unsigned long flags;
1149 spin_lock_irqsave(&device_ids_lock, flags);
1150 list_for_each_entry(pci_dev_id, &pcistub_device_ids, slot_list) {
1151 if (count >= PAGE_SIZE)
1154 count += scnprintf(buf + count, PAGE_SIZE - count,
1155 "%04x:%02x:%02x.%d\n",
1156 pci_dev_id->domain, pci_dev_id->bus,
1157 PCI_SLOT(pci_dev_id->devfn),
1158 PCI_FUNC(pci_dev_id->devfn));
1160 spin_unlock_irqrestore(&device_ids_lock, flags);
1164 static DRIVER_ATTR(slots, S_IRUSR, pcistub_slot_show, NULL);
1166 static ssize_t pcistub_irq_handler_show(struct device_driver *drv, char *buf)
1168 struct pcistub_device *psdev;
1169 struct xen_pcibk_dev_data *dev_data;
1171 unsigned long flags;
1173 spin_lock_irqsave(&pcistub_devices_lock, flags);
1174 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
1175 if (count >= PAGE_SIZE)
1179 dev_data = pci_get_drvdata(psdev->dev);
1183 scnprintf(buf + count, PAGE_SIZE - count,
1184 "%s:%s:%sing:%ld\n",
1185 pci_name(psdev->dev),
1186 dev_data->isr_on ? "on" : "off",
1187 dev_data->ack_intr ? "ack" : "not ack",
1190 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
1193 static DRIVER_ATTR(irq_handlers, S_IRUSR, pcistub_irq_handler_show, NULL);
1195 static ssize_t pcistub_irq_handler_switch(struct device_driver *drv,
1199 struct pcistub_device *psdev;
1200 struct xen_pcibk_dev_data *dev_data;
1201 int domain, bus, slot, func;
1204 err = str_to_slot(buf, &domain, &bus, &slot, &func);
1208 psdev = pcistub_device_find(domain, bus, slot, func);
1214 dev_data = pci_get_drvdata(psdev->dev);
1220 dev_dbg(&psdev->dev->dev, "%s fake irq handler: %d->%d\n",
1221 dev_data->irq_name, dev_data->isr_on,
1224 dev_data->isr_on = !(dev_data->isr_on);
1225 if (dev_data->isr_on)
1226 dev_data->ack_intr = 1;
1229 pcistub_device_put(psdev);
1234 static DRIVER_ATTR(irq_handler_state, S_IWUSR, NULL,
1235 pcistub_irq_handler_switch);
1237 static ssize_t pcistub_quirk_add(struct device_driver *drv, const char *buf,
1240 int domain, bus, slot, func, reg, size, mask;
1243 err = str_to_quirk(buf, &domain, &bus, &slot, &func, ®, &size,
1248 err = pcistub_reg_add(domain, bus, slot, func, reg, size, mask);
1256 static ssize_t pcistub_quirk_show(struct device_driver *drv, char *buf)
1259 unsigned long flags;
1260 struct xen_pcibk_config_quirk *quirk;
1261 struct xen_pcibk_dev_data *dev_data;
1262 const struct config_field *field;
1263 const struct config_field_entry *cfg_entry;
1265 spin_lock_irqsave(&device_ids_lock, flags);
1266 list_for_each_entry(quirk, &xen_pcibk_quirks, quirks_list) {
1267 if (count >= PAGE_SIZE)
1270 count += scnprintf(buf + count, PAGE_SIZE - count,
1271 "%02x:%02x.%01x\n\t%04x:%04x:%04x:%04x\n",
1272 quirk->pdev->bus->number,
1273 PCI_SLOT(quirk->pdev->devfn),
1274 PCI_FUNC(quirk->pdev->devfn),
1275 quirk->devid.vendor, quirk->devid.device,
1276 quirk->devid.subvendor,
1277 quirk->devid.subdevice);
1279 dev_data = pci_get_drvdata(quirk->pdev);
1281 list_for_each_entry(cfg_entry, &dev_data->config_fields, list) {
1282 field = cfg_entry->field;
1283 if (count >= PAGE_SIZE)
1286 count += scnprintf(buf + count, PAGE_SIZE - count,
1287 "\t\t%08x:%01x:%08x\n",
1288 cfg_entry->base_offset +
1289 field->offset, field->size,
1295 spin_unlock_irqrestore(&device_ids_lock, flags);
1299 static DRIVER_ATTR(quirks, S_IRUSR | S_IWUSR, pcistub_quirk_show,
1302 static ssize_t permissive_add(struct device_driver *drv, const char *buf,
1305 int domain, bus, slot, func;
1307 struct pcistub_device *psdev;
1308 struct xen_pcibk_dev_data *dev_data;
1310 err = str_to_slot(buf, &domain, &bus, &slot, &func);
1314 psdev = pcistub_device_find(domain, bus, slot, func);
1320 dev_data = pci_get_drvdata(psdev->dev);
1321 /* the driver data for a device should never be null at this point */
1326 if (!dev_data->permissive) {
1327 dev_data->permissive = 1;
1328 /* Let user know that what they're doing could be unsafe */
1329 dev_warn(&psdev->dev->dev, "enabling permissive mode "
1330 "configuration space accesses!\n");
1331 dev_warn(&psdev->dev->dev,
1332 "permissive mode is potentially unsafe!\n");
1335 pcistub_device_put(psdev);
1342 static ssize_t permissive_show(struct device_driver *drv, char *buf)
1344 struct pcistub_device *psdev;
1345 struct xen_pcibk_dev_data *dev_data;
1347 unsigned long flags;
1348 spin_lock_irqsave(&pcistub_devices_lock, flags);
1349 list_for_each_entry(psdev, &pcistub_devices, dev_list) {
1350 if (count >= PAGE_SIZE)
1354 dev_data = pci_get_drvdata(psdev->dev);
1355 if (!dev_data || !dev_data->permissive)
1358 scnprintf(buf + count, PAGE_SIZE - count, "%s\n",
1359 pci_name(psdev->dev));
1361 spin_unlock_irqrestore(&pcistub_devices_lock, flags);
1364 static DRIVER_ATTR(permissive, S_IRUSR | S_IWUSR, permissive_show,
1367 static void pcistub_exit(void)
1369 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_new_slot);
1370 driver_remove_file(&xen_pcibk_pci_driver.driver,
1371 &driver_attr_remove_slot);
1372 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_slots);
1373 driver_remove_file(&xen_pcibk_pci_driver.driver, &driver_attr_quirks);
1374 driver_remove_file(&xen_pcibk_pci_driver.driver,
1375 &driver_attr_permissive);
1376 driver_remove_file(&xen_pcibk_pci_driver.driver,
1377 &driver_attr_irq_handlers);
1378 driver_remove_file(&xen_pcibk_pci_driver.driver,
1379 &driver_attr_irq_handler_state);
1380 pci_unregister_driver(&xen_pcibk_pci_driver);
1383 static int __init pcistub_init(void)
1387 int domain, bus, slot, func;
1390 if (pci_devs_to_hide && *pci_devs_to_hide) {
1394 err = sscanf(pci_devs_to_hide + pos,
1395 " (%x:%x:%x.%x) %n",
1396 &domain, &bus, &slot, &func, &parsed);
1400 sscanf(pci_devs_to_hide + pos,
1402 &domain, &bus, &slot, &parsed);
1406 sscanf(pci_devs_to_hide + pos,
1408 &domain, &bus, &parsed);
1414 err = sscanf(pci_devs_to_hide + pos,
1416 &bus, &slot, &func, &parsed);
1420 sscanf(pci_devs_to_hide + pos,
1422 &bus, &slot, &parsed);
1426 sscanf(pci_devs_to_hide + pos,
1436 err = pcistub_device_id_add(domain, bus, slot, func);
1441 } while (pci_devs_to_hide[pos]);
1444 /* If we're the first PCI Device Driver to register, we're the
1445 * first one to get offered PCI devices as they become
1446 * available (and thus we can be the first to grab them)
1448 err = pci_register_driver(&xen_pcibk_pci_driver);
1452 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1453 &driver_attr_new_slot);
1455 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1456 &driver_attr_remove_slot);
1458 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1459 &driver_attr_slots);
1461 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1462 &driver_attr_quirks);
1464 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1465 &driver_attr_permissive);
1468 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1469 &driver_attr_irq_handlers);
1471 err = driver_create_file(&xen_pcibk_pci_driver.driver,
1472 &driver_attr_irq_handler_state);
1480 pr_err("Error parsing pci_devs_to_hide at \"%s\"\n",
1481 pci_devs_to_hide + pos);
1487 * fs_initcall happens before device_initcall
1488 * so xen_pcibk *should* get called first (b/c we
1489 * want to suck up any device before other drivers
1490 * get a chance by being the first pci device
1491 * driver to register)
1493 fs_initcall(pcistub_init);
1496 static int __init xen_pcibk_init(void)
1500 if (!xen_initial_domain())
1503 err = xen_pcibk_config_init();
1508 err = pcistub_init();
1513 pcistub_init_devices_late();
1514 err = xen_pcibk_xenbus_register();
1521 static void __exit xen_pcibk_cleanup(void)
1523 xen_pcibk_xenbus_unregister();
1527 module_init(xen_pcibk_init);
1528 module_exit(xen_pcibk_cleanup);
1530 MODULE_LICENSE("Dual BSD/GPL");
1531 MODULE_ALIAS("xen-backend:pci");