1 // SPDX-License-Identifier: GPL-2.0
5 * Author: Ryan Wilson <hap9@epoch.ncsc.mil>
7 #include <linux/module.h>
8 #include <linux/init.h>
10 #include <xen/xenbus.h>
11 #include <xen/events.h>
12 #include <xen/grant_table.h>
14 #include <linux/spinlock.h>
15 #include <linux/pci.h>
16 #include <linux/msi.h>
17 #include <xen/interface/io/pciif.h>
18 #include <asm/xen/pci.h>
19 #include <linux/interrupt.h>
20 #include <linux/atomic.h>
21 #include <linux/workqueue.h>
22 #include <linux/bitops.h>
23 #include <linux/time.h>
24 #include <linux/ktime.h>
25 #include <xen/platform_pci.h>
27 #include <asm/xen/swiotlb-xen.h>
29 #define INVALID_EVTCHN (-1)
31 struct pci_bus_entry
{
32 struct list_head list
;
36 #define _PDEVB_op_active (0)
37 #define PDEVB_op_active (1 << (_PDEVB_op_active))
39 struct pcifront_device
{
40 struct xenbus_device
*xdev
;
41 struct list_head root_buses
;
48 /* Lock this when doing any operations in sh_info */
49 spinlock_t sh_info_lock
;
50 struct xen_pci_sharedinfo
*sh_info
;
51 struct work_struct op_work
;
57 struct pci_sysdata sd
;
58 struct pcifront_device
*pdev
;
61 static inline struct pcifront_device
*
62 pcifront_get_pdev(struct pcifront_sd
*sd
)
67 static inline void pcifront_init_sd(struct pcifront_sd
*sd
,
68 unsigned int domain
, unsigned int bus
,
69 struct pcifront_device
*pdev
)
71 /* Because we do not expose that information via XenBus. */
72 sd
->sd
.node
= first_online_node
;
73 sd
->sd
.domain
= domain
;
77 static DEFINE_SPINLOCK(pcifront_dev_lock
);
78 static struct pcifront_device
*pcifront_dev
;
80 static int errno_to_pcibios_err(int errno
)
83 case XEN_PCI_ERR_success
:
84 return PCIBIOS_SUCCESSFUL
;
86 case XEN_PCI_ERR_dev_not_found
:
87 return PCIBIOS_DEVICE_NOT_FOUND
;
89 case XEN_PCI_ERR_invalid_offset
:
90 case XEN_PCI_ERR_op_failed
:
91 return PCIBIOS_BAD_REGISTER_NUMBER
;
93 case XEN_PCI_ERR_not_implemented
:
94 return PCIBIOS_FUNC_NOT_SUPPORTED
;
96 case XEN_PCI_ERR_access_denied
:
97 return PCIBIOS_SET_FAILED
;
102 static inline void schedule_pcifront_aer_op(struct pcifront_device
*pdev
)
104 if (test_bit(_XEN_PCIB_active
, (unsigned long *)&pdev
->sh_info
->flags
)
105 && !test_and_set_bit(_PDEVB_op_active
, &pdev
->flags
)) {
106 dev_dbg(&pdev
->xdev
->dev
, "schedule aer frontend job\n");
107 schedule_work(&pdev
->op_work
);
111 static int do_pci_op(struct pcifront_device
*pdev
, struct xen_pci_op
*op
)
114 struct xen_pci_op
*active_op
= &pdev
->sh_info
->op
;
115 unsigned long irq_flags
;
116 evtchn_port_t port
= pdev
->evtchn
;
117 unsigned int irq
= pdev
->irq
;
120 spin_lock_irqsave(&pdev
->sh_info_lock
, irq_flags
);
122 memcpy(active_op
, op
, sizeof(struct xen_pci_op
));
126 set_bit(_XEN_PCIF_active
, (unsigned long *)&pdev
->sh_info
->flags
);
127 notify_remote_via_evtchn(port
);
130 * We set a poll timeout of 3 seconds but give up on return after
131 * 2 seconds. It is better to time out too late rather than too early
132 * (in the latter case we end up continually re-executing poll() with a
133 * timeout in the past). 1s difference gives plenty of slack for error.
135 ns_timeout
= ktime_get_ns() + 2 * (s64
)NSEC_PER_SEC
;
137 xen_clear_irq_pending(irq
);
139 while (test_bit(_XEN_PCIF_active
,
140 (unsigned long *)&pdev
->sh_info
->flags
)) {
141 xen_poll_irq_timeout(irq
, jiffies
+ 3*HZ
);
142 xen_clear_irq_pending(irq
);
144 if (ns
> ns_timeout
) {
145 dev_err(&pdev
->xdev
->dev
,
146 "pciback not responding!!!\n");
147 clear_bit(_XEN_PCIF_active
,
148 (unsigned long *)&pdev
->sh_info
->flags
);
149 err
= XEN_PCI_ERR_dev_not_found
;
155 * We might lose backend service request since we
156 * reuse same evtchn with pci_conf backend response. So re-schedule
157 * aer pcifront service.
159 if (test_bit(_XEN_PCIB_active
,
160 (unsigned long *)&pdev
->sh_info
->flags
)) {
161 dev_err(&pdev
->xdev
->dev
,
162 "schedule aer pcifront service\n");
163 schedule_pcifront_aer_op(pdev
);
166 memcpy(op
, active_op
, sizeof(struct xen_pci_op
));
170 spin_unlock_irqrestore(&pdev
->sh_info_lock
, irq_flags
);
174 /* Access to this function is spinlocked in drivers/pci/access.c */
175 static int pcifront_bus_read(struct pci_bus
*bus
, unsigned int devfn
,
176 int where
, int size
, u32
*val
)
179 struct xen_pci_op op
= {
180 .cmd
= XEN_PCI_OP_conf_read
,
181 .domain
= pci_domain_nr(bus
),
187 struct pcifront_sd
*sd
= bus
->sysdata
;
188 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
190 dev_dbg(&pdev
->xdev
->dev
,
191 "read dev=%04x:%02x:%02x.%d - offset %x size %d\n",
192 pci_domain_nr(bus
), bus
->number
, PCI_SLOT(devfn
),
193 PCI_FUNC(devfn
), where
, size
);
195 err
= do_pci_op(pdev
, &op
);
198 dev_dbg(&pdev
->xdev
->dev
, "read got back value %x\n",
202 } else if (err
== -ENODEV
) {
203 /* No device here, pretend that it just returned 0 */
208 return errno_to_pcibios_err(err
);
211 /* Access to this function is spinlocked in drivers/pci/access.c */
212 static int pcifront_bus_write(struct pci_bus
*bus
, unsigned int devfn
,
213 int where
, int size
, u32 val
)
215 struct xen_pci_op op
= {
216 .cmd
= XEN_PCI_OP_conf_write
,
217 .domain
= pci_domain_nr(bus
),
224 struct pcifront_sd
*sd
= bus
->sysdata
;
225 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
227 dev_dbg(&pdev
->xdev
->dev
,
228 "write dev=%04x:%02x:%02x.%d - offset %x size %d val %x\n",
229 pci_domain_nr(bus
), bus
->number
,
230 PCI_SLOT(devfn
), PCI_FUNC(devfn
), where
, size
, val
);
232 return errno_to_pcibios_err(do_pci_op(pdev
, &op
));
235 static struct pci_ops pcifront_bus_ops
= {
236 .read
= pcifront_bus_read
,
237 .write
= pcifront_bus_write
,
240 #ifdef CONFIG_PCI_MSI
241 static int pci_frontend_enable_msix(struct pci_dev
*dev
,
242 int vector
[], int nvec
)
246 struct xen_pci_op op
= {
247 .cmd
= XEN_PCI_OP_enable_msix
,
248 .domain
= pci_domain_nr(dev
->bus
),
249 .bus
= dev
->bus
->number
,
253 struct pcifront_sd
*sd
= dev
->bus
->sysdata
;
254 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
255 struct msi_desc
*entry
;
257 if (nvec
> SH_INFO_MAX_VEC
) {
258 pci_err(dev
, "too many vectors (0x%x) for PCI frontend:"
259 " Increase SH_INFO_MAX_VEC\n", nvec
);
264 msi_for_each_desc(entry
, &dev
->dev
, MSI_DESC_NOTASSOCIATED
) {
265 op
.msix_entries
[i
].entry
= entry
->msi_index
;
266 /* Vector is useless at this point. */
267 op
.msix_entries
[i
].vector
= -1;
271 err
= do_pci_op(pdev
, &op
);
274 if (likely(!op
.value
)) {
275 /* we get the result */
276 for (i
= 0; i
< nvec
; i
++) {
277 if (op
.msix_entries
[i
].vector
<= 0) {
278 pci_warn(dev
, "MSI-X entry %d is invalid: %d!\n",
279 i
, op
.msix_entries
[i
].vector
);
284 vector
[i
] = op
.msix_entries
[i
].vector
;
287 pr_info("enable msix get value %x\n", op
.value
);
291 pci_err(dev
, "enable msix get err %x\n", err
);
296 static void pci_frontend_disable_msix(struct pci_dev
*dev
)
299 struct xen_pci_op op
= {
300 .cmd
= XEN_PCI_OP_disable_msix
,
301 .domain
= pci_domain_nr(dev
->bus
),
302 .bus
= dev
->bus
->number
,
305 struct pcifront_sd
*sd
= dev
->bus
->sysdata
;
306 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
308 err
= do_pci_op(pdev
, &op
);
310 /* What should do for error ? */
312 pci_err(dev
, "pci_disable_msix get err %x\n", err
);
315 static int pci_frontend_enable_msi(struct pci_dev
*dev
, int vector
[])
318 struct xen_pci_op op
= {
319 .cmd
= XEN_PCI_OP_enable_msi
,
320 .domain
= pci_domain_nr(dev
->bus
),
321 .bus
= dev
->bus
->number
,
324 struct pcifront_sd
*sd
= dev
->bus
->sysdata
;
325 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
327 err
= do_pci_op(pdev
, &op
);
329 vector
[0] = op
.value
;
331 pci_warn(dev
, "MSI entry is invalid: %d!\n",
337 pci_err(dev
, "pci frontend enable msi failed for dev "
338 "%x:%x\n", op
.bus
, op
.devfn
);
344 static void pci_frontend_disable_msi(struct pci_dev
*dev
)
347 struct xen_pci_op op
= {
348 .cmd
= XEN_PCI_OP_disable_msi
,
349 .domain
= pci_domain_nr(dev
->bus
),
350 .bus
= dev
->bus
->number
,
353 struct pcifront_sd
*sd
= dev
->bus
->sysdata
;
354 struct pcifront_device
*pdev
= pcifront_get_pdev(sd
);
356 err
= do_pci_op(pdev
, &op
);
357 if (err
== XEN_PCI_ERR_dev_not_found
) {
358 /* XXX No response from backend, what shall we do? */
359 pr_info("get no response from backend for disable MSI\n");
363 /* how can pciback notify us fail? */
364 pr_info("get fake response from backend\n");
367 static struct xen_pci_frontend_ops pci_frontend_ops
= {
368 .enable_msi
= pci_frontend_enable_msi
,
369 .disable_msi
= pci_frontend_disable_msi
,
370 .enable_msix
= pci_frontend_enable_msix
,
371 .disable_msix
= pci_frontend_disable_msix
,
374 static void pci_frontend_registrar(int enable
)
377 xen_pci_frontend
= &pci_frontend_ops
;
379 xen_pci_frontend
= NULL
;
382 static inline void pci_frontend_registrar(int enable
) { };
383 #endif /* CONFIG_PCI_MSI */
385 /* Claim resources for the PCI frontend as-is, backend won't allow changes */
386 static int pcifront_claim_resource(struct pci_dev
*dev
, void *data
)
388 struct pcifront_device
*pdev
= data
;
392 pci_dev_for_each_resource(dev
, r
, i
) {
393 if (!r
->parent
&& r
->start
&& r
->flags
) {
394 dev_info(&pdev
->xdev
->dev
, "claiming resource %s/%d\n",
396 if (pci_claim_resource(dev
, i
)) {
397 dev_err(&pdev
->xdev
->dev
, "Could not claim resource %s/%d! "
398 "Device offline. Try using e820_host=1 in the guest config.\n",
407 static int pcifront_scan_bus(struct pcifront_device
*pdev
,
408 unsigned int domain
, unsigned int bus
,
415 * Scan the bus for functions and add.
416 * We omit handling of PCI bridge attachment because pciback prevents
417 * bridges from being exported.
419 for (devfn
= 0; devfn
< 0x100; devfn
++) {
420 d
= pci_get_slot(b
, devfn
);
422 /* Device is already known. */
427 d
= pci_scan_single_device(b
, devfn
);
429 dev_info(&pdev
->xdev
->dev
, "New device on "
430 "%04x:%02x:%02x.%d found.\n", domain
, bus
,
431 PCI_SLOT(devfn
), PCI_FUNC(devfn
));
437 static int pcifront_scan_root(struct pcifront_device
*pdev
,
438 unsigned int domain
, unsigned int bus
)
441 LIST_HEAD(resources
);
442 struct pcifront_sd
*sd
= NULL
;
443 struct pci_bus_entry
*bus_entry
= NULL
;
445 static struct resource busn_res
= {
448 .flags
= IORESOURCE_BUS
,
451 #ifndef CONFIG_PCI_DOMAINS
453 dev_err(&pdev
->xdev
->dev
,
454 "PCI Root in non-zero PCI Domain! domain=%d\n", domain
);
455 dev_err(&pdev
->xdev
->dev
,
456 "Please compile with CONFIG_PCI_DOMAINS\n");
462 dev_info(&pdev
->xdev
->dev
, "Creating PCI Frontend Bus %04x:%02x\n",
465 bus_entry
= kzalloc(sizeof(*bus_entry
), GFP_KERNEL
);
466 sd
= kzalloc(sizeof(*sd
), GFP_KERNEL
);
467 if (!bus_entry
|| !sd
) {
471 pci_add_resource(&resources
, &ioport_resource
);
472 pci_add_resource(&resources
, &iomem_resource
);
473 pci_add_resource(&resources
, &busn_res
);
474 pcifront_init_sd(sd
, domain
, bus
, pdev
);
476 pci_lock_rescan_remove();
478 b
= pci_scan_root_bus(&pdev
->xdev
->dev
, bus
,
479 &pcifront_bus_ops
, sd
, &resources
);
481 dev_err(&pdev
->xdev
->dev
,
482 "Error creating PCI Frontend Bus!\n");
484 pci_unlock_rescan_remove();
485 pci_free_resource_list(&resources
);
491 list_add(&bus_entry
->list
, &pdev
->root_buses
);
494 * pci_scan_root_bus skips devices which do not have a
495 * devfn==0. The pcifront_scan_bus enumerates all devfn.
497 err
= pcifront_scan_bus(pdev
, domain
, bus
, b
);
499 /* Claim resources before going "live" with our devices */
500 pci_walk_bus(b
, pcifront_claim_resource
, pdev
);
502 /* Create SysFS and notify udev of the devices. Aka: "going live" */
503 pci_bus_add_devices(b
);
505 pci_unlock_rescan_remove();
515 static int pcifront_rescan_root(struct pcifront_device
*pdev
,
516 unsigned int domain
, unsigned int bus
)
521 b
= pci_find_bus(domain
, bus
);
523 /* If the bus is unknown, create it. */
524 return pcifront_scan_root(pdev
, domain
, bus
);
526 dev_info(&pdev
->xdev
->dev
, "Rescanning PCI Frontend Bus %04x:%02x\n",
529 err
= pcifront_scan_bus(pdev
, domain
, bus
, b
);
531 /* Claim resources before going "live" with our devices */
532 pci_walk_bus(b
, pcifront_claim_resource
, pdev
);
534 /* Create SysFS and notify udev of the devices. Aka: "going live" */
535 pci_bus_add_devices(b
);
540 static void free_root_bus_devs(struct pci_bus
*bus
)
544 while (!list_empty(&bus
->devices
)) {
545 dev
= container_of(bus
->devices
.next
, struct pci_dev
,
547 pci_dbg(dev
, "removing device\n");
548 pci_stop_and_remove_bus_device(dev
);
552 static void pcifront_free_roots(struct pcifront_device
*pdev
)
554 struct pci_bus_entry
*bus_entry
, *t
;
556 dev_dbg(&pdev
->xdev
->dev
, "cleaning up root buses\n");
558 pci_lock_rescan_remove();
559 list_for_each_entry_safe(bus_entry
, t
, &pdev
->root_buses
, list
) {
560 list_del(&bus_entry
->list
);
562 free_root_bus_devs(bus_entry
->bus
);
564 kfree(bus_entry
->bus
->sysdata
);
566 device_unregister(bus_entry
->bus
->bridge
);
567 pci_remove_bus(bus_entry
->bus
);
571 pci_unlock_rescan_remove();
574 static pci_ers_result_t
pcifront_common_process(int cmd
,
575 struct pcifront_device
*pdev
,
576 pci_channel_state_t state
)
578 struct pci_driver
*pdrv
;
579 int bus
= pdev
->sh_info
->aer_op
.bus
;
580 int devfn
= pdev
->sh_info
->aer_op
.devfn
;
581 int domain
= pdev
->sh_info
->aer_op
.domain
;
582 struct pci_dev
*pcidev
;
584 dev_dbg(&pdev
->xdev
->dev
,
585 "pcifront AER process: cmd %x (bus:%x, devfn%x)",
588 pcidev
= pci_get_domain_bus_and_slot(domain
, bus
, devfn
);
589 if (!pcidev
|| !pcidev
->dev
.driver
) {
590 dev_err(&pdev
->xdev
->dev
, "device or AER driver is NULL\n");
592 return PCI_ERS_RESULT_NONE
;
594 pdrv
= to_pci_driver(pcidev
->dev
.driver
);
596 if (pdrv
->err_handler
&& pdrv
->err_handler
->error_detected
) {
597 pci_dbg(pcidev
, "trying to call AER service\n");
599 case XEN_PCI_OP_aer_detected
:
600 return pdrv
->err_handler
->error_detected(pcidev
, state
);
601 case XEN_PCI_OP_aer_mmio
:
602 return pdrv
->err_handler
->mmio_enabled(pcidev
);
603 case XEN_PCI_OP_aer_slotreset
:
604 return pdrv
->err_handler
->slot_reset(pcidev
);
605 case XEN_PCI_OP_aer_resume
:
606 pdrv
->err_handler
->resume(pcidev
);
607 return PCI_ERS_RESULT_NONE
;
609 dev_err(&pdev
->xdev
->dev
,
610 "bad request in aer recovery operation!\n");
614 return PCI_ERS_RESULT_NONE
;
618 static void pcifront_do_aer(struct work_struct
*data
)
620 struct pcifront_device
*pdev
=
621 container_of(data
, struct pcifront_device
, op_work
);
622 int cmd
= pdev
->sh_info
->aer_op
.cmd
;
623 pci_channel_state_t state
=
624 (pci_channel_state_t
)pdev
->sh_info
->aer_op
.err
;
627 * If a pci_conf op is in progress, we have to wait until it is done
628 * before service aer op
630 dev_dbg(&pdev
->xdev
->dev
,
631 "pcifront service aer bus %x devfn %x\n",
632 pdev
->sh_info
->aer_op
.bus
, pdev
->sh_info
->aer_op
.devfn
);
634 pdev
->sh_info
->aer_op
.err
= pcifront_common_process(cmd
, pdev
, state
);
636 /* Post the operation to the guest. */
638 clear_bit(_XEN_PCIB_active
, (unsigned long *)&pdev
->sh_info
->flags
);
639 notify_remote_via_evtchn(pdev
->evtchn
);
641 /*in case of we lost an aer request in four lines time_window*/
642 smp_mb__before_atomic();
643 clear_bit(_PDEVB_op_active
, &pdev
->flags
);
644 smp_mb__after_atomic();
646 schedule_pcifront_aer_op(pdev
);
650 static irqreturn_t
pcifront_handler_aer(int irq
, void *dev
)
652 struct pcifront_device
*pdev
= dev
;
654 schedule_pcifront_aer_op(pdev
);
657 static int pcifront_connect_and_init_dma(struct pcifront_device
*pdev
)
661 spin_lock(&pcifront_dev_lock
);
664 dev_info(&pdev
->xdev
->dev
, "Installing PCI frontend\n");
669 spin_unlock(&pcifront_dev_lock
);
674 static void pcifront_disconnect(struct pcifront_device
*pdev
)
676 spin_lock(&pcifront_dev_lock
);
678 if (pdev
== pcifront_dev
) {
679 dev_info(&pdev
->xdev
->dev
,
680 "Disconnecting PCI Frontend Buses\n");
684 spin_unlock(&pcifront_dev_lock
);
686 static struct pcifront_device
*alloc_pdev(struct xenbus_device
*xdev
)
688 struct pcifront_device
*pdev
;
690 pdev
= kzalloc(sizeof(struct pcifront_device
), GFP_KERNEL
);
694 if (xenbus_setup_ring(xdev
, GFP_KERNEL
, (void **)&pdev
->sh_info
, 1,
700 pdev
->sh_info
->flags
= 0;
702 /*Flag for registering PV AER handler*/
703 set_bit(_XEN_PCIB_AERHANDLER
, (void *)&pdev
->sh_info
->flags
);
705 dev_set_drvdata(&xdev
->dev
, pdev
);
708 INIT_LIST_HEAD(&pdev
->root_buses
);
710 spin_lock_init(&pdev
->sh_info_lock
);
712 pdev
->evtchn
= INVALID_EVTCHN
;
715 INIT_WORK(&pdev
->op_work
, pcifront_do_aer
);
717 dev_dbg(&xdev
->dev
, "Allocated pdev @ 0x%p pdev->sh_info @ 0x%p\n",
718 pdev
, pdev
->sh_info
);
723 static void free_pdev(struct pcifront_device
*pdev
)
725 dev_dbg(&pdev
->xdev
->dev
, "freeing pdev @ 0x%p\n", pdev
);
727 pcifront_free_roots(pdev
);
729 cancel_work_sync(&pdev
->op_work
);
732 unbind_from_irqhandler(pdev
->irq
, pdev
);
734 if (pdev
->evtchn
!= INVALID_EVTCHN
)
735 xenbus_free_evtchn(pdev
->xdev
, pdev
->evtchn
);
737 xenbus_teardown_ring((void **)&pdev
->sh_info
, 1, &pdev
->gnt_ref
);
739 dev_set_drvdata(&pdev
->xdev
->dev
, NULL
);
744 static int pcifront_publish_info(struct pcifront_device
*pdev
)
747 struct xenbus_transaction trans
;
749 err
= xenbus_alloc_evtchn(pdev
->xdev
, &pdev
->evtchn
);
753 err
= bind_evtchn_to_irqhandler(pdev
->evtchn
, pcifront_handler_aer
,
754 0, "pcifront", pdev
);
762 err
= xenbus_transaction_start(&trans
);
764 xenbus_dev_fatal(pdev
->xdev
, err
,
765 "Error writing configuration for backend "
766 "(start transaction)");
770 err
= xenbus_printf(trans
, pdev
->xdev
->nodename
,
771 "pci-op-ref", "%u", pdev
->gnt_ref
);
773 err
= xenbus_printf(trans
, pdev
->xdev
->nodename
,
774 "event-channel", "%u", pdev
->evtchn
);
776 err
= xenbus_printf(trans
, pdev
->xdev
->nodename
,
777 "magic", XEN_PCI_MAGIC
);
780 xenbus_transaction_end(trans
, 1);
781 xenbus_dev_fatal(pdev
->xdev
, err
,
782 "Error writing configuration for backend");
785 err
= xenbus_transaction_end(trans
, 0);
789 xenbus_dev_fatal(pdev
->xdev
, err
,
790 "Error completing transaction "
796 xenbus_switch_state(pdev
->xdev
, XenbusStateInitialised
);
798 dev_dbg(&pdev
->xdev
->dev
, "publishing successful!\n");
804 static void pcifront_connect(struct pcifront_device
*pdev
)
807 int i
, num_roots
, len
;
809 unsigned int domain
, bus
;
811 err
= xenbus_scanf(XBT_NIL
, pdev
->xdev
->otherend
,
812 "root_num", "%d", &num_roots
);
813 if (err
== -ENOENT
) {
814 xenbus_dev_error(pdev
->xdev
, err
,
815 "No PCI Roots found, trying 0000:00");
816 err
= pcifront_rescan_root(pdev
, 0, 0);
818 xenbus_dev_fatal(pdev
->xdev
, err
,
819 "Error scanning PCI root 0000:00");
823 } else if (err
!= 1) {
824 xenbus_dev_fatal(pdev
->xdev
, err
>= 0 ? -EINVAL
: err
,
825 "Error reading number of PCI roots");
829 for (i
= 0; i
< num_roots
; i
++) {
830 len
= snprintf(str
, sizeof(str
), "root-%d", i
);
831 if (unlikely(len
>= (sizeof(str
) - 1)))
834 err
= xenbus_scanf(XBT_NIL
, pdev
->xdev
->otherend
, str
,
835 "%x:%x", &domain
, &bus
);
837 xenbus_dev_fatal(pdev
->xdev
, err
>= 0 ? -EINVAL
: err
,
838 "Error reading PCI root %d", i
);
842 err
= pcifront_rescan_root(pdev
, domain
, bus
);
844 xenbus_dev_fatal(pdev
->xdev
, err
,
845 "Error scanning PCI root %04x:%02x",
851 xenbus_switch_state(pdev
->xdev
, XenbusStateConnected
);
854 static void pcifront_try_connect(struct pcifront_device
*pdev
)
858 /* Only connect once */
859 if (xenbus_read_driver_state(pdev
->xdev
->nodename
) !=
860 XenbusStateInitialised
)
863 err
= pcifront_connect_and_init_dma(pdev
);
864 if (err
&& err
!= -EEXIST
) {
865 xenbus_dev_fatal(pdev
->xdev
, err
,
866 "Error setting up PCI Frontend");
870 pcifront_connect(pdev
);
873 static int pcifront_try_disconnect(struct pcifront_device
*pdev
)
876 enum xenbus_state prev_state
;
879 prev_state
= xenbus_read_driver_state(pdev
->xdev
->nodename
);
881 if (prev_state
>= XenbusStateClosing
)
884 if (prev_state
== XenbusStateConnected
) {
885 pcifront_free_roots(pdev
);
886 pcifront_disconnect(pdev
);
889 err
= xenbus_switch_state(pdev
->xdev
, XenbusStateClosed
);
896 static void pcifront_attach_devices(struct pcifront_device
*pdev
)
898 if (xenbus_read_driver_state(pdev
->xdev
->nodename
) ==
899 XenbusStateReconfiguring
)
900 pcifront_connect(pdev
);
903 static int pcifront_detach_devices(struct pcifront_device
*pdev
)
907 enum xenbus_state state
;
908 unsigned int domain
, bus
, slot
, func
;
909 struct pci_dev
*pci_dev
;
912 state
= xenbus_read_driver_state(pdev
->xdev
->nodename
);
913 if (state
== XenbusStateInitialised
) {
914 dev_dbg(&pdev
->xdev
->dev
, "Handle skipped connect.\n");
915 /* We missed Connected and need to initialize. */
916 err
= pcifront_connect_and_init_dma(pdev
);
917 if (err
&& err
!= -EEXIST
) {
918 xenbus_dev_fatal(pdev
->xdev
, err
,
919 "Error setting up PCI Frontend");
923 goto out_switch_state
;
924 } else if (state
!= XenbusStateConnected
) {
928 err
= xenbus_scanf(XBT_NIL
, pdev
->xdev
->otherend
, "num_devs", "%d",
933 xenbus_dev_fatal(pdev
->xdev
, err
,
934 "Error reading number of PCI devices");
938 /* Find devices being detached and remove them. */
939 for (i
= 0; i
< num_devs
; i
++) {
942 l
= snprintf(str
, sizeof(str
), "state-%d", i
);
943 if (unlikely(l
>= (sizeof(str
) - 1))) {
947 state
= xenbus_read_unsigned(pdev
->xdev
->otherend
, str
,
950 if (state
!= XenbusStateClosing
)
954 l
= snprintf(str
, sizeof(str
), "vdev-%d", i
);
955 if (unlikely(l
>= (sizeof(str
) - 1))) {
959 err
= xenbus_scanf(XBT_NIL
, pdev
->xdev
->otherend
, str
,
960 "%x:%x:%x.%x", &domain
, &bus
, &slot
, &func
);
964 xenbus_dev_fatal(pdev
->xdev
, err
,
965 "Error reading PCI device %d", i
);
969 pci_dev
= pci_get_domain_bus_and_slot(domain
, bus
,
970 PCI_DEVFN(slot
, func
));
972 dev_dbg(&pdev
->xdev
->dev
,
973 "Cannot get PCI device %04x:%02x:%02x.%d\n",
974 domain
, bus
, slot
, func
);
977 pci_lock_rescan_remove();
978 pci_stop_and_remove_bus_device(pci_dev
);
979 pci_dev_put(pci_dev
);
980 pci_unlock_rescan_remove();
982 dev_dbg(&pdev
->xdev
->dev
,
983 "PCI device %04x:%02x:%02x.%d removed.\n",
984 domain
, bus
, slot
, func
);
988 err
= xenbus_switch_state(pdev
->xdev
, XenbusStateReconfiguring
);
994 static void pcifront_backend_changed(struct xenbus_device
*xdev
,
995 enum xenbus_state be_state
)
997 struct pcifront_device
*pdev
= dev_get_drvdata(&xdev
->dev
);
1000 case XenbusStateUnknown
:
1001 case XenbusStateInitialising
:
1002 case XenbusStateInitWait
:
1003 case XenbusStateInitialised
:
1006 case XenbusStateConnected
:
1007 pcifront_try_connect(pdev
);
1010 case XenbusStateClosed
:
1011 if (xdev
->state
== XenbusStateClosed
)
1013 fallthrough
; /* Missed the backend's CLOSING state */
1014 case XenbusStateClosing
:
1015 dev_warn(&xdev
->dev
, "backend going away!\n");
1016 pcifront_try_disconnect(pdev
);
1019 case XenbusStateReconfiguring
:
1020 pcifront_detach_devices(pdev
);
1023 case XenbusStateReconfigured
:
1024 pcifront_attach_devices(pdev
);
1029 static int pcifront_xenbus_probe(struct xenbus_device
*xdev
,
1030 const struct xenbus_device_id
*id
)
1033 struct pcifront_device
*pdev
= alloc_pdev(xdev
);
1037 xenbus_dev_fatal(xdev
, err
,
1038 "Error allocating pcifront_device struct");
1042 err
= pcifront_publish_info(pdev
);
1050 static void pcifront_xenbus_remove(struct xenbus_device
*xdev
)
1052 struct pcifront_device
*pdev
= dev_get_drvdata(&xdev
->dev
);
1058 static const struct xenbus_device_id xenpci_ids
[] = {
1063 static struct xenbus_driver xenpci_driver
= {
1066 .probe
= pcifront_xenbus_probe
,
1067 .remove
= pcifront_xenbus_remove
,
1068 .otherend_changed
= pcifront_backend_changed
,
1071 static int __init
pcifront_init(void)
1073 if (!xen_pv_domain() || xen_initial_domain())
1076 if (!xen_has_pv_devices())
1079 pci_frontend_registrar(1 /* enable */);
1081 return xenbus_register_frontend(&xenpci_driver
);
1084 static void __exit
pcifront_cleanup(void)
1086 xenbus_unregister_driver(&xenpci_driver
);
1087 pci_frontend_registrar(0 /* disable */);
1089 module_init(pcifront_init
);
1090 module_exit(pcifront_cleanup
);
1092 MODULE_DESCRIPTION("Xen PCI passthrough frontend.");
1093 MODULE_LICENSE("GPL");
1094 MODULE_ALIAS("xen:pci");