4 * Copyright 2014 IBM Corp.
5 * Author(s): Frank Blaschka <frank.blaschka@de.ibm.com>
6 * Hong Bo Li <lihbbj@cn.ibm.com>
7 * Yi Min Zhao <zyimin@cn.ibm.com>
9 * This work is licensed under the terms of the GNU GPL, version 2 or (at
10 * your option) any later version. See the COPYING file in the top-level
14 #include "qemu/osdep.h"
15 #include "qapi/error.h"
16 #include "qapi/visitor.h"
18 #include "hw/s390x/s390-pci-bus.h"
19 #include "hw/s390x/s390-pci-inst.h"
20 #include "hw/s390x/s390-pci-vfio.h"
21 #include "hw/pci/pci_bus.h"
22 #include "hw/qdev-properties.h"
23 #include "hw/pci/pci_bridge.h"
24 #include "hw/pci/msi.h"
25 #include "qemu/error-report.h"
26 #include "qemu/module.h"
28 #ifndef DEBUG_S390PCI_BUS
29 #define DEBUG_S390PCI_BUS 0
32 #define DPRINTF(fmt, ...) \
34 if (DEBUG_S390PCI_BUS) { \
35 fprintf(stderr, "S390pci-bus: " fmt, ## __VA_ARGS__); \
39 S390pciState
*s390_get_phb(void)
41 static S390pciState
*phb
;
44 phb
= S390_PCI_HOST_BRIDGE(
45 object_resolve_path(TYPE_S390_PCI_HOST_BRIDGE
, NULL
));
52 int pci_chsc_sei_nt2_get_event(void *res
)
54 ChscSeiNt2Res
*nt2_res
= (ChscSeiNt2Res
*)res
;
58 SeiContainer
*sei_cont
;
59 S390pciState
*s
= s390_get_phb();
61 sei_cont
= QTAILQ_FIRST(&s
->pending_sei
);
63 QTAILQ_REMOVE(&s
->pending_sei
, sei_cont
, link
);
65 nt2_res
->cc
= sei_cont
->cc
;
66 nt2_res
->length
= cpu_to_be16(sizeof(ChscSeiNt2Res
));
67 switch (sei_cont
->cc
) {
68 case 1: /* error event */
69 eccdf
= (PciCcdfErr
*)nt2_res
->ccdf
;
70 eccdf
->fid
= cpu_to_be32(sei_cont
->fid
);
71 eccdf
->fh
= cpu_to_be32(sei_cont
->fh
);
72 eccdf
->e
= cpu_to_be32(sei_cont
->e
);
73 eccdf
->faddr
= cpu_to_be64(sei_cont
->faddr
);
74 eccdf
->pec
= cpu_to_be16(sei_cont
->pec
);
76 case 2: /* availability event */
77 accdf
= (PciCcdfAvail
*)nt2_res
->ccdf
;
78 accdf
->fid
= cpu_to_be32(sei_cont
->fid
);
79 accdf
->fh
= cpu_to_be32(sei_cont
->fh
);
80 accdf
->pec
= cpu_to_be16(sei_cont
->pec
);
92 int pci_chsc_sei_nt2_have_event(void)
94 S390pciState
*s
= s390_get_phb();
96 return !QTAILQ_EMPTY(&s
->pending_sei
);
99 S390PCIBusDevice
*s390_pci_find_next_avail_dev(S390pciState
*s
,
100 S390PCIBusDevice
*pbdev
)
102 S390PCIBusDevice
*ret
= pbdev
? QTAILQ_NEXT(pbdev
, link
) :
103 QTAILQ_FIRST(&s
->zpci_devs
);
105 while (ret
&& ret
->state
== ZPCI_FS_RESERVED
) {
106 ret
= QTAILQ_NEXT(ret
, link
);
112 S390PCIBusDevice
*s390_pci_find_dev_by_fid(S390pciState
*s
, uint32_t fid
)
114 S390PCIBusDevice
*pbdev
;
116 QTAILQ_FOREACH(pbdev
, &s
->zpci_devs
, link
) {
117 if (pbdev
->fid
== fid
) {
125 void s390_pci_sclp_configure(SCCB
*sccb
)
127 IoaCfgSccb
*psccb
= (IoaCfgSccb
*)sccb
;
128 S390PCIBusDevice
*pbdev
= s390_pci_find_dev_by_fid(s390_get_phb(),
129 be32_to_cpu(psccb
->aid
));
133 DPRINTF("sclp config no dev found\n");
134 rc
= SCLP_RC_ADAPTER_ID_NOT_RECOGNIZED
;
138 switch (pbdev
->state
) {
139 case ZPCI_FS_RESERVED
:
140 rc
= SCLP_RC_ADAPTER_IN_RESERVED_STATE
;
142 case ZPCI_FS_STANDBY
:
143 pbdev
->state
= ZPCI_FS_DISABLED
;
144 rc
= SCLP_RC_NORMAL_COMPLETION
;
147 rc
= SCLP_RC_NO_ACTION_REQUIRED
;
150 psccb
->header
.response_code
= cpu_to_be16(rc
);
153 static void s390_pci_perform_unplug(S390PCIBusDevice
*pbdev
)
155 HotplugHandler
*hotplug_ctrl
;
157 /* Unplug the PCI device */
159 DeviceState
*pdev
= DEVICE(pbdev
->pdev
);
161 hotplug_ctrl
= qdev_get_hotplug_handler(pdev
);
162 hotplug_handler_unplug(hotplug_ctrl
, pdev
, &error_abort
);
163 object_unparent(OBJECT(pdev
));
166 /* Unplug the zPCI device */
167 hotplug_ctrl
= qdev_get_hotplug_handler(DEVICE(pbdev
));
168 hotplug_handler_unplug(hotplug_ctrl
, DEVICE(pbdev
), &error_abort
);
169 object_unparent(OBJECT(pbdev
));
172 void s390_pci_sclp_deconfigure(SCCB
*sccb
)
174 IoaCfgSccb
*psccb
= (IoaCfgSccb
*)sccb
;
175 S390PCIBusDevice
*pbdev
= s390_pci_find_dev_by_fid(s390_get_phb(),
176 be32_to_cpu(psccb
->aid
));
180 DPRINTF("sclp deconfig no dev found\n");
181 rc
= SCLP_RC_ADAPTER_ID_NOT_RECOGNIZED
;
185 switch (pbdev
->state
) {
186 case ZPCI_FS_RESERVED
:
187 rc
= SCLP_RC_ADAPTER_IN_RESERVED_STATE
;
189 case ZPCI_FS_STANDBY
:
190 rc
= SCLP_RC_NO_ACTION_REQUIRED
;
193 if (pbdev
->summary_ind
) {
194 pci_dereg_irqs(pbdev
);
196 if (pbdev
->iommu
->enabled
) {
197 pci_dereg_ioat(pbdev
->iommu
);
199 pbdev
->state
= ZPCI_FS_STANDBY
;
200 rc
= SCLP_RC_NORMAL_COMPLETION
;
202 if (pbdev
->unplug_requested
) {
203 s390_pci_perform_unplug(pbdev
);
207 psccb
->header
.response_code
= cpu_to_be16(rc
);
210 static S390PCIBusDevice
*s390_pci_find_dev_by_uid(S390pciState
*s
, uint16_t uid
)
212 S390PCIBusDevice
*pbdev
;
214 QTAILQ_FOREACH(pbdev
, &s
->zpci_devs
, link
) {
215 if (pbdev
->uid
== uid
) {
223 S390PCIBusDevice
*s390_pci_find_dev_by_target(S390pciState
*s
,
226 S390PCIBusDevice
*pbdev
;
232 QTAILQ_FOREACH(pbdev
, &s
->zpci_devs
, link
) {
233 if (!strcmp(pbdev
->target
, target
)) {
241 static S390PCIBusDevice
*s390_pci_find_dev_by_pci(S390pciState
*s
,
244 S390PCIBusDevice
*pbdev
;
250 QTAILQ_FOREACH(pbdev
, &s
->zpci_devs
, link
) {
251 if (pbdev
->pdev
== pci_dev
) {
259 S390PCIBusDevice
*s390_pci_find_dev_by_idx(S390pciState
*s
, uint32_t idx
)
261 return g_hash_table_lookup(s
->zpci_table
, &idx
);
264 S390PCIBusDevice
*s390_pci_find_dev_by_fh(S390pciState
*s
, uint32_t fh
)
266 uint32_t idx
= FH_MASK_INDEX
& fh
;
267 S390PCIBusDevice
*pbdev
= s390_pci_find_dev_by_idx(s
, idx
);
269 if (pbdev
&& pbdev
->fh
== fh
) {
276 static void s390_pci_generate_event(uint8_t cc
, uint16_t pec
, uint32_t fh
,
277 uint32_t fid
, uint64_t faddr
, uint32_t e
)
279 SeiContainer
*sei_cont
;
280 S390pciState
*s
= s390_get_phb();
282 sei_cont
= g_new0(SeiContainer
, 1);
287 sei_cont
->faddr
= faddr
;
290 QTAILQ_INSERT_TAIL(&s
->pending_sei
, sei_cont
, link
);
291 css_generate_css_crws(0);
294 static void s390_pci_generate_plug_event(uint16_t pec
, uint32_t fh
,
297 s390_pci_generate_event(2, pec
, fh
, fid
, 0, 0);
300 void s390_pci_generate_error_event(uint16_t pec
, uint32_t fh
, uint32_t fid
,
301 uint64_t faddr
, uint32_t e
)
303 s390_pci_generate_event(1, pec
, fh
, fid
, faddr
, e
);
306 static void s390_pci_set_irq(void *opaque
, int irq
, int level
)
311 static int s390_pci_map_irq(PCIDevice
*pci_dev
, int irq_num
)
317 static uint64_t s390_pci_get_table_origin(uint64_t iota
)
319 return iota
& ~ZPCI_IOTA_RTTO_FLAG
;
322 static unsigned int calc_rtx(dma_addr_t ptr
)
324 return ((unsigned long) ptr
>> ZPCI_RT_SHIFT
) & ZPCI_INDEX_MASK
;
327 static unsigned int calc_sx(dma_addr_t ptr
)
329 return ((unsigned long) ptr
>> ZPCI_ST_SHIFT
) & ZPCI_INDEX_MASK
;
332 static unsigned int calc_px(dma_addr_t ptr
)
334 return ((unsigned long) ptr
>> PAGE_SHIFT
) & ZPCI_PT_MASK
;
337 static uint64_t get_rt_sto(uint64_t entry
)
339 return ((entry
& ZPCI_TABLE_TYPE_MASK
) == ZPCI_TABLE_TYPE_RTX
)
340 ? (entry
& ZPCI_RTE_ADDR_MASK
)
344 static uint64_t get_st_pto(uint64_t entry
)
346 return ((entry
& ZPCI_TABLE_TYPE_MASK
) == ZPCI_TABLE_TYPE_SX
)
347 ? (entry
& ZPCI_STE_ADDR_MASK
)
351 static bool rt_entry_isvalid(uint64_t entry
)
353 return (entry
& ZPCI_TABLE_VALID_MASK
) == ZPCI_TABLE_VALID
;
356 static bool pt_entry_isvalid(uint64_t entry
)
358 return (entry
& ZPCI_PTE_VALID_MASK
) == ZPCI_PTE_VALID
;
361 static bool entry_isprotected(uint64_t entry
)
363 return (entry
& ZPCI_TABLE_PROT_MASK
) == ZPCI_TABLE_PROTECTED
;
366 /* ett is expected table type, -1 page table, 0 segment table, 1 region table */
367 static uint64_t get_table_index(uint64_t iova
, int8_t ett
)
371 return calc_px(iova
);
373 return calc_sx(iova
);
375 return calc_rtx(iova
);
381 static bool entry_isvalid(uint64_t entry
, int8_t ett
)
385 return pt_entry_isvalid(entry
);
388 return rt_entry_isvalid(entry
);
394 /* Return true if address translation is done */
395 static bool translate_iscomplete(uint64_t entry
, int8_t ett
)
399 return (entry
& ZPCI_TABLE_FC
) ? true : false;
407 static uint64_t get_frame_size(int8_t ett
)
421 static uint64_t get_next_table_origin(uint64_t entry
, int8_t ett
)
425 return entry
& ZPCI_PTE_ADDR_MASK
;
427 return get_st_pto(entry
);
429 return get_rt_sto(entry
);
436 * table_translate: do translation within one table and return the following
439 * @entry: the entry being translated, the result is stored in this.
440 * @to: the address of table origin.
441 * @ett: expected table type, 1 region table, 0 segment table and -1 page table.
444 static uint64_t table_translate(S390IOTLBEntry
*entry
, uint64_t to
, int8_t ett
,
447 uint64_t tx
, te
, nto
= 0;
450 tx
= get_table_index(entry
->iova
, ett
);
451 te
= address_space_ldq(&address_space_memory
, to
+ tx
* sizeof(uint64_t),
452 MEMTXATTRS_UNSPECIFIED
, NULL
);
455 err
= ERR_EVENT_INVALTE
;
459 if (!entry_isvalid(te
, ett
)) {
460 entry
->perm
&= IOMMU_NONE
;
464 if (ett
== ZPCI_ETT_RT
&& ((te
& ZPCI_TABLE_LEN_RTX
) != ZPCI_TABLE_LEN_RTX
465 || te
& ZPCI_TABLE_OFFSET_MASK
)) {
466 err
= ERR_EVENT_INVALTL
;
470 nto
= get_next_table_origin(te
, ett
);
476 if (entry_isprotected(te
)) {
477 entry
->perm
&= IOMMU_RO
;
479 entry
->perm
&= IOMMU_RW
;
482 if (translate_iscomplete(te
, ett
)) {
485 entry
->translated_addr
= te
& ZPCI_PTE_ADDR_MASK
;
488 entry
->translated_addr
= (te
& ZPCI_SFAA_MASK
) |
489 (entry
->iova
& ~ZPCI_SFAA_MASK
);
496 entry
->perm
= IOMMU_NONE
;
499 entry
->len
= get_frame_size(ett
);
503 uint16_t s390_guest_io_table_walk(uint64_t g_iota
, hwaddr addr
,
504 S390IOTLBEntry
*entry
)
506 uint64_t to
= s390_pci_get_table_origin(g_iota
);
510 entry
->iova
= addr
& PAGE_MASK
;
511 entry
->translated_addr
= 0;
512 entry
->perm
= IOMMU_RW
;
514 if (entry_isprotected(g_iota
)) {
515 entry
->perm
&= IOMMU_RO
;
519 to
= table_translate(entry
, to
, ett
--, &error
);
525 static IOMMUTLBEntry
s390_translate_iommu(IOMMUMemoryRegion
*mr
, hwaddr addr
,
526 IOMMUAccessFlags flag
, int iommu_idx
)
528 S390PCIIOMMU
*iommu
= container_of(mr
, S390PCIIOMMU
, iommu_mr
);
529 S390IOTLBEntry
*entry
;
530 uint64_t iova
= addr
& PAGE_MASK
;
532 IOMMUTLBEntry ret
= {
533 .target_as
= &address_space_memory
,
535 .translated_addr
= 0,
536 .addr_mask
= ~(hwaddr
)0,
540 switch (iommu
->pbdev
->state
) {
541 case ZPCI_FS_ENABLED
:
542 case ZPCI_FS_BLOCKED
:
543 if (!iommu
->enabled
) {
551 DPRINTF("iommu trans addr 0x%" PRIx64
"\n", addr
);
553 if (addr
< iommu
->pba
|| addr
> iommu
->pal
) {
554 error
= ERR_EVENT_OORANGE
;
558 entry
= g_hash_table_lookup(iommu
->iotlb
, &iova
);
560 ret
.iova
= entry
->iova
;
561 ret
.translated_addr
= entry
->translated_addr
;
562 ret
.addr_mask
= entry
->len
- 1;
563 ret
.perm
= entry
->perm
;
566 ret
.addr_mask
= ~PAGE_MASK
;
567 ret
.perm
= IOMMU_NONE
;
570 if (flag
!= IOMMU_NONE
&& !(flag
& ret
.perm
)) {
571 error
= ERR_EVENT_TPROTE
;
575 iommu
->pbdev
->state
= ZPCI_FS_ERROR
;
576 s390_pci_generate_error_event(error
, iommu
->pbdev
->fh
,
577 iommu
->pbdev
->fid
, addr
, 0);
582 static void s390_pci_iommu_replay(IOMMUMemoryRegion
*iommu
,
583 IOMMUNotifier
*notifier
)
585 /* It's impossible to plug a pci device on s390x that already has iommu
586 * mappings which need to be replayed, that is due to the "one iommu per
587 * zpci device" construct. But when we support migration of vfio-pci
588 * devices in future, we need to revisit this.
593 static S390PCIIOMMU
*s390_pci_get_iommu(S390pciState
*s
, PCIBus
*bus
,
596 uint64_t key
= (uintptr_t)bus
;
597 S390PCIIOMMUTable
*table
= g_hash_table_lookup(s
->iommu_table
, &key
);
601 table
= g_new0(S390PCIIOMMUTable
, 1);
603 g_hash_table_insert(s
->iommu_table
, &table
->key
, table
);
606 iommu
= table
->iommu
[PCI_SLOT(devfn
)];
608 iommu
= S390_PCI_IOMMU(object_new(TYPE_S390_PCI_IOMMU
));
610 char *mr_name
= g_strdup_printf("iommu-root-%02x:%02x.%01x",
614 char *as_name
= g_strdup_printf("iommu-pci-%02x:%02x.%01x",
618 memory_region_init(&iommu
->mr
, OBJECT(iommu
), mr_name
, UINT64_MAX
);
619 address_space_init(&iommu
->as
, &iommu
->mr
, as_name
);
620 iommu
->iotlb
= g_hash_table_new_full(g_int64_hash
, g_int64_equal
,
622 table
->iommu
[PCI_SLOT(devfn
)] = iommu
;
631 static AddressSpace
*s390_pci_dma_iommu(PCIBus
*bus
, void *opaque
, int devfn
)
633 S390pciState
*s
= opaque
;
634 S390PCIIOMMU
*iommu
= s390_pci_get_iommu(s
, bus
, devfn
);
639 static uint8_t set_ind_atomic(uint64_t ind_loc
, uint8_t to_be_set
)
641 uint8_t expected
, actual
;
643 /* avoid multiple fetches */
644 uint8_t volatile *ind_addr
;
646 ind_addr
= cpu_physical_memory_map(ind_loc
, &len
, true);
648 s390_pci_generate_error_event(ERR_EVENT_AIRERR
, 0, 0, 0, 0);
654 actual
= qatomic_cmpxchg(ind_addr
, expected
, expected
| to_be_set
);
655 } while (actual
!= expected
);
656 cpu_physical_memory_unmap((void *)ind_addr
, len
, 1, len
);
661 static void s390_msi_ctrl_write(void *opaque
, hwaddr addr
, uint64_t data
,
664 S390PCIBusDevice
*pbdev
= opaque
;
665 uint32_t vec
= data
& ZPCI_MSI_VEC_MASK
;
670 DPRINTF("write_msix data 0x%" PRIx64
" idx %d vec 0x%x\n", data
,
673 if (pbdev
->state
!= ZPCI_FS_ENABLED
) {
677 ind_bit
= pbdev
->routes
.adapter
.ind_offset
;
678 sum_bit
= pbdev
->routes
.adapter
.summary_offset
;
680 set_ind_atomic(pbdev
->routes
.adapter
.ind_addr
+ (ind_bit
+ vec
) / 8,
681 0x80 >> ((ind_bit
+ vec
) % 8));
682 if (!set_ind_atomic(pbdev
->routes
.adapter
.summary_addr
+ sum_bit
/ 8,
683 0x80 >> (sum_bit
% 8))) {
684 css_adapter_interrupt(CSS_IO_ADAPTER_PCI
, pbdev
->isc
);
688 static uint64_t s390_msi_ctrl_read(void *opaque
, hwaddr addr
, unsigned size
)
693 static const MemoryRegionOps s390_msi_ctrl_ops
= {
694 .write
= s390_msi_ctrl_write
,
695 .read
= s390_msi_ctrl_read
,
696 .endianness
= DEVICE_LITTLE_ENDIAN
,
699 void s390_pci_iommu_enable(S390PCIIOMMU
*iommu
)
702 * The iommu region is initialized against a 0-mapped address space,
703 * so the smallest IOMMU region we can define runs from 0 to the end
704 * of the PCI address space.
706 char *name
= g_strdup_printf("iommu-s390-%04x", iommu
->pbdev
->uid
);
707 memory_region_init_iommu(&iommu
->iommu_mr
, sizeof(iommu
->iommu_mr
),
708 TYPE_S390_IOMMU_MEMORY_REGION
, OBJECT(&iommu
->mr
),
709 name
, iommu
->pal
+ 1);
710 iommu
->enabled
= true;
711 memory_region_add_subregion(&iommu
->mr
, 0, MEMORY_REGION(&iommu
->iommu_mr
));
715 void s390_pci_iommu_disable(S390PCIIOMMU
*iommu
)
717 iommu
->enabled
= false;
718 g_hash_table_remove_all(iommu
->iotlb
);
719 memory_region_del_subregion(&iommu
->mr
, MEMORY_REGION(&iommu
->iommu_mr
));
720 object_unparent(OBJECT(&iommu
->iommu_mr
));
723 static void s390_pci_iommu_free(S390pciState
*s
, PCIBus
*bus
, int32_t devfn
)
725 uint64_t key
= (uintptr_t)bus
;
726 S390PCIIOMMUTable
*table
= g_hash_table_lookup(s
->iommu_table
, &key
);
727 S390PCIIOMMU
*iommu
= table
? table
->iommu
[PCI_SLOT(devfn
)] : NULL
;
729 if (!table
|| !iommu
) {
733 table
->iommu
[PCI_SLOT(devfn
)] = NULL
;
734 g_hash_table_destroy(iommu
->iotlb
);
736 * An attached PCI device may have memory listeners, eg. VFIO PCI.
737 * The associated subregion will already have been unmapped in
738 * s390_pci_iommu_disable in response to the guest deconfigure request.
739 * Remove the listeners now before destroying the address space.
741 address_space_remove_listeners(&iommu
->as
);
742 address_space_destroy(&iommu
->as
);
743 object_unparent(OBJECT(&iommu
->mr
));
744 object_unparent(OBJECT(iommu
));
745 object_unref(OBJECT(iommu
));
748 S390PCIGroup
*s390_group_create(int id
)
751 S390pciState
*s
= s390_get_phb();
753 group
= g_new0(S390PCIGroup
, 1);
755 QTAILQ_INSERT_TAIL(&s
->zpci_groups
, group
, link
);
759 S390PCIGroup
*s390_group_find(int id
)
762 S390pciState
*s
= s390_get_phb();
764 QTAILQ_FOREACH(group
, &s
->zpci_groups
, link
) {
765 if (group
->id
== id
) {
772 static void s390_pci_init_default_group(void)
775 ClpRspQueryPciGrp
*resgrp
;
777 group
= s390_group_create(ZPCI_DEFAULT_FN_GRP
);
778 resgrp
= &group
->zpci_group
;
781 resgrp
->msia
= ZPCI_MSI_ADDR
;
782 resgrp
->mui
= DEFAULT_MUI
;
784 resgrp
->maxstbl
= 128;
788 static void set_pbdev_info(S390PCIBusDevice
*pbdev
)
790 pbdev
->zpci_fn
.sdma
= ZPCI_SDMA_ADDR
;
791 pbdev
->zpci_fn
.edma
= ZPCI_EDMA_ADDR
;
792 pbdev
->zpci_fn
.pchid
= 0;
793 pbdev
->zpci_fn
.pfgid
= ZPCI_DEFAULT_FN_GRP
;
794 pbdev
->zpci_fn
.fid
= pbdev
->fid
;
795 pbdev
->zpci_fn
.uid
= pbdev
->uid
;
796 pbdev
->pci_group
= s390_group_find(ZPCI_DEFAULT_FN_GRP
);
799 static void s390_pcihost_realize(DeviceState
*dev
, Error
**errp
)
803 PCIHostState
*phb
= PCI_HOST_BRIDGE(dev
);
804 S390pciState
*s
= S390_PCI_HOST_BRIDGE(dev
);
806 DPRINTF("host_init\n");
808 b
= pci_register_root_bus(dev
, NULL
, s390_pci_set_irq
, s390_pci_map_irq
,
809 NULL
, get_system_memory(), get_system_io(), 0,
811 pci_setup_iommu(b
, s390_pci_dma_iommu
, s
);
814 qbus_set_hotplug_handler(bus
, OBJECT(dev
));
817 s
->bus
= S390_PCI_BUS(qbus_create(TYPE_S390_PCI_BUS
, dev
, NULL
));
818 qbus_set_hotplug_handler(BUS(s
->bus
), OBJECT(dev
));
820 s
->iommu_table
= g_hash_table_new_full(g_int64_hash
, g_int64_equal
,
822 s
->zpci_table
= g_hash_table_new_full(g_int_hash
, g_int_equal
, NULL
, NULL
);
824 QTAILQ_INIT(&s
->pending_sei
);
825 QTAILQ_INIT(&s
->zpci_devs
);
826 QTAILQ_INIT(&s
->zpci_dma_limit
);
827 QTAILQ_INIT(&s
->zpci_groups
);
829 s390_pci_init_default_group();
830 css_register_io_adapters(CSS_IO_ADAPTER_PCI
, true, false,
831 S390_ADAPTER_SUPPRESSIBLE
, errp
);
834 static void s390_pcihost_unrealize(DeviceState
*dev
)
837 S390pciState
*s
= S390_PCI_HOST_BRIDGE(dev
);
839 while (!QTAILQ_EMPTY(&s
->zpci_groups
)) {
840 group
= QTAILQ_FIRST(&s
->zpci_groups
);
841 QTAILQ_REMOVE(&s
->zpci_groups
, group
, link
);
845 static int s390_pci_msix_init(S390PCIBusDevice
*pbdev
)
852 pos
= pci_find_capability(pbdev
->pdev
, PCI_CAP_ID_MSIX
);
857 ctrl
= pci_host_config_read_common(pbdev
->pdev
, pos
+ PCI_MSIX_FLAGS
,
858 pci_config_size(pbdev
->pdev
), sizeof(ctrl
));
859 table
= pci_host_config_read_common(pbdev
->pdev
, pos
+ PCI_MSIX_TABLE
,
860 pci_config_size(pbdev
->pdev
), sizeof(table
));
861 pba
= pci_host_config_read_common(pbdev
->pdev
, pos
+ PCI_MSIX_PBA
,
862 pci_config_size(pbdev
->pdev
), sizeof(pba
));
864 pbdev
->msix
.table_bar
= table
& PCI_MSIX_FLAGS_BIRMASK
;
865 pbdev
->msix
.table_offset
= table
& ~PCI_MSIX_FLAGS_BIRMASK
;
866 pbdev
->msix
.pba_bar
= pba
& PCI_MSIX_FLAGS_BIRMASK
;
867 pbdev
->msix
.pba_offset
= pba
& ~PCI_MSIX_FLAGS_BIRMASK
;
868 pbdev
->msix
.entries
= (ctrl
& PCI_MSIX_FLAGS_QSIZE
) + 1;
870 name
= g_strdup_printf("msix-s390-%04x", pbdev
->uid
);
871 memory_region_init_io(&pbdev
->msix_notify_mr
, OBJECT(pbdev
),
872 &s390_msi_ctrl_ops
, pbdev
, name
, PAGE_SIZE
);
873 memory_region_add_subregion(&pbdev
->iommu
->mr
,
874 pbdev
->pci_group
->zpci_group
.msia
,
875 &pbdev
->msix_notify_mr
);
881 static void s390_pci_msix_free(S390PCIBusDevice
*pbdev
)
883 memory_region_del_subregion(&pbdev
->iommu
->mr
, &pbdev
->msix_notify_mr
);
884 object_unparent(OBJECT(&pbdev
->msix_notify_mr
));
887 static S390PCIBusDevice
*s390_pci_device_new(S390pciState
*s
,
888 const char *target
, Error
**errp
)
890 Error
*local_err
= NULL
;
893 dev
= qdev_try_new(TYPE_S390_PCI_DEVICE
);
895 error_setg(errp
, "zPCI device could not be created");
899 if (!object_property_set_str(OBJECT(dev
), "target", target
, &local_err
)) {
900 object_unparent(OBJECT(dev
));
901 error_propagate_prepend(errp
, local_err
,
902 "zPCI device could not be created: ");
905 if (!qdev_realize_and_unref(dev
, BUS(s
->bus
), &local_err
)) {
906 object_unparent(OBJECT(dev
));
907 error_propagate_prepend(errp
, local_err
,
908 "zPCI device could not be created: ");
912 return S390_PCI_DEVICE(dev
);
915 static bool s390_pci_alloc_idx(S390pciState
*s
, S390PCIBusDevice
*pbdev
)
920 while (s390_pci_find_dev_by_idx(s
, idx
)) {
921 idx
= (idx
+ 1) & FH_MASK_INDEX
;
922 if (idx
== s
->next_idx
) {
931 static void s390_pcihost_pre_plug(HotplugHandler
*hotplug_dev
, DeviceState
*dev
,
934 S390pciState
*s
= S390_PCI_HOST_BRIDGE(hotplug_dev
);
936 if (!s390_has_feat(S390_FEAT_ZPCI
)) {
937 warn_report("Plugging a PCI/zPCI device without the 'zpci' CPU "
938 "feature enabled; the guest will not be able to see/use "
942 if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_DEVICE
)) {
943 PCIDevice
*pdev
= PCI_DEVICE(dev
);
945 if (pdev
->cap_present
& QEMU_PCI_CAP_MULTIFUNCTION
) {
946 error_setg(errp
, "multifunction not supported in s390");
949 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_S390_PCI_DEVICE
)) {
950 S390PCIBusDevice
*pbdev
= S390_PCI_DEVICE(dev
);
952 if (!s390_pci_alloc_idx(s
, pbdev
)) {
953 error_setg(errp
, "no slot for plugging zpci device");
959 static void s390_pci_update_subordinate(PCIDevice
*dev
, uint32_t nr
)
963 pci_default_write_config(dev
, PCI_SUBORDINATE_BUS
, nr
, 1);
964 while (!pci_bus_is_root(pci_get_bus(dev
))) {
965 dev
= pci_get_bus(dev
)->parent_dev
;
967 old_nr
= pci_default_read_config(dev
, PCI_SUBORDINATE_BUS
, 1);
969 pci_default_write_config(dev
, PCI_SUBORDINATE_BUS
, nr
, 1);
974 static void s390_pcihost_plug(HotplugHandler
*hotplug_dev
, DeviceState
*dev
,
977 S390pciState
*s
= S390_PCI_HOST_BRIDGE(hotplug_dev
);
978 PCIDevice
*pdev
= NULL
;
979 S390PCIBusDevice
*pbdev
= NULL
;
981 if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_BRIDGE
)) {
982 PCIBridge
*pb
= PCI_BRIDGE(dev
);
984 pdev
= PCI_DEVICE(dev
);
985 pci_bridge_map_irq(pb
, dev
->id
, s390_pci_map_irq
);
986 pci_setup_iommu(&pb
->sec_bus
, s390_pci_dma_iommu
, s
);
988 qbus_set_hotplug_handler(BUS(&pb
->sec_bus
), OBJECT(s
));
990 if (dev
->hotplugged
) {
991 pci_default_write_config(pdev
, PCI_PRIMARY_BUS
,
992 pci_dev_bus_num(pdev
), 1);
994 pci_default_write_config(pdev
, PCI_SECONDARY_BUS
, s
->bus_no
, 1);
996 s390_pci_update_subordinate(pdev
, s
->bus_no
);
998 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_DEVICE
)) {
999 pdev
= PCI_DEVICE(dev
);
1002 /* In the case the PCI device does not define an id */
1003 /* we generate one based on the PCI address */
1004 dev
->id
= g_strdup_printf("auto_%02x:%02x.%01x",
1005 pci_dev_bus_num(pdev
),
1006 PCI_SLOT(pdev
->devfn
),
1007 PCI_FUNC(pdev
->devfn
));
1010 pbdev
= s390_pci_find_dev_by_target(s
, dev
->id
);
1012 pbdev
= s390_pci_device_new(s
, dev
->id
, errp
);
1019 pbdev
->iommu
= s390_pci_get_iommu(s
, pci_get_bus(pdev
), pdev
->devfn
);
1020 pbdev
->iommu
->pbdev
= pbdev
;
1021 pbdev
->state
= ZPCI_FS_DISABLED
;
1022 set_pbdev_info(pbdev
);
1024 if (object_dynamic_cast(OBJECT(dev
), "vfio-pci")) {
1025 pbdev
->fh
|= FH_SHM_VFIO
;
1026 pbdev
->iommu
->dma_limit
= s390_pci_start_dma_count(s
, pbdev
);
1027 /* Fill in CLP information passed via the vfio region */
1028 s390_pci_get_clp_info(pbdev
);
1030 pbdev
->fh
|= FH_SHM_EMUL
;
1033 if (s390_pci_msix_init(pbdev
)) {
1034 error_setg(errp
, "MSI-X support is mandatory "
1035 "in the S390 architecture");
1039 if (dev
->hotplugged
) {
1040 s390_pci_generate_plug_event(HP_EVENT_TO_CONFIGURED
,
1041 pbdev
->fh
, pbdev
->fid
);
1043 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_S390_PCI_DEVICE
)) {
1044 pbdev
= S390_PCI_DEVICE(dev
);
1046 /* the allocated idx is actually getting used */
1047 s
->next_idx
= (pbdev
->idx
+ 1) & FH_MASK_INDEX
;
1048 pbdev
->fh
= pbdev
->idx
;
1049 QTAILQ_INSERT_TAIL(&s
->zpci_devs
, pbdev
, link
);
1050 g_hash_table_insert(s
->zpci_table
, &pbdev
->idx
, pbdev
);
1052 g_assert_not_reached();
1056 static void s390_pcihost_unplug(HotplugHandler
*hotplug_dev
, DeviceState
*dev
,
1059 S390pciState
*s
= S390_PCI_HOST_BRIDGE(hotplug_dev
);
1060 S390PCIBusDevice
*pbdev
= NULL
;
1062 if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_DEVICE
)) {
1063 PCIDevice
*pci_dev
= PCI_DEVICE(dev
);
1067 pbdev
= s390_pci_find_dev_by_pci(s
, PCI_DEVICE(dev
));
1070 s390_pci_generate_plug_event(HP_EVENT_STANDBY_TO_RESERVED
,
1071 pbdev
->fh
, pbdev
->fid
);
1072 bus
= pci_get_bus(pci_dev
);
1073 devfn
= pci_dev
->devfn
;
1074 qdev_unrealize(dev
);
1076 s390_pci_msix_free(pbdev
);
1077 s390_pci_iommu_free(s
, bus
, devfn
);
1079 pbdev
->state
= ZPCI_FS_RESERVED
;
1080 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_S390_PCI_DEVICE
)) {
1081 pbdev
= S390_PCI_DEVICE(dev
);
1083 QTAILQ_REMOVE(&s
->zpci_devs
, pbdev
, link
);
1084 g_hash_table_remove(s
->zpci_table
, &pbdev
->idx
);
1085 if (pbdev
->iommu
->dma_limit
) {
1086 s390_pci_end_dma_count(s
, pbdev
->iommu
->dma_limit
);
1088 qdev_unrealize(dev
);
1092 static void s390_pcihost_unplug_request(HotplugHandler
*hotplug_dev
,
1096 S390pciState
*s
= S390_PCI_HOST_BRIDGE(hotplug_dev
);
1097 S390PCIBusDevice
*pbdev
;
1099 if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_BRIDGE
)) {
1100 error_setg(errp
, "PCI bridge hot unplug currently not supported");
1101 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_PCI_DEVICE
)) {
1103 * Redirect the unplug request to the zPCI device and remember that
1104 * we've checked the PCI device already (to prevent endless recursion).
1106 pbdev
= s390_pci_find_dev_by_pci(s
, PCI_DEVICE(dev
));
1108 pbdev
->pci_unplug_request_processed
= true;
1109 qdev_unplug(DEVICE(pbdev
), errp
);
1110 } else if (object_dynamic_cast(OBJECT(dev
), TYPE_S390_PCI_DEVICE
)) {
1111 pbdev
= S390_PCI_DEVICE(dev
);
1114 * If unplug was initially requested for the zPCI device, we
1115 * first have to redirect to the PCI device, which will in return
1116 * redirect back to us after performing its checks (if the request
1117 * is not blocked, e.g. because it's a PCI bridge).
1119 if (pbdev
->pdev
&& !pbdev
->pci_unplug_request_processed
) {
1120 qdev_unplug(DEVICE(pbdev
->pdev
), errp
);
1123 pbdev
->pci_unplug_request_processed
= false;
1125 switch (pbdev
->state
) {
1126 case ZPCI_FS_STANDBY
:
1127 case ZPCI_FS_RESERVED
:
1128 s390_pci_perform_unplug(pbdev
);
1132 * Allow to send multiple requests, e.g. if the guest crashed
1133 * before releasing the device, we would not be able to send
1134 * another request to the same VM (e.g. fresh OS).
1136 pbdev
->unplug_requested
= true;
1137 s390_pci_generate_plug_event(HP_EVENT_DECONFIGURE_REQUEST
,
1138 pbdev
->fh
, pbdev
->fid
);
1141 g_assert_not_reached();
1145 static void s390_pci_enumerate_bridge(PCIBus
*bus
, PCIDevice
*pdev
,
1148 S390pciState
*s
= opaque
;
1149 PCIBus
*sec_bus
= NULL
;
1151 if ((pci_default_read_config(pdev
, PCI_HEADER_TYPE
, 1) !=
1152 PCI_HEADER_TYPE_BRIDGE
)) {
1157 pci_default_write_config(pdev
, PCI_PRIMARY_BUS
, pci_dev_bus_num(pdev
), 1);
1158 pci_default_write_config(pdev
, PCI_SECONDARY_BUS
, s
->bus_no
, 1);
1159 pci_default_write_config(pdev
, PCI_SUBORDINATE_BUS
, s
->bus_no
, 1);
1161 sec_bus
= pci_bridge_get_sec_bus(PCI_BRIDGE(pdev
));
1166 /* Assign numbers to all child bridges. The last is the highest number. */
1167 pci_for_each_device(sec_bus
, pci_bus_num(sec_bus
),
1168 s390_pci_enumerate_bridge
, s
);
1169 pci_default_write_config(pdev
, PCI_SUBORDINATE_BUS
, s
->bus_no
, 1);
1172 static void s390_pcihost_reset(DeviceState
*dev
)
1174 S390pciState
*s
= S390_PCI_HOST_BRIDGE(dev
);
1175 PCIBus
*bus
= s
->parent_obj
.bus
;
1176 S390PCIBusDevice
*pbdev
, *next
;
1178 /* Process all pending unplug requests */
1179 QTAILQ_FOREACH_SAFE(pbdev
, &s
->zpci_devs
, link
, next
) {
1180 if (pbdev
->unplug_requested
) {
1181 if (pbdev
->summary_ind
) {
1182 pci_dereg_irqs(pbdev
);
1184 if (pbdev
->iommu
->enabled
) {
1185 pci_dereg_ioat(pbdev
->iommu
);
1187 pbdev
->state
= ZPCI_FS_STANDBY
;
1188 s390_pci_perform_unplug(pbdev
);
1193 * When resetting a PCI bridge, the assigned numbers are set to 0. So
1194 * on every system reset, we also have to reassign numbers.
1197 pci_for_each_device(bus
, pci_bus_num(bus
), s390_pci_enumerate_bridge
, s
);
1200 static void s390_pcihost_class_init(ObjectClass
*klass
, void *data
)
1202 DeviceClass
*dc
= DEVICE_CLASS(klass
);
1203 HotplugHandlerClass
*hc
= HOTPLUG_HANDLER_CLASS(klass
);
1205 dc
->reset
= s390_pcihost_reset
;
1206 dc
->realize
= s390_pcihost_realize
;
1207 dc
->unrealize
= s390_pcihost_unrealize
;
1208 hc
->pre_plug
= s390_pcihost_pre_plug
;
1209 hc
->plug
= s390_pcihost_plug
;
1210 hc
->unplug_request
= s390_pcihost_unplug_request
;
1211 hc
->unplug
= s390_pcihost_unplug
;
1212 msi_nonbroken
= true;
1215 static const TypeInfo s390_pcihost_info
= {
1216 .name
= TYPE_S390_PCI_HOST_BRIDGE
,
1217 .parent
= TYPE_PCI_HOST_BRIDGE
,
1218 .instance_size
= sizeof(S390pciState
),
1219 .class_init
= s390_pcihost_class_init
,
1220 .interfaces
= (InterfaceInfo
[]) {
1221 { TYPE_HOTPLUG_HANDLER
},
1226 static const TypeInfo s390_pcibus_info
= {
1227 .name
= TYPE_S390_PCI_BUS
,
1229 .instance_size
= sizeof(S390PCIBus
),
1232 static uint16_t s390_pci_generate_uid(S390pciState
*s
)
1238 if (!s390_pci_find_dev_by_uid(s
, uid
)) {
1241 } while (uid
< ZPCI_MAX_UID
);
1243 return UID_UNDEFINED
;
1246 static uint32_t s390_pci_generate_fid(S390pciState
*s
, Error
**errp
)
1251 if (!s390_pci_find_dev_by_fid(s
, fid
)) {
1254 } while (fid
++ != ZPCI_MAX_FID
);
1256 error_setg(errp
, "no free fid could be found");
1260 static void s390_pci_device_realize(DeviceState
*dev
, Error
**errp
)
1262 S390PCIBusDevice
*zpci
= S390_PCI_DEVICE(dev
);
1263 S390pciState
*s
= s390_get_phb();
1265 if (!zpci
->target
) {
1266 error_setg(errp
, "target must be defined");
1270 if (s390_pci_find_dev_by_target(s
, zpci
->target
)) {
1271 error_setg(errp
, "target %s already has an associated zpci device",
1276 if (zpci
->uid
== UID_UNDEFINED
) {
1277 zpci
->uid
= s390_pci_generate_uid(s
);
1279 error_setg(errp
, "no free uid could be found");
1282 } else if (s390_pci_find_dev_by_uid(s
, zpci
->uid
)) {
1283 error_setg(errp
, "uid %u already in use", zpci
->uid
);
1287 if (!zpci
->fid_defined
) {
1288 Error
*local_error
= NULL
;
1290 zpci
->fid
= s390_pci_generate_fid(s
, &local_error
);
1292 error_propagate(errp
, local_error
);
1295 } else if (s390_pci_find_dev_by_fid(s
, zpci
->fid
)) {
1296 error_setg(errp
, "fid %u already in use", zpci
->fid
);
1300 zpci
->state
= ZPCI_FS_RESERVED
;
1301 zpci
->fmb
.format
= ZPCI_FMB_FORMAT
;
1304 static void s390_pci_device_reset(DeviceState
*dev
)
1306 S390PCIBusDevice
*pbdev
= S390_PCI_DEVICE(dev
);
1308 switch (pbdev
->state
) {
1309 case ZPCI_FS_RESERVED
:
1311 case ZPCI_FS_STANDBY
:
1314 pbdev
->fh
&= ~FH_MASK_ENABLE
;
1315 pbdev
->state
= ZPCI_FS_DISABLED
;
1319 if (pbdev
->summary_ind
) {
1320 pci_dereg_irqs(pbdev
);
1322 if (pbdev
->iommu
->enabled
) {
1323 pci_dereg_ioat(pbdev
->iommu
);
1326 fmb_timer_free(pbdev
);
1329 static void s390_pci_get_fid(Object
*obj
, Visitor
*v
, const char *name
,
1330 void *opaque
, Error
**errp
)
1332 Property
*prop
= opaque
;
1333 uint32_t *ptr
= qdev_get_prop_ptr(DEVICE(obj
), prop
);
1335 visit_type_uint32(v
, name
, ptr
, errp
);
1338 static void s390_pci_set_fid(Object
*obj
, Visitor
*v
, const char *name
,
1339 void *opaque
, Error
**errp
)
1341 DeviceState
*dev
= DEVICE(obj
);
1342 S390PCIBusDevice
*zpci
= S390_PCI_DEVICE(obj
);
1343 Property
*prop
= opaque
;
1344 uint32_t *ptr
= qdev_get_prop_ptr(dev
, prop
);
1346 if (dev
->realized
) {
1347 qdev_prop_set_after_realize(dev
, name
, errp
);
1351 if (!visit_type_uint32(v
, name
, ptr
, errp
)) {
1354 zpci
->fid_defined
= true;
1357 static const PropertyInfo s390_pci_fid_propinfo
= {
1359 .get
= s390_pci_get_fid
,
1360 .set
= s390_pci_set_fid
,
1363 #define DEFINE_PROP_S390_PCI_FID(_n, _s, _f) \
1364 DEFINE_PROP(_n, _s, _f, s390_pci_fid_propinfo, uint32_t)
1366 static Property s390_pci_device_properties
[] = {
1367 DEFINE_PROP_UINT16("uid", S390PCIBusDevice
, uid
, UID_UNDEFINED
),
1368 DEFINE_PROP_S390_PCI_FID("fid", S390PCIBusDevice
, fid
),
1369 DEFINE_PROP_STRING("target", S390PCIBusDevice
, target
),
1370 DEFINE_PROP_END_OF_LIST(),
1373 static const VMStateDescription s390_pci_device_vmstate
= {
1374 .name
= TYPE_S390_PCI_DEVICE
,
1376 * TODO: add state handling here, so migration works at least with
1377 * emulated pci devices on s390x
1382 static void s390_pci_device_class_init(ObjectClass
*klass
, void *data
)
1384 DeviceClass
*dc
= DEVICE_CLASS(klass
);
1386 dc
->desc
= "zpci device";
1387 set_bit(DEVICE_CATEGORY_MISC
, dc
->categories
);
1388 dc
->reset
= s390_pci_device_reset
;
1389 dc
->bus_type
= TYPE_S390_PCI_BUS
;
1390 dc
->realize
= s390_pci_device_realize
;
1391 device_class_set_props(dc
, s390_pci_device_properties
);
1392 dc
->vmsd
= &s390_pci_device_vmstate
;
1395 static const TypeInfo s390_pci_device_info
= {
1396 .name
= TYPE_S390_PCI_DEVICE
,
1397 .parent
= TYPE_DEVICE
,
1398 .instance_size
= sizeof(S390PCIBusDevice
),
1399 .class_init
= s390_pci_device_class_init
,
1402 static TypeInfo s390_pci_iommu_info
= {
1403 .name
= TYPE_S390_PCI_IOMMU
,
1404 .parent
= TYPE_OBJECT
,
1405 .instance_size
= sizeof(S390PCIIOMMU
),
1408 static void s390_iommu_memory_region_class_init(ObjectClass
*klass
, void *data
)
1410 IOMMUMemoryRegionClass
*imrc
= IOMMU_MEMORY_REGION_CLASS(klass
);
1412 imrc
->translate
= s390_translate_iommu
;
1413 imrc
->replay
= s390_pci_iommu_replay
;
1416 static const TypeInfo s390_iommu_memory_region_info
= {
1417 .parent
= TYPE_IOMMU_MEMORY_REGION
,
1418 .name
= TYPE_S390_IOMMU_MEMORY_REGION
,
1419 .class_init
= s390_iommu_memory_region_class_init
,
1422 static void s390_pci_register_types(void)
1424 type_register_static(&s390_pcihost_info
);
1425 type_register_static(&s390_pcibus_info
);
1426 type_register_static(&s390_pci_device_info
);
1427 type_register_static(&s390_pci_iommu_info
);
1428 type_register_static(&s390_iommu_memory_region_info
);
1431 type_init(s390_pci_register_types
)