4 * Copyright (c) 2020 Red Hat, Inc.
6 * This program is free software; you can redistribute it and/or modify it
7 * under the terms and conditions of the GNU General Public License,
8 * version 2 or later, as published by the Free Software Foundation.
10 * This program is distributed in the hope it will be useful, but WITHOUT
11 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
12 * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for
15 * You should have received a copy of the GNU General Public License along with
16 * this program. If not, see <http://www.gnu.org/licenses/>.
20 #include "qemu/osdep.h"
23 #include "qemu-common.h"
24 #include "hw/qdev-properties.h"
25 #include "hw/virtio/virtio.h"
26 #include "sysemu/kvm.h"
27 #include "qapi/error.h"
28 #include "qemu/error-report.h"
31 #include "standard-headers/linux/virtio_ids.h"
33 #include "hw/virtio/virtio-bus.h"
34 #include "hw/virtio/virtio-access.h"
35 #include "hw/virtio/virtio-iommu.h"
36 #include "hw/pci/pci_bus.h"
37 #include "hw/pci/pci.h"
40 #define VIOMMU_DEFAULT_QUEUE_SIZE 256
41 #define VIOMMU_PROBE_SIZE 512
43 typedef struct VirtIOIOMMUDomain
{
46 QLIST_HEAD(, VirtIOIOMMUEndpoint
) endpoint_list
;
49 typedef struct VirtIOIOMMUEndpoint
{
51 VirtIOIOMMUDomain
*domain
;
52 QLIST_ENTRY(VirtIOIOMMUEndpoint
) next
;
53 } VirtIOIOMMUEndpoint
;
55 typedef struct VirtIOIOMMUInterval
{
58 } VirtIOIOMMUInterval
;
60 typedef struct VirtIOIOMMUMapping
{
65 static inline uint16_t virtio_iommu_get_bdf(IOMMUDevice
*dev
)
67 return PCI_BUILD_BDF(pci_bus_num(dev
->bus
), dev
->devfn
);
71 * The bus number is used for lookup when SID based operations occur.
72 * In that case we lazily populate the IOMMUPciBus array from the bus hash
73 * table. At the time the IOMMUPciBus is created (iommu_find_add_as), the bus
74 * numbers may not be always initialized yet.
76 static IOMMUPciBus
*iommu_find_iommu_pcibus(VirtIOIOMMU
*s
, uint8_t bus_num
)
78 IOMMUPciBus
*iommu_pci_bus
= s
->iommu_pcibus_by_bus_num
[bus_num
];
83 g_hash_table_iter_init(&iter
, s
->as_by_busptr
);
84 while (g_hash_table_iter_next(&iter
, NULL
, (void **)&iommu_pci_bus
)) {
85 if (pci_bus_num(iommu_pci_bus
->bus
) == bus_num
) {
86 s
->iommu_pcibus_by_bus_num
[bus_num
] = iommu_pci_bus
;
95 static IOMMUMemoryRegion
*virtio_iommu_mr(VirtIOIOMMU
*s
, uint32_t sid
)
98 IOMMUPciBus
*iommu_pci_bus
;
101 bus_n
= PCI_BUS_NUM(sid
);
102 iommu_pci_bus
= iommu_find_iommu_pcibus(s
, bus_n
);
104 devfn
= sid
& PCI_DEVFN_MAX
;
105 dev
= iommu_pci_bus
->pbdev
[devfn
];
107 return &dev
->iommu_mr
;
113 static gint
interval_cmp(gconstpointer a
, gconstpointer b
, gpointer user_data
)
115 VirtIOIOMMUInterval
*inta
= (VirtIOIOMMUInterval
*)a
;
116 VirtIOIOMMUInterval
*intb
= (VirtIOIOMMUInterval
*)b
;
118 if (inta
->high
< intb
->low
) {
120 } else if (intb
->high
< inta
->low
) {
127 static void virtio_iommu_detach_endpoint_from_domain(VirtIOIOMMUEndpoint
*ep
)
132 QLIST_REMOVE(ep
, next
);
136 static VirtIOIOMMUEndpoint
*virtio_iommu_get_endpoint(VirtIOIOMMU
*s
,
139 VirtIOIOMMUEndpoint
*ep
;
141 ep
= g_tree_lookup(s
->endpoints
, GUINT_TO_POINTER(ep_id
));
145 if (!virtio_iommu_mr(s
, ep_id
)) {
148 ep
= g_malloc0(sizeof(*ep
));
150 trace_virtio_iommu_get_endpoint(ep_id
);
151 g_tree_insert(s
->endpoints
, GUINT_TO_POINTER(ep_id
), ep
);
155 static void virtio_iommu_put_endpoint(gpointer data
)
157 VirtIOIOMMUEndpoint
*ep
= (VirtIOIOMMUEndpoint
*)data
;
160 virtio_iommu_detach_endpoint_from_domain(ep
);
163 trace_virtio_iommu_put_endpoint(ep
->id
);
167 static VirtIOIOMMUDomain
*virtio_iommu_get_domain(VirtIOIOMMU
*s
,
170 VirtIOIOMMUDomain
*domain
;
172 domain
= g_tree_lookup(s
->domains
, GUINT_TO_POINTER(domain_id
));
176 domain
= g_malloc0(sizeof(*domain
));
177 domain
->id
= domain_id
;
178 domain
->mappings
= g_tree_new_full((GCompareDataFunc
)interval_cmp
,
179 NULL
, (GDestroyNotify
)g_free
,
180 (GDestroyNotify
)g_free
);
181 g_tree_insert(s
->domains
, GUINT_TO_POINTER(domain_id
), domain
);
182 QLIST_INIT(&domain
->endpoint_list
);
183 trace_virtio_iommu_get_domain(domain_id
);
187 static void virtio_iommu_put_domain(gpointer data
)
189 VirtIOIOMMUDomain
*domain
= (VirtIOIOMMUDomain
*)data
;
190 VirtIOIOMMUEndpoint
*iter
, *tmp
;
192 QLIST_FOREACH_SAFE(iter
, &domain
->endpoint_list
, next
, tmp
) {
193 virtio_iommu_detach_endpoint_from_domain(iter
);
195 g_tree_destroy(domain
->mappings
);
196 trace_virtio_iommu_put_domain(domain
->id
);
200 static AddressSpace
*virtio_iommu_find_add_as(PCIBus
*bus
, void *opaque
,
203 VirtIOIOMMU
*s
= opaque
;
204 IOMMUPciBus
*sbus
= g_hash_table_lookup(s
->as_by_busptr
, bus
);
205 static uint32_t mr_index
;
209 sbus
= g_malloc0(sizeof(IOMMUPciBus
) +
210 sizeof(IOMMUDevice
*) * PCI_DEVFN_MAX
);
212 g_hash_table_insert(s
->as_by_busptr
, bus
, sbus
);
215 sdev
= sbus
->pbdev
[devfn
];
217 char *name
= g_strdup_printf("%s-%d-%d",
218 TYPE_VIRTIO_IOMMU_MEMORY_REGION
,
220 sdev
= sbus
->pbdev
[devfn
] = g_malloc0(sizeof(IOMMUDevice
));
226 trace_virtio_iommu_init_iommu_mr(name
);
228 memory_region_init_iommu(&sdev
->iommu_mr
, sizeof(sdev
->iommu_mr
),
229 TYPE_VIRTIO_IOMMU_MEMORY_REGION
,
232 address_space_init(&sdev
->as
,
233 MEMORY_REGION(&sdev
->iommu_mr
), TYPE_VIRTIO_IOMMU
);
239 static int virtio_iommu_attach(VirtIOIOMMU
*s
,
240 struct virtio_iommu_req_attach
*req
)
242 uint32_t domain_id
= le32_to_cpu(req
->domain
);
243 uint32_t ep_id
= le32_to_cpu(req
->endpoint
);
244 VirtIOIOMMUDomain
*domain
;
245 VirtIOIOMMUEndpoint
*ep
;
247 trace_virtio_iommu_attach(domain_id
, ep_id
);
249 ep
= virtio_iommu_get_endpoint(s
, ep_id
);
251 return VIRTIO_IOMMU_S_NOENT
;
255 VirtIOIOMMUDomain
*previous_domain
= ep
->domain
;
257 * the device is already attached to a domain,
260 virtio_iommu_detach_endpoint_from_domain(ep
);
261 if (QLIST_EMPTY(&previous_domain
->endpoint_list
)) {
262 g_tree_remove(s
->domains
, GUINT_TO_POINTER(previous_domain
->id
));
266 domain
= virtio_iommu_get_domain(s
, domain_id
);
267 QLIST_INSERT_HEAD(&domain
->endpoint_list
, ep
, next
);
271 return VIRTIO_IOMMU_S_OK
;
274 static int virtio_iommu_detach(VirtIOIOMMU
*s
,
275 struct virtio_iommu_req_detach
*req
)
277 uint32_t domain_id
= le32_to_cpu(req
->domain
);
278 uint32_t ep_id
= le32_to_cpu(req
->endpoint
);
279 VirtIOIOMMUDomain
*domain
;
280 VirtIOIOMMUEndpoint
*ep
;
282 trace_virtio_iommu_detach(domain_id
, ep_id
);
284 ep
= g_tree_lookup(s
->endpoints
, GUINT_TO_POINTER(ep_id
));
286 return VIRTIO_IOMMU_S_NOENT
;
291 if (!domain
|| domain
->id
!= domain_id
) {
292 return VIRTIO_IOMMU_S_INVAL
;
295 virtio_iommu_detach_endpoint_from_domain(ep
);
297 if (QLIST_EMPTY(&domain
->endpoint_list
)) {
298 g_tree_remove(s
->domains
, GUINT_TO_POINTER(domain
->id
));
300 return VIRTIO_IOMMU_S_OK
;
303 static int virtio_iommu_map(VirtIOIOMMU
*s
,
304 struct virtio_iommu_req_map
*req
)
306 uint32_t domain_id
= le32_to_cpu(req
->domain
);
307 uint64_t phys_start
= le64_to_cpu(req
->phys_start
);
308 uint64_t virt_start
= le64_to_cpu(req
->virt_start
);
309 uint64_t virt_end
= le64_to_cpu(req
->virt_end
);
310 uint32_t flags
= le32_to_cpu(req
->flags
);
311 VirtIOIOMMUDomain
*domain
;
312 VirtIOIOMMUInterval
*interval
;
313 VirtIOIOMMUMapping
*mapping
;
315 if (flags
& ~VIRTIO_IOMMU_MAP_F_MASK
) {
316 return VIRTIO_IOMMU_S_INVAL
;
319 domain
= g_tree_lookup(s
->domains
, GUINT_TO_POINTER(domain_id
));
321 return VIRTIO_IOMMU_S_NOENT
;
324 interval
= g_malloc0(sizeof(*interval
));
326 interval
->low
= virt_start
;
327 interval
->high
= virt_end
;
329 mapping
= g_tree_lookup(domain
->mappings
, (gpointer
)interval
);
332 return VIRTIO_IOMMU_S_INVAL
;
335 trace_virtio_iommu_map(domain_id
, virt_start
, virt_end
, phys_start
, flags
);
337 mapping
= g_malloc0(sizeof(*mapping
));
338 mapping
->phys_addr
= phys_start
;
339 mapping
->flags
= flags
;
341 g_tree_insert(domain
->mappings
, interval
, mapping
);
343 return VIRTIO_IOMMU_S_OK
;
346 static int virtio_iommu_unmap(VirtIOIOMMU
*s
,
347 struct virtio_iommu_req_unmap
*req
)
349 uint32_t domain_id
= le32_to_cpu(req
->domain
);
350 uint64_t virt_start
= le64_to_cpu(req
->virt_start
);
351 uint64_t virt_end
= le64_to_cpu(req
->virt_end
);
352 VirtIOIOMMUMapping
*iter_val
;
353 VirtIOIOMMUInterval interval
, *iter_key
;
354 VirtIOIOMMUDomain
*domain
;
355 int ret
= VIRTIO_IOMMU_S_OK
;
357 trace_virtio_iommu_unmap(domain_id
, virt_start
, virt_end
);
359 domain
= g_tree_lookup(s
->domains
, GUINT_TO_POINTER(domain_id
));
361 return VIRTIO_IOMMU_S_NOENT
;
363 interval
.low
= virt_start
;
364 interval
.high
= virt_end
;
366 while (g_tree_lookup_extended(domain
->mappings
, &interval
,
367 (void **)&iter_key
, (void**)&iter_val
)) {
368 uint64_t current_low
= iter_key
->low
;
369 uint64_t current_high
= iter_key
->high
;
371 if (interval
.low
<= current_low
&& interval
.high
>= current_high
) {
372 g_tree_remove(domain
->mappings
, iter_key
);
373 trace_virtio_iommu_unmap_done(domain_id
, current_low
, current_high
);
375 ret
= VIRTIO_IOMMU_S_RANGE
;
382 static ssize_t
virtio_iommu_fill_resv_mem_prop(VirtIOIOMMU
*s
, uint32_t ep
,
383 uint8_t *buf
, size_t free
)
385 struct virtio_iommu_probe_resv_mem prop
= {};
386 size_t size
= sizeof(prop
), length
= size
- sizeof(prop
.head
), total
;
389 total
= size
* s
->nb_reserved_regions
;
395 for (i
= 0; i
< s
->nb_reserved_regions
; i
++) {
396 unsigned subtype
= s
->reserved_regions
[i
].type
;
398 assert(subtype
== VIRTIO_IOMMU_RESV_MEM_T_RESERVED
||
399 subtype
== VIRTIO_IOMMU_RESV_MEM_T_MSI
);
400 prop
.head
.type
= cpu_to_le16(VIRTIO_IOMMU_PROBE_T_RESV_MEM
);
401 prop
.head
.length
= cpu_to_le16(length
);
402 prop
.subtype
= subtype
;
403 prop
.start
= cpu_to_le64(s
->reserved_regions
[i
].low
);
404 prop
.end
= cpu_to_le64(s
->reserved_regions
[i
].high
);
406 memcpy(buf
, &prop
, size
);
408 trace_virtio_iommu_fill_resv_property(ep
, prop
.subtype
,
409 prop
.start
, prop
.end
);
416 * virtio_iommu_probe - Fill the probe request buffer with
417 * the properties the device is able to return
419 static int virtio_iommu_probe(VirtIOIOMMU
*s
,
420 struct virtio_iommu_req_probe
*req
,
423 uint32_t ep_id
= le32_to_cpu(req
->endpoint
);
424 size_t free
= VIOMMU_PROBE_SIZE
;
427 if (!virtio_iommu_mr(s
, ep_id
)) {
428 return VIRTIO_IOMMU_S_NOENT
;
431 count
= virtio_iommu_fill_resv_mem_prop(s
, ep_id
, buf
, free
);
433 return VIRTIO_IOMMU_S_INVAL
;
438 return VIRTIO_IOMMU_S_OK
;
441 static int virtio_iommu_iov_to_req(struct iovec
*iov
,
442 unsigned int iov_cnt
,
443 void *req
, size_t req_sz
)
445 size_t sz
, payload_sz
= req_sz
- sizeof(struct virtio_iommu_req_tail
);
447 sz
= iov_to_buf(iov
, iov_cnt
, 0, req
, payload_sz
);
448 if (unlikely(sz
!= payload_sz
)) {
449 return VIRTIO_IOMMU_S_INVAL
;
454 #define virtio_iommu_handle_req(__req) \
455 static int virtio_iommu_handle_ ## __req(VirtIOIOMMU *s, \
457 unsigned int iov_cnt) \
459 struct virtio_iommu_req_ ## __req req; \
460 int ret = virtio_iommu_iov_to_req(iov, iov_cnt, &req, sizeof(req)); \
462 return ret ? ret : virtio_iommu_ ## __req(s, &req); \
465 virtio_iommu_handle_req(attach
)
466 virtio_iommu_handle_req(detach
)
467 virtio_iommu_handle_req(map
)
468 virtio_iommu_handle_req(unmap
)
470 static int virtio_iommu_handle_probe(VirtIOIOMMU
*s
,
472 unsigned int iov_cnt
,
475 struct virtio_iommu_req_probe req
;
476 int ret
= virtio_iommu_iov_to_req(iov
, iov_cnt
, &req
, sizeof(req
));
478 return ret
? ret
: virtio_iommu_probe(s
, &req
, buf
);
481 static void virtio_iommu_handle_command(VirtIODevice
*vdev
, VirtQueue
*vq
)
483 VirtIOIOMMU
*s
= VIRTIO_IOMMU(vdev
);
484 struct virtio_iommu_req_head head
;
485 struct virtio_iommu_req_tail tail
= {};
486 size_t output_size
= sizeof(tail
), sz
;
487 VirtQueueElement
*elem
;
488 unsigned int iov_cnt
;
493 elem
= virtqueue_pop(vq
, sizeof(VirtQueueElement
));
498 if (iov_size(elem
->in_sg
, elem
->in_num
) < sizeof(tail
) ||
499 iov_size(elem
->out_sg
, elem
->out_num
) < sizeof(head
)) {
500 virtio_error(vdev
, "virtio-iommu bad head/tail size");
501 virtqueue_detach_element(vq
, elem
, 0);
506 iov_cnt
= elem
->out_num
;
508 sz
= iov_to_buf(iov
, iov_cnt
, 0, &head
, sizeof(head
));
509 if (unlikely(sz
!= sizeof(head
))) {
510 tail
.status
= VIRTIO_IOMMU_S_DEVERR
;
513 qemu_mutex_lock(&s
->mutex
);
515 case VIRTIO_IOMMU_T_ATTACH
:
516 tail
.status
= virtio_iommu_handle_attach(s
, iov
, iov_cnt
);
518 case VIRTIO_IOMMU_T_DETACH
:
519 tail
.status
= virtio_iommu_handle_detach(s
, iov
, iov_cnt
);
521 case VIRTIO_IOMMU_T_MAP
:
522 tail
.status
= virtio_iommu_handle_map(s
, iov
, iov_cnt
);
524 case VIRTIO_IOMMU_T_UNMAP
:
525 tail
.status
= virtio_iommu_handle_unmap(s
, iov
, iov_cnt
);
527 case VIRTIO_IOMMU_T_PROBE
:
529 struct virtio_iommu_req_tail
*ptail
;
531 output_size
= s
->config
.probe_size
+ sizeof(tail
);
532 buf
= g_malloc0(output_size
);
534 ptail
= (struct virtio_iommu_req_tail
*)
535 (buf
+ s
->config
.probe_size
);
536 ptail
->status
= virtio_iommu_handle_probe(s
, iov
, iov_cnt
, buf
);
540 tail
.status
= VIRTIO_IOMMU_S_UNSUPP
;
542 qemu_mutex_unlock(&s
->mutex
);
545 sz
= iov_from_buf(elem
->in_sg
, elem
->in_num
, 0,
546 buf
? buf
: &tail
, output_size
);
547 assert(sz
== output_size
);
549 virtqueue_push(vq
, elem
, sz
);
550 virtio_notify(vdev
, vq
);
556 static void virtio_iommu_report_fault(VirtIOIOMMU
*viommu
, uint8_t reason
,
557 int flags
, uint32_t endpoint
,
560 VirtIODevice
*vdev
= &viommu
->parent_obj
;
561 VirtQueue
*vq
= viommu
->event_vq
;
562 struct virtio_iommu_fault fault
;
563 VirtQueueElement
*elem
;
566 memset(&fault
, 0, sizeof(fault
));
567 fault
.reason
= reason
;
568 fault
.flags
= cpu_to_le32(flags
);
569 fault
.endpoint
= cpu_to_le32(endpoint
);
570 fault
.address
= cpu_to_le64(address
);
572 elem
= virtqueue_pop(vq
, sizeof(VirtQueueElement
));
576 "no buffer available in event queue to report event");
580 if (iov_size(elem
->in_sg
, elem
->in_num
) < sizeof(fault
)) {
581 virtio_error(vdev
, "error buffer of wrong size");
582 virtqueue_detach_element(vq
, elem
, 0);
587 sz
= iov_from_buf(elem
->in_sg
, elem
->in_num
, 0,
588 &fault
, sizeof(fault
));
589 assert(sz
== sizeof(fault
));
591 trace_virtio_iommu_report_fault(reason
, flags
, endpoint
, address
);
592 virtqueue_push(vq
, elem
, sz
);
593 virtio_notify(vdev
, vq
);
598 static IOMMUTLBEntry
virtio_iommu_translate(IOMMUMemoryRegion
*mr
, hwaddr addr
,
599 IOMMUAccessFlags flag
,
602 IOMMUDevice
*sdev
= container_of(mr
, IOMMUDevice
, iommu_mr
);
603 VirtIOIOMMUInterval interval
, *mapping_key
;
604 VirtIOIOMMUMapping
*mapping_value
;
605 VirtIOIOMMU
*s
= sdev
->viommu
;
606 bool read_fault
, write_fault
;
607 VirtIOIOMMUEndpoint
*ep
;
614 interval
.high
= addr
+ 1;
616 IOMMUTLBEntry entry
= {
617 .target_as
= &address_space_memory
,
619 .translated_addr
= addr
,
620 .addr_mask
= (1 << ctz32(s
->config
.page_size_mask
)) - 1,
624 bypass_allowed
= virtio_vdev_has_feature(&s
->parent_obj
,
625 VIRTIO_IOMMU_F_BYPASS
);
627 sid
= virtio_iommu_get_bdf(sdev
);
629 trace_virtio_iommu_translate(mr
->parent_obj
.name
, sid
, addr
, flag
);
630 qemu_mutex_lock(&s
->mutex
);
632 ep
= g_tree_lookup(s
->endpoints
, GUINT_TO_POINTER(sid
));
634 if (!bypass_allowed
) {
635 error_report_once("%s sid=%d is not known!!", __func__
, sid
);
636 virtio_iommu_report_fault(s
, VIRTIO_IOMMU_FAULT_R_UNKNOWN
,
637 VIRTIO_IOMMU_FAULT_F_ADDRESS
,
645 for (i
= 0; i
< s
->nb_reserved_regions
; i
++) {
646 ReservedRegion
*reg
= &s
->reserved_regions
[i
];
648 if (addr
>= reg
->low
&& addr
<= reg
->high
) {
650 case VIRTIO_IOMMU_RESV_MEM_T_MSI
:
653 case VIRTIO_IOMMU_RESV_MEM_T_RESERVED
:
655 virtio_iommu_report_fault(s
, VIRTIO_IOMMU_FAULT_R_MAPPING
,
656 VIRTIO_IOMMU_FAULT_F_ADDRESS
,
665 if (!bypass_allowed
) {
666 error_report_once("%s %02x:%02x.%01x not attached to any domain",
667 __func__
, PCI_BUS_NUM(sid
),
668 PCI_SLOT(sid
), PCI_FUNC(sid
));
669 virtio_iommu_report_fault(s
, VIRTIO_IOMMU_FAULT_R_DOMAIN
,
670 VIRTIO_IOMMU_FAULT_F_ADDRESS
,
678 found
= g_tree_lookup_extended(ep
->domain
->mappings
, (gpointer
)(&interval
),
679 (void **)&mapping_key
,
680 (void **)&mapping_value
);
682 error_report_once("%s no mapping for 0x%"PRIx64
" for sid=%d",
683 __func__
, addr
, sid
);
684 virtio_iommu_report_fault(s
, VIRTIO_IOMMU_FAULT_R_MAPPING
,
685 VIRTIO_IOMMU_FAULT_F_ADDRESS
,
690 read_fault
= (flag
& IOMMU_RO
) &&
691 !(mapping_value
->flags
& VIRTIO_IOMMU_MAP_F_READ
);
692 write_fault
= (flag
& IOMMU_WO
) &&
693 !(mapping_value
->flags
& VIRTIO_IOMMU_MAP_F_WRITE
);
695 flags
= read_fault
? VIRTIO_IOMMU_FAULT_F_READ
: 0;
696 flags
|= write_fault
? VIRTIO_IOMMU_FAULT_F_WRITE
: 0;
698 error_report_once("%s permission error on 0x%"PRIx64
"(%d): allowed=%d",
699 __func__
, addr
, flag
, mapping_value
->flags
);
700 flags
|= VIRTIO_IOMMU_FAULT_F_ADDRESS
;
701 virtio_iommu_report_fault(s
, VIRTIO_IOMMU_FAULT_R_MAPPING
,
702 flags
| VIRTIO_IOMMU_FAULT_F_ADDRESS
,
706 entry
.translated_addr
= addr
- mapping_key
->low
+ mapping_value
->phys_addr
;
708 trace_virtio_iommu_translate_out(addr
, entry
.translated_addr
, sid
);
711 qemu_mutex_unlock(&s
->mutex
);
715 static void virtio_iommu_get_config(VirtIODevice
*vdev
, uint8_t *config_data
)
717 VirtIOIOMMU
*dev
= VIRTIO_IOMMU(vdev
);
718 struct virtio_iommu_config
*config
= &dev
->config
;
720 trace_virtio_iommu_get_config(config
->page_size_mask
,
721 config
->input_range
.start
,
722 config
->input_range
.end
,
723 config
->domain_range
.end
,
725 memcpy(config_data
, &dev
->config
, sizeof(struct virtio_iommu_config
));
728 static void virtio_iommu_set_config(VirtIODevice
*vdev
,
729 const uint8_t *config_data
)
731 struct virtio_iommu_config config
;
733 memcpy(&config
, config_data
, sizeof(struct virtio_iommu_config
));
734 trace_virtio_iommu_set_config(config
.page_size_mask
,
735 config
.input_range
.start
,
736 config
.input_range
.end
,
737 config
.domain_range
.end
,
741 static uint64_t virtio_iommu_get_features(VirtIODevice
*vdev
, uint64_t f
,
744 VirtIOIOMMU
*dev
= VIRTIO_IOMMU(vdev
);
747 trace_virtio_iommu_get_features(f
);
751 static gint
int_cmp(gconstpointer a
, gconstpointer b
, gpointer user_data
)
753 guint ua
= GPOINTER_TO_UINT(a
);
754 guint ub
= GPOINTER_TO_UINT(b
);
755 return (ua
> ub
) - (ua
< ub
);
758 static void virtio_iommu_device_realize(DeviceState
*dev
, Error
**errp
)
760 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
761 VirtIOIOMMU
*s
= VIRTIO_IOMMU(dev
);
763 virtio_init(vdev
, "virtio-iommu", VIRTIO_ID_IOMMU
,
764 sizeof(struct virtio_iommu_config
));
766 memset(s
->iommu_pcibus_by_bus_num
, 0, sizeof(s
->iommu_pcibus_by_bus_num
));
768 s
->req_vq
= virtio_add_queue(vdev
, VIOMMU_DEFAULT_QUEUE_SIZE
,
769 virtio_iommu_handle_command
);
770 s
->event_vq
= virtio_add_queue(vdev
, VIOMMU_DEFAULT_QUEUE_SIZE
, NULL
);
772 s
->config
.page_size_mask
= TARGET_PAGE_MASK
;
773 s
->config
.input_range
.end
= -1UL;
774 s
->config
.domain_range
.end
= 32;
775 s
->config
.probe_size
= VIOMMU_PROBE_SIZE
;
777 virtio_add_feature(&s
->features
, VIRTIO_RING_F_EVENT_IDX
);
778 virtio_add_feature(&s
->features
, VIRTIO_RING_F_INDIRECT_DESC
);
779 virtio_add_feature(&s
->features
, VIRTIO_F_VERSION_1
);
780 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_INPUT_RANGE
);
781 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_DOMAIN_RANGE
);
782 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_MAP_UNMAP
);
783 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_BYPASS
);
784 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_MMIO
);
785 virtio_add_feature(&s
->features
, VIRTIO_IOMMU_F_PROBE
);
787 qemu_mutex_init(&s
->mutex
);
789 s
->as_by_busptr
= g_hash_table_new_full(NULL
, NULL
, NULL
, g_free
);
791 if (s
->primary_bus
) {
792 pci_setup_iommu(s
->primary_bus
, virtio_iommu_find_add_as
, s
);
794 error_setg(errp
, "VIRTIO-IOMMU is not attached to any PCI bus!");
798 static void virtio_iommu_device_unrealize(DeviceState
*dev
)
800 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
801 VirtIOIOMMU
*s
= VIRTIO_IOMMU(dev
);
803 g_hash_table_destroy(s
->as_by_busptr
);
804 g_tree_destroy(s
->domains
);
805 g_tree_destroy(s
->endpoints
);
807 virtio_delete_queue(s
->req_vq
);
808 virtio_delete_queue(s
->event_vq
);
809 virtio_cleanup(vdev
);
812 static void virtio_iommu_device_reset(VirtIODevice
*vdev
)
814 VirtIOIOMMU
*s
= VIRTIO_IOMMU(vdev
);
816 trace_virtio_iommu_device_reset();
819 g_tree_destroy(s
->domains
);
822 g_tree_destroy(s
->endpoints
);
824 s
->domains
= g_tree_new_full((GCompareDataFunc
)int_cmp
,
825 NULL
, NULL
, virtio_iommu_put_domain
);
826 s
->endpoints
= g_tree_new_full((GCompareDataFunc
)int_cmp
,
827 NULL
, NULL
, virtio_iommu_put_endpoint
);
830 static void virtio_iommu_set_status(VirtIODevice
*vdev
, uint8_t status
)
832 trace_virtio_iommu_device_status(status
);
835 static void virtio_iommu_instance_init(Object
*obj
)
839 #define VMSTATE_INTERVAL \
841 .name = "interval", \
843 .minimum_version_id = 1, \
844 .fields = (VMStateField[]) { \
845 VMSTATE_UINT64(low, VirtIOIOMMUInterval), \
846 VMSTATE_UINT64(high, VirtIOIOMMUInterval), \
847 VMSTATE_END_OF_LIST() \
851 #define VMSTATE_MAPPING \
855 .minimum_version_id = 1, \
856 .fields = (VMStateField[]) { \
857 VMSTATE_UINT64(phys_addr, VirtIOIOMMUMapping),\
858 VMSTATE_UINT32(flags, VirtIOIOMMUMapping), \
859 VMSTATE_END_OF_LIST() \
863 static const VMStateDescription vmstate_interval_mapping
[2] = {
864 VMSTATE_MAPPING
, /* value */
865 VMSTATE_INTERVAL
/* key */
868 static int domain_preload(void *opaque
)
870 VirtIOIOMMUDomain
*domain
= opaque
;
872 domain
->mappings
= g_tree_new_full((GCompareDataFunc
)interval_cmp
,
873 NULL
, g_free
, g_free
);
877 static const VMStateDescription vmstate_endpoint
= {
880 .minimum_version_id
= 1,
881 .fields
= (VMStateField
[]) {
882 VMSTATE_UINT32(id
, VirtIOIOMMUEndpoint
),
883 VMSTATE_END_OF_LIST()
887 static const VMStateDescription vmstate_domain
= {
890 .minimum_version_id
= 1,
891 .pre_load
= domain_preload
,
892 .fields
= (VMStateField
[]) {
893 VMSTATE_UINT32(id
, VirtIOIOMMUDomain
),
894 VMSTATE_GTREE_V(mappings
, VirtIOIOMMUDomain
, 1,
895 vmstate_interval_mapping
,
896 VirtIOIOMMUInterval
, VirtIOIOMMUMapping
),
897 VMSTATE_QLIST_V(endpoint_list
, VirtIOIOMMUDomain
, 1,
898 vmstate_endpoint
, VirtIOIOMMUEndpoint
, next
),
899 VMSTATE_END_OF_LIST()
903 static gboolean
reconstruct_endpoints(gpointer key
, gpointer value
,
906 VirtIOIOMMU
*s
= (VirtIOIOMMU
*)data
;
907 VirtIOIOMMUDomain
*d
= (VirtIOIOMMUDomain
*)value
;
908 VirtIOIOMMUEndpoint
*iter
;
910 QLIST_FOREACH(iter
, &d
->endpoint_list
, next
) {
912 g_tree_insert(s
->endpoints
, GUINT_TO_POINTER(iter
->id
), iter
);
914 return false; /* continue the domain traversal */
917 static int iommu_post_load(void *opaque
, int version_id
)
919 VirtIOIOMMU
*s
= opaque
;
921 g_tree_foreach(s
->domains
, reconstruct_endpoints
, s
);
925 static const VMStateDescription vmstate_virtio_iommu_device
= {
926 .name
= "virtio-iommu-device",
927 .minimum_version_id
= 1,
929 .post_load
= iommu_post_load
,
930 .fields
= (VMStateField
[]) {
931 VMSTATE_GTREE_DIRECT_KEY_V(domains
, VirtIOIOMMU
, 1,
932 &vmstate_domain
, VirtIOIOMMUDomain
),
933 VMSTATE_END_OF_LIST()
937 static const VMStateDescription vmstate_virtio_iommu
= {
938 .name
= "virtio-iommu",
939 .minimum_version_id
= 1,
940 .priority
= MIG_PRI_IOMMU
,
942 .fields
= (VMStateField
[]) {
943 VMSTATE_VIRTIO_DEVICE
,
944 VMSTATE_END_OF_LIST()
948 static Property virtio_iommu_properties
[] = {
949 DEFINE_PROP_LINK("primary-bus", VirtIOIOMMU
, primary_bus
, "PCI", PCIBus
*),
950 DEFINE_PROP_END_OF_LIST(),
953 static void virtio_iommu_class_init(ObjectClass
*klass
, void *data
)
955 DeviceClass
*dc
= DEVICE_CLASS(klass
);
956 VirtioDeviceClass
*vdc
= VIRTIO_DEVICE_CLASS(klass
);
958 device_class_set_props(dc
, virtio_iommu_properties
);
959 dc
->vmsd
= &vmstate_virtio_iommu
;
961 set_bit(DEVICE_CATEGORY_MISC
, dc
->categories
);
962 vdc
->realize
= virtio_iommu_device_realize
;
963 vdc
->unrealize
= virtio_iommu_device_unrealize
;
964 vdc
->reset
= virtio_iommu_device_reset
;
965 vdc
->get_config
= virtio_iommu_get_config
;
966 vdc
->set_config
= virtio_iommu_set_config
;
967 vdc
->get_features
= virtio_iommu_get_features
;
968 vdc
->set_status
= virtio_iommu_set_status
;
969 vdc
->vmsd
= &vmstate_virtio_iommu_device
;
972 static void virtio_iommu_memory_region_class_init(ObjectClass
*klass
,
975 IOMMUMemoryRegionClass
*imrc
= IOMMU_MEMORY_REGION_CLASS(klass
);
977 imrc
->translate
= virtio_iommu_translate
;
980 static const TypeInfo virtio_iommu_info
= {
981 .name
= TYPE_VIRTIO_IOMMU
,
982 .parent
= TYPE_VIRTIO_DEVICE
,
983 .instance_size
= sizeof(VirtIOIOMMU
),
984 .instance_init
= virtio_iommu_instance_init
,
985 .class_init
= virtio_iommu_class_init
,
988 static const TypeInfo virtio_iommu_memory_region_info
= {
989 .parent
= TYPE_IOMMU_MEMORY_REGION
,
990 .name
= TYPE_VIRTIO_IOMMU_MEMORY_REGION
,
991 .class_init
= virtio_iommu_memory_region_class_init
,
994 static void virtio_register_types(void)
996 type_register_static(&virtio_iommu_info
);
997 type_register_static(&virtio_iommu_memory_region_info
);
1000 type_init(virtio_register_types
)