Merge branch 'master' of git://git.qemu.org/qemu into next
[qemu/qemu-dev-zwu.git] / hw / virtio-pci.c
blob2f122aad71149cabe789231b2307c88d5462afd5
1 /*
2 * Virtio PCI Bindings
4 * Copyright IBM, Corp. 2007
5 * Copyright (c) 2009 CodeSourcery
7 * Authors:
8 * Anthony Liguori <aliguori@us.ibm.com>
9 * Paul Brook <paul@codesourcery.com>
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
16 #include <inttypes.h>
18 #include "virtio.h"
19 #include "virtio-blk.h"
20 #include "virtio-net.h"
21 #include "virtio-serial.h"
22 #include "pci.h"
23 #include "qemu-error.h"
24 #include "msix.h"
25 #include "net.h"
26 #include "loader.h"
27 #include "kvm.h"
28 #include "blockdev.h"
29 #include "virtio-pci.h"
31 /* from Linux's linux/virtio_pci.h */
33 /* A 32-bit r/o bitmask of the features supported by the host */
34 #define VIRTIO_PCI_HOST_FEATURES 0
36 /* A 32-bit r/w bitmask of features activated by the guest */
37 #define VIRTIO_PCI_GUEST_FEATURES 4
39 /* A 32-bit r/w PFN for the currently selected queue */
40 #define VIRTIO_PCI_QUEUE_PFN 8
42 /* A 16-bit r/o queue size for the currently selected queue */
43 #define VIRTIO_PCI_QUEUE_NUM 12
45 /* A 16-bit r/w queue selector */
46 #define VIRTIO_PCI_QUEUE_SEL 14
48 /* A 16-bit r/w queue notifier */
49 #define VIRTIO_PCI_QUEUE_NOTIFY 16
51 /* An 8-bit device status register. */
52 #define VIRTIO_PCI_STATUS 18
54 /* An 8-bit r/o interrupt status register. Reading the value will return the
55 * current contents of the ISR and will also clear it. This is effectively
56 * a read-and-acknowledge. */
57 #define VIRTIO_PCI_ISR 19
59 /* MSI-X registers: only enabled if MSI-X is enabled. */
60 /* A 16-bit vector for configuration changes. */
61 #define VIRTIO_MSI_CONFIG_VECTOR 20
62 /* A 16-bit vector for selected queue notifications. */
63 #define VIRTIO_MSI_QUEUE_VECTOR 22
65 /* Config space size */
66 #define VIRTIO_PCI_CONFIG_NOMSI 20
67 #define VIRTIO_PCI_CONFIG_MSI 24
68 #define VIRTIO_PCI_REGION_SIZE(dev) (msix_present(dev) ? \
69 VIRTIO_PCI_CONFIG_MSI : \
70 VIRTIO_PCI_CONFIG_NOMSI)
72 /* The remaining space is defined by each driver as the per-driver
73 * configuration space */
74 #define VIRTIO_PCI_CONFIG(dev) (msix_enabled(dev) ? \
75 VIRTIO_PCI_CONFIG_MSI : \
76 VIRTIO_PCI_CONFIG_NOMSI)
78 /* How many bits to shift physical queue address written to QUEUE_PFN.
79 * 12 is historical, and due to x86 page size. */
80 #define VIRTIO_PCI_QUEUE_ADDR_SHIFT 12
82 /* Flags track per-device state like workarounds for quirks in older guests. */
83 #define VIRTIO_PCI_FLAG_BUS_MASTER_BUG (1 << 0)
85 /* Performance improves when virtqueue kick processing is decoupled from the
86 * vcpu thread using ioeventfd for some devices. */
87 #define VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT 1
88 #define VIRTIO_PCI_FLAG_USE_IOEVENTFD (1 << VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT)
90 /* QEMU doesn't strictly need write barriers since everything runs in
91 * lock-step. We'll leave the calls to wmb() in though to make it obvious for
92 * KVM or if kqemu gets SMP support.
94 #define wmb() do { } while (0)
96 /* virtio device */
98 static void virtio_pci_notify(void *opaque, uint16_t vector)
100 VirtIOPCIProxy *proxy = opaque;
101 if (msix_enabled(&proxy->pci_dev))
102 msix_notify(&proxy->pci_dev, vector);
103 else
104 qemu_set_irq(proxy->pci_dev.irq[0], proxy->vdev->isr & 1);
107 static void virtio_pci_save_config(void * opaque, QEMUFile *f)
109 VirtIOPCIProxy *proxy = opaque;
110 pci_device_save(&proxy->pci_dev, f);
111 msix_save(&proxy->pci_dev, f);
112 if (msix_present(&proxy->pci_dev))
113 qemu_put_be16(f, proxy->vdev->config_vector);
116 static void virtio_pci_save_queue(void * opaque, int n, QEMUFile *f)
118 VirtIOPCIProxy *proxy = opaque;
119 if (msix_present(&proxy->pci_dev))
120 qemu_put_be16(f, virtio_queue_vector(proxy->vdev, n));
123 static int virtio_pci_load_config(void * opaque, QEMUFile *f)
125 VirtIOPCIProxy *proxy = opaque;
126 int ret;
127 ret = pci_device_load(&proxy->pci_dev, f);
128 if (ret) {
129 return ret;
131 msix_load(&proxy->pci_dev, f);
132 if (msix_present(&proxy->pci_dev)) {
133 qemu_get_be16s(f, &proxy->vdev->config_vector);
134 } else {
135 proxy->vdev->config_vector = VIRTIO_NO_VECTOR;
137 if (proxy->vdev->config_vector != VIRTIO_NO_VECTOR) {
138 return msix_vector_use(&proxy->pci_dev, proxy->vdev->config_vector);
140 return 0;
143 static int virtio_pci_load_queue(void * opaque, int n, QEMUFile *f)
145 VirtIOPCIProxy *proxy = opaque;
146 uint16_t vector;
147 if (msix_present(&proxy->pci_dev)) {
148 qemu_get_be16s(f, &vector);
149 } else {
150 vector = VIRTIO_NO_VECTOR;
152 virtio_queue_set_vector(proxy->vdev, n, vector);
153 if (vector != VIRTIO_NO_VECTOR) {
154 return msix_vector_use(&proxy->pci_dev, vector);
156 return 0;
159 static int virtio_pci_set_host_notifier_internal(VirtIOPCIProxy *proxy,
160 int n, bool assign)
162 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
163 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
164 int r;
165 if (assign) {
166 r = event_notifier_init(notifier, 1);
167 if (r < 0) {
168 error_report("%s: unable to init event notifier: %d",
169 __func__, r);
170 return r;
172 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
173 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
174 n, assign);
175 if (r < 0) {
176 error_report("%s: unable to map ioeventfd: %d",
177 __func__, r);
178 event_notifier_cleanup(notifier);
180 } else {
181 r = kvm_set_ioeventfd_pio_word(event_notifier_get_fd(notifier),
182 proxy->addr + VIRTIO_PCI_QUEUE_NOTIFY,
183 n, assign);
184 if (r < 0) {
185 error_report("%s: unable to unmap ioeventfd: %d",
186 __func__, r);
187 return r;
190 /* Handle the race condition where the guest kicked and we deassigned
191 * before we got around to handling the kick.
193 if (event_notifier_test_and_clear(notifier)) {
194 virtio_queue_notify_vq(vq);
197 event_notifier_cleanup(notifier);
199 return r;
202 static void virtio_pci_host_notifier_read(void *opaque)
204 VirtQueue *vq = opaque;
205 EventNotifier *n = virtio_queue_get_host_notifier(vq);
206 if (event_notifier_test_and_clear(n)) {
207 virtio_queue_notify_vq(vq);
211 static void virtio_pci_set_host_notifier_fd_handler(VirtIOPCIProxy *proxy,
212 int n, bool assign)
214 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
215 EventNotifier *notifier = virtio_queue_get_host_notifier(vq);
216 if (assign) {
217 qemu_set_fd_handler(event_notifier_get_fd(notifier),
218 virtio_pci_host_notifier_read, NULL, vq);
219 } else {
220 qemu_set_fd_handler(event_notifier_get_fd(notifier),
221 NULL, NULL, NULL);
225 static void virtio_pci_start_ioeventfd(VirtIOPCIProxy *proxy)
227 int n, r;
229 if (!(proxy->flags & VIRTIO_PCI_FLAG_USE_IOEVENTFD) ||
230 proxy->ioeventfd_disabled ||
231 proxy->ioeventfd_started) {
232 return;
235 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
236 if (!virtio_queue_get_num(proxy->vdev, n)) {
237 continue;
240 r = virtio_pci_set_host_notifier_internal(proxy, n, true);
241 if (r < 0) {
242 goto assign_error;
245 virtio_pci_set_host_notifier_fd_handler(proxy, n, true);
247 proxy->ioeventfd_started = true;
248 return;
250 assign_error:
251 while (--n >= 0) {
252 if (!virtio_queue_get_num(proxy->vdev, n)) {
253 continue;
256 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
257 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
258 assert(r >= 0);
260 proxy->ioeventfd_started = false;
261 error_report("%s: failed. Fallback to a userspace (slower).", __func__);
264 static void virtio_pci_stop_ioeventfd(VirtIOPCIProxy *proxy)
266 int r;
267 int n;
269 if (!proxy->ioeventfd_started) {
270 return;
273 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
274 if (!virtio_queue_get_num(proxy->vdev, n)) {
275 continue;
278 virtio_pci_set_host_notifier_fd_handler(proxy, n, false);
279 r = virtio_pci_set_host_notifier_internal(proxy, n, false);
280 assert(r >= 0);
282 proxy->ioeventfd_started = false;
285 static void virtio_pci_reset(DeviceState *d)
287 VirtIOPCIProxy *proxy = container_of(d, VirtIOPCIProxy, pci_dev.qdev);
288 virtio_pci_stop_ioeventfd(proxy);
289 virtio_reset(proxy->vdev);
290 msix_reset(&proxy->pci_dev);
291 proxy->flags &= ~VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
294 static void virtio_ioport_write(void *opaque, uint32_t addr, uint32_t val)
296 VirtIOPCIProxy *proxy = opaque;
297 VirtIODevice *vdev = proxy->vdev;
298 target_phys_addr_t pa;
300 switch (addr) {
301 case VIRTIO_PCI_GUEST_FEATURES:
302 /* Guest does not negotiate properly? We have to assume nothing. */
303 if (val & (1 << VIRTIO_F_BAD_FEATURE)) {
304 if (vdev->bad_features)
305 val = proxy->host_features & vdev->bad_features(vdev);
306 else
307 val = 0;
309 if (vdev->set_features)
310 vdev->set_features(vdev, val);
311 vdev->guest_features = val;
312 break;
313 case VIRTIO_PCI_QUEUE_PFN:
314 pa = (target_phys_addr_t)val << VIRTIO_PCI_QUEUE_ADDR_SHIFT;
315 if (pa == 0) {
316 virtio_pci_stop_ioeventfd(proxy);
317 virtio_reset(proxy->vdev);
318 msix_unuse_all_vectors(&proxy->pci_dev);
320 else
321 virtio_queue_set_addr(vdev, vdev->queue_sel, pa);
322 break;
323 case VIRTIO_PCI_QUEUE_SEL:
324 if (val < VIRTIO_PCI_QUEUE_MAX)
325 vdev->queue_sel = val;
326 break;
327 case VIRTIO_PCI_QUEUE_NOTIFY:
328 if (val < VIRTIO_PCI_QUEUE_MAX) {
329 virtio_queue_notify(vdev, val);
331 break;
332 case VIRTIO_PCI_STATUS:
333 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
334 virtio_pci_stop_ioeventfd(proxy);
337 virtio_set_status(vdev, val & 0xFF);
339 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
340 virtio_pci_start_ioeventfd(proxy);
343 if (vdev->status == 0) {
344 virtio_reset(proxy->vdev);
345 msix_unuse_all_vectors(&proxy->pci_dev);
348 /* Linux before 2.6.34 sets the device as OK without enabling
349 the PCI device bus master bit. In this case we need to disable
350 some safety checks. */
351 if ((val & VIRTIO_CONFIG_S_DRIVER_OK) &&
352 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
353 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
355 break;
356 case VIRTIO_MSI_CONFIG_VECTOR:
357 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
358 /* Make it possible for guest to discover an error took place. */
359 if (msix_vector_use(&proxy->pci_dev, val) < 0)
360 val = VIRTIO_NO_VECTOR;
361 vdev->config_vector = val;
362 break;
363 case VIRTIO_MSI_QUEUE_VECTOR:
364 msix_vector_unuse(&proxy->pci_dev,
365 virtio_queue_vector(vdev, vdev->queue_sel));
366 /* Make it possible for guest to discover an error took place. */
367 if (msix_vector_use(&proxy->pci_dev, val) < 0)
368 val = VIRTIO_NO_VECTOR;
369 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
370 break;
371 default:
372 error_report("%s: unexpected address 0x%x value 0x%x",
373 __func__, addr, val);
374 break;
378 static uint32_t virtio_ioport_read(VirtIOPCIProxy *proxy, uint32_t addr)
380 VirtIODevice *vdev = proxy->vdev;
381 uint32_t ret = 0xFFFFFFFF;
383 switch (addr) {
384 case VIRTIO_PCI_HOST_FEATURES:
385 ret = proxy->host_features;
386 break;
387 case VIRTIO_PCI_GUEST_FEATURES:
388 ret = vdev->guest_features;
389 break;
390 case VIRTIO_PCI_QUEUE_PFN:
391 ret = virtio_queue_get_addr(vdev, vdev->queue_sel)
392 >> VIRTIO_PCI_QUEUE_ADDR_SHIFT;
393 break;
394 case VIRTIO_PCI_QUEUE_NUM:
395 ret = virtio_queue_get_num(vdev, vdev->queue_sel);
396 break;
397 case VIRTIO_PCI_QUEUE_SEL:
398 ret = vdev->queue_sel;
399 break;
400 case VIRTIO_PCI_STATUS:
401 ret = vdev->status;
402 break;
403 case VIRTIO_PCI_ISR:
404 /* reading from the ISR also clears it. */
405 ret = vdev->isr;
406 vdev->isr = 0;
407 qemu_set_irq(proxy->pci_dev.irq[0], 0);
408 break;
409 case VIRTIO_MSI_CONFIG_VECTOR:
410 ret = vdev->config_vector;
411 break;
412 case VIRTIO_MSI_QUEUE_VECTOR:
413 ret = virtio_queue_vector(vdev, vdev->queue_sel);
414 break;
415 default:
416 break;
419 return ret;
422 static uint32_t virtio_pci_config_readb(void *opaque, uint32_t addr)
424 VirtIOPCIProxy *proxy = opaque;
425 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
426 addr -= proxy->addr;
427 if (addr < config)
428 return virtio_ioport_read(proxy, addr);
429 addr -= config;
430 return virtio_config_readb(proxy->vdev, addr);
433 static uint32_t virtio_pci_config_readw(void *opaque, uint32_t addr)
435 VirtIOPCIProxy *proxy = opaque;
436 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
437 addr -= proxy->addr;
438 if (addr < config)
439 return virtio_ioport_read(proxy, addr);
440 addr -= config;
441 return virtio_config_readw(proxy->vdev, addr);
444 static uint32_t virtio_pci_config_readl(void *opaque, uint32_t addr)
446 VirtIOPCIProxy *proxy = opaque;
447 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
448 addr -= proxy->addr;
449 if (addr < config)
450 return virtio_ioport_read(proxy, addr);
451 addr -= config;
452 return virtio_config_readl(proxy->vdev, addr);
455 static void virtio_pci_config_writeb(void *opaque, uint32_t addr, uint32_t val)
457 VirtIOPCIProxy *proxy = opaque;
458 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
459 addr -= proxy->addr;
460 if (addr < config) {
461 virtio_ioport_write(proxy, addr, val);
462 return;
464 addr -= config;
465 virtio_config_writeb(proxy->vdev, addr, val);
468 static void virtio_pci_config_writew(void *opaque, uint32_t addr, uint32_t val)
470 VirtIOPCIProxy *proxy = opaque;
471 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
472 addr -= proxy->addr;
473 if (addr < config) {
474 virtio_ioport_write(proxy, addr, val);
475 return;
477 addr -= config;
478 virtio_config_writew(proxy->vdev, addr, val);
481 static void virtio_pci_config_writel(void *opaque, uint32_t addr, uint32_t val)
483 VirtIOPCIProxy *proxy = opaque;
484 uint32_t config = VIRTIO_PCI_CONFIG(&proxy->pci_dev);
485 addr -= proxy->addr;
486 if (addr < config) {
487 virtio_ioport_write(proxy, addr, val);
488 return;
490 addr -= config;
491 virtio_config_writel(proxy->vdev, addr, val);
494 static void virtio_map(PCIDevice *pci_dev, int region_num,
495 pcibus_t addr, pcibus_t size, int type)
497 VirtIOPCIProxy *proxy = container_of(pci_dev, VirtIOPCIProxy, pci_dev);
498 VirtIODevice *vdev = proxy->vdev;
499 unsigned config_len = VIRTIO_PCI_REGION_SIZE(pci_dev) + vdev->config_len;
501 proxy->addr = addr;
503 register_ioport_write(addr, config_len, 1, virtio_pci_config_writeb, proxy);
504 register_ioport_write(addr, config_len, 2, virtio_pci_config_writew, proxy);
505 register_ioport_write(addr, config_len, 4, virtio_pci_config_writel, proxy);
506 register_ioport_read(addr, config_len, 1, virtio_pci_config_readb, proxy);
507 register_ioport_read(addr, config_len, 2, virtio_pci_config_readw, proxy);
508 register_ioport_read(addr, config_len, 4, virtio_pci_config_readl, proxy);
510 if (vdev->config_len)
511 vdev->get_config(vdev, vdev->config);
514 static void virtio_write_config(PCIDevice *pci_dev, uint32_t address,
515 uint32_t val, int len)
517 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
519 if (PCI_COMMAND == address) {
520 if (!(val & PCI_COMMAND_MASTER)) {
521 if (!(proxy->flags & VIRTIO_PCI_FLAG_BUS_MASTER_BUG)) {
522 virtio_pci_stop_ioeventfd(proxy);
523 virtio_set_status(proxy->vdev,
524 proxy->vdev->status & ~VIRTIO_CONFIG_S_DRIVER_OK);
529 pci_default_write_config(pci_dev, address, val, len);
530 msix_write_config(pci_dev, address, val, len);
533 static unsigned virtio_pci_get_features(void *opaque)
535 VirtIOPCIProxy *proxy = opaque;
536 return proxy->host_features;
539 static void virtio_pci_guest_notifier_read(void *opaque)
541 VirtQueue *vq = opaque;
542 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
543 if (event_notifier_test_and_clear(n)) {
544 virtio_irq(vq);
548 static int virtio_pci_mask_vq(PCIDevice *dev, unsigned vector,
549 VirtQueue *vq, int masked)
551 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
552 int r = kvm_set_irqfd(dev->msix_irq_entries[vector].gsi,
553 event_notifier_get_fd(notifier),
554 !masked);
555 if (r < 0) {
556 return (r == -ENOSYS) ? 0 : r;
558 if (masked) {
559 qemu_set_fd_handler(event_notifier_get_fd(notifier),
560 virtio_pci_guest_notifier_read, NULL, vq);
561 } else {
562 qemu_set_fd_handler(event_notifier_get_fd(notifier),
563 NULL, NULL, NULL);
565 return 0;
568 static int virtio_pci_mask_notifier(PCIDevice *dev, unsigned vector,
569 int masked)
571 VirtIOPCIProxy *proxy = container_of(dev, VirtIOPCIProxy, pci_dev);
572 VirtIODevice *vdev = proxy->vdev;
573 int r, n;
575 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
576 if (!virtio_queue_get_num(vdev, n)) {
577 break;
579 if (virtio_queue_vector(vdev, n) != vector) {
580 continue;
582 r = virtio_pci_mask_vq(dev, vector, virtio_get_queue(vdev, n), masked);
583 if (r < 0) {
584 goto undo;
587 return 0;
588 undo:
589 while (--n >= 0) {
590 if (virtio_queue_vector(vdev, n) != vector) {
591 continue;
593 virtio_pci_mask_vq(dev, vector, virtio_get_queue(vdev, n), !masked);
595 return r;
599 static int virtio_pci_set_guest_notifier(void *opaque, int n, bool assign)
601 VirtIOPCIProxy *proxy = opaque;
602 VirtQueue *vq = virtio_get_queue(proxy->vdev, n);
603 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
605 if (assign) {
606 int r = event_notifier_init(notifier, 0);
607 if (r < 0) {
608 return r;
610 qemu_set_fd_handler(event_notifier_get_fd(notifier),
611 virtio_pci_guest_notifier_read, NULL, vq);
612 } else {
613 qemu_set_fd_handler(event_notifier_get_fd(notifier),
614 NULL, NULL, NULL);
615 /* Test and clear notifier before closing it,
616 * in case poll callback didn't have time to run. */
617 virtio_pci_guest_notifier_read(vq);
618 event_notifier_cleanup(notifier);
621 return 0;
624 static bool virtio_pci_query_guest_notifiers(void *opaque)
626 VirtIOPCIProxy *proxy = opaque;
627 return msix_enabled(&proxy->pci_dev);
630 static int virtio_pci_set_guest_notifiers(void *opaque, bool assign)
632 VirtIOPCIProxy *proxy = opaque;
633 VirtIODevice *vdev = proxy->vdev;
634 int r, n;
636 /* Must unset mask notifier while guest notifier
637 * is still assigned */
638 if (!assign) {
639 r = msix_unset_mask_notifier(&proxy->pci_dev);
640 assert(r >= 0);
643 for (n = 0; n < VIRTIO_PCI_QUEUE_MAX; n++) {
644 if (!virtio_queue_get_num(vdev, n)) {
645 break;
648 r = virtio_pci_set_guest_notifier(opaque, n, assign);
649 if (r < 0) {
650 goto assign_error;
654 /* Must set mask notifier after guest notifier
655 * has been assigned */
656 if (assign) {
657 r = msix_set_mask_notifier(&proxy->pci_dev,
658 virtio_pci_mask_notifier);
659 if (r < 0) {
660 goto assign_error;
664 return 0;
666 assign_error:
667 /* We get here on assignment failure. Recover by undoing for VQs 0 .. n. */
668 while (--n >= 0) {
669 virtio_pci_set_guest_notifier(opaque, n, !assign);
672 if (!assign) {
673 msix_set_mask_notifier(&proxy->pci_dev,
674 virtio_pci_mask_notifier);
676 return r;
679 static int virtio_pci_set_host_notifier(void *opaque, int n, bool assign)
681 VirtIOPCIProxy *proxy = opaque;
683 /* Stop using ioeventfd for virtqueue kick if the device starts using host
684 * notifiers. This makes it easy to avoid stepping on each others' toes.
686 proxy->ioeventfd_disabled = assign;
687 if (assign) {
688 virtio_pci_stop_ioeventfd(proxy);
690 /* We don't need to start here: it's not needed because backend
691 * currently only stops on status change away from ok,
692 * reset, vmstop and such. If we do add code to start here,
693 * need to check vmstate, device state etc. */
694 return virtio_pci_set_host_notifier_internal(proxy, n, assign);
697 static void virtio_pci_vmstate_change(void *opaque, bool running)
699 VirtIOPCIProxy *proxy = opaque;
701 if (running) {
702 /* Try to find out if the guest has bus master disabled, but is
703 in ready state. Then we have a buggy guest OS. */
704 if ((proxy->vdev->status & VIRTIO_CONFIG_S_DRIVER_OK) &&
705 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
706 proxy->flags |= VIRTIO_PCI_FLAG_BUS_MASTER_BUG;
708 virtio_pci_start_ioeventfd(proxy);
709 } else {
710 virtio_pci_stop_ioeventfd(proxy);
714 static const VirtIOBindings virtio_pci_bindings = {
715 .notify = virtio_pci_notify,
716 .save_config = virtio_pci_save_config,
717 .load_config = virtio_pci_load_config,
718 .save_queue = virtio_pci_save_queue,
719 .load_queue = virtio_pci_load_queue,
720 .get_features = virtio_pci_get_features,
721 .query_guest_notifiers = virtio_pci_query_guest_notifiers,
722 .set_host_notifier = virtio_pci_set_host_notifier,
723 .set_guest_notifiers = virtio_pci_set_guest_notifiers,
724 .vmstate_change = virtio_pci_vmstate_change,
727 void virtio_init_pci(VirtIOPCIProxy *proxy, VirtIODevice *vdev)
729 uint8_t *config;
730 uint32_t size;
732 proxy->vdev = vdev;
734 config = proxy->pci_dev.config;
736 if (proxy->class_code) {
737 pci_config_set_class(config, proxy->class_code);
739 pci_set_word(config + 0x2c, pci_get_word(config + PCI_VENDOR_ID));
740 pci_set_word(config + 0x2e, vdev->device_id);
741 config[0x3d] = 1;
743 if (vdev->nvectors && !msix_init(&proxy->pci_dev, vdev->nvectors, 1, 0)) {
744 pci_register_bar(&proxy->pci_dev, 1,
745 msix_bar_size(&proxy->pci_dev),
746 PCI_BASE_ADDRESS_SPACE_MEMORY,
747 msix_mmio_map);
748 } else
749 vdev->nvectors = 0;
751 proxy->pci_dev.config_write = virtio_write_config;
753 size = VIRTIO_PCI_REGION_SIZE(&proxy->pci_dev) + vdev->config_len;
754 if (size & (size-1))
755 size = 1 << qemu_fls(size);
757 pci_register_bar(&proxy->pci_dev, 0, size, PCI_BASE_ADDRESS_SPACE_IO,
758 virtio_map);
760 if (!kvm_has_many_ioeventfds()) {
761 proxy->flags &= ~VIRTIO_PCI_FLAG_USE_IOEVENTFD;
764 virtio_bind_device(vdev, &virtio_pci_bindings, proxy);
765 proxy->host_features |= 0x1 << VIRTIO_F_NOTIFY_ON_EMPTY;
766 proxy->host_features |= 0x1 << VIRTIO_F_BAD_FEATURE;
767 proxy->host_features = vdev->get_features(vdev, proxy->host_features);
770 static int virtio_blk_init_pci(PCIDevice *pci_dev)
772 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
773 VirtIODevice *vdev;
775 if (proxy->class_code != PCI_CLASS_STORAGE_SCSI &&
776 proxy->class_code != PCI_CLASS_STORAGE_OTHER)
777 proxy->class_code = PCI_CLASS_STORAGE_SCSI;
779 vdev = virtio_blk_init(&pci_dev->qdev, &proxy->block);
780 if (!vdev) {
781 return -1;
783 vdev->nvectors = proxy->nvectors;
784 virtio_init_pci(proxy, vdev);
785 /* make the actual value visible */
786 proxy->nvectors = vdev->nvectors;
787 return 0;
790 static int virtio_exit_pci(PCIDevice *pci_dev)
792 return msix_uninit(pci_dev);
795 static int virtio_blk_exit_pci(PCIDevice *pci_dev)
797 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
799 virtio_pci_stop_ioeventfd(proxy);
800 virtio_blk_exit(proxy->vdev);
801 blockdev_mark_auto_del(proxy->block.bs);
802 return virtio_exit_pci(pci_dev);
805 static int virtio_serial_init_pci(PCIDevice *pci_dev)
807 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
808 VirtIODevice *vdev;
810 if (proxy->class_code != PCI_CLASS_COMMUNICATION_OTHER &&
811 proxy->class_code != PCI_CLASS_DISPLAY_OTHER && /* qemu 0.10 */
812 proxy->class_code != PCI_CLASS_OTHERS) /* qemu-kvm */
813 proxy->class_code = PCI_CLASS_COMMUNICATION_OTHER;
815 vdev = virtio_serial_init(&pci_dev->qdev, &proxy->serial);
816 if (!vdev) {
817 return -1;
819 vdev->nvectors = proxy->nvectors == DEV_NVECTORS_UNSPECIFIED
820 ? proxy->serial.max_virtserial_ports + 1
821 : proxy->nvectors;
822 virtio_init_pci(proxy, vdev);
823 proxy->nvectors = vdev->nvectors;
824 return 0;
827 static int virtio_serial_exit_pci(PCIDevice *pci_dev)
829 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
831 virtio_pci_stop_ioeventfd(proxy);
832 virtio_serial_exit(proxy->vdev);
833 return virtio_exit_pci(pci_dev);
836 static int virtio_net_init_pci(PCIDevice *pci_dev)
838 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
839 VirtIODevice *vdev;
841 vdev = virtio_net_init(&pci_dev->qdev, &proxy->nic, &proxy->net);
843 vdev->nvectors = proxy->nvectors;
844 virtio_init_pci(proxy, vdev);
846 /* make the actual value visible */
847 proxy->nvectors = vdev->nvectors;
848 return 0;
851 static int virtio_net_exit_pci(PCIDevice *pci_dev)
853 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
855 virtio_pci_stop_ioeventfd(proxy);
856 virtio_net_exit(proxy->vdev);
857 return virtio_exit_pci(pci_dev);
860 static int virtio_balloon_init_pci(PCIDevice *pci_dev)
862 VirtIOPCIProxy *proxy = DO_UPCAST(VirtIOPCIProxy, pci_dev, pci_dev);
863 VirtIODevice *vdev;
865 vdev = virtio_balloon_init(&pci_dev->qdev);
866 virtio_init_pci(proxy, vdev);
867 return 0;
870 static PCIDeviceInfo virtio_info[] = {
872 .qdev.name = "virtio-blk-pci",
873 .qdev.alias = "virtio-blk",
874 .qdev.size = sizeof(VirtIOPCIProxy),
875 .init = virtio_blk_init_pci,
876 .exit = virtio_blk_exit_pci,
877 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
878 .device_id = PCI_DEVICE_ID_VIRTIO_BLOCK,
879 .revision = VIRTIO_PCI_ABI_VERSION,
880 .class_id = PCI_CLASS_STORAGE_SCSI,
881 .qdev.props = (Property[]) {
882 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
883 DEFINE_BLOCK_PROPERTIES(VirtIOPCIProxy, block),
884 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
885 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
886 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 2),
887 DEFINE_VIRTIO_BLK_FEATURES(VirtIOPCIProxy, host_features),
888 DEFINE_PROP_END_OF_LIST(),
890 .qdev.reset = virtio_pci_reset,
892 .qdev.name = "virtio-net-pci",
893 .qdev.alias = "virtio-net",
894 .qdev.size = sizeof(VirtIOPCIProxy),
895 .init = virtio_net_init_pci,
896 .exit = virtio_net_exit_pci,
897 .romfile = "pxe-virtio.rom",
898 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
899 .device_id = PCI_DEVICE_ID_VIRTIO_NET,
900 .revision = VIRTIO_PCI_ABI_VERSION,
901 .class_id = PCI_CLASS_NETWORK_ETHERNET,
902 .qdev.props = (Property[]) {
903 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
904 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, false),
905 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors, 3),
906 DEFINE_VIRTIO_NET_FEATURES(VirtIOPCIProxy, host_features),
907 DEFINE_NIC_PROPERTIES(VirtIOPCIProxy, nic),
908 DEFINE_PROP_UINT32("x-txtimer", VirtIOPCIProxy,
909 net.txtimer, TX_TIMER_INTERVAL),
910 DEFINE_PROP_INT32("x-txburst", VirtIOPCIProxy,
911 net.txburst, TX_BURST),
912 DEFINE_PROP_STRING("tx", VirtIOPCIProxy, net.tx),
913 DEFINE_PROP_END_OF_LIST(),
915 .qdev.reset = virtio_pci_reset,
917 .qdev.name = "virtio-serial-pci",
918 .qdev.alias = "virtio-serial",
919 .qdev.size = sizeof(VirtIOPCIProxy),
920 .init = virtio_serial_init_pci,
921 .exit = virtio_serial_exit_pci,
922 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
923 .device_id = PCI_DEVICE_ID_VIRTIO_CONSOLE,
924 .revision = VIRTIO_PCI_ABI_VERSION,
925 .class_id = PCI_CLASS_COMMUNICATION_OTHER,
926 .qdev.props = (Property[]) {
927 DEFINE_PROP_BIT("ioeventfd", VirtIOPCIProxy, flags,
928 VIRTIO_PCI_FLAG_USE_IOEVENTFD_BIT, true),
929 DEFINE_PROP_UINT32("vectors", VirtIOPCIProxy, nvectors,
930 DEV_NVECTORS_UNSPECIFIED),
931 DEFINE_PROP_HEX32("class", VirtIOPCIProxy, class_code, 0),
932 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
933 DEFINE_PROP_UINT32("max_ports", VirtIOPCIProxy,
934 serial.max_virtserial_ports, 31),
935 DEFINE_PROP_END_OF_LIST(),
937 .qdev.reset = virtio_pci_reset,
939 .qdev.name = "virtio-balloon-pci",
940 .qdev.alias = "virtio-balloon",
941 .qdev.size = sizeof(VirtIOPCIProxy),
942 .init = virtio_balloon_init_pci,
943 .exit = virtio_exit_pci,
944 .vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET,
945 .device_id = PCI_DEVICE_ID_VIRTIO_BALLOON,
946 .revision = VIRTIO_PCI_ABI_VERSION,
947 .class_id = PCI_CLASS_MEMORY_RAM,
948 .qdev.props = (Property[]) {
949 DEFINE_VIRTIO_COMMON_FEATURES(VirtIOPCIProxy, host_features),
950 DEFINE_PROP_END_OF_LIST(),
952 .qdev.reset = virtio_pci_reset,
954 /* end of list */
958 static void virtio_pci_register_devices(void)
960 pci_qdev_register_many(virtio_info);
963 device_init(virtio_pci_register_devices)