2 * vhost-user-blk host device
4 * Copyright(C) 2017 Intel Corporation.
7 * Changpeng Liu <changpeng.liu@intel.com>
9 * Largely based on the "vhost-user-scsi.c" and "vhost-scsi.c" implemented by:
10 * Felipe Franciosi <felipe@nutanix.com>
11 * Stefan Hajnoczi <stefanha@linux.vnet.ibm.com>
12 * Nicholas Bellinger <nab@risingtidesystems.com>
14 * This work is licensed under the terms of the GNU LGPL, version 2 or later.
15 * See the COPYING.LIB file in the top-level directory.
19 #include "qemu/osdep.h"
20 #include "qapi/error.h"
21 #include "qemu/error-report.h"
22 #include "qemu/cutils.h"
23 #include "hw/qdev-core.h"
24 #include "hw/qdev-properties.h"
25 #include "hw/qdev-properties-system.h"
26 #include "hw/virtio/virtio-blk-common.h"
27 #include "hw/virtio/vhost.h"
28 #include "hw/virtio/vhost-user-blk.h"
29 #include "hw/virtio/virtio.h"
30 #include "hw/virtio/virtio-bus.h"
31 #include "hw/virtio/virtio-access.h"
32 #include "sysemu/sysemu.h"
33 #include "sysemu/runstate.h"
35 #define REALIZE_CONNECTION_RETRIES 3
37 static const int user_feature_bits
[] = {
38 VIRTIO_BLK_F_SIZE_MAX
,
40 VIRTIO_BLK_F_GEOMETRY
,
41 VIRTIO_BLK_F_BLK_SIZE
,
42 VIRTIO_BLK_F_TOPOLOGY
,
46 VIRTIO_BLK_F_CONFIG_WCE
,
48 VIRTIO_BLK_F_WRITE_ZEROES
,
50 VIRTIO_RING_F_INDIRECT_DESC
,
51 VIRTIO_RING_F_EVENT_IDX
,
52 VIRTIO_F_NOTIFY_ON_EMPTY
,
54 VIRTIO_F_IOMMU_PLATFORM
,
56 VHOST_INVALID_FEATURE_BIT
59 static void vhost_user_blk_event(void *opaque
, QEMUChrEvent event
);
61 static void vhost_user_blk_update_config(VirtIODevice
*vdev
, uint8_t *config
)
63 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
65 /* Our num_queues overrides the device backend */
66 virtio_stw_p(vdev
, &s
->blkcfg
.num_queues
, s
->num_queues
);
68 memcpy(config
, &s
->blkcfg
, vdev
->config_len
);
71 static void vhost_user_blk_set_config(VirtIODevice
*vdev
, const uint8_t *config
)
73 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
74 struct virtio_blk_config
*blkcfg
= (struct virtio_blk_config
*)config
;
77 if (blkcfg
->wce
== s
->blkcfg
.wce
) {
81 ret
= vhost_dev_set_config(&s
->dev
, &blkcfg
->wce
,
82 offsetof(struct virtio_blk_config
, wce
),
84 VHOST_SET_CONFIG_TYPE_FRONTEND
);
86 error_report("set device config space failed");
90 s
->blkcfg
.wce
= blkcfg
->wce
;
93 static int vhost_user_blk_handle_config_change(struct vhost_dev
*dev
)
96 struct virtio_blk_config blkcfg
;
97 VirtIODevice
*vdev
= dev
->vdev
;
98 VHostUserBlk
*s
= VHOST_USER_BLK(dev
->vdev
);
99 Error
*local_err
= NULL
;
105 ret
= vhost_dev_get_config(dev
, (uint8_t *)&blkcfg
,
106 vdev
->config_len
, &local_err
);
108 error_report_err(local_err
);
112 /* valid for resize only */
113 if (blkcfg
.capacity
!= s
->blkcfg
.capacity
) {
114 s
->blkcfg
.capacity
= blkcfg
.capacity
;
115 memcpy(dev
->vdev
->config
, &s
->blkcfg
, vdev
->config_len
);
116 virtio_notify_config(dev
->vdev
);
122 const VhostDevConfigOps blk_ops
= {
123 .vhost_dev_config_notifier
= vhost_user_blk_handle_config_change
,
126 static int vhost_user_blk_start(VirtIODevice
*vdev
, Error
**errp
)
128 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
129 BusState
*qbus
= BUS(qdev_get_parent_bus(DEVICE(vdev
)));
130 VirtioBusClass
*k
= VIRTIO_BUS_GET_CLASS(qbus
);
133 if (!k
->set_guest_notifiers
) {
134 error_setg(errp
, "binding does not support guest notifiers");
138 ret
= vhost_dev_enable_notifiers(&s
->dev
, vdev
);
140 error_setg_errno(errp
, -ret
, "Error enabling host notifiers");
144 ret
= k
->set_guest_notifiers(qbus
->parent
, s
->dev
.nvqs
, true);
146 error_setg_errno(errp
, -ret
, "Error binding guest notifier");
147 goto err_host_notifiers
;
150 s
->dev
.acked_features
= vdev
->guest_features
;
152 ret
= vhost_dev_prepare_inflight(&s
->dev
, vdev
);
154 error_setg_errno(errp
, -ret
, "Error setting inflight format");
155 goto err_guest_notifiers
;
158 if (!s
->inflight
->addr
) {
159 ret
= vhost_dev_get_inflight(&s
->dev
, s
->queue_size
, s
->inflight
);
161 error_setg_errno(errp
, -ret
, "Error getting inflight");
162 goto err_guest_notifiers
;
166 ret
= vhost_dev_set_inflight(&s
->dev
, s
->inflight
);
168 error_setg_errno(errp
, -ret
, "Error setting inflight");
169 goto err_guest_notifiers
;
172 /* guest_notifier_mask/pending not used yet, so just unmask
173 * everything here. virtio-pci will do the right thing by
174 * enabling/disabling irqfd.
176 for (i
= 0; i
< s
->dev
.nvqs
; i
++) {
177 vhost_virtqueue_mask(&s
->dev
, vdev
, i
, false);
180 s
->dev
.vq_index_end
= s
->dev
.nvqs
;
181 ret
= vhost_dev_start(&s
->dev
, vdev
, true);
183 error_setg_errno(errp
, -ret
, "Error starting vhost");
184 goto err_guest_notifiers
;
186 s
->started_vu
= true;
191 for (i
= 0; i
< s
->dev
.nvqs
; i
++) {
192 vhost_virtqueue_mask(&s
->dev
, vdev
, i
, true);
194 k
->set_guest_notifiers(qbus
->parent
, s
->dev
.nvqs
, false);
196 vhost_dev_disable_notifiers(&s
->dev
, vdev
);
200 static void vhost_user_blk_stop(VirtIODevice
*vdev
)
202 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
203 BusState
*qbus
= BUS(qdev_get_parent_bus(DEVICE(vdev
)));
204 VirtioBusClass
*k
= VIRTIO_BUS_GET_CLASS(qbus
);
207 if (!s
->started_vu
) {
210 s
->started_vu
= false;
212 if (!k
->set_guest_notifiers
) {
216 vhost_dev_stop(&s
->dev
, vdev
, true);
218 ret
= k
->set_guest_notifiers(qbus
->parent
, s
->dev
.nvqs
, false);
220 error_report("vhost guest notifier cleanup failed: %d", ret
);
224 vhost_dev_disable_notifiers(&s
->dev
, vdev
);
227 static void vhost_user_blk_set_status(VirtIODevice
*vdev
, uint8_t status
)
229 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
230 bool should_start
= virtio_device_should_start(vdev
, status
);
231 Error
*local_err
= NULL
;
238 if (vhost_dev_is_started(&s
->dev
) == should_start
) {
243 ret
= vhost_user_blk_start(vdev
, &local_err
);
245 error_reportf_err(local_err
, "vhost-user-blk: vhost start failed: ");
246 qemu_chr_fe_disconnect(&s
->chardev
);
249 vhost_user_blk_stop(vdev
);
254 static uint64_t vhost_user_blk_get_features(VirtIODevice
*vdev
,
258 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
260 /* Turn on pre-defined features */
261 virtio_add_feature(&features
, VIRTIO_BLK_F_SIZE_MAX
);
262 virtio_add_feature(&features
, VIRTIO_BLK_F_SEG_MAX
);
263 virtio_add_feature(&features
, VIRTIO_BLK_F_GEOMETRY
);
264 virtio_add_feature(&features
, VIRTIO_BLK_F_TOPOLOGY
);
265 virtio_add_feature(&features
, VIRTIO_BLK_F_BLK_SIZE
);
266 virtio_add_feature(&features
, VIRTIO_BLK_F_FLUSH
);
267 virtio_add_feature(&features
, VIRTIO_BLK_F_RO
);
269 if (s
->num_queues
> 1) {
270 virtio_add_feature(&features
, VIRTIO_BLK_F_MQ
);
273 return vhost_get_features(&s
->dev
, user_feature_bits
, features
);
276 static void vhost_user_blk_handle_output(VirtIODevice
*vdev
, VirtQueue
*vq
)
278 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
279 Error
*local_err
= NULL
;
282 if (!vdev
->start_on_kick
) {
290 if (vhost_dev_is_started(&s
->dev
)) {
294 /* Some guests kick before setting VIRTIO_CONFIG_S_DRIVER_OK so start
295 * vhost here instead of waiting for .set_status().
297 ret
= vhost_user_blk_start(vdev
, &local_err
);
299 error_reportf_err(local_err
, "vhost-user-blk: vhost start failed: ");
300 qemu_chr_fe_disconnect(&s
->chardev
);
304 /* Kick right away to begin processing requests already in vring */
305 for (i
= 0; i
< s
->dev
.nvqs
; i
++) {
306 VirtQueue
*kick_vq
= virtio_get_queue(vdev
, i
);
308 if (!virtio_queue_get_desc_addr(vdev
, i
)) {
311 event_notifier_set(virtio_queue_get_host_notifier(kick_vq
));
315 static void vhost_user_blk_reset(VirtIODevice
*vdev
)
317 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
319 vhost_dev_free_inflight(s
->inflight
);
322 static int vhost_user_blk_connect(DeviceState
*dev
, Error
**errp
)
324 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
325 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
333 s
->dev
.num_queues
= s
->num_queues
;
334 s
->dev
.nvqs
= s
->num_queues
;
335 s
->dev
.vqs
= s
->vhost_vqs
;
337 s
->dev
.backend_features
= 0;
339 vhost_dev_set_config_notifier(&s
->dev
, &blk_ops
);
341 s
->vhost_user
.supports_config
= true;
342 ret
= vhost_dev_init(&s
->dev
, &s
->vhost_user
, VHOST_BACKEND_TYPE_USER
, 0,
348 /* restore vhost state */
349 if (virtio_device_started(vdev
, vdev
->status
)) {
350 ret
= vhost_user_blk_start(vdev
, errp
);
359 static void vhost_user_blk_disconnect(DeviceState
*dev
)
361 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
362 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
367 s
->connected
= false;
369 vhost_user_blk_stop(vdev
);
371 vhost_dev_cleanup(&s
->dev
);
373 /* Re-instate the event handler for new connections */
374 qemu_chr_fe_set_handlers(&s
->chardev
, NULL
, NULL
, vhost_user_blk_event
,
375 NULL
, dev
, NULL
, true);
378 static void vhost_user_blk_event(void *opaque
, QEMUChrEvent event
)
380 DeviceState
*dev
= opaque
;
381 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
382 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
383 Error
*local_err
= NULL
;
386 case CHR_EVENT_OPENED
:
387 if (vhost_user_blk_connect(dev
, &local_err
) < 0) {
388 error_report_err(local_err
);
389 qemu_chr_fe_disconnect(&s
->chardev
);
393 case CHR_EVENT_CLOSED
:
394 /* defer close until later to avoid circular close */
395 vhost_user_async_close(dev
, &s
->chardev
, &s
->dev
,
396 vhost_user_blk_disconnect
);
398 case CHR_EVENT_BREAK
:
399 case CHR_EVENT_MUX_IN
:
400 case CHR_EVENT_MUX_OUT
:
406 static int vhost_user_blk_realize_connect(VHostUserBlk
*s
, Error
**errp
)
408 DeviceState
*dev
= &s
->parent_obj
.parent_obj
;
411 s
->connected
= false;
413 ret
= qemu_chr_fe_wait_connected(&s
->chardev
, errp
);
418 ret
= vhost_user_blk_connect(dev
, errp
);
420 qemu_chr_fe_disconnect(&s
->chardev
);
423 assert(s
->connected
);
425 ret
= vhost_dev_get_config(&s
->dev
, (uint8_t *)&s
->blkcfg
,
426 s
->parent_obj
.config_len
, errp
);
428 qemu_chr_fe_disconnect(&s
->chardev
);
429 vhost_dev_cleanup(&s
->dev
);
436 static void vhost_user_blk_device_realize(DeviceState
*dev
, Error
**errp
)
439 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
440 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
445 if (!s
->chardev
.chr
) {
446 error_setg(errp
, "chardev is mandatory");
450 if (s
->num_queues
== VHOST_USER_BLK_AUTO_NUM_QUEUES
) {
453 if (!s
->num_queues
|| s
->num_queues
> VIRTIO_QUEUE_MAX
) {
454 error_setg(errp
, "invalid number of IO queues");
458 if (!s
->queue_size
) {
459 error_setg(errp
, "queue size must be non-zero");
462 if (s
->queue_size
> VIRTQUEUE_MAX_SIZE
) {
463 error_setg(errp
, "queue size must not exceed %d",
468 if (!vhost_user_init(&s
->vhost_user
, &s
->chardev
, errp
)) {
472 config_size
= virtio_get_config_size(&virtio_blk_cfg_size_params
,
473 vdev
->host_features
);
474 virtio_init(vdev
, VIRTIO_ID_BLOCK
, config_size
);
476 s
->virtqs
= g_new(VirtQueue
*, s
->num_queues
);
477 for (i
= 0; i
< s
->num_queues
; i
++) {
478 s
->virtqs
[i
] = virtio_add_queue(vdev
, s
->queue_size
,
479 vhost_user_blk_handle_output
);
482 s
->inflight
= g_new0(struct vhost_inflight
, 1);
483 s
->vhost_vqs
= g_new0(struct vhost_virtqueue
, s
->num_queues
);
485 retries
= REALIZE_CONNECTION_RETRIES
;
489 error_prepend(errp
, "Reconnecting after error: ");
490 error_report_err(*errp
);
493 ret
= vhost_user_blk_realize_connect(s
, errp
);
494 } while (ret
< 0 && retries
--);
500 /* we're fully initialized, now we can operate, so add the handler */
501 qemu_chr_fe_set_handlers(&s
->chardev
, NULL
, NULL
,
502 vhost_user_blk_event
, NULL
, (void *)dev
,
507 g_free(s
->vhost_vqs
);
511 for (i
= 0; i
< s
->num_queues
; i
++) {
512 virtio_delete_queue(s
->virtqs
[i
]);
515 virtio_cleanup(vdev
);
516 vhost_user_cleanup(&s
->vhost_user
);
519 static void vhost_user_blk_device_unrealize(DeviceState
*dev
)
521 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
522 VHostUserBlk
*s
= VHOST_USER_BLK(dev
);
525 virtio_set_status(vdev
, 0);
526 qemu_chr_fe_set_handlers(&s
->chardev
, NULL
, NULL
, NULL
,
527 NULL
, NULL
, NULL
, false);
528 vhost_dev_cleanup(&s
->dev
);
529 vhost_dev_free_inflight(s
->inflight
);
530 g_free(s
->vhost_vqs
);
535 for (i
= 0; i
< s
->num_queues
; i
++) {
536 virtio_delete_queue(s
->virtqs
[i
]);
539 virtio_cleanup(vdev
);
540 vhost_user_cleanup(&s
->vhost_user
);
543 static void vhost_user_blk_instance_init(Object
*obj
)
545 VHostUserBlk
*s
= VHOST_USER_BLK(obj
);
547 device_add_bootindex_property(obj
, &s
->bootindex
, "bootindex",
548 "/disk@0,0", DEVICE(obj
));
551 static struct vhost_dev
*vhost_user_blk_get_vhost(VirtIODevice
*vdev
)
553 VHostUserBlk
*s
= VHOST_USER_BLK(vdev
);
557 static const VMStateDescription vmstate_vhost_user_blk
= {
558 .name
= "vhost-user-blk",
559 .minimum_version_id
= 1,
561 .fields
= (VMStateField
[]) {
562 VMSTATE_VIRTIO_DEVICE
,
563 VMSTATE_END_OF_LIST()
567 static Property vhost_user_blk_properties
[] = {
568 DEFINE_PROP_CHR("chardev", VHostUserBlk
, chardev
),
569 DEFINE_PROP_UINT16("num-queues", VHostUserBlk
, num_queues
,
570 VHOST_USER_BLK_AUTO_NUM_QUEUES
),
571 DEFINE_PROP_UINT32("queue-size", VHostUserBlk
, queue_size
, 128),
572 DEFINE_PROP_BIT64("config-wce", VHostUserBlk
, parent_obj
.host_features
,
573 VIRTIO_BLK_F_CONFIG_WCE
, true),
574 DEFINE_PROP_BIT64("discard", VHostUserBlk
, parent_obj
.host_features
,
575 VIRTIO_BLK_F_DISCARD
, true),
576 DEFINE_PROP_BIT64("write-zeroes", VHostUserBlk
, parent_obj
.host_features
,
577 VIRTIO_BLK_F_WRITE_ZEROES
, true),
578 DEFINE_PROP_END_OF_LIST(),
581 static void vhost_user_blk_class_init(ObjectClass
*klass
, void *data
)
583 DeviceClass
*dc
= DEVICE_CLASS(klass
);
584 VirtioDeviceClass
*vdc
= VIRTIO_DEVICE_CLASS(klass
);
586 device_class_set_props(dc
, vhost_user_blk_properties
);
587 dc
->vmsd
= &vmstate_vhost_user_blk
;
588 set_bit(DEVICE_CATEGORY_STORAGE
, dc
->categories
);
589 vdc
->realize
= vhost_user_blk_device_realize
;
590 vdc
->unrealize
= vhost_user_blk_device_unrealize
;
591 vdc
->get_config
= vhost_user_blk_update_config
;
592 vdc
->set_config
= vhost_user_blk_set_config
;
593 vdc
->get_features
= vhost_user_blk_get_features
;
594 vdc
->set_status
= vhost_user_blk_set_status
;
595 vdc
->reset
= vhost_user_blk_reset
;
596 vdc
->get_vhost
= vhost_user_blk_get_vhost
;
599 static const TypeInfo vhost_user_blk_info
= {
600 .name
= TYPE_VHOST_USER_BLK
,
601 .parent
= TYPE_VIRTIO_DEVICE
,
602 .instance_size
= sizeof(VHostUserBlk
),
603 .instance_init
= vhost_user_blk_instance_init
,
604 .class_init
= vhost_user_blk_class_init
,
607 static void virtio_register_types(void)
609 type_register_static(&vhost_user_blk_info
);
612 type_init(virtio_register_types
)