2 * Virtio Network Device
4 * Copyright IBM, Corp. 2007
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
14 #include "qemu/osdep.h"
16 #include "hw/virtio/virtio.h"
18 #include "net/checksum.h"
20 #include "qemu/error-report.h"
21 #include "qemu/timer.h"
22 #include "hw/virtio/virtio-net.h"
23 #include "net/vhost_net.h"
24 #include "hw/virtio/virtio-bus.h"
25 #include "qapi/qmp/qjson.h"
26 #include "qapi-event.h"
27 #include "hw/virtio/virtio-access.h"
29 #define VIRTIO_NET_VM_VERSION 11
31 #define MAC_TABLE_ENTRIES 64
32 #define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
34 /* previously fixed value */
35 #define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
36 /* for now, only allow larger queues; with virtio-1, guest can downsize */
37 #define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
40 * Calculate the number of bytes up to and including the given 'field' of
43 #define endof(container, field) \
44 (offsetof(container, field) + sizeof(((container *)0)->field))
46 typedef struct VirtIOFeature
{
51 static VirtIOFeature feature_sizes
[] = {
52 {.flags
= 1 << VIRTIO_NET_F_MAC
,
53 .end
= endof(struct virtio_net_config
, mac
)},
54 {.flags
= 1 << VIRTIO_NET_F_STATUS
,
55 .end
= endof(struct virtio_net_config
, status
)},
56 {.flags
= 1 << VIRTIO_NET_F_MQ
,
57 .end
= endof(struct virtio_net_config
, max_virtqueue_pairs
)},
61 static VirtIONetQueue
*virtio_net_get_subqueue(NetClientState
*nc
)
63 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
65 return &n
->vqs
[nc
->queue_index
];
68 static int vq2q(int queue_index
)
70 return queue_index
/ 2;
74 * - we could suppress RX interrupt if we were so inclined.
77 static void virtio_net_get_config(VirtIODevice
*vdev
, uint8_t *config
)
79 VirtIONet
*n
= VIRTIO_NET(vdev
);
80 struct virtio_net_config netcfg
;
82 virtio_stw_p(vdev
, &netcfg
.status
, n
->status
);
83 virtio_stw_p(vdev
, &netcfg
.max_virtqueue_pairs
, n
->max_queues
);
84 memcpy(netcfg
.mac
, n
->mac
, ETH_ALEN
);
85 memcpy(config
, &netcfg
, n
->config_size
);
88 static void virtio_net_set_config(VirtIODevice
*vdev
, const uint8_t *config
)
90 VirtIONet
*n
= VIRTIO_NET(vdev
);
91 struct virtio_net_config netcfg
= {};
93 memcpy(&netcfg
, config
, n
->config_size
);
95 if (!virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_MAC_ADDR
) &&
96 !virtio_vdev_has_feature(vdev
, VIRTIO_F_VERSION_1
) &&
97 memcmp(netcfg
.mac
, n
->mac
, ETH_ALEN
)) {
98 memcpy(n
->mac
, netcfg
.mac
, ETH_ALEN
);
99 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
103 static bool virtio_net_started(VirtIONet
*n
, uint8_t status
)
105 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
106 return (status
& VIRTIO_CONFIG_S_DRIVER_OK
) &&
107 (n
->status
& VIRTIO_NET_S_LINK_UP
) && vdev
->vm_running
;
110 static void virtio_net_announce_timer(void *opaque
)
112 VirtIONet
*n
= opaque
;
113 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
115 n
->announce_counter
--;
116 n
->status
|= VIRTIO_NET_S_ANNOUNCE
;
117 virtio_notify_config(vdev
);
120 static void virtio_net_vhost_status(VirtIONet
*n
, uint8_t status
)
122 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
123 NetClientState
*nc
= qemu_get_queue(n
->nic
);
124 int queues
= n
->multiqueue
? n
->max_queues
: 1;
126 if (!get_vhost_net(nc
->peer
)) {
130 if ((virtio_net_started(n
, status
) && !nc
->peer
->link_down
) ==
131 !!n
->vhost_started
) {
134 if (!n
->vhost_started
) {
137 if (n
->needs_vnet_hdr_swap
) {
138 error_report("backend does not support %s vnet headers; "
139 "falling back on userspace virtio",
140 virtio_is_big_endian(vdev
) ? "BE" : "LE");
144 /* Any packets outstanding? Purge them to avoid touching rings
145 * when vhost is running.
147 for (i
= 0; i
< queues
; i
++) {
148 NetClientState
*qnc
= qemu_get_subqueue(n
->nic
, i
);
150 /* Purge both directions: TX and RX. */
151 qemu_net_queue_purge(qnc
->peer
->incoming_queue
, qnc
);
152 qemu_net_queue_purge(qnc
->incoming_queue
, qnc
->peer
);
155 n
->vhost_started
= 1;
156 r
= vhost_net_start(vdev
, n
->nic
->ncs
, queues
);
158 error_report("unable to start vhost net: %d: "
159 "falling back on userspace virtio", -r
);
160 n
->vhost_started
= 0;
163 vhost_net_stop(vdev
, n
->nic
->ncs
, queues
);
164 n
->vhost_started
= 0;
168 static int virtio_net_set_vnet_endian_one(VirtIODevice
*vdev
,
169 NetClientState
*peer
,
172 if (virtio_is_big_endian(vdev
)) {
173 return qemu_set_vnet_be(peer
, enable
);
175 return qemu_set_vnet_le(peer
, enable
);
179 static bool virtio_net_set_vnet_endian(VirtIODevice
*vdev
, NetClientState
*ncs
,
180 int queues
, bool enable
)
184 for (i
= 0; i
< queues
; i
++) {
185 if (virtio_net_set_vnet_endian_one(vdev
, ncs
[i
].peer
, enable
) < 0 &&
188 virtio_net_set_vnet_endian_one(vdev
, ncs
[i
].peer
, false);
198 static void virtio_net_vnet_endian_status(VirtIONet
*n
, uint8_t status
)
200 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
201 int queues
= n
->multiqueue
? n
->max_queues
: 1;
203 if (virtio_net_started(n
, status
)) {
204 /* Before using the device, we tell the network backend about the
205 * endianness to use when parsing vnet headers. If the backend
206 * can't do it, we fallback onto fixing the headers in the core
209 n
->needs_vnet_hdr_swap
= virtio_net_set_vnet_endian(vdev
, n
->nic
->ncs
,
211 } else if (virtio_net_started(n
, vdev
->status
)) {
212 /* After using the device, we need to reset the network backend to
213 * the default (guest native endianness), otherwise the guest may
214 * lose network connectivity if it is rebooted into a different
217 virtio_net_set_vnet_endian(vdev
, n
->nic
->ncs
, queues
, false);
221 static void virtio_net_set_status(struct VirtIODevice
*vdev
, uint8_t status
)
223 VirtIONet
*n
= VIRTIO_NET(vdev
);
226 uint8_t queue_status
;
228 virtio_net_vnet_endian_status(n
, status
);
229 virtio_net_vhost_status(n
, status
);
231 for (i
= 0; i
< n
->max_queues
; i
++) {
232 NetClientState
*ncs
= qemu_get_subqueue(n
->nic
, i
);
236 if ((!n
->multiqueue
&& i
!= 0) || i
>= n
->curr_queues
) {
239 queue_status
= status
;
242 virtio_net_started(n
, queue_status
) && !n
->vhost_started
;
245 qemu_flush_queued_packets(ncs
);
248 if (!q
->tx_waiting
) {
254 timer_mod(q
->tx_timer
,
255 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL
) + n
->tx_timeout
);
257 qemu_bh_schedule(q
->tx_bh
);
261 timer_del(q
->tx_timer
);
263 qemu_bh_cancel(q
->tx_bh
);
269 static void virtio_net_set_link_status(NetClientState
*nc
)
271 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
272 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
273 uint16_t old_status
= n
->status
;
276 n
->status
&= ~VIRTIO_NET_S_LINK_UP
;
278 n
->status
|= VIRTIO_NET_S_LINK_UP
;
280 if (n
->status
!= old_status
)
281 virtio_notify_config(vdev
);
283 virtio_net_set_status(vdev
, vdev
->status
);
286 static void rxfilter_notify(NetClientState
*nc
)
288 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
290 if (nc
->rxfilter_notify_enabled
) {
291 gchar
*path
= object_get_canonical_path(OBJECT(n
->qdev
));
292 qapi_event_send_nic_rx_filter_changed(!!n
->netclient_name
,
293 n
->netclient_name
, path
, &error_abort
);
296 /* disable event notification to avoid events flooding */
297 nc
->rxfilter_notify_enabled
= 0;
301 static intList
*get_vlan_table(VirtIONet
*n
)
303 intList
*list
, *entry
;
307 for (i
= 0; i
< MAX_VLAN
>> 5; i
++) {
308 for (j
= 0; n
->vlans
[i
] && j
<= 0x1f; j
++) {
309 if (n
->vlans
[i
] & (1U << j
)) {
310 entry
= g_malloc0(sizeof(*entry
));
311 entry
->value
= (i
<< 5) + j
;
321 static RxFilterInfo
*virtio_net_query_rxfilter(NetClientState
*nc
)
323 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
324 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
326 strList
*str_list
, *entry
;
329 info
= g_malloc0(sizeof(*info
));
330 info
->name
= g_strdup(nc
->name
);
331 info
->promiscuous
= n
->promisc
;
334 info
->unicast
= RX_STATE_NONE
;
335 } else if (n
->alluni
) {
336 info
->unicast
= RX_STATE_ALL
;
338 info
->unicast
= RX_STATE_NORMAL
;
342 info
->multicast
= RX_STATE_NONE
;
343 } else if (n
->allmulti
) {
344 info
->multicast
= RX_STATE_ALL
;
346 info
->multicast
= RX_STATE_NORMAL
;
349 info
->broadcast_allowed
= n
->nobcast
;
350 info
->multicast_overflow
= n
->mac_table
.multi_overflow
;
351 info
->unicast_overflow
= n
->mac_table
.uni_overflow
;
353 info
->main_mac
= qemu_mac_strdup_printf(n
->mac
);
356 for (i
= 0; i
< n
->mac_table
.first_multi
; i
++) {
357 entry
= g_malloc0(sizeof(*entry
));
358 entry
->value
= qemu_mac_strdup_printf(n
->mac_table
.macs
+ i
* ETH_ALEN
);
359 entry
->next
= str_list
;
362 info
->unicast_table
= str_list
;
365 for (i
= n
->mac_table
.first_multi
; i
< n
->mac_table
.in_use
; i
++) {
366 entry
= g_malloc0(sizeof(*entry
));
367 entry
->value
= qemu_mac_strdup_printf(n
->mac_table
.macs
+ i
* ETH_ALEN
);
368 entry
->next
= str_list
;
371 info
->multicast_table
= str_list
;
372 info
->vlan_table
= get_vlan_table(n
);
374 if (!virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_VLAN
)) {
375 info
->vlan
= RX_STATE_ALL
;
376 } else if (!info
->vlan_table
) {
377 info
->vlan
= RX_STATE_NONE
;
379 info
->vlan
= RX_STATE_NORMAL
;
382 /* enable event notification after query */
383 nc
->rxfilter_notify_enabled
= 1;
388 static void virtio_net_reset(VirtIODevice
*vdev
)
390 VirtIONet
*n
= VIRTIO_NET(vdev
);
392 /* Reset back to compatibility mode */
399 /* multiqueue is disabled by default */
401 timer_del(n
->announce_timer
);
402 n
->announce_counter
= 0;
403 n
->status
&= ~VIRTIO_NET_S_ANNOUNCE
;
405 /* Flush any MAC and VLAN filter table state */
406 n
->mac_table
.in_use
= 0;
407 n
->mac_table
.first_multi
= 0;
408 n
->mac_table
.multi_overflow
= 0;
409 n
->mac_table
.uni_overflow
= 0;
410 memset(n
->mac_table
.macs
, 0, MAC_TABLE_ENTRIES
* ETH_ALEN
);
411 memcpy(&n
->mac
[0], &n
->nic
->conf
->macaddr
, sizeof(n
->mac
));
412 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
413 memset(n
->vlans
, 0, MAX_VLAN
>> 3);
416 static void peer_test_vnet_hdr(VirtIONet
*n
)
418 NetClientState
*nc
= qemu_get_queue(n
->nic
);
423 n
->has_vnet_hdr
= qemu_has_vnet_hdr(nc
->peer
);
426 static int peer_has_vnet_hdr(VirtIONet
*n
)
428 return n
->has_vnet_hdr
;
431 static int peer_has_ufo(VirtIONet
*n
)
433 if (!peer_has_vnet_hdr(n
))
436 n
->has_ufo
= qemu_has_ufo(qemu_get_queue(n
->nic
)->peer
);
441 static void virtio_net_set_mrg_rx_bufs(VirtIONet
*n
, int mergeable_rx_bufs
,
447 n
->mergeable_rx_bufs
= mergeable_rx_bufs
;
450 n
->guest_hdr_len
= sizeof(struct virtio_net_hdr_mrg_rxbuf
);
452 n
->guest_hdr_len
= n
->mergeable_rx_bufs
?
453 sizeof(struct virtio_net_hdr_mrg_rxbuf
) :
454 sizeof(struct virtio_net_hdr
);
457 for (i
= 0; i
< n
->max_queues
; i
++) {
458 nc
= qemu_get_subqueue(n
->nic
, i
);
460 if (peer_has_vnet_hdr(n
) &&
461 qemu_has_vnet_hdr_len(nc
->peer
, n
->guest_hdr_len
)) {
462 qemu_set_vnet_hdr_len(nc
->peer
, n
->guest_hdr_len
);
463 n
->host_hdr_len
= n
->guest_hdr_len
;
468 static int peer_attach(VirtIONet
*n
, int index
)
470 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, index
);
476 if (nc
->peer
->info
->type
== NET_CLIENT_DRIVER_VHOST_USER
) {
477 vhost_set_vring_enable(nc
->peer
, 1);
480 if (nc
->peer
->info
->type
!= NET_CLIENT_DRIVER_TAP
) {
484 return tap_enable(nc
->peer
);
487 static int peer_detach(VirtIONet
*n
, int index
)
489 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, index
);
495 if (nc
->peer
->info
->type
== NET_CLIENT_DRIVER_VHOST_USER
) {
496 vhost_set_vring_enable(nc
->peer
, 0);
499 if (nc
->peer
->info
->type
!= NET_CLIENT_DRIVER_TAP
) {
503 return tap_disable(nc
->peer
);
506 static void virtio_net_set_queues(VirtIONet
*n
)
511 for (i
= 0; i
< n
->max_queues
; i
++) {
512 if (i
< n
->curr_queues
) {
513 r
= peer_attach(n
, i
);
516 r
= peer_detach(n
, i
);
522 static void virtio_net_set_multiqueue(VirtIONet
*n
, int multiqueue
);
524 static uint64_t virtio_net_get_features(VirtIODevice
*vdev
, uint64_t features
,
527 VirtIONet
*n
= VIRTIO_NET(vdev
);
528 NetClientState
*nc
= qemu_get_queue(n
->nic
);
530 /* Firstly sync all virtio-net possible supported features */
531 features
|= n
->host_features
;
533 virtio_add_feature(&features
, VIRTIO_NET_F_MAC
);
535 if (!peer_has_vnet_hdr(n
)) {
536 virtio_clear_feature(&features
, VIRTIO_NET_F_CSUM
);
537 virtio_clear_feature(&features
, VIRTIO_NET_F_HOST_TSO4
);
538 virtio_clear_feature(&features
, VIRTIO_NET_F_HOST_TSO6
);
539 virtio_clear_feature(&features
, VIRTIO_NET_F_HOST_ECN
);
541 virtio_clear_feature(&features
, VIRTIO_NET_F_GUEST_CSUM
);
542 virtio_clear_feature(&features
, VIRTIO_NET_F_GUEST_TSO4
);
543 virtio_clear_feature(&features
, VIRTIO_NET_F_GUEST_TSO6
);
544 virtio_clear_feature(&features
, VIRTIO_NET_F_GUEST_ECN
);
547 if (!peer_has_vnet_hdr(n
) || !peer_has_ufo(n
)) {
548 virtio_clear_feature(&features
, VIRTIO_NET_F_GUEST_UFO
);
549 virtio_clear_feature(&features
, VIRTIO_NET_F_HOST_UFO
);
552 if (!get_vhost_net(nc
->peer
)) {
555 return vhost_net_get_features(get_vhost_net(nc
->peer
), features
);
558 static uint64_t virtio_net_bad_features(VirtIODevice
*vdev
)
560 uint64_t features
= 0;
562 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
564 virtio_add_feature(&features
, VIRTIO_NET_F_MAC
);
565 virtio_add_feature(&features
, VIRTIO_NET_F_CSUM
);
566 virtio_add_feature(&features
, VIRTIO_NET_F_HOST_TSO4
);
567 virtio_add_feature(&features
, VIRTIO_NET_F_HOST_TSO6
);
568 virtio_add_feature(&features
, VIRTIO_NET_F_HOST_ECN
);
573 static void virtio_net_apply_guest_offloads(VirtIONet
*n
)
575 qemu_set_offload(qemu_get_queue(n
->nic
)->peer
,
576 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_CSUM
)),
577 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_TSO4
)),
578 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_TSO6
)),
579 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_ECN
)),
580 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_UFO
)));
583 static uint64_t virtio_net_guest_offloads_by_features(uint32_t features
)
585 static const uint64_t guest_offloads_mask
=
586 (1ULL << VIRTIO_NET_F_GUEST_CSUM
) |
587 (1ULL << VIRTIO_NET_F_GUEST_TSO4
) |
588 (1ULL << VIRTIO_NET_F_GUEST_TSO6
) |
589 (1ULL << VIRTIO_NET_F_GUEST_ECN
) |
590 (1ULL << VIRTIO_NET_F_GUEST_UFO
);
592 return guest_offloads_mask
& features
;
595 static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet
*n
)
597 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
598 return virtio_net_guest_offloads_by_features(vdev
->guest_features
);
601 static void virtio_net_set_features(VirtIODevice
*vdev
, uint64_t features
)
603 VirtIONet
*n
= VIRTIO_NET(vdev
);
606 virtio_net_set_multiqueue(n
,
607 virtio_has_feature(features
, VIRTIO_NET_F_MQ
));
609 virtio_net_set_mrg_rx_bufs(n
,
610 virtio_has_feature(features
,
611 VIRTIO_NET_F_MRG_RXBUF
),
612 virtio_has_feature(features
,
613 VIRTIO_F_VERSION_1
));
615 if (n
->has_vnet_hdr
) {
616 n
->curr_guest_offloads
=
617 virtio_net_guest_offloads_by_features(features
);
618 virtio_net_apply_guest_offloads(n
);
621 for (i
= 0; i
< n
->max_queues
; i
++) {
622 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, i
);
624 if (!get_vhost_net(nc
->peer
)) {
627 vhost_net_ack_features(get_vhost_net(nc
->peer
), features
);
630 if (virtio_has_feature(features
, VIRTIO_NET_F_CTRL_VLAN
)) {
631 memset(n
->vlans
, 0, MAX_VLAN
>> 3);
633 memset(n
->vlans
, 0xff, MAX_VLAN
>> 3);
637 static int virtio_net_handle_rx_mode(VirtIONet
*n
, uint8_t cmd
,
638 struct iovec
*iov
, unsigned int iov_cnt
)
642 NetClientState
*nc
= qemu_get_queue(n
->nic
);
644 s
= iov_to_buf(iov
, iov_cnt
, 0, &on
, sizeof(on
));
645 if (s
!= sizeof(on
)) {
646 return VIRTIO_NET_ERR
;
649 if (cmd
== VIRTIO_NET_CTRL_RX_PROMISC
) {
651 } else if (cmd
== VIRTIO_NET_CTRL_RX_ALLMULTI
) {
653 } else if (cmd
== VIRTIO_NET_CTRL_RX_ALLUNI
) {
655 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOMULTI
) {
657 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOUNI
) {
659 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOBCAST
) {
662 return VIRTIO_NET_ERR
;
667 return VIRTIO_NET_OK
;
670 static int virtio_net_handle_offloads(VirtIONet
*n
, uint8_t cmd
,
671 struct iovec
*iov
, unsigned int iov_cnt
)
673 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
677 if (!virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
)) {
678 return VIRTIO_NET_ERR
;
681 s
= iov_to_buf(iov
, iov_cnt
, 0, &offloads
, sizeof(offloads
));
682 if (s
!= sizeof(offloads
)) {
683 return VIRTIO_NET_ERR
;
686 if (cmd
== VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET
) {
687 uint64_t supported_offloads
;
689 if (!n
->has_vnet_hdr
) {
690 return VIRTIO_NET_ERR
;
693 supported_offloads
= virtio_net_supported_guest_offloads(n
);
694 if (offloads
& ~supported_offloads
) {
695 return VIRTIO_NET_ERR
;
698 n
->curr_guest_offloads
= offloads
;
699 virtio_net_apply_guest_offloads(n
);
701 return VIRTIO_NET_OK
;
703 return VIRTIO_NET_ERR
;
707 static int virtio_net_handle_mac(VirtIONet
*n
, uint8_t cmd
,
708 struct iovec
*iov
, unsigned int iov_cnt
)
710 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
711 struct virtio_net_ctrl_mac mac_data
;
713 NetClientState
*nc
= qemu_get_queue(n
->nic
);
715 if (cmd
== VIRTIO_NET_CTRL_MAC_ADDR_SET
) {
716 if (iov_size(iov
, iov_cnt
) != sizeof(n
->mac
)) {
717 return VIRTIO_NET_ERR
;
719 s
= iov_to_buf(iov
, iov_cnt
, 0, &n
->mac
, sizeof(n
->mac
));
720 assert(s
== sizeof(n
->mac
));
721 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
724 return VIRTIO_NET_OK
;
727 if (cmd
!= VIRTIO_NET_CTRL_MAC_TABLE_SET
) {
728 return VIRTIO_NET_ERR
;
733 uint8_t uni_overflow
= 0;
734 uint8_t multi_overflow
= 0;
735 uint8_t *macs
= g_malloc0(MAC_TABLE_ENTRIES
* ETH_ALEN
);
737 s
= iov_to_buf(iov
, iov_cnt
, 0, &mac_data
.entries
,
738 sizeof(mac_data
.entries
));
739 mac_data
.entries
= virtio_ldl_p(vdev
, &mac_data
.entries
);
740 if (s
!= sizeof(mac_data
.entries
)) {
743 iov_discard_front(&iov
, &iov_cnt
, s
);
745 if (mac_data
.entries
* ETH_ALEN
> iov_size(iov
, iov_cnt
)) {
749 if (mac_data
.entries
<= MAC_TABLE_ENTRIES
) {
750 s
= iov_to_buf(iov
, iov_cnt
, 0, macs
,
751 mac_data
.entries
* ETH_ALEN
);
752 if (s
!= mac_data
.entries
* ETH_ALEN
) {
755 in_use
+= mac_data
.entries
;
760 iov_discard_front(&iov
, &iov_cnt
, mac_data
.entries
* ETH_ALEN
);
762 first_multi
= in_use
;
764 s
= iov_to_buf(iov
, iov_cnt
, 0, &mac_data
.entries
,
765 sizeof(mac_data
.entries
));
766 mac_data
.entries
= virtio_ldl_p(vdev
, &mac_data
.entries
);
767 if (s
!= sizeof(mac_data
.entries
)) {
771 iov_discard_front(&iov
, &iov_cnt
, s
);
773 if (mac_data
.entries
* ETH_ALEN
!= iov_size(iov
, iov_cnt
)) {
777 if (mac_data
.entries
<= MAC_TABLE_ENTRIES
- in_use
) {
778 s
= iov_to_buf(iov
, iov_cnt
, 0, &macs
[in_use
* ETH_ALEN
],
779 mac_data
.entries
* ETH_ALEN
);
780 if (s
!= mac_data
.entries
* ETH_ALEN
) {
783 in_use
+= mac_data
.entries
;
788 n
->mac_table
.in_use
= in_use
;
789 n
->mac_table
.first_multi
= first_multi
;
790 n
->mac_table
.uni_overflow
= uni_overflow
;
791 n
->mac_table
.multi_overflow
= multi_overflow
;
792 memcpy(n
->mac_table
.macs
, macs
, MAC_TABLE_ENTRIES
* ETH_ALEN
);
796 return VIRTIO_NET_OK
;
800 return VIRTIO_NET_ERR
;
803 static int virtio_net_handle_vlan_table(VirtIONet
*n
, uint8_t cmd
,
804 struct iovec
*iov
, unsigned int iov_cnt
)
806 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
809 NetClientState
*nc
= qemu_get_queue(n
->nic
);
811 s
= iov_to_buf(iov
, iov_cnt
, 0, &vid
, sizeof(vid
));
812 vid
= virtio_lduw_p(vdev
, &vid
);
813 if (s
!= sizeof(vid
)) {
814 return VIRTIO_NET_ERR
;
818 return VIRTIO_NET_ERR
;
820 if (cmd
== VIRTIO_NET_CTRL_VLAN_ADD
)
821 n
->vlans
[vid
>> 5] |= (1U << (vid
& 0x1f));
822 else if (cmd
== VIRTIO_NET_CTRL_VLAN_DEL
)
823 n
->vlans
[vid
>> 5] &= ~(1U << (vid
& 0x1f));
825 return VIRTIO_NET_ERR
;
829 return VIRTIO_NET_OK
;
832 static int virtio_net_handle_announce(VirtIONet
*n
, uint8_t cmd
,
833 struct iovec
*iov
, unsigned int iov_cnt
)
835 if (cmd
== VIRTIO_NET_CTRL_ANNOUNCE_ACK
&&
836 n
->status
& VIRTIO_NET_S_ANNOUNCE
) {
837 n
->status
&= ~VIRTIO_NET_S_ANNOUNCE
;
838 if (n
->announce_counter
) {
839 timer_mod(n
->announce_timer
,
840 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL
) +
841 self_announce_delay(n
->announce_counter
));
843 return VIRTIO_NET_OK
;
845 return VIRTIO_NET_ERR
;
849 static int virtio_net_handle_mq(VirtIONet
*n
, uint8_t cmd
,
850 struct iovec
*iov
, unsigned int iov_cnt
)
852 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
853 struct virtio_net_ctrl_mq mq
;
857 s
= iov_to_buf(iov
, iov_cnt
, 0, &mq
, sizeof(mq
));
858 if (s
!= sizeof(mq
)) {
859 return VIRTIO_NET_ERR
;
862 if (cmd
!= VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET
) {
863 return VIRTIO_NET_ERR
;
866 queues
= virtio_lduw_p(vdev
, &mq
.virtqueue_pairs
);
868 if (queues
< VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN
||
869 queues
> VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX
||
870 queues
> n
->max_queues
||
872 return VIRTIO_NET_ERR
;
875 n
->curr_queues
= queues
;
876 /* stop the backend before changing the number of queues to avoid handling a
878 virtio_net_set_status(vdev
, vdev
->status
);
879 virtio_net_set_queues(n
);
881 return VIRTIO_NET_OK
;
883 static void virtio_net_handle_ctrl(VirtIODevice
*vdev
, VirtQueue
*vq
)
885 VirtIONet
*n
= VIRTIO_NET(vdev
);
886 struct virtio_net_ctrl_hdr ctrl
;
887 virtio_net_ctrl_ack status
= VIRTIO_NET_ERR
;
888 VirtQueueElement
*elem
;
890 struct iovec
*iov
, *iov2
;
891 unsigned int iov_cnt
;
894 elem
= virtqueue_pop(vq
, sizeof(VirtQueueElement
));
898 if (iov_size(elem
->in_sg
, elem
->in_num
) < sizeof(status
) ||
899 iov_size(elem
->out_sg
, elem
->out_num
) < sizeof(ctrl
)) {
900 error_report("virtio-net ctrl missing headers");
904 iov_cnt
= elem
->out_num
;
905 iov2
= iov
= g_memdup(elem
->out_sg
, sizeof(struct iovec
) * elem
->out_num
);
906 s
= iov_to_buf(iov
, iov_cnt
, 0, &ctrl
, sizeof(ctrl
));
907 iov_discard_front(&iov
, &iov_cnt
, sizeof(ctrl
));
908 if (s
!= sizeof(ctrl
)) {
909 status
= VIRTIO_NET_ERR
;
910 } else if (ctrl
.class == VIRTIO_NET_CTRL_RX
) {
911 status
= virtio_net_handle_rx_mode(n
, ctrl
.cmd
, iov
, iov_cnt
);
912 } else if (ctrl
.class == VIRTIO_NET_CTRL_MAC
) {
913 status
= virtio_net_handle_mac(n
, ctrl
.cmd
, iov
, iov_cnt
);
914 } else if (ctrl
.class == VIRTIO_NET_CTRL_VLAN
) {
915 status
= virtio_net_handle_vlan_table(n
, ctrl
.cmd
, iov
, iov_cnt
);
916 } else if (ctrl
.class == VIRTIO_NET_CTRL_ANNOUNCE
) {
917 status
= virtio_net_handle_announce(n
, ctrl
.cmd
, iov
, iov_cnt
);
918 } else if (ctrl
.class == VIRTIO_NET_CTRL_MQ
) {
919 status
= virtio_net_handle_mq(n
, ctrl
.cmd
, iov
, iov_cnt
);
920 } else if (ctrl
.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS
) {
921 status
= virtio_net_handle_offloads(n
, ctrl
.cmd
, iov
, iov_cnt
);
924 s
= iov_from_buf(elem
->in_sg
, elem
->in_num
, 0, &status
, sizeof(status
));
925 assert(s
== sizeof(status
));
927 virtqueue_push(vq
, elem
, sizeof(status
));
928 virtio_notify(vdev
, vq
);
936 static void virtio_net_handle_rx(VirtIODevice
*vdev
, VirtQueue
*vq
)
938 VirtIONet
*n
= VIRTIO_NET(vdev
);
939 int queue_index
= vq2q(virtio_get_queue_index(vq
));
941 qemu_flush_queued_packets(qemu_get_subqueue(n
->nic
, queue_index
));
944 static int virtio_net_can_receive(NetClientState
*nc
)
946 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
947 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
948 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
950 if (!vdev
->vm_running
) {
954 if (nc
->queue_index
>= n
->curr_queues
) {
958 if (!virtio_queue_ready(q
->rx_vq
) ||
959 !(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
966 static int virtio_net_has_buffers(VirtIONetQueue
*q
, int bufsize
)
969 if (virtio_queue_empty(q
->rx_vq
) ||
970 (n
->mergeable_rx_bufs
&&
971 !virtqueue_avail_bytes(q
->rx_vq
, bufsize
, 0))) {
972 virtio_queue_set_notification(q
->rx_vq
, 1);
974 /* To avoid a race condition where the guest has made some buffers
975 * available after the above check but before notification was
976 * enabled, check for available buffers again.
978 if (virtio_queue_empty(q
->rx_vq
) ||
979 (n
->mergeable_rx_bufs
&&
980 !virtqueue_avail_bytes(q
->rx_vq
, bufsize
, 0))) {
985 virtio_queue_set_notification(q
->rx_vq
, 0);
989 static void virtio_net_hdr_swap(VirtIODevice
*vdev
, struct virtio_net_hdr
*hdr
)
991 virtio_tswap16s(vdev
, &hdr
->hdr_len
);
992 virtio_tswap16s(vdev
, &hdr
->gso_size
);
993 virtio_tswap16s(vdev
, &hdr
->csum_start
);
994 virtio_tswap16s(vdev
, &hdr
->csum_offset
);
997 /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
998 * it never finds out that the packets don't have valid checksums. This
999 * causes dhclient to get upset. Fedora's carried a patch for ages to
1000 * fix this with Xen but it hasn't appeared in an upstream release of
1003 * To avoid breaking existing guests, we catch udp packets and add
1004 * checksums. This is terrible but it's better than hacking the guest
1007 * N.B. if we introduce a zero-copy API, this operation is no longer free so
1008 * we should provide a mechanism to disable it to avoid polluting the host
1011 static void work_around_broken_dhclient(struct virtio_net_hdr
*hdr
,
1012 uint8_t *buf
, size_t size
)
1014 if ((hdr
->flags
& VIRTIO_NET_HDR_F_NEEDS_CSUM
) && /* missing csum */
1015 (size
> 27 && size
< 1500) && /* normal sized MTU */
1016 (buf
[12] == 0x08 && buf
[13] == 0x00) && /* ethertype == IPv4 */
1017 (buf
[23] == 17) && /* ip.protocol == UDP */
1018 (buf
[34] == 0 && buf
[35] == 67)) { /* udp.srcport == bootps */
1019 net_checksum_calculate(buf
, size
);
1020 hdr
->flags
&= ~VIRTIO_NET_HDR_F_NEEDS_CSUM
;
1024 static void receive_header(VirtIONet
*n
, const struct iovec
*iov
, int iov_cnt
,
1025 const void *buf
, size_t size
)
1027 if (n
->has_vnet_hdr
) {
1028 /* FIXME this cast is evil */
1029 void *wbuf
= (void *)buf
;
1030 work_around_broken_dhclient(wbuf
, wbuf
+ n
->host_hdr_len
,
1031 size
- n
->host_hdr_len
);
1033 if (n
->needs_vnet_hdr_swap
) {
1034 virtio_net_hdr_swap(VIRTIO_DEVICE(n
), wbuf
);
1036 iov_from_buf(iov
, iov_cnt
, 0, buf
, sizeof(struct virtio_net_hdr
));
1038 struct virtio_net_hdr hdr
= {
1040 .gso_type
= VIRTIO_NET_HDR_GSO_NONE
1042 iov_from_buf(iov
, iov_cnt
, 0, &hdr
, sizeof hdr
);
1046 static int receive_filter(VirtIONet
*n
, const uint8_t *buf
, int size
)
1048 static const uint8_t bcast
[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
1049 static const uint8_t vlan
[] = {0x81, 0x00};
1050 uint8_t *ptr
= (uint8_t *)buf
;
1056 ptr
+= n
->host_hdr_len
;
1058 if (!memcmp(&ptr
[12], vlan
, sizeof(vlan
))) {
1059 int vid
= lduw_be_p(ptr
+ 14) & 0xfff;
1060 if (!(n
->vlans
[vid
>> 5] & (1U << (vid
& 0x1f))))
1064 if (ptr
[0] & 1) { // multicast
1065 if (!memcmp(ptr
, bcast
, sizeof(bcast
))) {
1067 } else if (n
->nomulti
) {
1069 } else if (n
->allmulti
|| n
->mac_table
.multi_overflow
) {
1073 for (i
= n
->mac_table
.first_multi
; i
< n
->mac_table
.in_use
; i
++) {
1074 if (!memcmp(ptr
, &n
->mac_table
.macs
[i
* ETH_ALEN
], ETH_ALEN
)) {
1081 } else if (n
->alluni
|| n
->mac_table
.uni_overflow
) {
1083 } else if (!memcmp(ptr
, n
->mac
, ETH_ALEN
)) {
1087 for (i
= 0; i
< n
->mac_table
.first_multi
; i
++) {
1088 if (!memcmp(ptr
, &n
->mac_table
.macs
[i
* ETH_ALEN
], ETH_ALEN
)) {
1097 static ssize_t
virtio_net_receive(NetClientState
*nc
, const uint8_t *buf
, size_t size
)
1099 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
1100 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
1101 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1102 struct iovec mhdr_sg
[VIRTQUEUE_MAX_SIZE
];
1103 struct virtio_net_hdr_mrg_rxbuf mhdr
;
1104 unsigned mhdr_cnt
= 0;
1105 size_t offset
, i
, guest_offset
;
1107 if (!virtio_net_can_receive(nc
)) {
1111 /* hdr_len refers to the header we supply to the guest */
1112 if (!virtio_net_has_buffers(q
, size
+ n
->guest_hdr_len
- n
->host_hdr_len
)) {
1116 if (!receive_filter(n
, buf
, size
))
1121 while (offset
< size
) {
1122 VirtQueueElement
*elem
;
1124 const struct iovec
*sg
;
1128 elem
= virtqueue_pop(q
->rx_vq
, sizeof(VirtQueueElement
));
1132 error_report("virtio-net unexpected empty queue: "
1133 "i %zd mergeable %d offset %zd, size %zd, "
1134 "guest hdr len %zd, host hdr len %zd "
1135 "guest features 0x%" PRIx64
,
1136 i
, n
->mergeable_rx_bufs
, offset
, size
,
1137 n
->guest_hdr_len
, n
->host_hdr_len
,
1138 vdev
->guest_features
);
1142 if (elem
->in_num
< 1) {
1143 error_report("virtio-net receive queue contains no in buffers");
1149 assert(offset
== 0);
1150 if (n
->mergeable_rx_bufs
) {
1151 mhdr_cnt
= iov_copy(mhdr_sg
, ARRAY_SIZE(mhdr_sg
),
1153 offsetof(typeof(mhdr
), num_buffers
),
1154 sizeof(mhdr
.num_buffers
));
1157 receive_header(n
, sg
, elem
->in_num
, buf
, size
);
1158 offset
= n
->host_hdr_len
;
1159 total
+= n
->guest_hdr_len
;
1160 guest_offset
= n
->guest_hdr_len
;
1165 /* copy in packet. ugh */
1166 len
= iov_from_buf(sg
, elem
->in_num
, guest_offset
,
1167 buf
+ offset
, size
- offset
);
1170 /* If buffers can't be merged, at this point we
1171 * must have consumed the complete packet.
1172 * Otherwise, drop it. */
1173 if (!n
->mergeable_rx_bufs
&& offset
< size
) {
1174 virtqueue_discard(q
->rx_vq
, elem
, total
);
1179 /* signal other side */
1180 virtqueue_fill(q
->rx_vq
, elem
, total
, i
++);
1185 virtio_stw_p(vdev
, &mhdr
.num_buffers
, i
);
1186 iov_from_buf(mhdr_sg
, mhdr_cnt
,
1188 &mhdr
.num_buffers
, sizeof mhdr
.num_buffers
);
1191 virtqueue_flush(q
->rx_vq
, i
);
1192 virtio_notify(vdev
, q
->rx_vq
);
1197 static int32_t virtio_net_flush_tx(VirtIONetQueue
*q
);
1199 static void virtio_net_tx_complete(NetClientState
*nc
, ssize_t len
)
1201 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
1202 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
1203 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1205 virtqueue_push(q
->tx_vq
, q
->async_tx
.elem
, 0);
1206 virtio_notify(vdev
, q
->tx_vq
);
1208 g_free(q
->async_tx
.elem
);
1209 q
->async_tx
.elem
= NULL
;
1211 virtio_queue_set_notification(q
->tx_vq
, 1);
1212 virtio_net_flush_tx(q
);
1216 static int32_t virtio_net_flush_tx(VirtIONetQueue
*q
)
1218 VirtIONet
*n
= q
->n
;
1219 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1220 VirtQueueElement
*elem
;
1221 int32_t num_packets
= 0;
1222 int queue_index
= vq2q(virtio_get_queue_index(q
->tx_vq
));
1223 if (!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
1227 if (q
->async_tx
.elem
) {
1228 virtio_queue_set_notification(q
->tx_vq
, 0);
1234 unsigned int out_num
;
1235 struct iovec sg
[VIRTQUEUE_MAX_SIZE
], sg2
[VIRTQUEUE_MAX_SIZE
+ 1], *out_sg
;
1236 struct virtio_net_hdr_mrg_rxbuf mhdr
;
1238 elem
= virtqueue_pop(q
->tx_vq
, sizeof(VirtQueueElement
));
1243 out_num
= elem
->out_num
;
1244 out_sg
= elem
->out_sg
;
1246 error_report("virtio-net header not in first element");
1250 if (n
->has_vnet_hdr
) {
1251 if (iov_to_buf(out_sg
, out_num
, 0, &mhdr
, n
->guest_hdr_len
) <
1253 error_report("virtio-net header incorrect");
1256 if (n
->needs_vnet_hdr_swap
) {
1257 virtio_net_hdr_swap(vdev
, (void *) &mhdr
);
1258 sg2
[0].iov_base
= &mhdr
;
1259 sg2
[0].iov_len
= n
->guest_hdr_len
;
1260 out_num
= iov_copy(&sg2
[1], ARRAY_SIZE(sg2
) - 1,
1262 n
->guest_hdr_len
, -1);
1263 if (out_num
== VIRTQUEUE_MAX_SIZE
) {
1271 * If host wants to see the guest header as is, we can
1272 * pass it on unchanged. Otherwise, copy just the parts
1273 * that host is interested in.
1275 assert(n
->host_hdr_len
<= n
->guest_hdr_len
);
1276 if (n
->host_hdr_len
!= n
->guest_hdr_len
) {
1277 unsigned sg_num
= iov_copy(sg
, ARRAY_SIZE(sg
),
1279 0, n
->host_hdr_len
);
1280 sg_num
+= iov_copy(sg
+ sg_num
, ARRAY_SIZE(sg
) - sg_num
,
1282 n
->guest_hdr_len
, -1);
1287 ret
= qemu_sendv_packet_async(qemu_get_subqueue(n
->nic
, queue_index
),
1288 out_sg
, out_num
, virtio_net_tx_complete
);
1290 virtio_queue_set_notification(q
->tx_vq
, 0);
1291 q
->async_tx
.elem
= elem
;
1296 virtqueue_push(q
->tx_vq
, elem
, 0);
1297 virtio_notify(vdev
, q
->tx_vq
);
1300 if (++num_packets
>= n
->tx_burst
) {
1307 static void virtio_net_handle_tx_timer(VirtIODevice
*vdev
, VirtQueue
*vq
)
1309 VirtIONet
*n
= VIRTIO_NET(vdev
);
1310 VirtIONetQueue
*q
= &n
->vqs
[vq2q(virtio_get_queue_index(vq
))];
1312 /* This happens when device was stopped but VCPU wasn't. */
1313 if (!vdev
->vm_running
) {
1318 if (q
->tx_waiting
) {
1319 virtio_queue_set_notification(vq
, 1);
1320 timer_del(q
->tx_timer
);
1322 virtio_net_flush_tx(q
);
1324 timer_mod(q
->tx_timer
,
1325 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL
) + n
->tx_timeout
);
1327 virtio_queue_set_notification(vq
, 0);
1331 static void virtio_net_handle_tx_bh(VirtIODevice
*vdev
, VirtQueue
*vq
)
1333 VirtIONet
*n
= VIRTIO_NET(vdev
);
1334 VirtIONetQueue
*q
= &n
->vqs
[vq2q(virtio_get_queue_index(vq
))];
1336 if (unlikely(q
->tx_waiting
)) {
1340 /* This happens when device was stopped but VCPU wasn't. */
1341 if (!vdev
->vm_running
) {
1344 virtio_queue_set_notification(vq
, 0);
1345 qemu_bh_schedule(q
->tx_bh
);
1348 static void virtio_net_tx_timer(void *opaque
)
1350 VirtIONetQueue
*q
= opaque
;
1351 VirtIONet
*n
= q
->n
;
1352 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1353 /* This happens when device was stopped but BH wasn't. */
1354 if (!vdev
->vm_running
) {
1355 /* Make sure tx waiting is set, so we'll run when restarted. */
1356 assert(q
->tx_waiting
);
1362 /* Just in case the driver is not ready on more */
1363 if (!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
1367 virtio_queue_set_notification(q
->tx_vq
, 1);
1368 virtio_net_flush_tx(q
);
1371 static void virtio_net_tx_bh(void *opaque
)
1373 VirtIONetQueue
*q
= opaque
;
1374 VirtIONet
*n
= q
->n
;
1375 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1378 /* This happens when device was stopped but BH wasn't. */
1379 if (!vdev
->vm_running
) {
1380 /* Make sure tx waiting is set, so we'll run when restarted. */
1381 assert(q
->tx_waiting
);
1387 /* Just in case the driver is not ready on more */
1388 if (unlikely(!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
))) {
1392 ret
= virtio_net_flush_tx(q
);
1393 if (ret
== -EBUSY
) {
1394 return; /* Notification re-enable handled by tx_complete */
1397 /* If we flush a full burst of packets, assume there are
1398 * more coming and immediately reschedule */
1399 if (ret
>= n
->tx_burst
) {
1400 qemu_bh_schedule(q
->tx_bh
);
1405 /* If less than a full burst, re-enable notification and flush
1406 * anything that may have come in while we weren't looking. If
1407 * we find something, assume the guest is still active and reschedule */
1408 virtio_queue_set_notification(q
->tx_vq
, 1);
1409 if (virtio_net_flush_tx(q
) > 0) {
1410 virtio_queue_set_notification(q
->tx_vq
, 0);
1411 qemu_bh_schedule(q
->tx_bh
);
1416 static void virtio_net_add_queue(VirtIONet
*n
, int index
)
1418 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1420 n
->vqs
[index
].rx_vq
= virtio_add_queue(vdev
, n
->net_conf
.rx_queue_size
,
1421 virtio_net_handle_rx
);
1422 if (n
->net_conf
.tx
&& !strcmp(n
->net_conf
.tx
, "timer")) {
1423 n
->vqs
[index
].tx_vq
=
1424 virtio_add_queue(vdev
, 256, virtio_net_handle_tx_timer
);
1425 n
->vqs
[index
].tx_timer
= timer_new_ns(QEMU_CLOCK_VIRTUAL
,
1426 virtio_net_tx_timer
,
1429 n
->vqs
[index
].tx_vq
=
1430 virtio_add_queue(vdev
, 256, virtio_net_handle_tx_bh
);
1431 n
->vqs
[index
].tx_bh
= qemu_bh_new(virtio_net_tx_bh
, &n
->vqs
[index
]);
1434 n
->vqs
[index
].tx_waiting
= 0;
1435 n
->vqs
[index
].n
= n
;
1438 static void virtio_net_del_queue(VirtIONet
*n
, int index
)
1440 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1441 VirtIONetQueue
*q
= &n
->vqs
[index
];
1442 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, index
);
1444 qemu_purge_queued_packets(nc
);
1446 virtio_del_queue(vdev
, index
* 2);
1448 timer_del(q
->tx_timer
);
1449 timer_free(q
->tx_timer
);
1451 qemu_bh_delete(q
->tx_bh
);
1453 virtio_del_queue(vdev
, index
* 2 + 1);
1456 static void virtio_net_change_num_queues(VirtIONet
*n
, int new_max_queues
)
1458 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1459 int old_num_queues
= virtio_get_num_queues(vdev
);
1460 int new_num_queues
= new_max_queues
* 2 + 1;
1463 assert(old_num_queues
>= 3);
1464 assert(old_num_queues
% 2 == 1);
1466 if (old_num_queues
== new_num_queues
) {
1471 * We always need to remove and add ctrl vq if
1472 * old_num_queues != new_num_queues. Remove ctrl_vq first,
1473 * and then we only enter one of the following too loops.
1475 virtio_del_queue(vdev
, old_num_queues
- 1);
1477 for (i
= new_num_queues
- 1; i
< old_num_queues
- 1; i
+= 2) {
1478 /* new_num_queues < old_num_queues */
1479 virtio_net_del_queue(n
, i
/ 2);
1482 for (i
= old_num_queues
- 1; i
< new_num_queues
- 1; i
+= 2) {
1483 /* new_num_queues > old_num_queues */
1484 virtio_net_add_queue(n
, i
/ 2);
1487 /* add ctrl_vq last */
1488 n
->ctrl_vq
= virtio_add_queue(vdev
, 64, virtio_net_handle_ctrl
);
1491 static void virtio_net_set_multiqueue(VirtIONet
*n
, int multiqueue
)
1493 int max
= multiqueue
? n
->max_queues
: 1;
1495 n
->multiqueue
= multiqueue
;
1496 virtio_net_change_num_queues(n
, max
);
1498 virtio_net_set_queues(n
);
1501 static void virtio_net_save(QEMUFile
*f
, void *opaque
, size_t size
)
1503 VirtIONet
*n
= opaque
;
1504 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1506 /* At this point, backend must be stopped, otherwise
1507 * it might keep writing to memory. */
1508 assert(!n
->vhost_started
);
1509 virtio_save(vdev
, f
);
1512 static void virtio_net_save_device(VirtIODevice
*vdev
, QEMUFile
*f
)
1514 VirtIONet
*n
= VIRTIO_NET(vdev
);
1517 qemu_put_buffer(f
, n
->mac
, ETH_ALEN
);
1518 qemu_put_be32(f
, n
->vqs
[0].tx_waiting
);
1519 qemu_put_be32(f
, n
->mergeable_rx_bufs
);
1520 qemu_put_be16(f
, n
->status
);
1521 qemu_put_byte(f
, n
->promisc
);
1522 qemu_put_byte(f
, n
->allmulti
);
1523 qemu_put_be32(f
, n
->mac_table
.in_use
);
1524 qemu_put_buffer(f
, n
->mac_table
.macs
, n
->mac_table
.in_use
* ETH_ALEN
);
1525 qemu_put_buffer(f
, (uint8_t *)n
->vlans
, MAX_VLAN
>> 3);
1526 qemu_put_be32(f
, n
->has_vnet_hdr
);
1527 qemu_put_byte(f
, n
->mac_table
.multi_overflow
);
1528 qemu_put_byte(f
, n
->mac_table
.uni_overflow
);
1529 qemu_put_byte(f
, n
->alluni
);
1530 qemu_put_byte(f
, n
->nomulti
);
1531 qemu_put_byte(f
, n
->nouni
);
1532 qemu_put_byte(f
, n
->nobcast
);
1533 qemu_put_byte(f
, n
->has_ufo
);
1534 if (n
->max_queues
> 1) {
1535 qemu_put_be16(f
, n
->max_queues
);
1536 qemu_put_be16(f
, n
->curr_queues
);
1537 for (i
= 1; i
< n
->curr_queues
; i
++) {
1538 qemu_put_be32(f
, n
->vqs
[i
].tx_waiting
);
1542 if (virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
)) {
1543 qemu_put_be64(f
, n
->curr_guest_offloads
);
1547 static int virtio_net_load(QEMUFile
*f
, void *opaque
, size_t size
)
1549 VirtIONet
*n
= opaque
;
1550 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1552 return virtio_load(vdev
, f
, VIRTIO_NET_VM_VERSION
);
1555 static int virtio_net_load_device(VirtIODevice
*vdev
, QEMUFile
*f
,
1558 VirtIONet
*n
= VIRTIO_NET(vdev
);
1561 qemu_get_buffer(f
, n
->mac
, ETH_ALEN
);
1562 n
->vqs
[0].tx_waiting
= qemu_get_be32(f
);
1564 virtio_net_set_mrg_rx_bufs(n
, qemu_get_be32(f
),
1565 virtio_vdev_has_feature(vdev
,
1566 VIRTIO_F_VERSION_1
));
1568 n
->status
= qemu_get_be16(f
);
1570 n
->promisc
= qemu_get_byte(f
);
1571 n
->allmulti
= qemu_get_byte(f
);
1573 n
->mac_table
.in_use
= qemu_get_be32(f
);
1574 /* MAC_TABLE_ENTRIES may be different from the saved image */
1575 if (n
->mac_table
.in_use
<= MAC_TABLE_ENTRIES
) {
1576 qemu_get_buffer(f
, n
->mac_table
.macs
,
1577 n
->mac_table
.in_use
* ETH_ALEN
);
1581 /* Overflow detected - can happen if source has a larger MAC table.
1582 * We simply set overflow flag so there's no need to maintain the
1583 * table of addresses, discard them all.
1584 * Note: 64 bit math to avoid integer overflow.
1586 for (i
= 0; i
< (int64_t)n
->mac_table
.in_use
* ETH_ALEN
; ++i
) {
1589 n
->mac_table
.multi_overflow
= n
->mac_table
.uni_overflow
= 1;
1590 n
->mac_table
.in_use
= 0;
1593 qemu_get_buffer(f
, (uint8_t *)n
->vlans
, MAX_VLAN
>> 3);
1595 if (qemu_get_be32(f
) && !peer_has_vnet_hdr(n
)) {
1596 error_report("virtio-net: saved image requires vnet_hdr=on");
1600 n
->mac_table
.multi_overflow
= qemu_get_byte(f
);
1601 n
->mac_table
.uni_overflow
= qemu_get_byte(f
);
1603 n
->alluni
= qemu_get_byte(f
);
1604 n
->nomulti
= qemu_get_byte(f
);
1605 n
->nouni
= qemu_get_byte(f
);
1606 n
->nobcast
= qemu_get_byte(f
);
1608 if (qemu_get_byte(f
) && !peer_has_ufo(n
)) {
1609 error_report("virtio-net: saved image requires TUN_F_UFO support");
1613 if (n
->max_queues
> 1) {
1614 if (n
->max_queues
!= qemu_get_be16(f
)) {
1615 error_report("virtio-net: different max_queues ");
1619 n
->curr_queues
= qemu_get_be16(f
);
1620 if (n
->curr_queues
> n
->max_queues
) {
1621 error_report("virtio-net: curr_queues %x > max_queues %x",
1622 n
->curr_queues
, n
->max_queues
);
1625 for (i
= 1; i
< n
->curr_queues
; i
++) {
1626 n
->vqs
[i
].tx_waiting
= qemu_get_be32(f
);
1630 if (virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
)) {
1631 n
->curr_guest_offloads
= qemu_get_be64(f
);
1633 n
->curr_guest_offloads
= virtio_net_supported_guest_offloads(n
);
1636 if (peer_has_vnet_hdr(n
)) {
1637 virtio_net_apply_guest_offloads(n
);
1640 virtio_net_set_queues(n
);
1642 /* Find the first multicast entry in the saved MAC filter */
1643 for (i
= 0; i
< n
->mac_table
.in_use
; i
++) {
1644 if (n
->mac_table
.macs
[i
* ETH_ALEN
] & 1) {
1648 n
->mac_table
.first_multi
= i
;
1650 /* nc.link_down can't be migrated, so infer link_down according
1651 * to link status bit in n->status */
1652 link_down
= (n
->status
& VIRTIO_NET_S_LINK_UP
) == 0;
1653 for (i
= 0; i
< n
->max_queues
; i
++) {
1654 qemu_get_subqueue(n
->nic
, i
)->link_down
= link_down
;
1657 if (virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_GUEST_ANNOUNCE
) &&
1658 virtio_vdev_has_feature(vdev
, VIRTIO_NET_F_CTRL_VQ
)) {
1659 n
->announce_counter
= SELF_ANNOUNCE_ROUNDS
;
1660 timer_mod(n
->announce_timer
, qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL
));
1666 static NetClientInfo net_virtio_info
= {
1667 .type
= NET_CLIENT_DRIVER_NIC
,
1668 .size
= sizeof(NICState
),
1669 .can_receive
= virtio_net_can_receive
,
1670 .receive
= virtio_net_receive
,
1671 .link_status_changed
= virtio_net_set_link_status
,
1672 .query_rx_filter
= virtio_net_query_rxfilter
,
1675 static bool virtio_net_guest_notifier_pending(VirtIODevice
*vdev
, int idx
)
1677 VirtIONet
*n
= VIRTIO_NET(vdev
);
1678 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, vq2q(idx
));
1679 assert(n
->vhost_started
);
1680 return vhost_net_virtqueue_pending(get_vhost_net(nc
->peer
), idx
);
1683 static void virtio_net_guest_notifier_mask(VirtIODevice
*vdev
, int idx
,
1686 VirtIONet
*n
= VIRTIO_NET(vdev
);
1687 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, vq2q(idx
));
1688 assert(n
->vhost_started
);
1689 vhost_net_virtqueue_mask(get_vhost_net(nc
->peer
),
1693 static void virtio_net_set_config_size(VirtIONet
*n
, uint64_t host_features
)
1695 int i
, config_size
= 0;
1696 virtio_add_feature(&host_features
, VIRTIO_NET_F_MAC
);
1697 for (i
= 0; feature_sizes
[i
].flags
!= 0; i
++) {
1698 if (host_features
& feature_sizes
[i
].flags
) {
1699 config_size
= MAX(feature_sizes
[i
].end
, config_size
);
1702 n
->config_size
= config_size
;
1705 void virtio_net_set_netclient_name(VirtIONet
*n
, const char *name
,
1709 * The name can be NULL, the netclient name will be type.x.
1711 assert(type
!= NULL
);
1713 g_free(n
->netclient_name
);
1714 g_free(n
->netclient_type
);
1715 n
->netclient_name
= g_strdup(name
);
1716 n
->netclient_type
= g_strdup(type
);
1719 static void virtio_net_device_realize(DeviceState
*dev
, Error
**errp
)
1721 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
1722 VirtIONet
*n
= VIRTIO_NET(dev
);
1726 virtio_net_set_config_size(n
, n
->host_features
);
1727 virtio_init(vdev
, "virtio-net", VIRTIO_ID_NET
, n
->config_size
);
1730 * We set a lower limit on RX queue size to what it always was.
1731 * Guests that want a smaller ring can always resize it without
1732 * help from us (using virtio 1 and up).
1734 if (n
->net_conf
.rx_queue_size
< VIRTIO_NET_RX_QUEUE_MIN_SIZE
||
1735 n
->net_conf
.rx_queue_size
> VIRTQUEUE_MAX_SIZE
||
1736 (n
->net_conf
.rx_queue_size
& (n
->net_conf
.rx_queue_size
- 1))) {
1737 error_setg(errp
, "Invalid rx_queue_size (= %" PRIu16
"), "
1738 "must be a power of 2 between %d and %d.",
1739 n
->net_conf
.rx_queue_size
, VIRTIO_NET_RX_QUEUE_MIN_SIZE
,
1740 VIRTQUEUE_MAX_SIZE
);
1741 virtio_cleanup(vdev
);
1745 n
->max_queues
= MAX(n
->nic_conf
.peers
.queues
, 1);
1746 if (n
->max_queues
* 2 + 1 > VIRTIO_QUEUE_MAX
) {
1747 error_setg(errp
, "Invalid number of queues (= %" PRIu32
"), "
1748 "must be a positive integer less than %d.",
1749 n
->max_queues
, (VIRTIO_QUEUE_MAX
- 1) / 2);
1750 virtio_cleanup(vdev
);
1753 n
->vqs
= g_malloc0(sizeof(VirtIONetQueue
) * n
->max_queues
);
1755 n
->tx_timeout
= n
->net_conf
.txtimer
;
1757 if (n
->net_conf
.tx
&& strcmp(n
->net_conf
.tx
, "timer")
1758 && strcmp(n
->net_conf
.tx
, "bh")) {
1759 error_report("virtio-net: "
1760 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1762 error_report("Defaulting to \"bh\"");
1765 for (i
= 0; i
< n
->max_queues
; i
++) {
1766 virtio_net_add_queue(n
, i
);
1769 n
->ctrl_vq
= virtio_add_queue(vdev
, 64, virtio_net_handle_ctrl
);
1770 qemu_macaddr_default_if_unset(&n
->nic_conf
.macaddr
);
1771 memcpy(&n
->mac
[0], &n
->nic_conf
.macaddr
, sizeof(n
->mac
));
1772 n
->status
= VIRTIO_NET_S_LINK_UP
;
1773 n
->announce_timer
= timer_new_ms(QEMU_CLOCK_VIRTUAL
,
1774 virtio_net_announce_timer
, n
);
1776 if (n
->netclient_type
) {
1778 * Happen when virtio_net_set_netclient_name has been called.
1780 n
->nic
= qemu_new_nic(&net_virtio_info
, &n
->nic_conf
,
1781 n
->netclient_type
, n
->netclient_name
, n
);
1783 n
->nic
= qemu_new_nic(&net_virtio_info
, &n
->nic_conf
,
1784 object_get_typename(OBJECT(dev
)), dev
->id
, n
);
1787 peer_test_vnet_hdr(n
);
1788 if (peer_has_vnet_hdr(n
)) {
1789 for (i
= 0; i
< n
->max_queues
; i
++) {
1790 qemu_using_vnet_hdr(qemu_get_subqueue(n
->nic
, i
)->peer
, true);
1792 n
->host_hdr_len
= sizeof(struct virtio_net_hdr
);
1794 n
->host_hdr_len
= 0;
1797 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->nic_conf
.macaddr
.a
);
1799 n
->vqs
[0].tx_waiting
= 0;
1800 n
->tx_burst
= n
->net_conf
.txburst
;
1801 virtio_net_set_mrg_rx_bufs(n
, 0, 0);
1802 n
->promisc
= 1; /* for compatibility */
1804 n
->mac_table
.macs
= g_malloc0(MAC_TABLE_ENTRIES
* ETH_ALEN
);
1806 n
->vlans
= g_malloc0(MAX_VLAN
>> 3);
1808 nc
= qemu_get_queue(n
->nic
);
1809 nc
->rxfilter_notify_enabled
= 1;
1814 static void virtio_net_device_unrealize(DeviceState
*dev
, Error
**errp
)
1816 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
1817 VirtIONet
*n
= VIRTIO_NET(dev
);
1820 /* This will stop vhost backend if appropriate. */
1821 virtio_net_set_status(vdev
, 0);
1823 g_free(n
->netclient_name
);
1824 n
->netclient_name
= NULL
;
1825 g_free(n
->netclient_type
);
1826 n
->netclient_type
= NULL
;
1828 g_free(n
->mac_table
.macs
);
1831 max_queues
= n
->multiqueue
? n
->max_queues
: 1;
1832 for (i
= 0; i
< max_queues
; i
++) {
1833 virtio_net_del_queue(n
, i
);
1836 timer_del(n
->announce_timer
);
1837 timer_free(n
->announce_timer
);
1839 qemu_del_nic(n
->nic
);
1840 virtio_cleanup(vdev
);
1843 static void virtio_net_instance_init(Object
*obj
)
1845 VirtIONet
*n
= VIRTIO_NET(obj
);
1848 * The default config_size is sizeof(struct virtio_net_config).
1849 * Can be overriden with virtio_net_set_config_size.
1851 n
->config_size
= sizeof(struct virtio_net_config
);
1852 device_add_bootindex_property(obj
, &n
->nic_conf
.bootindex
,
1853 "bootindex", "/ethernet-phy@0",
1857 VMSTATE_VIRTIO_DEVICE(net
, VIRTIO_NET_VM_VERSION
, virtio_net_load
,
1860 static Property virtio_net_properties
[] = {
1861 DEFINE_PROP_BIT("csum", VirtIONet
, host_features
, VIRTIO_NET_F_CSUM
, true),
1862 DEFINE_PROP_BIT("guest_csum", VirtIONet
, host_features
,
1863 VIRTIO_NET_F_GUEST_CSUM
, true),
1864 DEFINE_PROP_BIT("gso", VirtIONet
, host_features
, VIRTIO_NET_F_GSO
, true),
1865 DEFINE_PROP_BIT("guest_tso4", VirtIONet
, host_features
,
1866 VIRTIO_NET_F_GUEST_TSO4
, true),
1867 DEFINE_PROP_BIT("guest_tso6", VirtIONet
, host_features
,
1868 VIRTIO_NET_F_GUEST_TSO6
, true),
1869 DEFINE_PROP_BIT("guest_ecn", VirtIONet
, host_features
,
1870 VIRTIO_NET_F_GUEST_ECN
, true),
1871 DEFINE_PROP_BIT("guest_ufo", VirtIONet
, host_features
,
1872 VIRTIO_NET_F_GUEST_UFO
, true),
1873 DEFINE_PROP_BIT("guest_announce", VirtIONet
, host_features
,
1874 VIRTIO_NET_F_GUEST_ANNOUNCE
, true),
1875 DEFINE_PROP_BIT("host_tso4", VirtIONet
, host_features
,
1876 VIRTIO_NET_F_HOST_TSO4
, true),
1877 DEFINE_PROP_BIT("host_tso6", VirtIONet
, host_features
,
1878 VIRTIO_NET_F_HOST_TSO6
, true),
1879 DEFINE_PROP_BIT("host_ecn", VirtIONet
, host_features
,
1880 VIRTIO_NET_F_HOST_ECN
, true),
1881 DEFINE_PROP_BIT("host_ufo", VirtIONet
, host_features
,
1882 VIRTIO_NET_F_HOST_UFO
, true),
1883 DEFINE_PROP_BIT("mrg_rxbuf", VirtIONet
, host_features
,
1884 VIRTIO_NET_F_MRG_RXBUF
, true),
1885 DEFINE_PROP_BIT("status", VirtIONet
, host_features
,
1886 VIRTIO_NET_F_STATUS
, true),
1887 DEFINE_PROP_BIT("ctrl_vq", VirtIONet
, host_features
,
1888 VIRTIO_NET_F_CTRL_VQ
, true),
1889 DEFINE_PROP_BIT("ctrl_rx", VirtIONet
, host_features
,
1890 VIRTIO_NET_F_CTRL_RX
, true),
1891 DEFINE_PROP_BIT("ctrl_vlan", VirtIONet
, host_features
,
1892 VIRTIO_NET_F_CTRL_VLAN
, true),
1893 DEFINE_PROP_BIT("ctrl_rx_extra", VirtIONet
, host_features
,
1894 VIRTIO_NET_F_CTRL_RX_EXTRA
, true),
1895 DEFINE_PROP_BIT("ctrl_mac_addr", VirtIONet
, host_features
,
1896 VIRTIO_NET_F_CTRL_MAC_ADDR
, true),
1897 DEFINE_PROP_BIT("ctrl_guest_offloads", VirtIONet
, host_features
,
1898 VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
, true),
1899 DEFINE_PROP_BIT("mq", VirtIONet
, host_features
, VIRTIO_NET_F_MQ
, false),
1900 DEFINE_NIC_PROPERTIES(VirtIONet
, nic_conf
),
1901 DEFINE_PROP_UINT32("x-txtimer", VirtIONet
, net_conf
.txtimer
,
1903 DEFINE_PROP_INT32("x-txburst", VirtIONet
, net_conf
.txburst
, TX_BURST
),
1904 DEFINE_PROP_STRING("tx", VirtIONet
, net_conf
.tx
),
1905 DEFINE_PROP_UINT16("rx_queue_size", VirtIONet
, net_conf
.rx_queue_size
,
1906 VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
),
1907 DEFINE_PROP_END_OF_LIST(),
1910 static void virtio_net_class_init(ObjectClass
*klass
, void *data
)
1912 DeviceClass
*dc
= DEVICE_CLASS(klass
);
1913 VirtioDeviceClass
*vdc
= VIRTIO_DEVICE_CLASS(klass
);
1915 dc
->props
= virtio_net_properties
;
1916 dc
->vmsd
= &vmstate_virtio_net
;
1917 set_bit(DEVICE_CATEGORY_NETWORK
, dc
->categories
);
1918 vdc
->realize
= virtio_net_device_realize
;
1919 vdc
->unrealize
= virtio_net_device_unrealize
;
1920 vdc
->get_config
= virtio_net_get_config
;
1921 vdc
->set_config
= virtio_net_set_config
;
1922 vdc
->get_features
= virtio_net_get_features
;
1923 vdc
->set_features
= virtio_net_set_features
;
1924 vdc
->bad_features
= virtio_net_bad_features
;
1925 vdc
->reset
= virtio_net_reset
;
1926 vdc
->set_status
= virtio_net_set_status
;
1927 vdc
->guest_notifier_mask
= virtio_net_guest_notifier_mask
;
1928 vdc
->guest_notifier_pending
= virtio_net_guest_notifier_pending
;
1929 vdc
->load
= virtio_net_load_device
;
1930 vdc
->save
= virtio_net_save_device
;
1933 static const TypeInfo virtio_net_info
= {
1934 .name
= TYPE_VIRTIO_NET
,
1935 .parent
= TYPE_VIRTIO_DEVICE
,
1936 .instance_size
= sizeof(VirtIONet
),
1937 .instance_init
= virtio_net_instance_init
,
1938 .class_init
= virtio_net_class_init
,
1941 static void virtio_register_types(void)
1943 type_register_static(&virtio_net_info
);
1946 type_init(virtio_register_types
)