2 * Virtio Network Device
4 * Copyright IBM, Corp. 2007
7 * Anthony Liguori <aliguori@us.ibm.com>
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
15 #include "hw/virtio/virtio.h"
17 #include "net/checksum.h"
19 #include "qemu/error-report.h"
20 #include "qemu/timer.h"
21 #include "hw/virtio/virtio-net.h"
22 #include "net/vhost_net.h"
23 #include "hw/virtio/virtio-bus.h"
24 #include "qapi/qmp/qjson.h"
25 #include "monitor/monitor.h"
27 #define VIRTIO_NET_VM_VERSION 11
29 #define MAC_TABLE_ENTRIES 64
30 #define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
33 * Calculate the number of bytes up to and including the given 'field' of
36 #define endof(container, field) \
37 (offsetof(container, field) + sizeof(((container *)0)->field))
39 typedef struct VirtIOFeature
{
44 static VirtIOFeature feature_sizes
[] = {
45 {.flags
= 1 << VIRTIO_NET_F_MAC
,
46 .end
= endof(struct virtio_net_config
, mac
)},
47 {.flags
= 1 << VIRTIO_NET_F_STATUS
,
48 .end
= endof(struct virtio_net_config
, status
)},
49 {.flags
= 1 << VIRTIO_NET_F_MQ
,
50 .end
= endof(struct virtio_net_config
, max_virtqueue_pairs
)},
54 static VirtIONetQueue
*virtio_net_get_subqueue(NetClientState
*nc
)
56 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
58 return &n
->vqs
[nc
->queue_index
];
61 static int vq2q(int queue_index
)
63 return queue_index
/ 2;
67 * - we could suppress RX interrupt if we were so inclined.
70 static void virtio_net_get_config(VirtIODevice
*vdev
, uint8_t *config
)
72 VirtIONet
*n
= VIRTIO_NET(vdev
);
73 struct virtio_net_config netcfg
;
75 stw_p(&netcfg
.status
, n
->status
);
76 stw_p(&netcfg
.max_virtqueue_pairs
, n
->max_queues
);
77 memcpy(netcfg
.mac
, n
->mac
, ETH_ALEN
);
78 memcpy(config
, &netcfg
, n
->config_size
);
81 static void virtio_net_set_config(VirtIODevice
*vdev
, const uint8_t *config
)
83 VirtIONet
*n
= VIRTIO_NET(vdev
);
84 struct virtio_net_config netcfg
= {};
86 memcpy(&netcfg
, config
, n
->config_size
);
88 if (!(vdev
->guest_features
>> VIRTIO_NET_F_CTRL_MAC_ADDR
& 1) &&
89 memcmp(netcfg
.mac
, n
->mac
, ETH_ALEN
)) {
90 memcpy(n
->mac
, netcfg
.mac
, ETH_ALEN
);
91 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
95 static bool virtio_net_started(VirtIONet
*n
, uint8_t status
)
97 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
98 return (status
& VIRTIO_CONFIG_S_DRIVER_OK
) &&
99 (n
->status
& VIRTIO_NET_S_LINK_UP
) && vdev
->vm_running
;
102 static void virtio_net_vhost_status(VirtIONet
*n
, uint8_t status
)
104 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
105 NetClientState
*nc
= qemu_get_queue(n
->nic
);
106 int queues
= n
->multiqueue
? n
->max_queues
: 1;
111 if (nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
115 if (!tap_get_vhost_net(nc
->peer
)) {
119 if (!!n
->vhost_started
==
120 (virtio_net_started(n
, status
) && !nc
->peer
->link_down
)) {
123 if (!n
->vhost_started
) {
125 if (!vhost_net_query(tap_get_vhost_net(nc
->peer
), vdev
)) {
128 n
->vhost_started
= 1;
129 r
= vhost_net_start(vdev
, n
->nic
->ncs
, queues
);
131 error_report("unable to start vhost net: %d: "
132 "falling back on userspace virtio", -r
);
133 n
->vhost_started
= 0;
136 vhost_net_stop(vdev
, n
->nic
->ncs
, queues
);
137 n
->vhost_started
= 0;
141 static void virtio_net_set_status(struct VirtIODevice
*vdev
, uint8_t status
)
143 VirtIONet
*n
= VIRTIO_NET(vdev
);
146 uint8_t queue_status
;
148 virtio_net_vhost_status(n
, status
);
150 for (i
= 0; i
< n
->max_queues
; i
++) {
153 if ((!n
->multiqueue
&& i
!= 0) || i
>= n
->curr_queues
) {
156 queue_status
= status
;
159 if (!q
->tx_waiting
) {
163 if (virtio_net_started(n
, queue_status
) && !n
->vhost_started
) {
165 timer_mod(q
->tx_timer
,
166 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL
) + n
->tx_timeout
);
168 qemu_bh_schedule(q
->tx_bh
);
172 timer_del(q
->tx_timer
);
174 qemu_bh_cancel(q
->tx_bh
);
180 static void virtio_net_set_link_status(NetClientState
*nc
)
182 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
183 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
184 uint16_t old_status
= n
->status
;
187 n
->status
&= ~VIRTIO_NET_S_LINK_UP
;
189 n
->status
|= VIRTIO_NET_S_LINK_UP
;
191 if (n
->status
!= old_status
)
192 virtio_notify_config(vdev
);
194 virtio_net_set_status(vdev
, vdev
->status
);
197 static void rxfilter_notify(NetClientState
*nc
)
200 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
202 if (nc
->rxfilter_notify_enabled
) {
203 gchar
*path
= object_get_canonical_path(OBJECT(n
->qdev
));
204 if (n
->netclient_name
) {
205 event_data
= qobject_from_jsonf("{ 'name': %s, 'path': %s }",
206 n
->netclient_name
, path
);
208 event_data
= qobject_from_jsonf("{ 'path': %s }", path
);
210 monitor_protocol_event(QEVENT_NIC_RX_FILTER_CHANGED
, event_data
);
211 qobject_decref(event_data
);
214 /* disable event notification to avoid events flooding */
215 nc
->rxfilter_notify_enabled
= 0;
219 static char *mac_strdup_printf(const uint8_t *mac
)
221 return g_strdup_printf("%.2x:%.2x:%.2x:%.2x:%.2x:%.2x", mac
[0],
222 mac
[1], mac
[2], mac
[3], mac
[4], mac
[5]);
225 static RxFilterInfo
*virtio_net_query_rxfilter(NetClientState
*nc
)
227 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
229 strList
*str_list
, *entry
;
230 intList
*int_list
, *int_entry
;
233 info
= g_malloc0(sizeof(*info
));
234 info
->name
= g_strdup(nc
->name
);
235 info
->promiscuous
= n
->promisc
;
238 info
->unicast
= RX_STATE_NONE
;
239 } else if (n
->alluni
) {
240 info
->unicast
= RX_STATE_ALL
;
242 info
->unicast
= RX_STATE_NORMAL
;
246 info
->multicast
= RX_STATE_NONE
;
247 } else if (n
->allmulti
) {
248 info
->multicast
= RX_STATE_ALL
;
250 info
->multicast
= RX_STATE_NORMAL
;
253 info
->broadcast_allowed
= n
->nobcast
;
254 info
->multicast_overflow
= n
->mac_table
.multi_overflow
;
255 info
->unicast_overflow
= n
->mac_table
.uni_overflow
;
257 info
->main_mac
= mac_strdup_printf(n
->mac
);
260 for (i
= 0; i
< n
->mac_table
.first_multi
; i
++) {
261 entry
= g_malloc0(sizeof(*entry
));
262 entry
->value
= mac_strdup_printf(n
->mac_table
.macs
+ i
* ETH_ALEN
);
263 entry
->next
= str_list
;
266 info
->unicast_table
= str_list
;
269 for (i
= n
->mac_table
.first_multi
; i
< n
->mac_table
.in_use
; i
++) {
270 entry
= g_malloc0(sizeof(*entry
));
271 entry
->value
= mac_strdup_printf(n
->mac_table
.macs
+ i
* ETH_ALEN
);
272 entry
->next
= str_list
;
275 info
->multicast_table
= str_list
;
278 for (i
= 0; i
< MAX_VLAN
>> 5; i
++) {
279 for (j
= 0; n
->vlans
[i
] && j
< 0x1f; j
++) {
280 if (n
->vlans
[i
] & (1U << j
)) {
281 int_entry
= g_malloc0(sizeof(*int_entry
));
282 int_entry
->value
= (i
<< 5) + j
;
283 int_entry
->next
= int_list
;
284 int_list
= int_entry
;
288 info
->vlan_table
= int_list
;
290 /* enable event notification after query */
291 nc
->rxfilter_notify_enabled
= 1;
296 static void virtio_net_reset(VirtIODevice
*vdev
)
298 VirtIONet
*n
= VIRTIO_NET(vdev
);
300 /* Reset back to compatibility mode */
307 /* multiqueue is disabled by default */
310 /* Flush any MAC and VLAN filter table state */
311 n
->mac_table
.in_use
= 0;
312 n
->mac_table
.first_multi
= 0;
313 n
->mac_table
.multi_overflow
= 0;
314 n
->mac_table
.uni_overflow
= 0;
315 memset(n
->mac_table
.macs
, 0, MAC_TABLE_ENTRIES
* ETH_ALEN
);
316 memcpy(&n
->mac
[0], &n
->nic
->conf
->macaddr
, sizeof(n
->mac
));
317 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
318 memset(n
->vlans
, 0, MAX_VLAN
>> 3);
321 static void peer_test_vnet_hdr(VirtIONet
*n
)
323 NetClientState
*nc
= qemu_get_queue(n
->nic
);
328 if (nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
332 n
->has_vnet_hdr
= tap_has_vnet_hdr(nc
->peer
);
335 static int peer_has_vnet_hdr(VirtIONet
*n
)
337 return n
->has_vnet_hdr
;
340 static int peer_has_ufo(VirtIONet
*n
)
342 if (!peer_has_vnet_hdr(n
))
345 n
->has_ufo
= tap_has_ufo(qemu_get_queue(n
->nic
)->peer
);
350 static void virtio_net_set_mrg_rx_bufs(VirtIONet
*n
, int mergeable_rx_bufs
)
355 n
->mergeable_rx_bufs
= mergeable_rx_bufs
;
357 n
->guest_hdr_len
= n
->mergeable_rx_bufs
?
358 sizeof(struct virtio_net_hdr_mrg_rxbuf
) : sizeof(struct virtio_net_hdr
);
360 for (i
= 0; i
< n
->max_queues
; i
++) {
361 nc
= qemu_get_subqueue(n
->nic
, i
);
363 if (peer_has_vnet_hdr(n
) &&
364 tap_has_vnet_hdr_len(nc
->peer
, n
->guest_hdr_len
)) {
365 tap_set_vnet_hdr_len(nc
->peer
, n
->guest_hdr_len
);
366 n
->host_hdr_len
= n
->guest_hdr_len
;
371 static int peer_attach(VirtIONet
*n
, int index
)
373 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, index
);
379 if (nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
383 return tap_enable(nc
->peer
);
386 static int peer_detach(VirtIONet
*n
, int index
)
388 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, index
);
394 if (nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
398 return tap_disable(nc
->peer
);
401 static void virtio_net_set_queues(VirtIONet
*n
)
405 for (i
= 0; i
< n
->max_queues
; i
++) {
406 if (i
< n
->curr_queues
) {
407 assert(!peer_attach(n
, i
));
409 assert(!peer_detach(n
, i
));
414 static void virtio_net_set_multiqueue(VirtIONet
*n
, int multiqueue
);
416 static uint32_t virtio_net_get_features(VirtIODevice
*vdev
, uint32_t features
)
418 VirtIONet
*n
= VIRTIO_NET(vdev
);
419 NetClientState
*nc
= qemu_get_queue(n
->nic
);
421 features
|= (1 << VIRTIO_NET_F_MAC
);
423 if (!peer_has_vnet_hdr(n
)) {
424 features
&= ~(0x1 << VIRTIO_NET_F_CSUM
);
425 features
&= ~(0x1 << VIRTIO_NET_F_HOST_TSO4
);
426 features
&= ~(0x1 << VIRTIO_NET_F_HOST_TSO6
);
427 features
&= ~(0x1 << VIRTIO_NET_F_HOST_ECN
);
429 features
&= ~(0x1 << VIRTIO_NET_F_GUEST_CSUM
);
430 features
&= ~(0x1 << VIRTIO_NET_F_GUEST_TSO4
);
431 features
&= ~(0x1 << VIRTIO_NET_F_GUEST_TSO6
);
432 features
&= ~(0x1 << VIRTIO_NET_F_GUEST_ECN
);
435 if (!peer_has_vnet_hdr(n
) || !peer_has_ufo(n
)) {
436 features
&= ~(0x1 << VIRTIO_NET_F_GUEST_UFO
);
437 features
&= ~(0x1 << VIRTIO_NET_F_HOST_UFO
);
440 if (!nc
->peer
|| nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
443 if (!tap_get_vhost_net(nc
->peer
)) {
446 return vhost_net_get_features(tap_get_vhost_net(nc
->peer
), features
);
449 static uint32_t virtio_net_bad_features(VirtIODevice
*vdev
)
451 uint32_t features
= 0;
453 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
455 features
|= (1 << VIRTIO_NET_F_MAC
);
456 features
|= (1 << VIRTIO_NET_F_CSUM
);
457 features
|= (1 << VIRTIO_NET_F_HOST_TSO4
);
458 features
|= (1 << VIRTIO_NET_F_HOST_TSO6
);
459 features
|= (1 << VIRTIO_NET_F_HOST_ECN
);
464 static void virtio_net_apply_guest_offloads(VirtIONet
*n
)
466 tap_set_offload(qemu_get_subqueue(n
->nic
, 0)->peer
,
467 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_CSUM
)),
468 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_TSO4
)),
469 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_TSO6
)),
470 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_ECN
)),
471 !!(n
->curr_guest_offloads
& (1ULL << VIRTIO_NET_F_GUEST_UFO
)));
474 static uint64_t virtio_net_guest_offloads_by_features(uint32_t features
)
476 static const uint64_t guest_offloads_mask
=
477 (1ULL << VIRTIO_NET_F_GUEST_CSUM
) |
478 (1ULL << VIRTIO_NET_F_GUEST_TSO4
) |
479 (1ULL << VIRTIO_NET_F_GUEST_TSO6
) |
480 (1ULL << VIRTIO_NET_F_GUEST_ECN
) |
481 (1ULL << VIRTIO_NET_F_GUEST_UFO
);
483 return guest_offloads_mask
& features
;
486 static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet
*n
)
488 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
489 return virtio_net_guest_offloads_by_features(vdev
->guest_features
);
492 static void virtio_net_set_features(VirtIODevice
*vdev
, uint32_t features
)
494 VirtIONet
*n
= VIRTIO_NET(vdev
);
497 virtio_net_set_multiqueue(n
, !!(features
& (1 << VIRTIO_NET_F_MQ
)));
499 virtio_net_set_mrg_rx_bufs(n
, !!(features
& (1 << VIRTIO_NET_F_MRG_RXBUF
)));
501 if (n
->has_vnet_hdr
) {
502 n
->curr_guest_offloads
=
503 virtio_net_guest_offloads_by_features(features
);
504 virtio_net_apply_guest_offloads(n
);
507 for (i
= 0; i
< n
->max_queues
; i
++) {
508 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, i
);
510 if (!nc
->peer
|| nc
->peer
->info
->type
!= NET_CLIENT_OPTIONS_KIND_TAP
) {
513 if (!tap_get_vhost_net(nc
->peer
)) {
516 vhost_net_ack_features(tap_get_vhost_net(nc
->peer
), features
);
520 static int virtio_net_handle_rx_mode(VirtIONet
*n
, uint8_t cmd
,
521 struct iovec
*iov
, unsigned int iov_cnt
)
525 NetClientState
*nc
= qemu_get_queue(n
->nic
);
527 s
= iov_to_buf(iov
, iov_cnt
, 0, &on
, sizeof(on
));
528 if (s
!= sizeof(on
)) {
529 return VIRTIO_NET_ERR
;
532 if (cmd
== VIRTIO_NET_CTRL_RX_PROMISC
) {
534 } else if (cmd
== VIRTIO_NET_CTRL_RX_ALLMULTI
) {
536 } else if (cmd
== VIRTIO_NET_CTRL_RX_ALLUNI
) {
538 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOMULTI
) {
540 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOUNI
) {
542 } else if (cmd
== VIRTIO_NET_CTRL_RX_NOBCAST
) {
545 return VIRTIO_NET_ERR
;
550 return VIRTIO_NET_OK
;
553 static int virtio_net_handle_offloads(VirtIONet
*n
, uint8_t cmd
,
554 struct iovec
*iov
, unsigned int iov_cnt
)
556 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
560 if (!((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
) & vdev
->guest_features
)) {
561 return VIRTIO_NET_ERR
;
564 s
= iov_to_buf(iov
, iov_cnt
, 0, &offloads
, sizeof(offloads
));
565 if (s
!= sizeof(offloads
)) {
566 return VIRTIO_NET_ERR
;
569 if (cmd
== VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET
) {
570 uint64_t supported_offloads
;
572 if (!n
->has_vnet_hdr
) {
573 return VIRTIO_NET_ERR
;
576 supported_offloads
= virtio_net_supported_guest_offloads(n
);
577 if (offloads
& ~supported_offloads
) {
578 return VIRTIO_NET_ERR
;
581 n
->curr_guest_offloads
= offloads
;
582 virtio_net_apply_guest_offloads(n
);
584 return VIRTIO_NET_OK
;
586 return VIRTIO_NET_ERR
;
590 static int virtio_net_handle_mac(VirtIONet
*n
, uint8_t cmd
,
591 struct iovec
*iov
, unsigned int iov_cnt
)
593 struct virtio_net_ctrl_mac mac_data
;
595 NetClientState
*nc
= qemu_get_queue(n
->nic
);
597 if (cmd
== VIRTIO_NET_CTRL_MAC_ADDR_SET
) {
598 if (iov_size(iov
, iov_cnt
) != sizeof(n
->mac
)) {
599 return VIRTIO_NET_ERR
;
601 s
= iov_to_buf(iov
, iov_cnt
, 0, &n
->mac
, sizeof(n
->mac
));
602 assert(s
== sizeof(n
->mac
));
603 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->mac
);
606 return VIRTIO_NET_OK
;
609 if (cmd
!= VIRTIO_NET_CTRL_MAC_TABLE_SET
) {
610 return VIRTIO_NET_ERR
;
613 n
->mac_table
.in_use
= 0;
614 n
->mac_table
.first_multi
= 0;
615 n
->mac_table
.uni_overflow
= 0;
616 n
->mac_table
.multi_overflow
= 0;
617 memset(n
->mac_table
.macs
, 0, MAC_TABLE_ENTRIES
* ETH_ALEN
);
619 s
= iov_to_buf(iov
, iov_cnt
, 0, &mac_data
.entries
,
620 sizeof(mac_data
.entries
));
621 mac_data
.entries
= ldl_p(&mac_data
.entries
);
622 if (s
!= sizeof(mac_data
.entries
)) {
625 iov_discard_front(&iov
, &iov_cnt
, s
);
627 if (mac_data
.entries
* ETH_ALEN
> iov_size(iov
, iov_cnt
)) {
631 if (mac_data
.entries
<= MAC_TABLE_ENTRIES
) {
632 s
= iov_to_buf(iov
, iov_cnt
, 0, n
->mac_table
.macs
,
633 mac_data
.entries
* ETH_ALEN
);
634 if (s
!= mac_data
.entries
* ETH_ALEN
) {
637 n
->mac_table
.in_use
+= mac_data
.entries
;
639 n
->mac_table
.uni_overflow
= 1;
642 iov_discard_front(&iov
, &iov_cnt
, mac_data
.entries
* ETH_ALEN
);
644 n
->mac_table
.first_multi
= n
->mac_table
.in_use
;
646 s
= iov_to_buf(iov
, iov_cnt
, 0, &mac_data
.entries
,
647 sizeof(mac_data
.entries
));
648 mac_data
.entries
= ldl_p(&mac_data
.entries
);
649 if (s
!= sizeof(mac_data
.entries
)) {
653 iov_discard_front(&iov
, &iov_cnt
, s
);
655 if (mac_data
.entries
* ETH_ALEN
!= iov_size(iov
, iov_cnt
)) {
659 if (n
->mac_table
.in_use
+ mac_data
.entries
<= MAC_TABLE_ENTRIES
) {
660 s
= iov_to_buf(iov
, iov_cnt
, 0,
661 &n
->mac_table
.macs
[n
->mac_table
.in_use
* ETH_ALEN
],
662 mac_data
.entries
* ETH_ALEN
);
663 if (s
!= mac_data
.entries
* ETH_ALEN
) {
666 n
->mac_table
.in_use
+= mac_data
.entries
;
668 n
->mac_table
.multi_overflow
= 1;
673 return VIRTIO_NET_OK
;
677 return VIRTIO_NET_ERR
;
680 static int virtio_net_handle_vlan_table(VirtIONet
*n
, uint8_t cmd
,
681 struct iovec
*iov
, unsigned int iov_cnt
)
685 NetClientState
*nc
= qemu_get_queue(n
->nic
);
687 s
= iov_to_buf(iov
, iov_cnt
, 0, &vid
, sizeof(vid
));
689 if (s
!= sizeof(vid
)) {
690 return VIRTIO_NET_ERR
;
694 return VIRTIO_NET_ERR
;
696 if (cmd
== VIRTIO_NET_CTRL_VLAN_ADD
)
697 n
->vlans
[vid
>> 5] |= (1U << (vid
& 0x1f));
698 else if (cmd
== VIRTIO_NET_CTRL_VLAN_DEL
)
699 n
->vlans
[vid
>> 5] &= ~(1U << (vid
& 0x1f));
701 return VIRTIO_NET_ERR
;
705 return VIRTIO_NET_OK
;
708 static int virtio_net_handle_mq(VirtIONet
*n
, uint8_t cmd
,
709 struct iovec
*iov
, unsigned int iov_cnt
)
711 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
712 struct virtio_net_ctrl_mq mq
;
716 s
= iov_to_buf(iov
, iov_cnt
, 0, &mq
, sizeof(mq
));
717 if (s
!= sizeof(mq
)) {
718 return VIRTIO_NET_ERR
;
721 if (cmd
!= VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET
) {
722 return VIRTIO_NET_ERR
;
725 queues
= lduw_p(&mq
.virtqueue_pairs
);
727 if (queues
< VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN
||
728 queues
> VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX
||
729 queues
> n
->max_queues
||
731 return VIRTIO_NET_ERR
;
734 n
->curr_queues
= queues
;
735 /* stop the backend before changing the number of queues to avoid handling a
737 virtio_net_set_status(vdev
, vdev
->status
);
738 virtio_net_set_queues(n
);
740 return VIRTIO_NET_OK
;
742 static void virtio_net_handle_ctrl(VirtIODevice
*vdev
, VirtQueue
*vq
)
744 VirtIONet
*n
= VIRTIO_NET(vdev
);
745 struct virtio_net_ctrl_hdr ctrl
;
746 virtio_net_ctrl_ack status
= VIRTIO_NET_ERR
;
747 VirtQueueElement elem
;
750 unsigned int iov_cnt
;
752 while (virtqueue_pop(vq
, &elem
)) {
753 if (iov_size(elem
.in_sg
, elem
.in_num
) < sizeof(status
) ||
754 iov_size(elem
.out_sg
, elem
.out_num
) < sizeof(ctrl
)) {
755 error_report("virtio-net ctrl missing headers");
760 iov_cnt
= elem
.out_num
;
761 s
= iov_to_buf(iov
, iov_cnt
, 0, &ctrl
, sizeof(ctrl
));
762 iov_discard_front(&iov
, &iov_cnt
, sizeof(ctrl
));
763 if (s
!= sizeof(ctrl
)) {
764 status
= VIRTIO_NET_ERR
;
765 } else if (ctrl
.class == VIRTIO_NET_CTRL_RX
) {
766 status
= virtio_net_handle_rx_mode(n
, ctrl
.cmd
, iov
, iov_cnt
);
767 } else if (ctrl
.class == VIRTIO_NET_CTRL_MAC
) {
768 status
= virtio_net_handle_mac(n
, ctrl
.cmd
, iov
, iov_cnt
);
769 } else if (ctrl
.class == VIRTIO_NET_CTRL_VLAN
) {
770 status
= virtio_net_handle_vlan_table(n
, ctrl
.cmd
, iov
, iov_cnt
);
771 } else if (ctrl
.class == VIRTIO_NET_CTRL_MQ
) {
772 status
= virtio_net_handle_mq(n
, ctrl
.cmd
, iov
, iov_cnt
);
773 } else if (ctrl
.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS
) {
774 status
= virtio_net_handle_offloads(n
, ctrl
.cmd
, iov
, iov_cnt
);
777 s
= iov_from_buf(elem
.in_sg
, elem
.in_num
, 0, &status
, sizeof(status
));
778 assert(s
== sizeof(status
));
780 virtqueue_push(vq
, &elem
, sizeof(status
));
781 virtio_notify(vdev
, vq
);
787 static void virtio_net_handle_rx(VirtIODevice
*vdev
, VirtQueue
*vq
)
789 VirtIONet
*n
= VIRTIO_NET(vdev
);
790 int queue_index
= vq2q(virtio_get_queue_index(vq
));
792 qemu_flush_queued_packets(qemu_get_subqueue(n
->nic
, queue_index
));
795 static int virtio_net_can_receive(NetClientState
*nc
)
797 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
798 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
799 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
801 if (!vdev
->vm_running
) {
805 if (nc
->queue_index
>= n
->curr_queues
) {
809 if (!virtio_queue_ready(q
->rx_vq
) ||
810 !(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
817 static int virtio_net_has_buffers(VirtIONetQueue
*q
, int bufsize
)
820 if (virtio_queue_empty(q
->rx_vq
) ||
821 (n
->mergeable_rx_bufs
&&
822 !virtqueue_avail_bytes(q
->rx_vq
, bufsize
, 0))) {
823 virtio_queue_set_notification(q
->rx_vq
, 1);
825 /* To avoid a race condition where the guest has made some buffers
826 * available after the above check but before notification was
827 * enabled, check for available buffers again.
829 if (virtio_queue_empty(q
->rx_vq
) ||
830 (n
->mergeable_rx_bufs
&&
831 !virtqueue_avail_bytes(q
->rx_vq
, bufsize
, 0))) {
836 virtio_queue_set_notification(q
->rx_vq
, 0);
840 /* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
841 * it never finds out that the packets don't have valid checksums. This
842 * causes dhclient to get upset. Fedora's carried a patch for ages to
843 * fix this with Xen but it hasn't appeared in an upstream release of
846 * To avoid breaking existing guests, we catch udp packets and add
847 * checksums. This is terrible but it's better than hacking the guest
850 * N.B. if we introduce a zero-copy API, this operation is no longer free so
851 * we should provide a mechanism to disable it to avoid polluting the host
854 static void work_around_broken_dhclient(struct virtio_net_hdr
*hdr
,
855 uint8_t *buf
, size_t size
)
857 if ((hdr
->flags
& VIRTIO_NET_HDR_F_NEEDS_CSUM
) && /* missing csum */
858 (size
> 27 && size
< 1500) && /* normal sized MTU */
859 (buf
[12] == 0x08 && buf
[13] == 0x00) && /* ethertype == IPv4 */
860 (buf
[23] == 17) && /* ip.protocol == UDP */
861 (buf
[34] == 0 && buf
[35] == 67)) { /* udp.srcport == bootps */
862 net_checksum_calculate(buf
, size
);
863 hdr
->flags
&= ~VIRTIO_NET_HDR_F_NEEDS_CSUM
;
867 static void receive_header(VirtIONet
*n
, const struct iovec
*iov
, int iov_cnt
,
868 const void *buf
, size_t size
)
870 if (n
->has_vnet_hdr
) {
871 /* FIXME this cast is evil */
872 void *wbuf
= (void *)buf
;
873 work_around_broken_dhclient(wbuf
, wbuf
+ n
->host_hdr_len
,
874 size
- n
->host_hdr_len
);
875 iov_from_buf(iov
, iov_cnt
, 0, buf
, sizeof(struct virtio_net_hdr
));
877 struct virtio_net_hdr hdr
= {
879 .gso_type
= VIRTIO_NET_HDR_GSO_NONE
881 iov_from_buf(iov
, iov_cnt
, 0, &hdr
, sizeof hdr
);
885 static int receive_filter(VirtIONet
*n
, const uint8_t *buf
, int size
)
887 static const uint8_t bcast
[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
888 static const uint8_t vlan
[] = {0x81, 0x00};
889 uint8_t *ptr
= (uint8_t *)buf
;
895 ptr
+= n
->host_hdr_len
;
897 if (!memcmp(&ptr
[12], vlan
, sizeof(vlan
))) {
898 int vid
= be16_to_cpup((uint16_t *)(ptr
+ 14)) & 0xfff;
899 if (!(n
->vlans
[vid
>> 5] & (1U << (vid
& 0x1f))))
903 if (ptr
[0] & 1) { // multicast
904 if (!memcmp(ptr
, bcast
, sizeof(bcast
))) {
906 } else if (n
->nomulti
) {
908 } else if (n
->allmulti
|| n
->mac_table
.multi_overflow
) {
912 for (i
= n
->mac_table
.first_multi
; i
< n
->mac_table
.in_use
; i
++) {
913 if (!memcmp(ptr
, &n
->mac_table
.macs
[i
* ETH_ALEN
], ETH_ALEN
)) {
920 } else if (n
->alluni
|| n
->mac_table
.uni_overflow
) {
922 } else if (!memcmp(ptr
, n
->mac
, ETH_ALEN
)) {
926 for (i
= 0; i
< n
->mac_table
.first_multi
; i
++) {
927 if (!memcmp(ptr
, &n
->mac_table
.macs
[i
* ETH_ALEN
], ETH_ALEN
)) {
936 static ssize_t
virtio_net_receive(NetClientState
*nc
, const uint8_t *buf
, size_t size
)
938 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
939 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
940 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
941 struct iovec mhdr_sg
[VIRTQUEUE_MAX_SIZE
];
942 struct virtio_net_hdr_mrg_rxbuf mhdr
;
943 unsigned mhdr_cnt
= 0;
944 size_t offset
, i
, guest_offset
;
946 if (!virtio_net_can_receive(nc
)) {
950 /* hdr_len refers to the header we supply to the guest */
951 if (!virtio_net_has_buffers(q
, size
+ n
->guest_hdr_len
- n
->host_hdr_len
)) {
955 if (!receive_filter(n
, buf
, size
))
960 while (offset
< size
) {
961 VirtQueueElement elem
;
963 const struct iovec
*sg
= elem
.in_sg
;
967 if (virtqueue_pop(q
->rx_vq
, &elem
) == 0) {
970 error_report("virtio-net unexpected empty queue: "
971 "i %zd mergeable %d offset %zd, size %zd, "
972 "guest hdr len %zd, host hdr len %zd guest features 0x%x",
973 i
, n
->mergeable_rx_bufs
, offset
, size
,
974 n
->guest_hdr_len
, n
->host_hdr_len
, vdev
->guest_features
);
978 if (elem
.in_num
< 1) {
979 error_report("virtio-net receive queue contains no in buffers");
985 if (n
->mergeable_rx_bufs
) {
986 mhdr_cnt
= iov_copy(mhdr_sg
, ARRAY_SIZE(mhdr_sg
),
988 offsetof(typeof(mhdr
), num_buffers
),
989 sizeof(mhdr
.num_buffers
));
992 receive_header(n
, sg
, elem
.in_num
, buf
, size
);
993 offset
= n
->host_hdr_len
;
994 total
+= n
->guest_hdr_len
;
995 guest_offset
= n
->guest_hdr_len
;
1000 /* copy in packet. ugh */
1001 len
= iov_from_buf(sg
, elem
.in_num
, guest_offset
,
1002 buf
+ offset
, size
- offset
);
1005 /* If buffers can't be merged, at this point we
1006 * must have consumed the complete packet.
1007 * Otherwise, drop it. */
1008 if (!n
->mergeable_rx_bufs
&& offset
< size
) {
1010 error_report("virtio-net truncated non-mergeable packet: "
1011 "i %zd mergeable %d offset %zd, size %zd, "
1012 "guest hdr len %zd, host hdr len %zd",
1013 i
, n
->mergeable_rx_bufs
,
1014 offset
, size
, n
->guest_hdr_len
, n
->host_hdr_len
);
1019 /* signal other side */
1020 virtqueue_fill(q
->rx_vq
, &elem
, total
, i
++);
1024 stw_p(&mhdr
.num_buffers
, i
);
1025 iov_from_buf(mhdr_sg
, mhdr_cnt
,
1027 &mhdr
.num_buffers
, sizeof mhdr
.num_buffers
);
1030 virtqueue_flush(q
->rx_vq
, i
);
1031 virtio_notify(vdev
, q
->rx_vq
);
1036 static int32_t virtio_net_flush_tx(VirtIONetQueue
*q
);
1038 static void virtio_net_tx_complete(NetClientState
*nc
, ssize_t len
)
1040 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
1041 VirtIONetQueue
*q
= virtio_net_get_subqueue(nc
);
1042 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1044 virtqueue_push(q
->tx_vq
, &q
->async_tx
.elem
, 0);
1045 virtio_notify(vdev
, q
->tx_vq
);
1047 q
->async_tx
.elem
.out_num
= q
->async_tx
.len
= 0;
1049 virtio_queue_set_notification(q
->tx_vq
, 1);
1050 virtio_net_flush_tx(q
);
1054 static int32_t virtio_net_flush_tx(VirtIONetQueue
*q
)
1056 VirtIONet
*n
= q
->n
;
1057 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1058 VirtQueueElement elem
;
1059 int32_t num_packets
= 0;
1060 int queue_index
= vq2q(virtio_get_queue_index(q
->tx_vq
));
1061 if (!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
1065 assert(vdev
->vm_running
);
1067 if (q
->async_tx
.elem
.out_num
) {
1068 virtio_queue_set_notification(q
->tx_vq
, 0);
1072 while (virtqueue_pop(q
->tx_vq
, &elem
)) {
1074 unsigned int out_num
= elem
.out_num
;
1075 struct iovec
*out_sg
= &elem
.out_sg
[0];
1076 struct iovec sg
[VIRTQUEUE_MAX_SIZE
];
1079 error_report("virtio-net header not in first element");
1084 * If host wants to see the guest header as is, we can
1085 * pass it on unchanged. Otherwise, copy just the parts
1086 * that host is interested in.
1088 assert(n
->host_hdr_len
<= n
->guest_hdr_len
);
1089 if (n
->host_hdr_len
!= n
->guest_hdr_len
) {
1090 unsigned sg_num
= iov_copy(sg
, ARRAY_SIZE(sg
),
1092 0, n
->host_hdr_len
);
1093 sg_num
+= iov_copy(sg
+ sg_num
, ARRAY_SIZE(sg
) - sg_num
,
1095 n
->guest_hdr_len
, -1);
1100 len
= n
->guest_hdr_len
;
1102 ret
= qemu_sendv_packet_async(qemu_get_subqueue(n
->nic
, queue_index
),
1103 out_sg
, out_num
, virtio_net_tx_complete
);
1105 virtio_queue_set_notification(q
->tx_vq
, 0);
1106 q
->async_tx
.elem
= elem
;
1107 q
->async_tx
.len
= len
;
1113 virtqueue_push(q
->tx_vq
, &elem
, 0);
1114 virtio_notify(vdev
, q
->tx_vq
);
1116 if (++num_packets
>= n
->tx_burst
) {
1123 static void virtio_net_handle_tx_timer(VirtIODevice
*vdev
, VirtQueue
*vq
)
1125 VirtIONet
*n
= VIRTIO_NET(vdev
);
1126 VirtIONetQueue
*q
= &n
->vqs
[vq2q(virtio_get_queue_index(vq
))];
1128 /* This happens when device was stopped but VCPU wasn't. */
1129 if (!vdev
->vm_running
) {
1134 if (q
->tx_waiting
) {
1135 virtio_queue_set_notification(vq
, 1);
1136 timer_del(q
->tx_timer
);
1138 virtio_net_flush_tx(q
);
1140 timer_mod(q
->tx_timer
,
1141 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL
) + n
->tx_timeout
);
1143 virtio_queue_set_notification(vq
, 0);
1147 static void virtio_net_handle_tx_bh(VirtIODevice
*vdev
, VirtQueue
*vq
)
1149 VirtIONet
*n
= VIRTIO_NET(vdev
);
1150 VirtIONetQueue
*q
= &n
->vqs
[vq2q(virtio_get_queue_index(vq
))];
1152 if (unlikely(q
->tx_waiting
)) {
1156 /* This happens when device was stopped but VCPU wasn't. */
1157 if (!vdev
->vm_running
) {
1160 virtio_queue_set_notification(vq
, 0);
1161 qemu_bh_schedule(q
->tx_bh
);
1164 static void virtio_net_tx_timer(void *opaque
)
1166 VirtIONetQueue
*q
= opaque
;
1167 VirtIONet
*n
= q
->n
;
1168 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1169 assert(vdev
->vm_running
);
1173 /* Just in case the driver is not ready on more */
1174 if (!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
)) {
1178 virtio_queue_set_notification(q
->tx_vq
, 1);
1179 virtio_net_flush_tx(q
);
1182 static void virtio_net_tx_bh(void *opaque
)
1184 VirtIONetQueue
*q
= opaque
;
1185 VirtIONet
*n
= q
->n
;
1186 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1189 assert(vdev
->vm_running
);
1193 /* Just in case the driver is not ready on more */
1194 if (unlikely(!(vdev
->status
& VIRTIO_CONFIG_S_DRIVER_OK
))) {
1198 ret
= virtio_net_flush_tx(q
);
1199 if (ret
== -EBUSY
) {
1200 return; /* Notification re-enable handled by tx_complete */
1203 /* If we flush a full burst of packets, assume there are
1204 * more coming and immediately reschedule */
1205 if (ret
>= n
->tx_burst
) {
1206 qemu_bh_schedule(q
->tx_bh
);
1211 /* If less than a full burst, re-enable notification and flush
1212 * anything that may have come in while we weren't looking. If
1213 * we find something, assume the guest is still active and reschedule */
1214 virtio_queue_set_notification(q
->tx_vq
, 1);
1215 if (virtio_net_flush_tx(q
) > 0) {
1216 virtio_queue_set_notification(q
->tx_vq
, 0);
1217 qemu_bh_schedule(q
->tx_bh
);
1222 static void virtio_net_set_multiqueue(VirtIONet
*n
, int multiqueue
)
1224 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1225 int i
, max
= multiqueue
? n
->max_queues
: 1;
1227 n
->multiqueue
= multiqueue
;
1229 for (i
= 2; i
<= n
->max_queues
* 2 + 1; i
++) {
1230 virtio_del_queue(vdev
, i
);
1233 for (i
= 1; i
< max
; i
++) {
1234 n
->vqs
[i
].rx_vq
= virtio_add_queue(vdev
, 256, virtio_net_handle_rx
);
1235 if (n
->vqs
[i
].tx_timer
) {
1237 virtio_add_queue(vdev
, 256, virtio_net_handle_tx_timer
);
1238 n
->vqs
[i
].tx_timer
= timer_new_ns(QEMU_CLOCK_VIRTUAL
,
1239 virtio_net_tx_timer
,
1243 virtio_add_queue(vdev
, 256, virtio_net_handle_tx_bh
);
1244 n
->vqs
[i
].tx_bh
= qemu_bh_new(virtio_net_tx_bh
, &n
->vqs
[i
]);
1247 n
->vqs
[i
].tx_waiting
= 0;
1251 /* Note: Minux Guests (version 3.2.1) use ctrl vq but don't ack
1252 * VIRTIO_NET_F_CTRL_VQ. Create ctrl vq unconditionally to avoid
1255 n
->ctrl_vq
= virtio_add_queue(vdev
, 64, virtio_net_handle_ctrl
);
1257 virtio_net_set_queues(n
);
1260 static void virtio_net_save(QEMUFile
*f
, void *opaque
)
1263 VirtIONet
*n
= opaque
;
1264 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1266 /* At this point, backend must be stopped, otherwise
1267 * it might keep writing to memory. */
1268 assert(!n
->vhost_started
);
1269 virtio_save(vdev
, f
);
1271 qemu_put_buffer(f
, n
->mac
, ETH_ALEN
);
1272 qemu_put_be32(f
, n
->vqs
[0].tx_waiting
);
1273 qemu_put_be32(f
, n
->mergeable_rx_bufs
);
1274 qemu_put_be16(f
, n
->status
);
1275 qemu_put_byte(f
, n
->promisc
);
1276 qemu_put_byte(f
, n
->allmulti
);
1277 qemu_put_be32(f
, n
->mac_table
.in_use
);
1278 qemu_put_buffer(f
, n
->mac_table
.macs
, n
->mac_table
.in_use
* ETH_ALEN
);
1279 qemu_put_buffer(f
, (uint8_t *)n
->vlans
, MAX_VLAN
>> 3);
1280 qemu_put_be32(f
, n
->has_vnet_hdr
);
1281 qemu_put_byte(f
, n
->mac_table
.multi_overflow
);
1282 qemu_put_byte(f
, n
->mac_table
.uni_overflow
);
1283 qemu_put_byte(f
, n
->alluni
);
1284 qemu_put_byte(f
, n
->nomulti
);
1285 qemu_put_byte(f
, n
->nouni
);
1286 qemu_put_byte(f
, n
->nobcast
);
1287 qemu_put_byte(f
, n
->has_ufo
);
1288 if (n
->max_queues
> 1) {
1289 qemu_put_be16(f
, n
->max_queues
);
1290 qemu_put_be16(f
, n
->curr_queues
);
1291 for (i
= 1; i
< n
->curr_queues
; i
++) {
1292 qemu_put_be32(f
, n
->vqs
[i
].tx_waiting
);
1296 if ((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
) & vdev
->guest_features
) {
1297 qemu_put_be64(f
, n
->curr_guest_offloads
);
1301 static int virtio_net_load(QEMUFile
*f
, void *opaque
, int version_id
)
1303 VirtIONet
*n
= opaque
;
1304 VirtIODevice
*vdev
= VIRTIO_DEVICE(n
);
1305 int ret
, i
, link_down
;
1307 if (version_id
< 2 || version_id
> VIRTIO_NET_VM_VERSION
)
1310 ret
= virtio_load(vdev
, f
);
1315 qemu_get_buffer(f
, n
->mac
, ETH_ALEN
);
1316 n
->vqs
[0].tx_waiting
= qemu_get_be32(f
);
1318 virtio_net_set_mrg_rx_bufs(n
, qemu_get_be32(f
));
1320 if (version_id
>= 3)
1321 n
->status
= qemu_get_be16(f
);
1323 if (version_id
>= 4) {
1324 if (version_id
< 8) {
1325 n
->promisc
= qemu_get_be32(f
);
1326 n
->allmulti
= qemu_get_be32(f
);
1328 n
->promisc
= qemu_get_byte(f
);
1329 n
->allmulti
= qemu_get_byte(f
);
1333 if (version_id
>= 5) {
1334 n
->mac_table
.in_use
= qemu_get_be32(f
);
1335 /* MAC_TABLE_ENTRIES may be different from the saved image */
1336 if (n
->mac_table
.in_use
<= MAC_TABLE_ENTRIES
) {
1337 qemu_get_buffer(f
, n
->mac_table
.macs
,
1338 n
->mac_table
.in_use
* ETH_ALEN
);
1339 } else if (n
->mac_table
.in_use
) {
1340 uint8_t *buf
= g_malloc0(n
->mac_table
.in_use
);
1341 qemu_get_buffer(f
, buf
, n
->mac_table
.in_use
* ETH_ALEN
);
1343 n
->mac_table
.multi_overflow
= n
->mac_table
.uni_overflow
= 1;
1344 n
->mac_table
.in_use
= 0;
1348 if (version_id
>= 6)
1349 qemu_get_buffer(f
, (uint8_t *)n
->vlans
, MAX_VLAN
>> 3);
1351 if (version_id
>= 7) {
1352 if (qemu_get_be32(f
) && !peer_has_vnet_hdr(n
)) {
1353 error_report("virtio-net: saved image requires vnet_hdr=on");
1358 if (version_id
>= 9) {
1359 n
->mac_table
.multi_overflow
= qemu_get_byte(f
);
1360 n
->mac_table
.uni_overflow
= qemu_get_byte(f
);
1363 if (version_id
>= 10) {
1364 n
->alluni
= qemu_get_byte(f
);
1365 n
->nomulti
= qemu_get_byte(f
);
1366 n
->nouni
= qemu_get_byte(f
);
1367 n
->nobcast
= qemu_get_byte(f
);
1370 if (version_id
>= 11) {
1371 if (qemu_get_byte(f
) && !peer_has_ufo(n
)) {
1372 error_report("virtio-net: saved image requires TUN_F_UFO support");
1377 if (n
->max_queues
> 1) {
1378 if (n
->max_queues
!= qemu_get_be16(f
)) {
1379 error_report("virtio-net: different max_queues ");
1383 n
->curr_queues
= qemu_get_be16(f
);
1384 for (i
= 1; i
< n
->curr_queues
; i
++) {
1385 n
->vqs
[i
].tx_waiting
= qemu_get_be32(f
);
1389 if ((1 << VIRTIO_NET_F_CTRL_GUEST_OFFLOADS
) & vdev
->guest_features
) {
1390 n
->curr_guest_offloads
= qemu_get_be64(f
);
1392 n
->curr_guest_offloads
= virtio_net_supported_guest_offloads(n
);
1395 if (peer_has_vnet_hdr(n
)) {
1396 virtio_net_apply_guest_offloads(n
);
1399 virtio_net_set_queues(n
);
1401 /* Find the first multicast entry in the saved MAC filter */
1402 for (i
= 0; i
< n
->mac_table
.in_use
; i
++) {
1403 if (n
->mac_table
.macs
[i
* ETH_ALEN
] & 1) {
1407 n
->mac_table
.first_multi
= i
;
1409 /* nc.link_down can't be migrated, so infer link_down according
1410 * to link status bit in n->status */
1411 link_down
= (n
->status
& VIRTIO_NET_S_LINK_UP
) == 0;
1412 for (i
= 0; i
< n
->max_queues
; i
++) {
1413 qemu_get_subqueue(n
->nic
, i
)->link_down
= link_down
;
1419 static void virtio_net_cleanup(NetClientState
*nc
)
1421 VirtIONet
*n
= qemu_get_nic_opaque(nc
);
1426 static NetClientInfo net_virtio_info
= {
1427 .type
= NET_CLIENT_OPTIONS_KIND_NIC
,
1428 .size
= sizeof(NICState
),
1429 .can_receive
= virtio_net_can_receive
,
1430 .receive
= virtio_net_receive
,
1431 .cleanup
= virtio_net_cleanup
,
1432 .link_status_changed
= virtio_net_set_link_status
,
1433 .query_rx_filter
= virtio_net_query_rxfilter
,
1436 static bool virtio_net_guest_notifier_pending(VirtIODevice
*vdev
, int idx
)
1438 VirtIONet
*n
= VIRTIO_NET(vdev
);
1439 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, vq2q(idx
));
1440 assert(n
->vhost_started
);
1441 return vhost_net_virtqueue_pending(tap_get_vhost_net(nc
->peer
), idx
);
1444 static void virtio_net_guest_notifier_mask(VirtIODevice
*vdev
, int idx
,
1447 VirtIONet
*n
= VIRTIO_NET(vdev
);
1448 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, vq2q(idx
));
1449 assert(n
->vhost_started
);
1450 vhost_net_virtqueue_mask(tap_get_vhost_net(nc
->peer
),
1454 void virtio_net_set_config_size(VirtIONet
*n
, uint32_t host_features
)
1456 int i
, config_size
= 0;
1457 host_features
|= (1 << VIRTIO_NET_F_MAC
);
1458 for (i
= 0; feature_sizes
[i
].flags
!= 0; i
++) {
1459 if (host_features
& feature_sizes
[i
].flags
) {
1460 config_size
= MAX(feature_sizes
[i
].end
, config_size
);
1463 n
->config_size
= config_size
;
1466 void virtio_net_set_netclient_name(VirtIONet
*n
, const char *name
,
1470 * The name can be NULL, the netclient name will be type.x.
1472 assert(type
!= NULL
);
1474 if (n
->netclient_name
) {
1475 g_free(n
->netclient_name
);
1476 n
->netclient_name
= NULL
;
1478 if (n
->netclient_type
) {
1479 g_free(n
->netclient_type
);
1480 n
->netclient_type
= NULL
;
1484 n
->netclient_name
= g_strdup(name
);
1486 n
->netclient_type
= g_strdup(type
);
1489 static void virtio_net_device_realize(DeviceState
*dev
, Error
**errp
)
1491 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
1492 VirtIONet
*n
= VIRTIO_NET(dev
);
1496 virtio_init(vdev
, "virtio-net", VIRTIO_ID_NET
, n
->config_size
);
1498 n
->max_queues
= MAX(n
->nic_conf
.queues
, 1);
1499 n
->vqs
= g_malloc0(sizeof(VirtIONetQueue
) * n
->max_queues
);
1500 n
->vqs
[0].rx_vq
= virtio_add_queue(vdev
, 256, virtio_net_handle_rx
);
1503 n
->tx_timeout
= n
->net_conf
.txtimer
;
1505 if (n
->net_conf
.tx
&& strcmp(n
->net_conf
.tx
, "timer")
1506 && strcmp(n
->net_conf
.tx
, "bh")) {
1507 error_report("virtio-net: "
1508 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1510 error_report("Defaulting to \"bh\"");
1513 if (n
->net_conf
.tx
&& !strcmp(n
->net_conf
.tx
, "timer")) {
1514 n
->vqs
[0].tx_vq
= virtio_add_queue(vdev
, 256,
1515 virtio_net_handle_tx_timer
);
1516 n
->vqs
[0].tx_timer
= timer_new_ns(QEMU_CLOCK_VIRTUAL
, virtio_net_tx_timer
,
1519 n
->vqs
[0].tx_vq
= virtio_add_queue(vdev
, 256,
1520 virtio_net_handle_tx_bh
);
1521 n
->vqs
[0].tx_bh
= qemu_bh_new(virtio_net_tx_bh
, &n
->vqs
[0]);
1523 n
->ctrl_vq
= virtio_add_queue(vdev
, 64, virtio_net_handle_ctrl
);
1524 qemu_macaddr_default_if_unset(&n
->nic_conf
.macaddr
);
1525 memcpy(&n
->mac
[0], &n
->nic_conf
.macaddr
, sizeof(n
->mac
));
1526 n
->status
= VIRTIO_NET_S_LINK_UP
;
1528 if (n
->netclient_type
) {
1530 * Happen when virtio_net_set_netclient_name has been called.
1532 n
->nic
= qemu_new_nic(&net_virtio_info
, &n
->nic_conf
,
1533 n
->netclient_type
, n
->netclient_name
, n
);
1535 n
->nic
= qemu_new_nic(&net_virtio_info
, &n
->nic_conf
,
1536 object_get_typename(OBJECT(dev
)), dev
->id
, n
);
1539 peer_test_vnet_hdr(n
);
1540 if (peer_has_vnet_hdr(n
)) {
1541 for (i
= 0; i
< n
->max_queues
; i
++) {
1542 tap_using_vnet_hdr(qemu_get_subqueue(n
->nic
, i
)->peer
, true);
1544 n
->host_hdr_len
= sizeof(struct virtio_net_hdr
);
1546 n
->host_hdr_len
= 0;
1549 qemu_format_nic_info_str(qemu_get_queue(n
->nic
), n
->nic_conf
.macaddr
.a
);
1551 n
->vqs
[0].tx_waiting
= 0;
1552 n
->tx_burst
= n
->net_conf
.txburst
;
1553 virtio_net_set_mrg_rx_bufs(n
, 0);
1554 n
->promisc
= 1; /* for compatibility */
1556 n
->mac_table
.macs
= g_malloc0(MAC_TABLE_ENTRIES
* ETH_ALEN
);
1558 n
->vlans
= g_malloc0(MAX_VLAN
>> 3);
1560 nc
= qemu_get_queue(n
->nic
);
1561 nc
->rxfilter_notify_enabled
= 1;
1564 register_savevm(dev
, "virtio-net", -1, VIRTIO_NET_VM_VERSION
,
1565 virtio_net_save
, virtio_net_load
, n
);
1567 add_boot_device_path(n
->nic_conf
.bootindex
, dev
, "/ethernet-phy@0");
1570 static void virtio_net_device_unrealize(DeviceState
*dev
, Error
**errp
)
1572 VirtIODevice
*vdev
= VIRTIO_DEVICE(dev
);
1573 VirtIONet
*n
= VIRTIO_NET(dev
);
1576 /* This will stop vhost backend if appropriate. */
1577 virtio_net_set_status(vdev
, 0);
1579 unregister_savevm(dev
, "virtio-net", n
);
1581 if (n
->netclient_name
) {
1582 g_free(n
->netclient_name
);
1583 n
->netclient_name
= NULL
;
1585 if (n
->netclient_type
) {
1586 g_free(n
->netclient_type
);
1587 n
->netclient_type
= NULL
;
1590 g_free(n
->mac_table
.macs
);
1593 for (i
= 0; i
< n
->max_queues
; i
++) {
1594 VirtIONetQueue
*q
= &n
->vqs
[i
];
1595 NetClientState
*nc
= qemu_get_subqueue(n
->nic
, i
);
1597 qemu_purge_queued_packets(nc
);
1600 timer_del(q
->tx_timer
);
1601 timer_free(q
->tx_timer
);
1602 } else if (q
->tx_bh
) {
1603 qemu_bh_delete(q
->tx_bh
);
1608 qemu_del_nic(n
->nic
);
1609 virtio_cleanup(vdev
);
1612 static void virtio_net_instance_init(Object
*obj
)
1614 VirtIONet
*n
= VIRTIO_NET(obj
);
1617 * The default config_size is sizeof(struct virtio_net_config).
1618 * Can be overriden with virtio_net_set_config_size.
1620 n
->config_size
= sizeof(struct virtio_net_config
);
1623 static Property virtio_net_properties
[] = {
1624 DEFINE_NIC_PROPERTIES(VirtIONet
, nic_conf
),
1625 DEFINE_PROP_UINT32("x-txtimer", VirtIONet
, net_conf
.txtimer
,
1627 DEFINE_PROP_INT32("x-txburst", VirtIONet
, net_conf
.txburst
, TX_BURST
),
1628 DEFINE_PROP_STRING("tx", VirtIONet
, net_conf
.tx
),
1629 DEFINE_PROP_END_OF_LIST(),
1632 static void virtio_net_class_init(ObjectClass
*klass
, void *data
)
1634 DeviceClass
*dc
= DEVICE_CLASS(klass
);
1635 VirtioDeviceClass
*vdc
= VIRTIO_DEVICE_CLASS(klass
);
1637 dc
->props
= virtio_net_properties
;
1638 set_bit(DEVICE_CATEGORY_NETWORK
, dc
->categories
);
1639 vdc
->realize
= virtio_net_device_realize
;
1640 vdc
->unrealize
= virtio_net_device_unrealize
;
1641 vdc
->get_config
= virtio_net_get_config
;
1642 vdc
->set_config
= virtio_net_set_config
;
1643 vdc
->get_features
= virtio_net_get_features
;
1644 vdc
->set_features
= virtio_net_set_features
;
1645 vdc
->bad_features
= virtio_net_bad_features
;
1646 vdc
->reset
= virtio_net_reset
;
1647 vdc
->set_status
= virtio_net_set_status
;
1648 vdc
->guest_notifier_mask
= virtio_net_guest_notifier_mask
;
1649 vdc
->guest_notifier_pending
= virtio_net_guest_notifier_pending
;
1652 static const TypeInfo virtio_net_info
= {
1653 .name
= TYPE_VIRTIO_NET
,
1654 .parent
= TYPE_VIRTIO_DEVICE
,
1655 .instance_size
= sizeof(VirtIONet
),
1656 .instance_init
= virtio_net_instance_init
,
1657 .class_init
= virtio_net_class_init
,
1660 static void virtio_register_types(void)
1662 type_register_static(&virtio_net_info
);
1665 type_init(virtio_register_types
)