]> git.ipfire.org Git - thirdparty/qemu.git/blame - hw/net/virtio-net.c
virtio-net: handle virtio_net_receive() errors
[thirdparty/qemu.git] / hw / net / virtio-net.c
CommitLineData
fbe78f4f
AL
1/*
2 * Virtio Network Device
3 *
4 * Copyright IBM, Corp. 2007
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
9b8bfe21 14#include "qemu/osdep.h"
1de7afc9 15#include "qemu/iov.h"
0d09e41a 16#include "hw/virtio/virtio.h"
1422e32d 17#include "net/net.h"
7200ac3c 18#include "net/checksum.h"
a8ed73f7 19#include "net/tap.h"
1de7afc9
PB
20#include "qemu/error-report.h"
21#include "qemu/timer.h"
0d09e41a
PB
22#include "hw/virtio/virtio-net.h"
23#include "net/vhost_net.h"
17ec5a86 24#include "hw/virtio/virtio-bus.h"
b1be4280 25#include "qapi/qmp/qjson.h"
06150279 26#include "qapi-event.h"
1399c60d 27#include "hw/virtio/virtio-access.h"
fbe78f4f 28
0ce0e8f4 29#define VIRTIO_NET_VM_VERSION 11
b6503ed9 30
4ffb17f5 31#define MAC_TABLE_ENTRIES 64
f21c0ed9 32#define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
9d6271b8 33
1c0fbfa3
MT
34/* previously fixed value */
35#define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
36/* for now, only allow larger queues; with virtio-1, guest can downsize */
37#define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
38
14f9b664
JL
39/*
40 * Calculate the number of bytes up to and including the given 'field' of
41 * 'container'.
42 */
43#define endof(container, field) \
44 (offsetof(container, field) + sizeof(((container *)0)->field))
45
46typedef struct VirtIOFeature {
47 uint32_t flags;
48 size_t end;
49} VirtIOFeature;
50
51static VirtIOFeature feature_sizes[] = {
52 {.flags = 1 << VIRTIO_NET_F_MAC,
53 .end = endof(struct virtio_net_config, mac)},
54 {.flags = 1 << VIRTIO_NET_F_STATUS,
55 .end = endof(struct virtio_net_config, status)},
56 {.flags = 1 << VIRTIO_NET_F_MQ,
57 .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
58 {}
59};
60
fed699f9 61static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
0c87e93e
JW
62{
63 VirtIONet *n = qemu_get_nic_opaque(nc);
64
fed699f9 65 return &n->vqs[nc->queue_index];
0c87e93e 66}
fed699f9
JW
67
68static int vq2q(int queue_index)
69{
70 return queue_index / 2;
71}
72
fbe78f4f
AL
73/* TODO
74 * - we could suppress RX interrupt if we were so inclined.
75 */
76
0f03eca6 77static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
fbe78f4f 78{
17a0ca55 79 VirtIONet *n = VIRTIO_NET(vdev);
fbe78f4f
AL
80 struct virtio_net_config netcfg;
81
1399c60d
RR
82 virtio_stw_p(vdev, &netcfg.status, n->status);
83 virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queues);
79674068 84 memcpy(netcfg.mac, n->mac, ETH_ALEN);
14f9b664 85 memcpy(config, &netcfg, n->config_size);
fbe78f4f
AL
86}
87
0f03eca6
AL
88static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
89{
17a0ca55 90 VirtIONet *n = VIRTIO_NET(vdev);
14f9b664 91 struct virtio_net_config netcfg = {};
0f03eca6 92
14f9b664 93 memcpy(&netcfg, config, n->config_size);
0f03eca6 94
95129d6f
CH
95 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
96 !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
c1943a3f 97 memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
79674068 98 memcpy(n->mac, netcfg.mac, ETH_ALEN);
b356f76d 99 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
0f03eca6
AL
100 }
101}
102
783e7706
MT
103static bool virtio_net_started(VirtIONet *n, uint8_t status)
104{
17a0ca55 105 VirtIODevice *vdev = VIRTIO_DEVICE(n);
783e7706 106 return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
17a0ca55 107 (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
783e7706
MT
108}
109
f57fcf70
JW
110static void virtio_net_announce_timer(void *opaque)
111{
112 VirtIONet *n = opaque;
113 VirtIODevice *vdev = VIRTIO_DEVICE(n);
114
115 n->announce_counter--;
116 n->status |= VIRTIO_NET_S_ANNOUNCE;
117 virtio_notify_config(vdev);
118}
119
783e7706 120static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
afbaa7b4 121{
17a0ca55 122 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b356f76d 123 NetClientState *nc = qemu_get_queue(n->nic);
fed699f9 124 int queues = n->multiqueue ? n->max_queues : 1;
b356f76d 125
ed8b4afe 126 if (!get_vhost_net(nc->peer)) {
afbaa7b4
MT
127 return;
128 }
fed699f9 129
8c1ac475
RK
130 if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
131 !!n->vhost_started) {
afbaa7b4
MT
132 return;
133 }
134 if (!n->vhost_started) {
086abc1c
MT
135 int r, i;
136
1bfa316c
GK
137 if (n->needs_vnet_hdr_swap) {
138 error_report("backend does not support %s vnet headers; "
139 "falling back on userspace virtio",
140 virtio_is_big_endian(vdev) ? "BE" : "LE");
141 return;
142 }
143
086abc1c
MT
144 /* Any packets outstanding? Purge them to avoid touching rings
145 * when vhost is running.
146 */
147 for (i = 0; i < queues; i++) {
148 NetClientState *qnc = qemu_get_subqueue(n->nic, i);
149
150 /* Purge both directions: TX and RX. */
151 qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
152 qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
153 }
154
1830b80f 155 n->vhost_started = 1;
17a0ca55 156 r = vhost_net_start(vdev, n->nic->ncs, queues);
afbaa7b4 157 if (r < 0) {
e7b43f7e
SH
158 error_report("unable to start vhost net: %d: "
159 "falling back on userspace virtio", -r);
1830b80f 160 n->vhost_started = 0;
afbaa7b4
MT
161 }
162 } else {
17a0ca55 163 vhost_net_stop(vdev, n->nic->ncs, queues);
afbaa7b4
MT
164 n->vhost_started = 0;
165 }
166}
167
1bfa316c
GK
168static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
169 NetClientState *peer,
170 bool enable)
171{
172 if (virtio_is_big_endian(vdev)) {
173 return qemu_set_vnet_be(peer, enable);
174 } else {
175 return qemu_set_vnet_le(peer, enable);
176 }
177}
178
179static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
180 int queues, bool enable)
181{
182 int i;
183
184 for (i = 0; i < queues; i++) {
185 if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
186 enable) {
187 while (--i >= 0) {
188 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
189 }
190
191 return true;
192 }
193 }
194
195 return false;
196}
197
198static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
199{
200 VirtIODevice *vdev = VIRTIO_DEVICE(n);
201 int queues = n->multiqueue ? n->max_queues : 1;
202
203 if (virtio_net_started(n, status)) {
204 /* Before using the device, we tell the network backend about the
205 * endianness to use when parsing vnet headers. If the backend
206 * can't do it, we fallback onto fixing the headers in the core
207 * virtio-net code.
208 */
209 n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
210 queues, true);
211 } else if (virtio_net_started(n, vdev->status)) {
212 /* After using the device, we need to reset the network backend to
213 * the default (guest native endianness), otherwise the guest may
214 * lose network connectivity if it is rebooted into a different
215 * endianness.
216 */
217 virtio_net_set_vnet_endian(vdev, n->nic->ncs, queues, false);
218 }
219}
220
783e7706
MT
221static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
222{
17a0ca55 223 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9
JW
224 VirtIONetQueue *q;
225 int i;
226 uint8_t queue_status;
783e7706 227
1bfa316c 228 virtio_net_vnet_endian_status(n, status);
783e7706
MT
229 virtio_net_vhost_status(n, status);
230
fed699f9 231 for (i = 0; i < n->max_queues; i++) {
38705bb5
FZ
232 NetClientState *ncs = qemu_get_subqueue(n->nic, i);
233 bool queue_started;
fed699f9 234 q = &n->vqs[i];
783e7706 235
fed699f9
JW
236 if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
237 queue_status = 0;
783e7706 238 } else {
fed699f9 239 queue_status = status;
783e7706 240 }
38705bb5
FZ
241 queue_started =
242 virtio_net_started(n, queue_status) && !n->vhost_started;
243
244 if (queue_started) {
245 qemu_flush_queued_packets(ncs);
246 }
fed699f9
JW
247
248 if (!q->tx_waiting) {
249 continue;
250 }
251
38705bb5 252 if (queue_started) {
fed699f9 253 if (q->tx_timer) {
bc72ad67
AB
254 timer_mod(q->tx_timer,
255 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
fed699f9
JW
256 } else {
257 qemu_bh_schedule(q->tx_bh);
258 }
783e7706 259 } else {
fed699f9 260 if (q->tx_timer) {
bc72ad67 261 timer_del(q->tx_timer);
fed699f9
JW
262 } else {
263 qemu_bh_cancel(q->tx_bh);
264 }
783e7706
MT
265 }
266 }
267}
268
4e68f7a0 269static void virtio_net_set_link_status(NetClientState *nc)
554c97dd 270{
cc1f0f45 271 VirtIONet *n = qemu_get_nic_opaque(nc);
17a0ca55 272 VirtIODevice *vdev = VIRTIO_DEVICE(n);
554c97dd
AL
273 uint16_t old_status = n->status;
274
eb6b6c12 275 if (nc->link_down)
554c97dd
AL
276 n->status &= ~VIRTIO_NET_S_LINK_UP;
277 else
278 n->status |= VIRTIO_NET_S_LINK_UP;
279
280 if (n->status != old_status)
17a0ca55 281 virtio_notify_config(vdev);
afbaa7b4 282
17a0ca55 283 virtio_net_set_status(vdev, vdev->status);
554c97dd
AL
284}
285
b1be4280
AK
286static void rxfilter_notify(NetClientState *nc)
287{
b1be4280
AK
288 VirtIONet *n = qemu_get_nic_opaque(nc);
289
290 if (nc->rxfilter_notify_enabled) {
96e35046 291 gchar *path = object_get_canonical_path(OBJECT(n->qdev));
06150279
WX
292 qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
293 n->netclient_name, path, &error_abort);
96e35046 294 g_free(path);
b1be4280
AK
295
296 /* disable event notification to avoid events flooding */
297 nc->rxfilter_notify_enabled = 0;
298 }
299}
300
f7bc8ef8
AK
301static intList *get_vlan_table(VirtIONet *n)
302{
303 intList *list, *entry;
304 int i, j;
305
306 list = NULL;
307 for (i = 0; i < MAX_VLAN >> 5; i++) {
308 for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
309 if (n->vlans[i] & (1U << j)) {
310 entry = g_malloc0(sizeof(*entry));
311 entry->value = (i << 5) + j;
312 entry->next = list;
313 list = entry;
314 }
315 }
316 }
317
318 return list;
319}
320
b1be4280
AK
321static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
322{
323 VirtIONet *n = qemu_get_nic_opaque(nc);
f7bc8ef8 324 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b1be4280
AK
325 RxFilterInfo *info;
326 strList *str_list, *entry;
f7bc8ef8 327 int i;
b1be4280
AK
328
329 info = g_malloc0(sizeof(*info));
330 info->name = g_strdup(nc->name);
331 info->promiscuous = n->promisc;
332
333 if (n->nouni) {
334 info->unicast = RX_STATE_NONE;
335 } else if (n->alluni) {
336 info->unicast = RX_STATE_ALL;
337 } else {
338 info->unicast = RX_STATE_NORMAL;
339 }
340
341 if (n->nomulti) {
342 info->multicast = RX_STATE_NONE;
343 } else if (n->allmulti) {
344 info->multicast = RX_STATE_ALL;
345 } else {
346 info->multicast = RX_STATE_NORMAL;
347 }
348
349 info->broadcast_allowed = n->nobcast;
350 info->multicast_overflow = n->mac_table.multi_overflow;
351 info->unicast_overflow = n->mac_table.uni_overflow;
352
b0575ba4 353 info->main_mac = qemu_mac_strdup_printf(n->mac);
b1be4280
AK
354
355 str_list = NULL;
356 for (i = 0; i < n->mac_table.first_multi; i++) {
357 entry = g_malloc0(sizeof(*entry));
b0575ba4 358 entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
b1be4280
AK
359 entry->next = str_list;
360 str_list = entry;
361 }
362 info->unicast_table = str_list;
363
364 str_list = NULL;
365 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
366 entry = g_malloc0(sizeof(*entry));
b0575ba4 367 entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
b1be4280
AK
368 entry->next = str_list;
369 str_list = entry;
370 }
371 info->multicast_table = str_list;
f7bc8ef8 372 info->vlan_table = get_vlan_table(n);
b1be4280 373
95129d6f 374 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
f7bc8ef8
AK
375 info->vlan = RX_STATE_ALL;
376 } else if (!info->vlan_table) {
377 info->vlan = RX_STATE_NONE;
378 } else {
379 info->vlan = RX_STATE_NORMAL;
b1be4280 380 }
b1be4280
AK
381
382 /* enable event notification after query */
383 nc->rxfilter_notify_enabled = 1;
384
385 return info;
386}
387
002437cd
AL
388static void virtio_net_reset(VirtIODevice *vdev)
389{
17a0ca55 390 VirtIONet *n = VIRTIO_NET(vdev);
002437cd
AL
391
392 /* Reset back to compatibility mode */
393 n->promisc = 1;
394 n->allmulti = 0;
015cb166
AW
395 n->alluni = 0;
396 n->nomulti = 0;
397 n->nouni = 0;
398 n->nobcast = 0;
fed699f9
JW
399 /* multiqueue is disabled by default */
400 n->curr_queues = 1;
f57fcf70
JW
401 timer_del(n->announce_timer);
402 n->announce_counter = 0;
403 n->status &= ~VIRTIO_NET_S_ANNOUNCE;
b6503ed9 404
f21c0ed9 405 /* Flush any MAC and VLAN filter table state */
b6503ed9 406 n->mac_table.in_use = 0;
2d9aba39 407 n->mac_table.first_multi = 0;
8fd2a2f1
AW
408 n->mac_table.multi_overflow = 0;
409 n->mac_table.uni_overflow = 0;
b6503ed9 410 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
41dc8a67 411 memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
702d66a8 412 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
f21c0ed9 413 memset(n->vlans, 0, MAX_VLAN >> 3);
002437cd
AL
414}
415
6e371ab8 416static void peer_test_vnet_hdr(VirtIONet *n)
3a330134 417{
b356f76d
JW
418 NetClientState *nc = qemu_get_queue(n->nic);
419 if (!nc->peer) {
6e371ab8 420 return;
b356f76d 421 }
3a330134 422
d6085e3a 423 n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
6e371ab8 424}
3a330134 425
6e371ab8
MT
426static int peer_has_vnet_hdr(VirtIONet *n)
427{
3a330134
MM
428 return n->has_vnet_hdr;
429}
430
0ce0e8f4
MM
431static int peer_has_ufo(VirtIONet *n)
432{
433 if (!peer_has_vnet_hdr(n))
434 return 0;
435
d6085e3a 436 n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
0ce0e8f4
MM
437
438 return n->has_ufo;
439}
440
bb9d17f8
CH
441static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
442 int version_1)
ff3a8066 443{
fed699f9
JW
444 int i;
445 NetClientState *nc;
446
ff3a8066
MT
447 n->mergeable_rx_bufs = mergeable_rx_bufs;
448
bb9d17f8
CH
449 if (version_1) {
450 n->guest_hdr_len = sizeof(struct virtio_net_hdr_mrg_rxbuf);
451 } else {
452 n->guest_hdr_len = n->mergeable_rx_bufs ?
453 sizeof(struct virtio_net_hdr_mrg_rxbuf) :
454 sizeof(struct virtio_net_hdr);
455 }
ff3a8066 456
fed699f9
JW
457 for (i = 0; i < n->max_queues; i++) {
458 nc = qemu_get_subqueue(n->nic, i);
459
460 if (peer_has_vnet_hdr(n) &&
d6085e3a
SH
461 qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
462 qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
fed699f9
JW
463 n->host_hdr_len = n->guest_hdr_len;
464 }
ff3a8066
MT
465 }
466}
467
fed699f9
JW
468static int peer_attach(VirtIONet *n, int index)
469{
470 NetClientState *nc = qemu_get_subqueue(n->nic, index);
471
472 if (!nc->peer) {
473 return 0;
474 }
475
f394b2e2 476 if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7263a0ad
CO
477 vhost_set_vring_enable(nc->peer, 1);
478 }
479
f394b2e2 480 if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
fed699f9
JW
481 return 0;
482 }
483
484 return tap_enable(nc->peer);
485}
486
487static int peer_detach(VirtIONet *n, int index)
488{
489 NetClientState *nc = qemu_get_subqueue(n->nic, index);
490
491 if (!nc->peer) {
492 return 0;
493 }
494
f394b2e2 495 if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7263a0ad
CO
496 vhost_set_vring_enable(nc->peer, 0);
497 }
498
f394b2e2 499 if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
fed699f9
JW
500 return 0;
501 }
502
503 return tap_disable(nc->peer);
504}
505
506static void virtio_net_set_queues(VirtIONet *n)
507{
508 int i;
ddfa83ea 509 int r;
fed699f9
JW
510
511 for (i = 0; i < n->max_queues; i++) {
512 if (i < n->curr_queues) {
ddfa83ea
JS
513 r = peer_attach(n, i);
514 assert(!r);
fed699f9 515 } else {
ddfa83ea
JS
516 r = peer_detach(n, i);
517 assert(!r);
fed699f9
JW
518 }
519 }
520}
521
ec57db16 522static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
fed699f9 523
9d5b731d
JW
524static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
525 Error **errp)
fbe78f4f 526{
17a0ca55 527 VirtIONet *n = VIRTIO_NET(vdev);
b356f76d 528 NetClientState *nc = qemu_get_queue(n->nic);
fbe78f4f 529
da3e8a23
SZ
530 /* Firstly sync all virtio-net possible supported features */
531 features |= n->host_features;
532
0cd09c3a 533 virtio_add_feature(&features, VIRTIO_NET_F_MAC);
c9f79a3f 534
6e371ab8 535 if (!peer_has_vnet_hdr(n)) {
0cd09c3a
CH
536 virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
537 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
538 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
539 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
8172539d 540
0cd09c3a
CH
541 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
542 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
543 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
544 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
8172539d 545 }
3a330134 546
8172539d 547 if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
0cd09c3a
CH
548 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
549 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
3a330134
MM
550 }
551
ed8b4afe 552 if (!get_vhost_net(nc->peer)) {
9bc6304c
MT
553 return features;
554 }
ed8b4afe 555 return vhost_net_get_features(get_vhost_net(nc->peer), features);
fbe78f4f
AL
556}
557
019a3edb 558static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
8eca6b1b 559{
019a3edb 560 uint64_t features = 0;
8eca6b1b
AL
561
562 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
563 * but also these: */
0cd09c3a
CH
564 virtio_add_feature(&features, VIRTIO_NET_F_MAC);
565 virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
566 virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
567 virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
568 virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
8eca6b1b 569
8172539d 570 return features;
8eca6b1b
AL
571}
572
644c9858
DF
573static void virtio_net_apply_guest_offloads(VirtIONet *n)
574{
ad37bb3b 575 qemu_set_offload(qemu_get_queue(n->nic)->peer,
644c9858
DF
576 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
577 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
578 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
579 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
580 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
581}
582
583static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
584{
585 static const uint64_t guest_offloads_mask =
586 (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
587 (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
588 (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
589 (1ULL << VIRTIO_NET_F_GUEST_ECN) |
590 (1ULL << VIRTIO_NET_F_GUEST_UFO);
591
592 return guest_offloads_mask & features;
593}
594
595static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
596{
597 VirtIODevice *vdev = VIRTIO_DEVICE(n);
598 return virtio_net_guest_offloads_by_features(vdev->guest_features);
599}
600
d5aaa1b0 601static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
fbe78f4f 602{
17a0ca55 603 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9
JW
604 int i;
605
ef546f12 606 virtio_net_set_multiqueue(n,
95129d6f 607 virtio_has_feature(features, VIRTIO_NET_F_MQ));
fbe78f4f 608
ef546f12 609 virtio_net_set_mrg_rx_bufs(n,
95129d6f
CH
610 virtio_has_feature(features,
611 VIRTIO_NET_F_MRG_RXBUF),
612 virtio_has_feature(features,
613 VIRTIO_F_VERSION_1));
f5436dd9
MM
614
615 if (n->has_vnet_hdr) {
644c9858
DF
616 n->curr_guest_offloads =
617 virtio_net_guest_offloads_by_features(features);
618 virtio_net_apply_guest_offloads(n);
f5436dd9 619 }
fed699f9
JW
620
621 for (i = 0; i < n->max_queues; i++) {
622 NetClientState *nc = qemu_get_subqueue(n->nic, i);
623
ed8b4afe 624 if (!get_vhost_net(nc->peer)) {
fed699f9
JW
625 continue;
626 }
ed8b4afe 627 vhost_net_ack_features(get_vhost_net(nc->peer), features);
dc14a397 628 }
0b1eaa88 629
95129d6f 630 if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
0b1eaa88
SF
631 memset(n->vlans, 0, MAX_VLAN >> 3);
632 } else {
633 memset(n->vlans, 0xff, MAX_VLAN >> 3);
634 }
fbe78f4f
AL
635}
636
002437cd 637static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
921ac5d0 638 struct iovec *iov, unsigned int iov_cnt)
002437cd
AL
639{
640 uint8_t on;
921ac5d0 641 size_t s;
b1be4280 642 NetClientState *nc = qemu_get_queue(n->nic);
002437cd 643
921ac5d0
MT
644 s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
645 if (s != sizeof(on)) {
646 return VIRTIO_NET_ERR;
002437cd
AL
647 }
648
dd23454b 649 if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
002437cd 650 n->promisc = on;
dd23454b 651 } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
002437cd 652 n->allmulti = on;
dd23454b 653 } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
015cb166 654 n->alluni = on;
dd23454b 655 } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
015cb166 656 n->nomulti = on;
dd23454b 657 } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
015cb166 658 n->nouni = on;
dd23454b 659 } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
015cb166 660 n->nobcast = on;
921ac5d0 661 } else {
002437cd 662 return VIRTIO_NET_ERR;
921ac5d0 663 }
002437cd 664
b1be4280
AK
665 rxfilter_notify(nc);
666
002437cd
AL
667 return VIRTIO_NET_OK;
668}
669
644c9858
DF
670static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
671 struct iovec *iov, unsigned int iov_cnt)
672{
673 VirtIODevice *vdev = VIRTIO_DEVICE(n);
674 uint64_t offloads;
675 size_t s;
676
95129d6f 677 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
644c9858
DF
678 return VIRTIO_NET_ERR;
679 }
680
681 s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
682 if (s != sizeof(offloads)) {
683 return VIRTIO_NET_ERR;
684 }
685
686 if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
687 uint64_t supported_offloads;
688
689 if (!n->has_vnet_hdr) {
690 return VIRTIO_NET_ERR;
691 }
692
693 supported_offloads = virtio_net_supported_guest_offloads(n);
694 if (offloads & ~supported_offloads) {
695 return VIRTIO_NET_ERR;
696 }
697
698 n->curr_guest_offloads = offloads;
699 virtio_net_apply_guest_offloads(n);
700
701 return VIRTIO_NET_OK;
702 } else {
703 return VIRTIO_NET_ERR;
704 }
705}
706
b6503ed9 707static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
921ac5d0 708 struct iovec *iov, unsigned int iov_cnt)
b6503ed9 709{
1399c60d 710 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b6503ed9 711 struct virtio_net_ctrl_mac mac_data;
921ac5d0 712 size_t s;
b1be4280 713 NetClientState *nc = qemu_get_queue(n->nic);
b6503ed9 714
c1943a3f
AK
715 if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
716 if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
717 return VIRTIO_NET_ERR;
718 }
719 s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
720 assert(s == sizeof(n->mac));
b356f76d 721 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
b1be4280
AK
722 rxfilter_notify(nc);
723
c1943a3f
AK
724 return VIRTIO_NET_OK;
725 }
726
921ac5d0 727 if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
b6503ed9 728 return VIRTIO_NET_ERR;
921ac5d0 729 }
b6503ed9 730
cae2e556
AK
731 int in_use = 0;
732 int first_multi = 0;
733 uint8_t uni_overflow = 0;
734 uint8_t multi_overflow = 0;
735 uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
b6503ed9 736
921ac5d0
MT
737 s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
738 sizeof(mac_data.entries));
1399c60d 739 mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
921ac5d0 740 if (s != sizeof(mac_data.entries)) {
b1be4280 741 goto error;
921ac5d0
MT
742 }
743 iov_discard_front(&iov, &iov_cnt, s);
b6503ed9 744
921ac5d0 745 if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
b1be4280 746 goto error;
921ac5d0 747 }
b6503ed9
AL
748
749 if (mac_data.entries <= MAC_TABLE_ENTRIES) {
cae2e556 750 s = iov_to_buf(iov, iov_cnt, 0, macs,
921ac5d0
MT
751 mac_data.entries * ETH_ALEN);
752 if (s != mac_data.entries * ETH_ALEN) {
b1be4280 753 goto error;
921ac5d0 754 }
cae2e556 755 in_use += mac_data.entries;
b6503ed9 756 } else {
cae2e556 757 uni_overflow = 1;
b6503ed9
AL
758 }
759
921ac5d0
MT
760 iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
761
cae2e556 762 first_multi = in_use;
2d9aba39 763
921ac5d0
MT
764 s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
765 sizeof(mac_data.entries));
1399c60d 766 mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
921ac5d0 767 if (s != sizeof(mac_data.entries)) {
b1be4280 768 goto error;
921ac5d0
MT
769 }
770
771 iov_discard_front(&iov, &iov_cnt, s);
b6503ed9 772
921ac5d0 773 if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
b1be4280 774 goto error;
921ac5d0 775 }
b6503ed9 776
edc24385 777 if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
cae2e556 778 s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
921ac5d0
MT
779 mac_data.entries * ETH_ALEN);
780 if (s != mac_data.entries * ETH_ALEN) {
b1be4280 781 goto error;
8fd2a2f1 782 }
cae2e556 783 in_use += mac_data.entries;
921ac5d0 784 } else {
cae2e556 785 multi_overflow = 1;
b6503ed9
AL
786 }
787
cae2e556
AK
788 n->mac_table.in_use = in_use;
789 n->mac_table.first_multi = first_multi;
790 n->mac_table.uni_overflow = uni_overflow;
791 n->mac_table.multi_overflow = multi_overflow;
792 memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
793 g_free(macs);
b1be4280
AK
794 rxfilter_notify(nc);
795
b6503ed9 796 return VIRTIO_NET_OK;
b1be4280
AK
797
798error:
cae2e556 799 g_free(macs);
b1be4280 800 return VIRTIO_NET_ERR;
b6503ed9
AL
801}
802
f21c0ed9 803static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
921ac5d0 804 struct iovec *iov, unsigned int iov_cnt)
f21c0ed9 805{
1399c60d 806 VirtIODevice *vdev = VIRTIO_DEVICE(n);
f21c0ed9 807 uint16_t vid;
921ac5d0 808 size_t s;
b1be4280 809 NetClientState *nc = qemu_get_queue(n->nic);
f21c0ed9 810
921ac5d0 811 s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
1399c60d 812 vid = virtio_lduw_p(vdev, &vid);
921ac5d0 813 if (s != sizeof(vid)) {
f21c0ed9
AL
814 return VIRTIO_NET_ERR;
815 }
816
f21c0ed9
AL
817 if (vid >= MAX_VLAN)
818 return VIRTIO_NET_ERR;
819
820 if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
821 n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
822 else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
823 n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
824 else
825 return VIRTIO_NET_ERR;
826
b1be4280
AK
827 rxfilter_notify(nc);
828
f21c0ed9
AL
829 return VIRTIO_NET_OK;
830}
831
f57fcf70
JW
832static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
833 struct iovec *iov, unsigned int iov_cnt)
834{
835 if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
836 n->status & VIRTIO_NET_S_ANNOUNCE) {
837 n->status &= ~VIRTIO_NET_S_ANNOUNCE;
838 if (n->announce_counter) {
839 timer_mod(n->announce_timer,
840 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) +
841 self_announce_delay(n->announce_counter));
842 }
843 return VIRTIO_NET_OK;
844 } else {
845 return VIRTIO_NET_ERR;
846 }
847}
848
fed699f9 849static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
f8f7c533 850 struct iovec *iov, unsigned int iov_cnt)
fed699f9 851{
17a0ca55 852 VirtIODevice *vdev = VIRTIO_DEVICE(n);
f8f7c533
JW
853 struct virtio_net_ctrl_mq mq;
854 size_t s;
855 uint16_t queues;
fed699f9 856
f8f7c533
JW
857 s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
858 if (s != sizeof(mq)) {
fed699f9
JW
859 return VIRTIO_NET_ERR;
860 }
861
862 if (cmd != VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
863 return VIRTIO_NET_ERR;
864 }
865
1399c60d 866 queues = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
fed699f9 867
f8f7c533
JW
868 if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
869 queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
870 queues > n->max_queues ||
fed699f9
JW
871 !n->multiqueue) {
872 return VIRTIO_NET_ERR;
873 }
874
f8f7c533 875 n->curr_queues = queues;
fed699f9
JW
876 /* stop the backend before changing the number of queues to avoid handling a
877 * disabled queue */
17a0ca55 878 virtio_net_set_status(vdev, vdev->status);
fed699f9
JW
879 virtio_net_set_queues(n);
880
881 return VIRTIO_NET_OK;
882}
ba7eadb5 883
3d11d36c
AL
884static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
885{
17a0ca55 886 VirtIONet *n = VIRTIO_NET(vdev);
3d11d36c
AL
887 struct virtio_net_ctrl_hdr ctrl;
888 virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
51b19ebe 889 VirtQueueElement *elem;
921ac5d0 890 size_t s;
771b6ed3 891 struct iovec *iov, *iov2;
921ac5d0 892 unsigned int iov_cnt;
3d11d36c 893
51b19ebe
PB
894 for (;;) {
895 elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
896 if (!elem) {
897 break;
898 }
899 if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) ||
900 iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) {
ba7eadb5
GK
901 virtio_error(vdev, "virtio-net ctrl missing headers");
902 virtqueue_detach_element(vq, elem, 0);
903 g_free(elem);
904 break;
3d11d36c
AL
905 }
906
51b19ebe
PB
907 iov_cnt = elem->out_num;
908 iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num);
921ac5d0
MT
909 s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
910 iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
911 if (s != sizeof(ctrl)) {
912 status = VIRTIO_NET_ERR;
dd23454b 913 } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
921ac5d0
MT
914 status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
915 } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
916 status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
917 } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
918 status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
f57fcf70
JW
919 } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
920 status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt);
fed699f9 921 } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
f8f7c533 922 status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
644c9858
DF
923 } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
924 status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
3d11d36c
AL
925 }
926
51b19ebe 927 s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status));
921ac5d0 928 assert(s == sizeof(status));
3d11d36c 929
51b19ebe 930 virtqueue_push(vq, elem, sizeof(status));
3d11d36c 931 virtio_notify(vdev, vq);
771b6ed3 932 g_free(iov2);
51b19ebe 933 g_free(elem);
3d11d36c
AL
934 }
935}
936
fbe78f4f
AL
937/* RX */
938
939static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
940{
17a0ca55 941 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 942 int queue_index = vq2q(virtio_get_queue_index(vq));
8aeff62d 943
fed699f9 944 qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
fbe78f4f
AL
945}
946
4e68f7a0 947static int virtio_net_can_receive(NetClientState *nc)
fbe78f4f 948{
cc1f0f45 949 VirtIONet *n = qemu_get_nic_opaque(nc);
17a0ca55 950 VirtIODevice *vdev = VIRTIO_DEVICE(n);
fed699f9 951 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
0c87e93e 952
17a0ca55 953 if (!vdev->vm_running) {
95477323
MT
954 return 0;
955 }
cdd5cc12 956
fed699f9
JW
957 if (nc->queue_index >= n->curr_queues) {
958 return 0;
959 }
960
0c87e93e 961 if (!virtio_queue_ready(q->rx_vq) ||
17a0ca55 962 !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
fbe78f4f 963 return 0;
0c87e93e 964 }
fbe78f4f 965
cdd5cc12
MM
966 return 1;
967}
968
0c87e93e 969static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
cdd5cc12 970{
0c87e93e
JW
971 VirtIONet *n = q->n;
972 if (virtio_queue_empty(q->rx_vq) ||
fbe78f4f 973 (n->mergeable_rx_bufs &&
0c87e93e
JW
974 !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
975 virtio_queue_set_notification(q->rx_vq, 1);
06b12970
TL
976
977 /* To avoid a race condition where the guest has made some buffers
978 * available after the above check but before notification was
979 * enabled, check for available buffers again.
980 */
0c87e93e 981 if (virtio_queue_empty(q->rx_vq) ||
06b12970 982 (n->mergeable_rx_bufs &&
0c87e93e 983 !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
06b12970 984 return 0;
0c87e93e 985 }
fbe78f4f
AL
986 }
987
0c87e93e 988 virtio_queue_set_notification(q->rx_vq, 0);
fbe78f4f
AL
989 return 1;
990}
991
1399c60d 992static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
032a74a1 993{
1399c60d
RR
994 virtio_tswap16s(vdev, &hdr->hdr_len);
995 virtio_tswap16s(vdev, &hdr->gso_size);
996 virtio_tswap16s(vdev, &hdr->csum_start);
997 virtio_tswap16s(vdev, &hdr->csum_offset);
032a74a1
CLG
998}
999
1d41b0c1
AL
1000/* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
1001 * it never finds out that the packets don't have valid checksums. This
1002 * causes dhclient to get upset. Fedora's carried a patch for ages to
1003 * fix this with Xen but it hasn't appeared in an upstream release of
1004 * dhclient yet.
1005 *
1006 * To avoid breaking existing guests, we catch udp packets and add
1007 * checksums. This is terrible but it's better than hacking the guest
1008 * kernels.
1009 *
1010 * N.B. if we introduce a zero-copy API, this operation is no longer free so
1011 * we should provide a mechanism to disable it to avoid polluting the host
1012 * cache.
1013 */
1014static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
22cc84db 1015 uint8_t *buf, size_t size)
1d41b0c1
AL
1016{
1017 if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
1018 (size > 27 && size < 1500) && /* normal sized MTU */
1019 (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
1020 (buf[23] == 17) && /* ip.protocol == UDP */
1021 (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
22cc84db 1022 net_checksum_calculate(buf, size);
1d41b0c1
AL
1023 hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
1024 }
1025}
1026
280598b7
MT
1027static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
1028 const void *buf, size_t size)
fbe78f4f 1029{
3a330134 1030 if (n->has_vnet_hdr) {
22cc84db
MT
1031 /* FIXME this cast is evil */
1032 void *wbuf = (void *)buf;
280598b7
MT
1033 work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
1034 size - n->host_hdr_len);
1bfa316c
GK
1035
1036 if (n->needs_vnet_hdr_swap) {
1037 virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
1038 }
280598b7 1039 iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
22cc84db
MT
1040 } else {
1041 struct virtio_net_hdr hdr = {
1042 .flags = 0,
1043 .gso_type = VIRTIO_NET_HDR_GSO_NONE
1044 };
1045 iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
3a330134 1046 }
fbe78f4f
AL
1047}
1048
3831ab20
AL
1049static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
1050{
1051 static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
f21c0ed9 1052 static const uint8_t vlan[] = {0x81, 0x00};
3831ab20 1053 uint8_t *ptr = (uint8_t *)buf;
b6503ed9 1054 int i;
3831ab20
AL
1055
1056 if (n->promisc)
1057 return 1;
1058
e043ebc6 1059 ptr += n->host_hdr_len;
3a330134 1060
f21c0ed9 1061 if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
7542d3e7 1062 int vid = lduw_be_p(ptr + 14) & 0xfff;
f21c0ed9
AL
1063 if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
1064 return 0;
1065 }
1066
bbe2f399
AW
1067 if (ptr[0] & 1) { // multicast
1068 if (!memcmp(ptr, bcast, sizeof(bcast))) {
015cb166
AW
1069 return !n->nobcast;
1070 } else if (n->nomulti) {
1071 return 0;
8fd2a2f1 1072 } else if (n->allmulti || n->mac_table.multi_overflow) {
bbe2f399
AW
1073 return 1;
1074 }
2d9aba39
AW
1075
1076 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
1077 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
1078 return 1;
1079 }
1080 }
bbe2f399 1081 } else { // unicast
015cb166
AW
1082 if (n->nouni) {
1083 return 0;
1084 } else if (n->alluni || n->mac_table.uni_overflow) {
8fd2a2f1
AW
1085 return 1;
1086 } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
bbe2f399
AW
1087 return 1;
1088 }
3831ab20 1089
2d9aba39
AW
1090 for (i = 0; i < n->mac_table.first_multi; i++) {
1091 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
1092 return 1;
1093 }
1094 }
b6503ed9
AL
1095 }
1096
3831ab20
AL
1097 return 0;
1098}
1099
4e68f7a0 1100static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, size_t size)
fbe78f4f 1101{
cc1f0f45 1102 VirtIONet *n = qemu_get_nic_opaque(nc);
fed699f9 1103 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
17a0ca55 1104 VirtIODevice *vdev = VIRTIO_DEVICE(n);
63c58728
MT
1105 struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
1106 struct virtio_net_hdr_mrg_rxbuf mhdr;
1107 unsigned mhdr_cnt = 0;
22cc84db 1108 size_t offset, i, guest_offset;
fbe78f4f 1109
fed699f9 1110 if (!virtio_net_can_receive(nc)) {
cdd5cc12 1111 return -1;
b356f76d 1112 }
cdd5cc12 1113
940cda94 1114 /* hdr_len refers to the header we supply to the guest */
0c87e93e 1115 if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
8aeff62d 1116 return 0;
0c87e93e 1117 }
fbe78f4f 1118
3831ab20 1119 if (!receive_filter(n, buf, size))
4f1c942b 1120 return size;
3831ab20 1121
fbe78f4f
AL
1122 offset = i = 0;
1123
1124 while (offset < size) {
51b19ebe 1125 VirtQueueElement *elem;
fbe78f4f 1126 int len, total;
51b19ebe 1127 const struct iovec *sg;
fbe78f4f 1128
22c253d9 1129 total = 0;
fbe78f4f 1130
51b19ebe
PB
1131 elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
1132 if (!elem) {
ba10b9c0
GK
1133 if (i) {
1134 virtio_error(vdev, "virtio-net unexpected empty queue: "
1135 "i %zd mergeable %d offset %zd, size %zd, "
1136 "guest hdr len %zd, host hdr len %zd "
1137 "guest features 0x%" PRIx64,
1138 i, n->mergeable_rx_bufs, offset, size,
1139 n->guest_hdr_len, n->host_hdr_len,
1140 vdev->guest_features);
1141 }
1142 return -1;
fbe78f4f
AL
1143 }
1144
51b19ebe 1145 if (elem->in_num < 1) {
ba10b9c0
GK
1146 virtio_error(vdev,
1147 "virtio-net receive queue contains no in buffers");
1148 virtqueue_detach_element(q->rx_vq, elem, 0);
1149 g_free(elem);
1150 return -1;
fbe78f4f
AL
1151 }
1152
51b19ebe 1153 sg = elem->in_sg;
fbe78f4f 1154 if (i == 0) {
c8d28e7e 1155 assert(offset == 0);
63c58728
MT
1156 if (n->mergeable_rx_bufs) {
1157 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
51b19ebe 1158 sg, elem->in_num,
63c58728
MT
1159 offsetof(typeof(mhdr), num_buffers),
1160 sizeof(mhdr.num_buffers));
1161 }
fbe78f4f 1162
51b19ebe 1163 receive_header(n, sg, elem->in_num, buf, size);
c8d28e7e 1164 offset = n->host_hdr_len;
e35e23f6 1165 total += n->guest_hdr_len;
22cc84db
MT
1166 guest_offset = n->guest_hdr_len;
1167 } else {
1168 guest_offset = 0;
fbe78f4f
AL
1169 }
1170
1171 /* copy in packet. ugh */
51b19ebe 1172 len = iov_from_buf(sg, elem->in_num, guest_offset,
dcf6f5e1 1173 buf + offset, size - offset);
fbe78f4f 1174 total += len;
279a4253
MT
1175 offset += len;
1176 /* If buffers can't be merged, at this point we
1177 * must have consumed the complete packet.
1178 * Otherwise, drop it. */
1179 if (!n->mergeable_rx_bufs && offset < size) {
51b19ebe
PB
1180 virtqueue_discard(q->rx_vq, elem, total);
1181 g_free(elem);
279a4253
MT
1182 return size;
1183 }
fbe78f4f
AL
1184
1185 /* signal other side */
51b19ebe
PB
1186 virtqueue_fill(q->rx_vq, elem, total, i++);
1187 g_free(elem);
fbe78f4f
AL
1188 }
1189
63c58728 1190 if (mhdr_cnt) {
1399c60d 1191 virtio_stw_p(vdev, &mhdr.num_buffers, i);
63c58728
MT
1192 iov_from_buf(mhdr_sg, mhdr_cnt,
1193 0,
1194 &mhdr.num_buffers, sizeof mhdr.num_buffers);
44b15bc5 1195 }
fbe78f4f 1196
0c87e93e 1197 virtqueue_flush(q->rx_vq, i);
17a0ca55 1198 virtio_notify(vdev, q->rx_vq);
4f1c942b
MM
1199
1200 return size;
fbe78f4f
AL
1201}
1202
0c87e93e 1203static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
6243375f 1204
4e68f7a0 1205static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
6243375f 1206{
cc1f0f45 1207 VirtIONet *n = qemu_get_nic_opaque(nc);
fed699f9 1208 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
17a0ca55 1209 VirtIODevice *vdev = VIRTIO_DEVICE(n);
6243375f 1210
51b19ebe 1211 virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
17a0ca55 1212 virtio_notify(vdev, q->tx_vq);
6243375f 1213
51b19ebe
PB
1214 g_free(q->async_tx.elem);
1215 q->async_tx.elem = NULL;
6243375f 1216
0c87e93e
JW
1217 virtio_queue_set_notification(q->tx_vq, 1);
1218 virtio_net_flush_tx(q);
6243375f
MM
1219}
1220
fbe78f4f 1221/* TX */
0c87e93e 1222static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
fbe78f4f 1223{
0c87e93e 1224 VirtIONet *n = q->n;
17a0ca55 1225 VirtIODevice *vdev = VIRTIO_DEVICE(n);
51b19ebe 1226 VirtQueueElement *elem;
e3f30488 1227 int32_t num_packets = 0;
fed699f9 1228 int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
17a0ca55 1229 if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
e3f30488
AW
1230 return num_packets;
1231 }
fbe78f4f 1232
51b19ebe 1233 if (q->async_tx.elem) {
0c87e93e 1234 virtio_queue_set_notification(q->tx_vq, 0);
e3f30488 1235 return num_packets;
6243375f
MM
1236 }
1237
51b19ebe 1238 for (;;) {
bd89dd98 1239 ssize_t ret;
51b19ebe
PB
1240 unsigned int out_num;
1241 struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
feb93f36 1242 struct virtio_net_hdr_mrg_rxbuf mhdr;
fbe78f4f 1243
51b19ebe
PB
1244 elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
1245 if (!elem) {
1246 break;
1247 }
1248
1249 out_num = elem->out_num;
1250 out_sg = elem->out_sg;
7b80d08e 1251 if (out_num < 1) {
e7b43f7e 1252 error_report("virtio-net header not in first element");
fbe78f4f
AL
1253 exit(1);
1254 }
1255
032a74a1 1256 if (n->has_vnet_hdr) {
feb93f36
JW
1257 if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
1258 n->guest_hdr_len) {
032a74a1
CLG
1259 error_report("virtio-net header incorrect");
1260 exit(1);
1261 }
1bfa316c 1262 if (n->needs_vnet_hdr_swap) {
feb93f36
JW
1263 virtio_net_hdr_swap(vdev, (void *) &mhdr);
1264 sg2[0].iov_base = &mhdr;
1265 sg2[0].iov_len = n->guest_hdr_len;
1266 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
1267 out_sg, out_num,
1268 n->guest_hdr_len, -1);
1269 if (out_num == VIRTQUEUE_MAX_SIZE) {
1270 goto drop;
1271 }
1272 out_num += 1;
1273 out_sg = sg2;
1274 }
032a74a1 1275 }
14761f9c
MT
1276 /*
1277 * If host wants to see the guest header as is, we can
1278 * pass it on unchanged. Otherwise, copy just the parts
1279 * that host is interested in.
1280 */
1281 assert(n->host_hdr_len <= n->guest_hdr_len);
1282 if (n->host_hdr_len != n->guest_hdr_len) {
1283 unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
1284 out_sg, out_num,
1285 0, n->host_hdr_len);
1286 sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
1287 out_sg, out_num,
1288 n->guest_hdr_len, -1);
1289 out_num = sg_num;
1290 out_sg = sg;
fbe78f4f
AL
1291 }
1292
fed699f9
JW
1293 ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
1294 out_sg, out_num, virtio_net_tx_complete);
6243375f 1295 if (ret == 0) {
0c87e93e
JW
1296 virtio_queue_set_notification(q->tx_vq, 0);
1297 q->async_tx.elem = elem;
e3f30488 1298 return -EBUSY;
6243375f
MM
1299 }
1300
feb93f36 1301drop:
51b19ebe 1302 virtqueue_push(q->tx_vq, elem, 0);
17a0ca55 1303 virtio_notify(vdev, q->tx_vq);
51b19ebe 1304 g_free(elem);
e3f30488
AW
1305
1306 if (++num_packets >= n->tx_burst) {
1307 break;
1308 }
fbe78f4f 1309 }
e3f30488 1310 return num_packets;
fbe78f4f
AL
1311}
1312
a697a334 1313static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
fbe78f4f 1314{
17a0ca55 1315 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1316 VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
fbe78f4f 1317
783e7706 1318 /* This happens when device was stopped but VCPU wasn't. */
17a0ca55 1319 if (!vdev->vm_running) {
0c87e93e 1320 q->tx_waiting = 1;
783e7706
MT
1321 return;
1322 }
1323
0c87e93e 1324 if (q->tx_waiting) {
fbe78f4f 1325 virtio_queue_set_notification(vq, 1);
bc72ad67 1326 timer_del(q->tx_timer);
0c87e93e
JW
1327 q->tx_waiting = 0;
1328 virtio_net_flush_tx(q);
fbe78f4f 1329 } else {
bc72ad67
AB
1330 timer_mod(q->tx_timer,
1331 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
0c87e93e 1332 q->tx_waiting = 1;
fbe78f4f
AL
1333 virtio_queue_set_notification(vq, 0);
1334 }
1335}
1336
a697a334
AW
1337static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
1338{
17a0ca55 1339 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1340 VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
a697a334 1341
0c87e93e 1342 if (unlikely(q->tx_waiting)) {
a697a334
AW
1343 return;
1344 }
0c87e93e 1345 q->tx_waiting = 1;
783e7706 1346 /* This happens when device was stopped but VCPU wasn't. */
17a0ca55 1347 if (!vdev->vm_running) {
783e7706
MT
1348 return;
1349 }
a697a334 1350 virtio_queue_set_notification(vq, 0);
0c87e93e 1351 qemu_bh_schedule(q->tx_bh);
a697a334
AW
1352}
1353
fbe78f4f
AL
1354static void virtio_net_tx_timer(void *opaque)
1355{
0c87e93e
JW
1356 VirtIONetQueue *q = opaque;
1357 VirtIONet *n = q->n;
17a0ca55 1358 VirtIODevice *vdev = VIRTIO_DEVICE(n);
e8bcf842
MT
1359 /* This happens when device was stopped but BH wasn't. */
1360 if (!vdev->vm_running) {
1361 /* Make sure tx waiting is set, so we'll run when restarted. */
1362 assert(q->tx_waiting);
1363 return;
1364 }
fbe78f4f 1365
0c87e93e 1366 q->tx_waiting = 0;
fbe78f4f
AL
1367
1368 /* Just in case the driver is not ready on more */
17a0ca55 1369 if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
fbe78f4f 1370 return;
17a0ca55 1371 }
fbe78f4f 1372
0c87e93e
JW
1373 virtio_queue_set_notification(q->tx_vq, 1);
1374 virtio_net_flush_tx(q);
fbe78f4f
AL
1375}
1376
a697a334
AW
1377static void virtio_net_tx_bh(void *opaque)
1378{
0c87e93e
JW
1379 VirtIONetQueue *q = opaque;
1380 VirtIONet *n = q->n;
17a0ca55 1381 VirtIODevice *vdev = VIRTIO_DEVICE(n);
a697a334
AW
1382 int32_t ret;
1383
e8bcf842
MT
1384 /* This happens when device was stopped but BH wasn't. */
1385 if (!vdev->vm_running) {
1386 /* Make sure tx waiting is set, so we'll run when restarted. */
1387 assert(q->tx_waiting);
1388 return;
1389 }
783e7706 1390
0c87e93e 1391 q->tx_waiting = 0;
a697a334
AW
1392
1393 /* Just in case the driver is not ready on more */
17a0ca55 1394 if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
a697a334 1395 return;
17a0ca55 1396 }
a697a334 1397
0c87e93e 1398 ret = virtio_net_flush_tx(q);
a697a334
AW
1399 if (ret == -EBUSY) {
1400 return; /* Notification re-enable handled by tx_complete */
1401 }
1402
1403 /* If we flush a full burst of packets, assume there are
1404 * more coming and immediately reschedule */
1405 if (ret >= n->tx_burst) {
0c87e93e
JW
1406 qemu_bh_schedule(q->tx_bh);
1407 q->tx_waiting = 1;
a697a334
AW
1408 return;
1409 }
1410
1411 /* If less than a full burst, re-enable notification and flush
1412 * anything that may have come in while we weren't looking. If
1413 * we find something, assume the guest is still active and reschedule */
0c87e93e
JW
1414 virtio_queue_set_notification(q->tx_vq, 1);
1415 if (virtio_net_flush_tx(q) > 0) {
1416 virtio_queue_set_notification(q->tx_vq, 0);
1417 qemu_bh_schedule(q->tx_bh);
1418 q->tx_waiting = 1;
a697a334
AW
1419 }
1420}
1421
f9d6dbf0
WC
1422static void virtio_net_add_queue(VirtIONet *n, int index)
1423{
1424 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1425
1c0fbfa3
MT
1426 n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
1427 virtio_net_handle_rx);
f9d6dbf0
WC
1428 if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
1429 n->vqs[index].tx_vq =
1430 virtio_add_queue(vdev, 256, virtio_net_handle_tx_timer);
1431 n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
1432 virtio_net_tx_timer,
1433 &n->vqs[index]);
1434 } else {
1435 n->vqs[index].tx_vq =
1436 virtio_add_queue(vdev, 256, virtio_net_handle_tx_bh);
1437 n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
1438 }
1439
1440 n->vqs[index].tx_waiting = 0;
1441 n->vqs[index].n = n;
1442}
1443
1444static void virtio_net_del_queue(VirtIONet *n, int index)
1445{
1446 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1447 VirtIONetQueue *q = &n->vqs[index];
1448 NetClientState *nc = qemu_get_subqueue(n->nic, index);
1449
1450 qemu_purge_queued_packets(nc);
1451
1452 virtio_del_queue(vdev, index * 2);
1453 if (q->tx_timer) {
1454 timer_del(q->tx_timer);
1455 timer_free(q->tx_timer);
1456 } else {
1457 qemu_bh_delete(q->tx_bh);
1458 }
1459 virtio_del_queue(vdev, index * 2 + 1);
1460}
1461
1462static void virtio_net_change_num_queues(VirtIONet *n, int new_max_queues)
1463{
1464 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1465 int old_num_queues = virtio_get_num_queues(vdev);
1466 int new_num_queues = new_max_queues * 2 + 1;
1467 int i;
1468
1469 assert(old_num_queues >= 3);
1470 assert(old_num_queues % 2 == 1);
1471
1472 if (old_num_queues == new_num_queues) {
1473 return;
1474 }
1475
1476 /*
1477 * We always need to remove and add ctrl vq if
1478 * old_num_queues != new_num_queues. Remove ctrl_vq first,
1479 * and then we only enter one of the following too loops.
1480 */
1481 virtio_del_queue(vdev, old_num_queues - 1);
1482
1483 for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
1484 /* new_num_queues < old_num_queues */
1485 virtio_net_del_queue(n, i / 2);
1486 }
1487
1488 for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
1489 /* new_num_queues > old_num_queues */
1490 virtio_net_add_queue(n, i / 2);
1491 }
1492
1493 /* add ctrl_vq last */
1494 n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
1495}
1496
ec57db16 1497static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
fed699f9 1498{
f9d6dbf0
WC
1499 int max = multiqueue ? n->max_queues : 1;
1500
fed699f9 1501 n->multiqueue = multiqueue;
f9d6dbf0 1502 virtio_net_change_num_queues(n, max);
fed699f9 1503
fed699f9
JW
1504 virtio_net_set_queues(n);
1505}
1506
290c2428 1507static void virtio_net_save(QEMUFile *f, void *opaque, size_t size)
fbe78f4f
AL
1508{
1509 VirtIONet *n = opaque;
17a0ca55 1510 VirtIODevice *vdev = VIRTIO_DEVICE(n);
fbe78f4f 1511
afbaa7b4
MT
1512 /* At this point, backend must be stopped, otherwise
1513 * it might keep writing to memory. */
1514 assert(!n->vhost_started);
17a0ca55 1515 virtio_save(vdev, f);
037dab2f
GK
1516}
1517
1518static void virtio_net_save_device(VirtIODevice *vdev, QEMUFile *f)
1519{
1520 VirtIONet *n = VIRTIO_NET(vdev);
1521 int i;
fbe78f4f 1522
79674068 1523 qemu_put_buffer(f, n->mac, ETH_ALEN);
5f800801 1524 qemu_put_be32(f, n->vqs[0].tx_waiting);
e46cb38f 1525 qemu_put_be32(f, n->mergeable_rx_bufs);
9d6271b8 1526 qemu_put_be16(f, n->status);
f10c592e
AW
1527 qemu_put_byte(f, n->promisc);
1528 qemu_put_byte(f, n->allmulti);
b6503ed9
AL
1529 qemu_put_be32(f, n->mac_table.in_use);
1530 qemu_put_buffer(f, n->mac_table.macs, n->mac_table.in_use * ETH_ALEN);
f21c0ed9 1531 qemu_put_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
3a330134 1532 qemu_put_be32(f, n->has_vnet_hdr);
8fd2a2f1
AW
1533 qemu_put_byte(f, n->mac_table.multi_overflow);
1534 qemu_put_byte(f, n->mac_table.uni_overflow);
015cb166
AW
1535 qemu_put_byte(f, n->alluni);
1536 qemu_put_byte(f, n->nomulti);
1537 qemu_put_byte(f, n->nouni);
1538 qemu_put_byte(f, n->nobcast);
0ce0e8f4 1539 qemu_put_byte(f, n->has_ufo);
5f800801
JW
1540 if (n->max_queues > 1) {
1541 qemu_put_be16(f, n->max_queues);
1542 qemu_put_be16(f, n->curr_queues);
1543 for (i = 1; i < n->curr_queues; i++) {
1544 qemu_put_be32(f, n->vqs[i].tx_waiting);
1545 }
1546 }
644c9858 1547
95129d6f 1548 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
644c9858
DF
1549 qemu_put_be64(f, n->curr_guest_offloads);
1550 }
fbe78f4f
AL
1551}
1552
290c2428 1553static int virtio_net_load(QEMUFile *f, void *opaque, size_t size)
fbe78f4f
AL
1554{
1555 VirtIONet *n = opaque;
17a0ca55 1556 VirtIODevice *vdev = VIRTIO_DEVICE(n);
fbe78f4f 1557
290c2428 1558 return virtio_load(vdev, f, VIRTIO_NET_VM_VERSION);
037dab2f
GK
1559}
1560
1561static int virtio_net_load_device(VirtIODevice *vdev, QEMUFile *f,
1562 int version_id)
1563{
1564 VirtIONet *n = VIRTIO_NET(vdev);
1565 int i, link_down;
fbe78f4f 1566
79674068 1567 qemu_get_buffer(f, n->mac, ETH_ALEN);
5f800801 1568 n->vqs[0].tx_waiting = qemu_get_be32(f);
ff3a8066 1569
bb9d17f8 1570 virtio_net_set_mrg_rx_bufs(n, qemu_get_be32(f),
95129d6f
CH
1571 virtio_vdev_has_feature(vdev,
1572 VIRTIO_F_VERSION_1));
fbe78f4f 1573
76010cb3 1574 n->status = qemu_get_be16(f);
9d6271b8 1575
76010cb3
DDAG
1576 n->promisc = qemu_get_byte(f);
1577 n->allmulti = qemu_get_byte(f);
002437cd 1578
76010cb3
DDAG
1579 n->mac_table.in_use = qemu_get_be32(f);
1580 /* MAC_TABLE_ENTRIES may be different from the saved image */
1581 if (n->mac_table.in_use <= MAC_TABLE_ENTRIES) {
1582 qemu_get_buffer(f, n->mac_table.macs,
1583 n->mac_table.in_use * ETH_ALEN);
1584 } else {
1585 int64_t i;
1586
1587 /* Overflow detected - can happen if source has a larger MAC table.
1588 * We simply set overflow flag so there's no need to maintain the
1589 * table of addresses, discard them all.
1590 * Note: 64 bit math to avoid integer overflow.
1591 */
1592 for (i = 0; i < (int64_t)n->mac_table.in_use * ETH_ALEN; ++i) {
1593 qemu_get_byte(f);
b6503ed9 1594 }
76010cb3
DDAG
1595 n->mac_table.multi_overflow = n->mac_table.uni_overflow = 1;
1596 n->mac_table.in_use = 0;
b6503ed9
AL
1597 }
1598
76010cb3 1599 qemu_get_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
f21c0ed9 1600
76010cb3
DDAG
1601 if (qemu_get_be32(f) && !peer_has_vnet_hdr(n)) {
1602 error_report("virtio-net: saved image requires vnet_hdr=on");
1603 return -1;
6c042c16
AW
1604 }
1605
76010cb3
DDAG
1606 n->mac_table.multi_overflow = qemu_get_byte(f);
1607 n->mac_table.uni_overflow = qemu_get_byte(f);
8fd2a2f1 1608
76010cb3
DDAG
1609 n->alluni = qemu_get_byte(f);
1610 n->nomulti = qemu_get_byte(f);
1611 n->nouni = qemu_get_byte(f);
1612 n->nobcast = qemu_get_byte(f);
015cb166 1613
76010cb3
DDAG
1614 if (qemu_get_byte(f) && !peer_has_ufo(n)) {
1615 error_report("virtio-net: saved image requires TUN_F_UFO support");
1616 return -1;
0ce0e8f4
MM
1617 }
1618
5f800801
JW
1619 if (n->max_queues > 1) {
1620 if (n->max_queues != qemu_get_be16(f)) {
1621 error_report("virtio-net: different max_queues ");
1622 return -1;
1623 }
1624
1625 n->curr_queues = qemu_get_be16(f);
eea750a5
MT
1626 if (n->curr_queues > n->max_queues) {
1627 error_report("virtio-net: curr_queues %x > max_queues %x",
1628 n->curr_queues, n->max_queues);
1629 return -1;
1630 }
5f800801
JW
1631 for (i = 1; i < n->curr_queues; i++) {
1632 n->vqs[i].tx_waiting = qemu_get_be32(f);
1633 }
1634 }
1635
6c666823
MT
1636 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
1637 n->curr_guest_offloads = qemu_get_be64(f);
1638 } else {
1639 n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
1640 }
1641
1642 if (peer_has_vnet_hdr(n)) {
1643 virtio_net_apply_guest_offloads(n);
1644 }
1645
5f800801
JW
1646 virtio_net_set_queues(n);
1647
2d9aba39
AW
1648 /* Find the first multicast entry in the saved MAC filter */
1649 for (i = 0; i < n->mac_table.in_use; i++) {
1650 if (n->mac_table.macs[i * ETH_ALEN] & 1) {
1651 break;
1652 }
1653 }
1654 n->mac_table.first_multi = i;
98991481
AK
1655
1656 /* nc.link_down can't be migrated, so infer link_down according
1657 * to link status bit in n->status */
5f800801
JW
1658 link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
1659 for (i = 0; i < n->max_queues; i++) {
1660 qemu_get_subqueue(n->nic, i)->link_down = link_down;
1661 }
98991481 1662
6c666823
MT
1663 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
1664 virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
1665 n->announce_counter = SELF_ANNOUNCE_ROUNDS;
1666 timer_mod(n->announce_timer, qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL));
1667 }
1668
fbe78f4f
AL
1669 return 0;
1670}
1671
eb6b6c12 1672static NetClientInfo net_virtio_info = {
f394b2e2 1673 .type = NET_CLIENT_DRIVER_NIC,
eb6b6c12
MM
1674 .size = sizeof(NICState),
1675 .can_receive = virtio_net_can_receive,
1676 .receive = virtio_net_receive,
eb6b6c12 1677 .link_status_changed = virtio_net_set_link_status,
b1be4280 1678 .query_rx_filter = virtio_net_query_rxfilter,
eb6b6c12
MM
1679};
1680
f56a1247
MT
1681static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
1682{
17a0ca55 1683 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1684 NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
f56a1247 1685 assert(n->vhost_started);
ed8b4afe 1686 return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
f56a1247
MT
1687}
1688
1689static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
1690 bool mask)
1691{
17a0ca55 1692 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1693 NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
f56a1247 1694 assert(n->vhost_started);
ed8b4afe 1695 vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
f56a1247
MT
1696 vdev, idx, mask);
1697}
1698
019a3edb 1699static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
fbe78f4f 1700{
14f9b664 1701 int i, config_size = 0;
0cd09c3a 1702 virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
14f9b664
JL
1703 for (i = 0; feature_sizes[i].flags != 0; i++) {
1704 if (host_features & feature_sizes[i].flags) {
1705 config_size = MAX(feature_sizes[i].end, config_size);
1706 }
1707 }
17ec5a86
FK
1708 n->config_size = config_size;
1709}
1710
8a253ec2
FK
1711void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
1712 const char *type)
1713{
1714 /*
1715 * The name can be NULL, the netclient name will be type.x.
1716 */
1717 assert(type != NULL);
1718
9e288406 1719 g_free(n->netclient_name);
9e288406 1720 g_free(n->netclient_type);
80e0090a 1721 n->netclient_name = g_strdup(name);
8a253ec2
FK
1722 n->netclient_type = g_strdup(type);
1723}
1724
e6f746b3 1725static void virtio_net_device_realize(DeviceState *dev, Error **errp)
17ec5a86 1726{
e6f746b3 1727 VirtIODevice *vdev = VIRTIO_DEVICE(dev);
284a32f0 1728 VirtIONet *n = VIRTIO_NET(dev);
b1be4280 1729 NetClientState *nc;
284a32f0 1730 int i;
1773d9ee 1731
da3e8a23 1732 virtio_net_set_config_size(n, n->host_features);
284a32f0 1733 virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
fbe78f4f 1734
1c0fbfa3
MT
1735 /*
1736 * We set a lower limit on RX queue size to what it always was.
1737 * Guests that want a smaller ring can always resize it without
1738 * help from us (using virtio 1 and up).
1739 */
1740 if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
1741 n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
1742 (n->net_conf.rx_queue_size & (n->net_conf.rx_queue_size - 1))) {
1743 error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
1744 "must be a power of 2 between %d and %d.",
1745 n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
1746 VIRTQUEUE_MAX_SIZE);
1747 virtio_cleanup(vdev);
1748 return;
1749 }
1750
575a1c0e 1751 n->max_queues = MAX(n->nic_conf.peers.queues, 1);
87b3bd1c 1752 if (n->max_queues * 2 + 1 > VIRTIO_QUEUE_MAX) {
7e0e736e 1753 error_setg(errp, "Invalid number of queues (= %" PRIu32 "), "
631b22ea 1754 "must be a positive integer less than %d.",
87b3bd1c 1755 n->max_queues, (VIRTIO_QUEUE_MAX - 1) / 2);
7e0e736e
JW
1756 virtio_cleanup(vdev);
1757 return;
1758 }
f6b26cf2 1759 n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
fed699f9 1760 n->curr_queues = 1;
1773d9ee 1761 n->tx_timeout = n->net_conf.txtimer;
a697a334 1762
1773d9ee
FK
1763 if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
1764 && strcmp(n->net_conf.tx, "bh")) {
e7b43f7e
SH
1765 error_report("virtio-net: "
1766 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1773d9ee 1767 n->net_conf.tx);
e7b43f7e 1768 error_report("Defaulting to \"bh\"");
a697a334
AW
1769 }
1770
da51a335 1771 for (i = 0; i < n->max_queues; i++) {
f9d6dbf0 1772 virtio_net_add_queue(n, i);
a697a334 1773 }
da51a335 1774
17a0ca55 1775 n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
1773d9ee
FK
1776 qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
1777 memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
554c97dd 1778 n->status = VIRTIO_NET_S_LINK_UP;
f57fcf70
JW
1779 n->announce_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL,
1780 virtio_net_announce_timer, n);
fbe78f4f 1781
8a253ec2
FK
1782 if (n->netclient_type) {
1783 /*
1784 * Happen when virtio_net_set_netclient_name has been called.
1785 */
1786 n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
1787 n->netclient_type, n->netclient_name, n);
1788 } else {
1789 n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
284a32f0 1790 object_get_typename(OBJECT(dev)), dev->id, n);
8a253ec2
FK
1791 }
1792
6e371ab8
MT
1793 peer_test_vnet_hdr(n);
1794 if (peer_has_vnet_hdr(n)) {
fed699f9 1795 for (i = 0; i < n->max_queues; i++) {
d6085e3a 1796 qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
fed699f9 1797 }
6e371ab8
MT
1798 n->host_hdr_len = sizeof(struct virtio_net_hdr);
1799 } else {
1800 n->host_hdr_len = 0;
1801 }
eb6b6c12 1802
1773d9ee 1803 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
96d5e201 1804
fed699f9 1805 n->vqs[0].tx_waiting = 0;
1773d9ee 1806 n->tx_burst = n->net_conf.txburst;
bb9d17f8 1807 virtio_net_set_mrg_rx_bufs(n, 0, 0);
002437cd 1808 n->promisc = 1; /* for compatibility */
fbe78f4f 1809
7267c094 1810 n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
b6503ed9 1811
7267c094 1812 n->vlans = g_malloc0(MAX_VLAN >> 3);
f21c0ed9 1813
b1be4280
AK
1814 nc = qemu_get_queue(n->nic);
1815 nc->rxfilter_notify_enabled = 1;
1816
284a32f0 1817 n->qdev = dev;
17ec5a86
FK
1818}
1819
306ec6c3 1820static void virtio_net_device_unrealize(DeviceState *dev, Error **errp)
17ec5a86 1821{
306ec6c3
AF
1822 VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1823 VirtIONet *n = VIRTIO_NET(dev);
f9d6dbf0 1824 int i, max_queues;
17ec5a86
FK
1825
1826 /* This will stop vhost backend if appropriate. */
1827 virtio_net_set_status(vdev, 0);
1828
9e288406
MA
1829 g_free(n->netclient_name);
1830 n->netclient_name = NULL;
1831 g_free(n->netclient_type);
1832 n->netclient_type = NULL;
8a253ec2 1833
17ec5a86
FK
1834 g_free(n->mac_table.macs);
1835 g_free(n->vlans);
1836
f9d6dbf0
WC
1837 max_queues = n->multiqueue ? n->max_queues : 1;
1838 for (i = 0; i < max_queues; i++) {
1839 virtio_net_del_queue(n, i);
17ec5a86
FK
1840 }
1841
f57fcf70
JW
1842 timer_del(n->announce_timer);
1843 timer_free(n->announce_timer);
17ec5a86
FK
1844 g_free(n->vqs);
1845 qemu_del_nic(n->nic);
6a1a8cc7 1846 virtio_cleanup(vdev);
17ec5a86
FK
1847}
1848
1849static void virtio_net_instance_init(Object *obj)
1850{
1851 VirtIONet *n = VIRTIO_NET(obj);
1852
1853 /*
1854 * The default config_size is sizeof(struct virtio_net_config).
1855 * Can be overriden with virtio_net_set_config_size.
1856 */
1857 n->config_size = sizeof(struct virtio_net_config);
aa4197c3
GA
1858 device_add_bootindex_property(obj, &n->nic_conf.bootindex,
1859 "bootindex", "/ethernet-phy@0",
1860 DEVICE(n), NULL);
17ec5a86
FK
1861}
1862
290c2428
DDAG
1863VMSTATE_VIRTIO_DEVICE(net, VIRTIO_NET_VM_VERSION, virtio_net_load,
1864 virtio_net_save);
1865
17ec5a86 1866static Property virtio_net_properties[] = {
87108bb2
SZ
1867 DEFINE_PROP_BIT("csum", VirtIONet, host_features, VIRTIO_NET_F_CSUM, true),
1868 DEFINE_PROP_BIT("guest_csum", VirtIONet, host_features,
1869 VIRTIO_NET_F_GUEST_CSUM, true),
1870 DEFINE_PROP_BIT("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
1871 DEFINE_PROP_BIT("guest_tso4", VirtIONet, host_features,
1872 VIRTIO_NET_F_GUEST_TSO4, true),
1873 DEFINE_PROP_BIT("guest_tso6", VirtIONet, host_features,
1874 VIRTIO_NET_F_GUEST_TSO6, true),
1875 DEFINE_PROP_BIT("guest_ecn", VirtIONet, host_features,
1876 VIRTIO_NET_F_GUEST_ECN, true),
1877 DEFINE_PROP_BIT("guest_ufo", VirtIONet, host_features,
1878 VIRTIO_NET_F_GUEST_UFO, true),
1879 DEFINE_PROP_BIT("guest_announce", VirtIONet, host_features,
1880 VIRTIO_NET_F_GUEST_ANNOUNCE, true),
1881 DEFINE_PROP_BIT("host_tso4", VirtIONet, host_features,
1882 VIRTIO_NET_F_HOST_TSO4, true),
1883 DEFINE_PROP_BIT("host_tso6", VirtIONet, host_features,
1884 VIRTIO_NET_F_HOST_TSO6, true),
1885 DEFINE_PROP_BIT("host_ecn", VirtIONet, host_features,
1886 VIRTIO_NET_F_HOST_ECN, true),
1887 DEFINE_PROP_BIT("host_ufo", VirtIONet, host_features,
1888 VIRTIO_NET_F_HOST_UFO, true),
1889 DEFINE_PROP_BIT("mrg_rxbuf", VirtIONet, host_features,
1890 VIRTIO_NET_F_MRG_RXBUF, true),
1891 DEFINE_PROP_BIT("status", VirtIONet, host_features,
1892 VIRTIO_NET_F_STATUS, true),
1893 DEFINE_PROP_BIT("ctrl_vq", VirtIONet, host_features,
1894 VIRTIO_NET_F_CTRL_VQ, true),
1895 DEFINE_PROP_BIT("ctrl_rx", VirtIONet, host_features,
1896 VIRTIO_NET_F_CTRL_RX, true),
1897 DEFINE_PROP_BIT("ctrl_vlan", VirtIONet, host_features,
1898 VIRTIO_NET_F_CTRL_VLAN, true),
1899 DEFINE_PROP_BIT("ctrl_rx_extra", VirtIONet, host_features,
1900 VIRTIO_NET_F_CTRL_RX_EXTRA, true),
1901 DEFINE_PROP_BIT("ctrl_mac_addr", VirtIONet, host_features,
1902 VIRTIO_NET_F_CTRL_MAC_ADDR, true),
1903 DEFINE_PROP_BIT("ctrl_guest_offloads", VirtIONet, host_features,
1904 VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
1905 DEFINE_PROP_BIT("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
17ec5a86
FK
1906 DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
1907 DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
87108bb2 1908 TX_TIMER_INTERVAL),
17ec5a86
FK
1909 DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
1910 DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
1c0fbfa3
MT
1911 DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
1912 VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
17ec5a86
FK
1913 DEFINE_PROP_END_OF_LIST(),
1914};
1915
1916static void virtio_net_class_init(ObjectClass *klass, void *data)
1917{
1918 DeviceClass *dc = DEVICE_CLASS(klass);
1919 VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
e6f746b3 1920
17ec5a86 1921 dc->props = virtio_net_properties;
290c2428 1922 dc->vmsd = &vmstate_virtio_net;
125ee0ed 1923 set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
e6f746b3 1924 vdc->realize = virtio_net_device_realize;
306ec6c3 1925 vdc->unrealize = virtio_net_device_unrealize;
17ec5a86
FK
1926 vdc->get_config = virtio_net_get_config;
1927 vdc->set_config = virtio_net_set_config;
1928 vdc->get_features = virtio_net_get_features;
1929 vdc->set_features = virtio_net_set_features;
1930 vdc->bad_features = virtio_net_bad_features;
1931 vdc->reset = virtio_net_reset;
1932 vdc->set_status = virtio_net_set_status;
1933 vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
1934 vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
037dab2f
GK
1935 vdc->load = virtio_net_load_device;
1936 vdc->save = virtio_net_save_device;
17ec5a86
FK
1937}
1938
1939static const TypeInfo virtio_net_info = {
1940 .name = TYPE_VIRTIO_NET,
1941 .parent = TYPE_VIRTIO_DEVICE,
1942 .instance_size = sizeof(VirtIONet),
1943 .instance_init = virtio_net_instance_init,
1944 .class_init = virtio_net_class_init,
1945};
1946
1947static void virtio_register_types(void)
1948{
1949 type_register_static(&virtio_net_info);
1950}
1951
1952type_init(virtio_register_types)