]> git.ipfire.org Git - thirdparty/qemu.git/blame - hw/net/virtio-net.c
intel_iommu: fixing source id during IOTLB hash key calculation
[thirdparty/qemu.git] / hw / net / virtio-net.c
CommitLineData
fbe78f4f
AL
1/*
2 * Virtio Network Device
3 *
4 * Copyright IBM, Corp. 2007
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
9b8bfe21 14#include "qemu/osdep.h"
1de7afc9 15#include "qemu/iov.h"
0d09e41a 16#include "hw/virtio/virtio.h"
1422e32d 17#include "net/net.h"
7200ac3c 18#include "net/checksum.h"
a8ed73f7 19#include "net/tap.h"
1de7afc9
PB
20#include "qemu/error-report.h"
21#include "qemu/timer.h"
0d09e41a
PB
22#include "hw/virtio/virtio-net.h"
23#include "net/vhost_net.h"
17ec5a86 24#include "hw/virtio/virtio-bus.h"
b1be4280 25#include "qapi/qmp/qjson.h"
06150279 26#include "qapi-event.h"
1399c60d 27#include "hw/virtio/virtio-access.h"
fbe78f4f 28
0ce0e8f4 29#define VIRTIO_NET_VM_VERSION 11
b6503ed9 30
4ffb17f5 31#define MAC_TABLE_ENTRIES 64
f21c0ed9 32#define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
9d6271b8 33
1c0fbfa3
MT
34/* previously fixed value */
35#define VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE 256
36/* for now, only allow larger queues; with virtio-1, guest can downsize */
37#define VIRTIO_NET_RX_QUEUE_MIN_SIZE VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE
38
14f9b664
JL
39/*
40 * Calculate the number of bytes up to and including the given 'field' of
41 * 'container'.
42 */
43#define endof(container, field) \
44 (offsetof(container, field) + sizeof(((container *)0)->field))
45
46typedef struct VirtIOFeature {
47 uint32_t flags;
48 size_t end;
49} VirtIOFeature;
50
51static VirtIOFeature feature_sizes[] = {
52 {.flags = 1 << VIRTIO_NET_F_MAC,
53 .end = endof(struct virtio_net_config, mac)},
54 {.flags = 1 << VIRTIO_NET_F_STATUS,
55 .end = endof(struct virtio_net_config, status)},
56 {.flags = 1 << VIRTIO_NET_F_MQ,
57 .end = endof(struct virtio_net_config, max_virtqueue_pairs)},
58 {}
59};
60
fed699f9 61static VirtIONetQueue *virtio_net_get_subqueue(NetClientState *nc)
0c87e93e
JW
62{
63 VirtIONet *n = qemu_get_nic_opaque(nc);
64
fed699f9 65 return &n->vqs[nc->queue_index];
0c87e93e 66}
fed699f9
JW
67
68static int vq2q(int queue_index)
69{
70 return queue_index / 2;
71}
72
fbe78f4f
AL
73/* TODO
74 * - we could suppress RX interrupt if we were so inclined.
75 */
76
0f03eca6 77static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
fbe78f4f 78{
17a0ca55 79 VirtIONet *n = VIRTIO_NET(vdev);
fbe78f4f
AL
80 struct virtio_net_config netcfg;
81
1399c60d
RR
82 virtio_stw_p(vdev, &netcfg.status, n->status);
83 virtio_stw_p(vdev, &netcfg.max_virtqueue_pairs, n->max_queues);
79674068 84 memcpy(netcfg.mac, n->mac, ETH_ALEN);
14f9b664 85 memcpy(config, &netcfg, n->config_size);
fbe78f4f
AL
86}
87
0f03eca6
AL
88static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
89{
17a0ca55 90 VirtIONet *n = VIRTIO_NET(vdev);
14f9b664 91 struct virtio_net_config netcfg = {};
0f03eca6 92
14f9b664 93 memcpy(&netcfg, config, n->config_size);
0f03eca6 94
95129d6f
CH
95 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_MAC_ADDR) &&
96 !virtio_vdev_has_feature(vdev, VIRTIO_F_VERSION_1) &&
c1943a3f 97 memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
79674068 98 memcpy(n->mac, netcfg.mac, ETH_ALEN);
b356f76d 99 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
0f03eca6
AL
100 }
101}
102
783e7706
MT
103static bool virtio_net_started(VirtIONet *n, uint8_t status)
104{
17a0ca55 105 VirtIODevice *vdev = VIRTIO_DEVICE(n);
783e7706 106 return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
17a0ca55 107 (n->status & VIRTIO_NET_S_LINK_UP) && vdev->vm_running;
783e7706
MT
108}
109
f57fcf70
JW
110static void virtio_net_announce_timer(void *opaque)
111{
112 VirtIONet *n = opaque;
113 VirtIODevice *vdev = VIRTIO_DEVICE(n);
114
115 n->announce_counter--;
116 n->status |= VIRTIO_NET_S_ANNOUNCE;
117 virtio_notify_config(vdev);
118}
119
783e7706 120static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
afbaa7b4 121{
17a0ca55 122 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b356f76d 123 NetClientState *nc = qemu_get_queue(n->nic);
fed699f9 124 int queues = n->multiqueue ? n->max_queues : 1;
b356f76d 125
ed8b4afe 126 if (!get_vhost_net(nc->peer)) {
afbaa7b4
MT
127 return;
128 }
fed699f9 129
8c1ac475
RK
130 if ((virtio_net_started(n, status) && !nc->peer->link_down) ==
131 !!n->vhost_started) {
afbaa7b4
MT
132 return;
133 }
134 if (!n->vhost_started) {
086abc1c
MT
135 int r, i;
136
1bfa316c
GK
137 if (n->needs_vnet_hdr_swap) {
138 error_report("backend does not support %s vnet headers; "
139 "falling back on userspace virtio",
140 virtio_is_big_endian(vdev) ? "BE" : "LE");
141 return;
142 }
143
086abc1c
MT
144 /* Any packets outstanding? Purge them to avoid touching rings
145 * when vhost is running.
146 */
147 for (i = 0; i < queues; i++) {
148 NetClientState *qnc = qemu_get_subqueue(n->nic, i);
149
150 /* Purge both directions: TX and RX. */
151 qemu_net_queue_purge(qnc->peer->incoming_queue, qnc);
152 qemu_net_queue_purge(qnc->incoming_queue, qnc->peer);
153 }
154
1830b80f 155 n->vhost_started = 1;
17a0ca55 156 r = vhost_net_start(vdev, n->nic->ncs, queues);
afbaa7b4 157 if (r < 0) {
e7b43f7e
SH
158 error_report("unable to start vhost net: %d: "
159 "falling back on userspace virtio", -r);
1830b80f 160 n->vhost_started = 0;
afbaa7b4
MT
161 }
162 } else {
17a0ca55 163 vhost_net_stop(vdev, n->nic->ncs, queues);
afbaa7b4
MT
164 n->vhost_started = 0;
165 }
166}
167
1bfa316c
GK
168static int virtio_net_set_vnet_endian_one(VirtIODevice *vdev,
169 NetClientState *peer,
170 bool enable)
171{
172 if (virtio_is_big_endian(vdev)) {
173 return qemu_set_vnet_be(peer, enable);
174 } else {
175 return qemu_set_vnet_le(peer, enable);
176 }
177}
178
179static bool virtio_net_set_vnet_endian(VirtIODevice *vdev, NetClientState *ncs,
180 int queues, bool enable)
181{
182 int i;
183
184 for (i = 0; i < queues; i++) {
185 if (virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, enable) < 0 &&
186 enable) {
187 while (--i >= 0) {
188 virtio_net_set_vnet_endian_one(vdev, ncs[i].peer, false);
189 }
190
191 return true;
192 }
193 }
194
195 return false;
196}
197
198static void virtio_net_vnet_endian_status(VirtIONet *n, uint8_t status)
199{
200 VirtIODevice *vdev = VIRTIO_DEVICE(n);
201 int queues = n->multiqueue ? n->max_queues : 1;
202
203 if (virtio_net_started(n, status)) {
204 /* Before using the device, we tell the network backend about the
205 * endianness to use when parsing vnet headers. If the backend
206 * can't do it, we fallback onto fixing the headers in the core
207 * virtio-net code.
208 */
209 n->needs_vnet_hdr_swap = virtio_net_set_vnet_endian(vdev, n->nic->ncs,
210 queues, true);
211 } else if (virtio_net_started(n, vdev->status)) {
212 /* After using the device, we need to reset the network backend to
213 * the default (guest native endianness), otherwise the guest may
214 * lose network connectivity if it is rebooted into a different
215 * endianness.
216 */
217 virtio_net_set_vnet_endian(vdev, n->nic->ncs, queues, false);
218 }
219}
220
783e7706
MT
221static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
222{
17a0ca55 223 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9
JW
224 VirtIONetQueue *q;
225 int i;
226 uint8_t queue_status;
783e7706 227
1bfa316c 228 virtio_net_vnet_endian_status(n, status);
783e7706
MT
229 virtio_net_vhost_status(n, status);
230
fed699f9 231 for (i = 0; i < n->max_queues; i++) {
38705bb5
FZ
232 NetClientState *ncs = qemu_get_subqueue(n->nic, i);
233 bool queue_started;
fed699f9 234 q = &n->vqs[i];
783e7706 235
fed699f9
JW
236 if ((!n->multiqueue && i != 0) || i >= n->curr_queues) {
237 queue_status = 0;
783e7706 238 } else {
fed699f9 239 queue_status = status;
783e7706 240 }
38705bb5
FZ
241 queue_started =
242 virtio_net_started(n, queue_status) && !n->vhost_started;
243
244 if (queue_started) {
245 qemu_flush_queued_packets(ncs);
246 }
fed699f9
JW
247
248 if (!q->tx_waiting) {
249 continue;
250 }
251
38705bb5 252 if (queue_started) {
fed699f9 253 if (q->tx_timer) {
bc72ad67
AB
254 timer_mod(q->tx_timer,
255 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
fed699f9
JW
256 } else {
257 qemu_bh_schedule(q->tx_bh);
258 }
783e7706 259 } else {
fed699f9 260 if (q->tx_timer) {
bc72ad67 261 timer_del(q->tx_timer);
fed699f9
JW
262 } else {
263 qemu_bh_cancel(q->tx_bh);
264 }
783e7706
MT
265 }
266 }
267}
268
4e68f7a0 269static void virtio_net_set_link_status(NetClientState *nc)
554c97dd 270{
cc1f0f45 271 VirtIONet *n = qemu_get_nic_opaque(nc);
17a0ca55 272 VirtIODevice *vdev = VIRTIO_DEVICE(n);
554c97dd
AL
273 uint16_t old_status = n->status;
274
eb6b6c12 275 if (nc->link_down)
554c97dd
AL
276 n->status &= ~VIRTIO_NET_S_LINK_UP;
277 else
278 n->status |= VIRTIO_NET_S_LINK_UP;
279
280 if (n->status != old_status)
17a0ca55 281 virtio_notify_config(vdev);
afbaa7b4 282
17a0ca55 283 virtio_net_set_status(vdev, vdev->status);
554c97dd
AL
284}
285
b1be4280
AK
286static void rxfilter_notify(NetClientState *nc)
287{
b1be4280
AK
288 VirtIONet *n = qemu_get_nic_opaque(nc);
289
290 if (nc->rxfilter_notify_enabled) {
96e35046 291 gchar *path = object_get_canonical_path(OBJECT(n->qdev));
06150279
WX
292 qapi_event_send_nic_rx_filter_changed(!!n->netclient_name,
293 n->netclient_name, path, &error_abort);
96e35046 294 g_free(path);
b1be4280
AK
295
296 /* disable event notification to avoid events flooding */
297 nc->rxfilter_notify_enabled = 0;
298 }
299}
300
f7bc8ef8
AK
301static intList *get_vlan_table(VirtIONet *n)
302{
303 intList *list, *entry;
304 int i, j;
305
306 list = NULL;
307 for (i = 0; i < MAX_VLAN >> 5; i++) {
308 for (j = 0; n->vlans[i] && j <= 0x1f; j++) {
309 if (n->vlans[i] & (1U << j)) {
310 entry = g_malloc0(sizeof(*entry));
311 entry->value = (i << 5) + j;
312 entry->next = list;
313 list = entry;
314 }
315 }
316 }
317
318 return list;
319}
320
b1be4280
AK
321static RxFilterInfo *virtio_net_query_rxfilter(NetClientState *nc)
322{
323 VirtIONet *n = qemu_get_nic_opaque(nc);
f7bc8ef8 324 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b1be4280
AK
325 RxFilterInfo *info;
326 strList *str_list, *entry;
f7bc8ef8 327 int i;
b1be4280
AK
328
329 info = g_malloc0(sizeof(*info));
330 info->name = g_strdup(nc->name);
331 info->promiscuous = n->promisc;
332
333 if (n->nouni) {
334 info->unicast = RX_STATE_NONE;
335 } else if (n->alluni) {
336 info->unicast = RX_STATE_ALL;
337 } else {
338 info->unicast = RX_STATE_NORMAL;
339 }
340
341 if (n->nomulti) {
342 info->multicast = RX_STATE_NONE;
343 } else if (n->allmulti) {
344 info->multicast = RX_STATE_ALL;
345 } else {
346 info->multicast = RX_STATE_NORMAL;
347 }
348
349 info->broadcast_allowed = n->nobcast;
350 info->multicast_overflow = n->mac_table.multi_overflow;
351 info->unicast_overflow = n->mac_table.uni_overflow;
352
b0575ba4 353 info->main_mac = qemu_mac_strdup_printf(n->mac);
b1be4280
AK
354
355 str_list = NULL;
356 for (i = 0; i < n->mac_table.first_multi; i++) {
357 entry = g_malloc0(sizeof(*entry));
b0575ba4 358 entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
b1be4280
AK
359 entry->next = str_list;
360 str_list = entry;
361 }
362 info->unicast_table = str_list;
363
364 str_list = NULL;
365 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
366 entry = g_malloc0(sizeof(*entry));
b0575ba4 367 entry->value = qemu_mac_strdup_printf(n->mac_table.macs + i * ETH_ALEN);
b1be4280
AK
368 entry->next = str_list;
369 str_list = entry;
370 }
371 info->multicast_table = str_list;
f7bc8ef8 372 info->vlan_table = get_vlan_table(n);
b1be4280 373
95129d6f 374 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VLAN)) {
f7bc8ef8
AK
375 info->vlan = RX_STATE_ALL;
376 } else if (!info->vlan_table) {
377 info->vlan = RX_STATE_NONE;
378 } else {
379 info->vlan = RX_STATE_NORMAL;
b1be4280 380 }
b1be4280
AK
381
382 /* enable event notification after query */
383 nc->rxfilter_notify_enabled = 1;
384
385 return info;
386}
387
002437cd
AL
388static void virtio_net_reset(VirtIODevice *vdev)
389{
17a0ca55 390 VirtIONet *n = VIRTIO_NET(vdev);
002437cd
AL
391
392 /* Reset back to compatibility mode */
393 n->promisc = 1;
394 n->allmulti = 0;
015cb166
AW
395 n->alluni = 0;
396 n->nomulti = 0;
397 n->nouni = 0;
398 n->nobcast = 0;
fed699f9
JW
399 /* multiqueue is disabled by default */
400 n->curr_queues = 1;
f57fcf70
JW
401 timer_del(n->announce_timer);
402 n->announce_counter = 0;
403 n->status &= ~VIRTIO_NET_S_ANNOUNCE;
b6503ed9 404
f21c0ed9 405 /* Flush any MAC and VLAN filter table state */
b6503ed9 406 n->mac_table.in_use = 0;
2d9aba39 407 n->mac_table.first_multi = 0;
8fd2a2f1
AW
408 n->mac_table.multi_overflow = 0;
409 n->mac_table.uni_overflow = 0;
b6503ed9 410 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
41dc8a67 411 memcpy(&n->mac[0], &n->nic->conf->macaddr, sizeof(n->mac));
702d66a8 412 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
f21c0ed9 413 memset(n->vlans, 0, MAX_VLAN >> 3);
002437cd
AL
414}
415
6e371ab8 416static void peer_test_vnet_hdr(VirtIONet *n)
3a330134 417{
b356f76d
JW
418 NetClientState *nc = qemu_get_queue(n->nic);
419 if (!nc->peer) {
6e371ab8 420 return;
b356f76d 421 }
3a330134 422
d6085e3a 423 n->has_vnet_hdr = qemu_has_vnet_hdr(nc->peer);
6e371ab8 424}
3a330134 425
6e371ab8
MT
426static int peer_has_vnet_hdr(VirtIONet *n)
427{
3a330134
MM
428 return n->has_vnet_hdr;
429}
430
0ce0e8f4
MM
431static int peer_has_ufo(VirtIONet *n)
432{
433 if (!peer_has_vnet_hdr(n))
434 return 0;
435
d6085e3a 436 n->has_ufo = qemu_has_ufo(qemu_get_queue(n->nic)->peer);
0ce0e8f4
MM
437
438 return n->has_ufo;
439}
440
bb9d17f8
CH
441static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs,
442 int version_1)
ff3a8066 443{
fed699f9
JW
444 int i;
445 NetClientState *nc;
446
ff3a8066
MT
447 n->mergeable_rx_bufs = mergeable_rx_bufs;
448
bb9d17f8
CH
449 if (version_1) {
450 n->guest_hdr_len = sizeof(struct virtio_net_hdr_mrg_rxbuf);
451 } else {
452 n->guest_hdr_len = n->mergeable_rx_bufs ?
453 sizeof(struct virtio_net_hdr_mrg_rxbuf) :
454 sizeof(struct virtio_net_hdr);
455 }
ff3a8066 456
fed699f9
JW
457 for (i = 0; i < n->max_queues; i++) {
458 nc = qemu_get_subqueue(n->nic, i);
459
460 if (peer_has_vnet_hdr(n) &&
d6085e3a
SH
461 qemu_has_vnet_hdr_len(nc->peer, n->guest_hdr_len)) {
462 qemu_set_vnet_hdr_len(nc->peer, n->guest_hdr_len);
fed699f9
JW
463 n->host_hdr_len = n->guest_hdr_len;
464 }
ff3a8066
MT
465 }
466}
467
fed699f9
JW
468static int peer_attach(VirtIONet *n, int index)
469{
470 NetClientState *nc = qemu_get_subqueue(n->nic, index);
471
472 if (!nc->peer) {
473 return 0;
474 }
475
f394b2e2 476 if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7263a0ad
CO
477 vhost_set_vring_enable(nc->peer, 1);
478 }
479
f394b2e2 480 if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
fed699f9
JW
481 return 0;
482 }
483
484 return tap_enable(nc->peer);
485}
486
487static int peer_detach(VirtIONet *n, int index)
488{
489 NetClientState *nc = qemu_get_subqueue(n->nic, index);
490
491 if (!nc->peer) {
492 return 0;
493 }
494
f394b2e2 495 if (nc->peer->info->type == NET_CLIENT_DRIVER_VHOST_USER) {
7263a0ad
CO
496 vhost_set_vring_enable(nc->peer, 0);
497 }
498
f394b2e2 499 if (nc->peer->info->type != NET_CLIENT_DRIVER_TAP) {
fed699f9
JW
500 return 0;
501 }
502
503 return tap_disable(nc->peer);
504}
505
506static void virtio_net_set_queues(VirtIONet *n)
507{
508 int i;
ddfa83ea 509 int r;
fed699f9
JW
510
511 for (i = 0; i < n->max_queues; i++) {
512 if (i < n->curr_queues) {
ddfa83ea
JS
513 r = peer_attach(n, i);
514 assert(!r);
fed699f9 515 } else {
ddfa83ea
JS
516 r = peer_detach(n, i);
517 assert(!r);
fed699f9
JW
518 }
519 }
520}
521
ec57db16 522static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue);
fed699f9 523
9d5b731d
JW
524static uint64_t virtio_net_get_features(VirtIODevice *vdev, uint64_t features,
525 Error **errp)
fbe78f4f 526{
17a0ca55 527 VirtIONet *n = VIRTIO_NET(vdev);
b356f76d 528 NetClientState *nc = qemu_get_queue(n->nic);
fbe78f4f 529
da3e8a23
SZ
530 /* Firstly sync all virtio-net possible supported features */
531 features |= n->host_features;
532
0cd09c3a 533 virtio_add_feature(&features, VIRTIO_NET_F_MAC);
c9f79a3f 534
6e371ab8 535 if (!peer_has_vnet_hdr(n)) {
0cd09c3a
CH
536 virtio_clear_feature(&features, VIRTIO_NET_F_CSUM);
537 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO4);
538 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_TSO6);
539 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_ECN);
8172539d 540
0cd09c3a
CH
541 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_CSUM);
542 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO4);
543 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_TSO6);
544 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_ECN);
8172539d 545 }
3a330134 546
8172539d 547 if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
0cd09c3a
CH
548 virtio_clear_feature(&features, VIRTIO_NET_F_GUEST_UFO);
549 virtio_clear_feature(&features, VIRTIO_NET_F_HOST_UFO);
3a330134
MM
550 }
551
ed8b4afe 552 if (!get_vhost_net(nc->peer)) {
9bc6304c
MT
553 return features;
554 }
ed8b4afe 555 return vhost_net_get_features(get_vhost_net(nc->peer), features);
fbe78f4f
AL
556}
557
019a3edb 558static uint64_t virtio_net_bad_features(VirtIODevice *vdev)
8eca6b1b 559{
019a3edb 560 uint64_t features = 0;
8eca6b1b
AL
561
562 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
563 * but also these: */
0cd09c3a
CH
564 virtio_add_feature(&features, VIRTIO_NET_F_MAC);
565 virtio_add_feature(&features, VIRTIO_NET_F_CSUM);
566 virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO4);
567 virtio_add_feature(&features, VIRTIO_NET_F_HOST_TSO6);
568 virtio_add_feature(&features, VIRTIO_NET_F_HOST_ECN);
8eca6b1b 569
8172539d 570 return features;
8eca6b1b
AL
571}
572
644c9858
DF
573static void virtio_net_apply_guest_offloads(VirtIONet *n)
574{
ad37bb3b 575 qemu_set_offload(qemu_get_queue(n->nic)->peer,
644c9858
DF
576 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_CSUM)),
577 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO4)),
578 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_TSO6)),
579 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_ECN)),
580 !!(n->curr_guest_offloads & (1ULL << VIRTIO_NET_F_GUEST_UFO)));
581}
582
583static uint64_t virtio_net_guest_offloads_by_features(uint32_t features)
584{
585 static const uint64_t guest_offloads_mask =
586 (1ULL << VIRTIO_NET_F_GUEST_CSUM) |
587 (1ULL << VIRTIO_NET_F_GUEST_TSO4) |
588 (1ULL << VIRTIO_NET_F_GUEST_TSO6) |
589 (1ULL << VIRTIO_NET_F_GUEST_ECN) |
590 (1ULL << VIRTIO_NET_F_GUEST_UFO);
591
592 return guest_offloads_mask & features;
593}
594
595static inline uint64_t virtio_net_supported_guest_offloads(VirtIONet *n)
596{
597 VirtIODevice *vdev = VIRTIO_DEVICE(n);
598 return virtio_net_guest_offloads_by_features(vdev->guest_features);
599}
600
d5aaa1b0 601static void virtio_net_set_features(VirtIODevice *vdev, uint64_t features)
fbe78f4f 602{
17a0ca55 603 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9
JW
604 int i;
605
ef546f12 606 virtio_net_set_multiqueue(n,
95129d6f 607 virtio_has_feature(features, VIRTIO_NET_F_MQ));
fbe78f4f 608
ef546f12 609 virtio_net_set_mrg_rx_bufs(n,
95129d6f
CH
610 virtio_has_feature(features,
611 VIRTIO_NET_F_MRG_RXBUF),
612 virtio_has_feature(features,
613 VIRTIO_F_VERSION_1));
f5436dd9
MM
614
615 if (n->has_vnet_hdr) {
644c9858
DF
616 n->curr_guest_offloads =
617 virtio_net_guest_offloads_by_features(features);
618 virtio_net_apply_guest_offloads(n);
f5436dd9 619 }
fed699f9
JW
620
621 for (i = 0; i < n->max_queues; i++) {
622 NetClientState *nc = qemu_get_subqueue(n->nic, i);
623
ed8b4afe 624 if (!get_vhost_net(nc->peer)) {
fed699f9
JW
625 continue;
626 }
ed8b4afe 627 vhost_net_ack_features(get_vhost_net(nc->peer), features);
dc14a397 628 }
0b1eaa88 629
95129d6f 630 if (virtio_has_feature(features, VIRTIO_NET_F_CTRL_VLAN)) {
0b1eaa88
SF
631 memset(n->vlans, 0, MAX_VLAN >> 3);
632 } else {
633 memset(n->vlans, 0xff, MAX_VLAN >> 3);
634 }
fbe78f4f
AL
635}
636
002437cd 637static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
921ac5d0 638 struct iovec *iov, unsigned int iov_cnt)
002437cd
AL
639{
640 uint8_t on;
921ac5d0 641 size_t s;
b1be4280 642 NetClientState *nc = qemu_get_queue(n->nic);
002437cd 643
921ac5d0
MT
644 s = iov_to_buf(iov, iov_cnt, 0, &on, sizeof(on));
645 if (s != sizeof(on)) {
646 return VIRTIO_NET_ERR;
002437cd
AL
647 }
648
dd23454b 649 if (cmd == VIRTIO_NET_CTRL_RX_PROMISC) {
002437cd 650 n->promisc = on;
dd23454b 651 } else if (cmd == VIRTIO_NET_CTRL_RX_ALLMULTI) {
002437cd 652 n->allmulti = on;
dd23454b 653 } else if (cmd == VIRTIO_NET_CTRL_RX_ALLUNI) {
015cb166 654 n->alluni = on;
dd23454b 655 } else if (cmd == VIRTIO_NET_CTRL_RX_NOMULTI) {
015cb166 656 n->nomulti = on;
dd23454b 657 } else if (cmd == VIRTIO_NET_CTRL_RX_NOUNI) {
015cb166 658 n->nouni = on;
dd23454b 659 } else if (cmd == VIRTIO_NET_CTRL_RX_NOBCAST) {
015cb166 660 n->nobcast = on;
921ac5d0 661 } else {
002437cd 662 return VIRTIO_NET_ERR;
921ac5d0 663 }
002437cd 664
b1be4280
AK
665 rxfilter_notify(nc);
666
002437cd
AL
667 return VIRTIO_NET_OK;
668}
669
644c9858
DF
670static int virtio_net_handle_offloads(VirtIONet *n, uint8_t cmd,
671 struct iovec *iov, unsigned int iov_cnt)
672{
673 VirtIODevice *vdev = VIRTIO_DEVICE(n);
674 uint64_t offloads;
675 size_t s;
676
95129d6f 677 if (!virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
644c9858
DF
678 return VIRTIO_NET_ERR;
679 }
680
681 s = iov_to_buf(iov, iov_cnt, 0, &offloads, sizeof(offloads));
682 if (s != sizeof(offloads)) {
683 return VIRTIO_NET_ERR;
684 }
685
686 if (cmd == VIRTIO_NET_CTRL_GUEST_OFFLOADS_SET) {
687 uint64_t supported_offloads;
688
689 if (!n->has_vnet_hdr) {
690 return VIRTIO_NET_ERR;
691 }
692
693 supported_offloads = virtio_net_supported_guest_offloads(n);
694 if (offloads & ~supported_offloads) {
695 return VIRTIO_NET_ERR;
696 }
697
698 n->curr_guest_offloads = offloads;
699 virtio_net_apply_guest_offloads(n);
700
701 return VIRTIO_NET_OK;
702 } else {
703 return VIRTIO_NET_ERR;
704 }
705}
706
b6503ed9 707static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
921ac5d0 708 struct iovec *iov, unsigned int iov_cnt)
b6503ed9 709{
1399c60d 710 VirtIODevice *vdev = VIRTIO_DEVICE(n);
b6503ed9 711 struct virtio_net_ctrl_mac mac_data;
921ac5d0 712 size_t s;
b1be4280 713 NetClientState *nc = qemu_get_queue(n->nic);
b6503ed9 714
c1943a3f
AK
715 if (cmd == VIRTIO_NET_CTRL_MAC_ADDR_SET) {
716 if (iov_size(iov, iov_cnt) != sizeof(n->mac)) {
717 return VIRTIO_NET_ERR;
718 }
719 s = iov_to_buf(iov, iov_cnt, 0, &n->mac, sizeof(n->mac));
720 assert(s == sizeof(n->mac));
b356f76d 721 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->mac);
b1be4280
AK
722 rxfilter_notify(nc);
723
c1943a3f
AK
724 return VIRTIO_NET_OK;
725 }
726
921ac5d0 727 if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET) {
b6503ed9 728 return VIRTIO_NET_ERR;
921ac5d0 729 }
b6503ed9 730
cae2e556
AK
731 int in_use = 0;
732 int first_multi = 0;
733 uint8_t uni_overflow = 0;
734 uint8_t multi_overflow = 0;
735 uint8_t *macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
b6503ed9 736
921ac5d0
MT
737 s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
738 sizeof(mac_data.entries));
1399c60d 739 mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
921ac5d0 740 if (s != sizeof(mac_data.entries)) {
b1be4280 741 goto error;
921ac5d0
MT
742 }
743 iov_discard_front(&iov, &iov_cnt, s);
b6503ed9 744
921ac5d0 745 if (mac_data.entries * ETH_ALEN > iov_size(iov, iov_cnt)) {
b1be4280 746 goto error;
921ac5d0 747 }
b6503ed9
AL
748
749 if (mac_data.entries <= MAC_TABLE_ENTRIES) {
cae2e556 750 s = iov_to_buf(iov, iov_cnt, 0, macs,
921ac5d0
MT
751 mac_data.entries * ETH_ALEN);
752 if (s != mac_data.entries * ETH_ALEN) {
b1be4280 753 goto error;
921ac5d0 754 }
cae2e556 755 in_use += mac_data.entries;
b6503ed9 756 } else {
cae2e556 757 uni_overflow = 1;
b6503ed9
AL
758 }
759
921ac5d0
MT
760 iov_discard_front(&iov, &iov_cnt, mac_data.entries * ETH_ALEN);
761
cae2e556 762 first_multi = in_use;
2d9aba39 763
921ac5d0
MT
764 s = iov_to_buf(iov, iov_cnt, 0, &mac_data.entries,
765 sizeof(mac_data.entries));
1399c60d 766 mac_data.entries = virtio_ldl_p(vdev, &mac_data.entries);
921ac5d0 767 if (s != sizeof(mac_data.entries)) {
b1be4280 768 goto error;
921ac5d0
MT
769 }
770
771 iov_discard_front(&iov, &iov_cnt, s);
b6503ed9 772
921ac5d0 773 if (mac_data.entries * ETH_ALEN != iov_size(iov, iov_cnt)) {
b1be4280 774 goto error;
921ac5d0 775 }
b6503ed9 776
edc24385 777 if (mac_data.entries <= MAC_TABLE_ENTRIES - in_use) {
cae2e556 778 s = iov_to_buf(iov, iov_cnt, 0, &macs[in_use * ETH_ALEN],
921ac5d0
MT
779 mac_data.entries * ETH_ALEN);
780 if (s != mac_data.entries * ETH_ALEN) {
b1be4280 781 goto error;
8fd2a2f1 782 }
cae2e556 783 in_use += mac_data.entries;
921ac5d0 784 } else {
cae2e556 785 multi_overflow = 1;
b6503ed9
AL
786 }
787
cae2e556
AK
788 n->mac_table.in_use = in_use;
789 n->mac_table.first_multi = first_multi;
790 n->mac_table.uni_overflow = uni_overflow;
791 n->mac_table.multi_overflow = multi_overflow;
792 memcpy(n->mac_table.macs, macs, MAC_TABLE_ENTRIES * ETH_ALEN);
793 g_free(macs);
b1be4280
AK
794 rxfilter_notify(nc);
795
b6503ed9 796 return VIRTIO_NET_OK;
b1be4280
AK
797
798error:
cae2e556 799 g_free(macs);
b1be4280 800 return VIRTIO_NET_ERR;
b6503ed9
AL
801}
802
f21c0ed9 803static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
921ac5d0 804 struct iovec *iov, unsigned int iov_cnt)
f21c0ed9 805{
1399c60d 806 VirtIODevice *vdev = VIRTIO_DEVICE(n);
f21c0ed9 807 uint16_t vid;
921ac5d0 808 size_t s;
b1be4280 809 NetClientState *nc = qemu_get_queue(n->nic);
f21c0ed9 810
921ac5d0 811 s = iov_to_buf(iov, iov_cnt, 0, &vid, sizeof(vid));
1399c60d 812 vid = virtio_lduw_p(vdev, &vid);
921ac5d0 813 if (s != sizeof(vid)) {
f21c0ed9
AL
814 return VIRTIO_NET_ERR;
815 }
816
f21c0ed9
AL
817 if (vid >= MAX_VLAN)
818 return VIRTIO_NET_ERR;
819
820 if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
821 n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
822 else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
823 n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
824 else
825 return VIRTIO_NET_ERR;
826
b1be4280
AK
827 rxfilter_notify(nc);
828
f21c0ed9
AL
829 return VIRTIO_NET_OK;
830}
831
f57fcf70
JW
832static int virtio_net_handle_announce(VirtIONet *n, uint8_t cmd,
833 struct iovec *iov, unsigned int iov_cnt)
834{
835 if (cmd == VIRTIO_NET_CTRL_ANNOUNCE_ACK &&
836 n->status & VIRTIO_NET_S_ANNOUNCE) {
837 n->status &= ~VIRTIO_NET_S_ANNOUNCE;
838 if (n->announce_counter) {
839 timer_mod(n->announce_timer,
840 qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL) +
841 self_announce_delay(n->announce_counter));
842 }
843 return VIRTIO_NET_OK;
844 } else {
845 return VIRTIO_NET_ERR;
846 }
847}
848
fed699f9 849static int virtio_net_handle_mq(VirtIONet *n, uint8_t cmd,
f8f7c533 850 struct iovec *iov, unsigned int iov_cnt)
fed699f9 851{
17a0ca55 852 VirtIODevice *vdev = VIRTIO_DEVICE(n);
f8f7c533
JW
853 struct virtio_net_ctrl_mq mq;
854 size_t s;
855 uint16_t queues;
fed699f9 856
f8f7c533
JW
857 s = iov_to_buf(iov, iov_cnt, 0, &mq, sizeof(mq));
858 if (s != sizeof(mq)) {
fed699f9
JW
859 return VIRTIO_NET_ERR;
860 }
861
862 if (cmd != VIRTIO_NET_CTRL_MQ_VQ_PAIRS_SET) {
863 return VIRTIO_NET_ERR;
864 }
865
1399c60d 866 queues = virtio_lduw_p(vdev, &mq.virtqueue_pairs);
fed699f9 867
f8f7c533
JW
868 if (queues < VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MIN ||
869 queues > VIRTIO_NET_CTRL_MQ_VQ_PAIRS_MAX ||
870 queues > n->max_queues ||
fed699f9
JW
871 !n->multiqueue) {
872 return VIRTIO_NET_ERR;
873 }
874
f8f7c533 875 n->curr_queues = queues;
fed699f9
JW
876 /* stop the backend before changing the number of queues to avoid handling a
877 * disabled queue */
17a0ca55 878 virtio_net_set_status(vdev, vdev->status);
fed699f9
JW
879 virtio_net_set_queues(n);
880
881 return VIRTIO_NET_OK;
882}
ba7eadb5 883
3d11d36c
AL
884static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
885{
17a0ca55 886 VirtIONet *n = VIRTIO_NET(vdev);
3d11d36c
AL
887 struct virtio_net_ctrl_hdr ctrl;
888 virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
51b19ebe 889 VirtQueueElement *elem;
921ac5d0 890 size_t s;
771b6ed3 891 struct iovec *iov, *iov2;
921ac5d0 892 unsigned int iov_cnt;
3d11d36c 893
51b19ebe
PB
894 for (;;) {
895 elem = virtqueue_pop(vq, sizeof(VirtQueueElement));
896 if (!elem) {
897 break;
898 }
899 if (iov_size(elem->in_sg, elem->in_num) < sizeof(status) ||
900 iov_size(elem->out_sg, elem->out_num) < sizeof(ctrl)) {
ba7eadb5
GK
901 virtio_error(vdev, "virtio-net ctrl missing headers");
902 virtqueue_detach_element(vq, elem, 0);
903 g_free(elem);
904 break;
3d11d36c
AL
905 }
906
51b19ebe
PB
907 iov_cnt = elem->out_num;
908 iov2 = iov = g_memdup(elem->out_sg, sizeof(struct iovec) * elem->out_num);
921ac5d0
MT
909 s = iov_to_buf(iov, iov_cnt, 0, &ctrl, sizeof(ctrl));
910 iov_discard_front(&iov, &iov_cnt, sizeof(ctrl));
911 if (s != sizeof(ctrl)) {
912 status = VIRTIO_NET_ERR;
dd23454b 913 } else if (ctrl.class == VIRTIO_NET_CTRL_RX) {
921ac5d0
MT
914 status = virtio_net_handle_rx_mode(n, ctrl.cmd, iov, iov_cnt);
915 } else if (ctrl.class == VIRTIO_NET_CTRL_MAC) {
916 status = virtio_net_handle_mac(n, ctrl.cmd, iov, iov_cnt);
917 } else if (ctrl.class == VIRTIO_NET_CTRL_VLAN) {
918 status = virtio_net_handle_vlan_table(n, ctrl.cmd, iov, iov_cnt);
f57fcf70
JW
919 } else if (ctrl.class == VIRTIO_NET_CTRL_ANNOUNCE) {
920 status = virtio_net_handle_announce(n, ctrl.cmd, iov, iov_cnt);
fed699f9 921 } else if (ctrl.class == VIRTIO_NET_CTRL_MQ) {
f8f7c533 922 status = virtio_net_handle_mq(n, ctrl.cmd, iov, iov_cnt);
644c9858
DF
923 } else if (ctrl.class == VIRTIO_NET_CTRL_GUEST_OFFLOADS) {
924 status = virtio_net_handle_offloads(n, ctrl.cmd, iov, iov_cnt);
3d11d36c
AL
925 }
926
51b19ebe 927 s = iov_from_buf(elem->in_sg, elem->in_num, 0, &status, sizeof(status));
921ac5d0 928 assert(s == sizeof(status));
3d11d36c 929
51b19ebe 930 virtqueue_push(vq, elem, sizeof(status));
3d11d36c 931 virtio_notify(vdev, vq);
771b6ed3 932 g_free(iov2);
51b19ebe 933 g_free(elem);
3d11d36c
AL
934 }
935}
936
fbe78f4f
AL
937/* RX */
938
939static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
940{
17a0ca55 941 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 942 int queue_index = vq2q(virtio_get_queue_index(vq));
8aeff62d 943
fed699f9 944 qemu_flush_queued_packets(qemu_get_subqueue(n->nic, queue_index));
fbe78f4f
AL
945}
946
4e68f7a0 947static int virtio_net_can_receive(NetClientState *nc)
fbe78f4f 948{
cc1f0f45 949 VirtIONet *n = qemu_get_nic_opaque(nc);
17a0ca55 950 VirtIODevice *vdev = VIRTIO_DEVICE(n);
fed699f9 951 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
0c87e93e 952
17a0ca55 953 if (!vdev->vm_running) {
95477323
MT
954 return 0;
955 }
cdd5cc12 956
fed699f9
JW
957 if (nc->queue_index >= n->curr_queues) {
958 return 0;
959 }
960
0c87e93e 961 if (!virtio_queue_ready(q->rx_vq) ||
17a0ca55 962 !(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
fbe78f4f 963 return 0;
0c87e93e 964 }
fbe78f4f 965
cdd5cc12
MM
966 return 1;
967}
968
0c87e93e 969static int virtio_net_has_buffers(VirtIONetQueue *q, int bufsize)
cdd5cc12 970{
0c87e93e
JW
971 VirtIONet *n = q->n;
972 if (virtio_queue_empty(q->rx_vq) ||
fbe78f4f 973 (n->mergeable_rx_bufs &&
0c87e93e
JW
974 !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
975 virtio_queue_set_notification(q->rx_vq, 1);
06b12970
TL
976
977 /* To avoid a race condition where the guest has made some buffers
978 * available after the above check but before notification was
979 * enabled, check for available buffers again.
980 */
0c87e93e 981 if (virtio_queue_empty(q->rx_vq) ||
06b12970 982 (n->mergeable_rx_bufs &&
0c87e93e 983 !virtqueue_avail_bytes(q->rx_vq, bufsize, 0))) {
06b12970 984 return 0;
0c87e93e 985 }
fbe78f4f
AL
986 }
987
0c87e93e 988 virtio_queue_set_notification(q->rx_vq, 0);
fbe78f4f
AL
989 return 1;
990}
991
1399c60d 992static void virtio_net_hdr_swap(VirtIODevice *vdev, struct virtio_net_hdr *hdr)
032a74a1 993{
1399c60d
RR
994 virtio_tswap16s(vdev, &hdr->hdr_len);
995 virtio_tswap16s(vdev, &hdr->gso_size);
996 virtio_tswap16s(vdev, &hdr->csum_start);
997 virtio_tswap16s(vdev, &hdr->csum_offset);
032a74a1
CLG
998}
999
1d41b0c1
AL
1000/* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
1001 * it never finds out that the packets don't have valid checksums. This
1002 * causes dhclient to get upset. Fedora's carried a patch for ages to
1003 * fix this with Xen but it hasn't appeared in an upstream release of
1004 * dhclient yet.
1005 *
1006 * To avoid breaking existing guests, we catch udp packets and add
1007 * checksums. This is terrible but it's better than hacking the guest
1008 * kernels.
1009 *
1010 * N.B. if we introduce a zero-copy API, this operation is no longer free so
1011 * we should provide a mechanism to disable it to avoid polluting the host
1012 * cache.
1013 */
1014static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
22cc84db 1015 uint8_t *buf, size_t size)
1d41b0c1
AL
1016{
1017 if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
1018 (size > 27 && size < 1500) && /* normal sized MTU */
1019 (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
1020 (buf[23] == 17) && /* ip.protocol == UDP */
1021 (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
22cc84db 1022 net_checksum_calculate(buf, size);
1d41b0c1
AL
1023 hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
1024 }
1025}
1026
280598b7
MT
1027static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
1028 const void *buf, size_t size)
fbe78f4f 1029{
3a330134 1030 if (n->has_vnet_hdr) {
22cc84db
MT
1031 /* FIXME this cast is evil */
1032 void *wbuf = (void *)buf;
280598b7
MT
1033 work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
1034 size - n->host_hdr_len);
1bfa316c
GK
1035
1036 if (n->needs_vnet_hdr_swap) {
1037 virtio_net_hdr_swap(VIRTIO_DEVICE(n), wbuf);
1038 }
280598b7 1039 iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
22cc84db
MT
1040 } else {
1041 struct virtio_net_hdr hdr = {
1042 .flags = 0,
1043 .gso_type = VIRTIO_NET_HDR_GSO_NONE
1044 };
1045 iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
3a330134 1046 }
fbe78f4f
AL
1047}
1048
3831ab20
AL
1049static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
1050{
1051 static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
f21c0ed9 1052 static const uint8_t vlan[] = {0x81, 0x00};
3831ab20 1053 uint8_t *ptr = (uint8_t *)buf;
b6503ed9 1054 int i;
3831ab20
AL
1055
1056 if (n->promisc)
1057 return 1;
1058
e043ebc6 1059 ptr += n->host_hdr_len;
3a330134 1060
f21c0ed9 1061 if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
7542d3e7 1062 int vid = lduw_be_p(ptr + 14) & 0xfff;
f21c0ed9
AL
1063 if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
1064 return 0;
1065 }
1066
bbe2f399
AW
1067 if (ptr[0] & 1) { // multicast
1068 if (!memcmp(ptr, bcast, sizeof(bcast))) {
015cb166
AW
1069 return !n->nobcast;
1070 } else if (n->nomulti) {
1071 return 0;
8fd2a2f1 1072 } else if (n->allmulti || n->mac_table.multi_overflow) {
bbe2f399
AW
1073 return 1;
1074 }
2d9aba39
AW
1075
1076 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
1077 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
1078 return 1;
1079 }
1080 }
bbe2f399 1081 } else { // unicast
015cb166
AW
1082 if (n->nouni) {
1083 return 0;
1084 } else if (n->alluni || n->mac_table.uni_overflow) {
8fd2a2f1
AW
1085 return 1;
1086 } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
bbe2f399
AW
1087 return 1;
1088 }
3831ab20 1089
2d9aba39
AW
1090 for (i = 0; i < n->mac_table.first_multi; i++) {
1091 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
1092 return 1;
1093 }
1094 }
b6503ed9
AL
1095 }
1096
3831ab20
AL
1097 return 0;
1098}
1099
4e68f7a0 1100static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, size_t size)
fbe78f4f 1101{
cc1f0f45 1102 VirtIONet *n = qemu_get_nic_opaque(nc);
fed699f9 1103 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
17a0ca55 1104 VirtIODevice *vdev = VIRTIO_DEVICE(n);
63c58728
MT
1105 struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
1106 struct virtio_net_hdr_mrg_rxbuf mhdr;
1107 unsigned mhdr_cnt = 0;
22cc84db 1108 size_t offset, i, guest_offset;
fbe78f4f 1109
fed699f9 1110 if (!virtio_net_can_receive(nc)) {
cdd5cc12 1111 return -1;
b356f76d 1112 }
cdd5cc12 1113
940cda94 1114 /* hdr_len refers to the header we supply to the guest */
0c87e93e 1115 if (!virtio_net_has_buffers(q, size + n->guest_hdr_len - n->host_hdr_len)) {
8aeff62d 1116 return 0;
0c87e93e 1117 }
fbe78f4f 1118
3831ab20 1119 if (!receive_filter(n, buf, size))
4f1c942b 1120 return size;
3831ab20 1121
fbe78f4f
AL
1122 offset = i = 0;
1123
1124 while (offset < size) {
51b19ebe 1125 VirtQueueElement *elem;
fbe78f4f 1126 int len, total;
51b19ebe 1127 const struct iovec *sg;
fbe78f4f 1128
22c253d9 1129 total = 0;
fbe78f4f 1130
51b19ebe
PB
1131 elem = virtqueue_pop(q->rx_vq, sizeof(VirtQueueElement));
1132 if (!elem) {
ba10b9c0
GK
1133 if (i) {
1134 virtio_error(vdev, "virtio-net unexpected empty queue: "
1135 "i %zd mergeable %d offset %zd, size %zd, "
1136 "guest hdr len %zd, host hdr len %zd "
1137 "guest features 0x%" PRIx64,
1138 i, n->mergeable_rx_bufs, offset, size,
1139 n->guest_hdr_len, n->host_hdr_len,
1140 vdev->guest_features);
1141 }
1142 return -1;
fbe78f4f
AL
1143 }
1144
51b19ebe 1145 if (elem->in_num < 1) {
ba10b9c0
GK
1146 virtio_error(vdev,
1147 "virtio-net receive queue contains no in buffers");
1148 virtqueue_detach_element(q->rx_vq, elem, 0);
1149 g_free(elem);
1150 return -1;
fbe78f4f
AL
1151 }
1152
51b19ebe 1153 sg = elem->in_sg;
fbe78f4f 1154 if (i == 0) {
c8d28e7e 1155 assert(offset == 0);
63c58728
MT
1156 if (n->mergeable_rx_bufs) {
1157 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
51b19ebe 1158 sg, elem->in_num,
63c58728
MT
1159 offsetof(typeof(mhdr), num_buffers),
1160 sizeof(mhdr.num_buffers));
1161 }
fbe78f4f 1162
51b19ebe 1163 receive_header(n, sg, elem->in_num, buf, size);
c8d28e7e 1164 offset = n->host_hdr_len;
e35e23f6 1165 total += n->guest_hdr_len;
22cc84db
MT
1166 guest_offset = n->guest_hdr_len;
1167 } else {
1168 guest_offset = 0;
fbe78f4f
AL
1169 }
1170
1171 /* copy in packet. ugh */
51b19ebe 1172 len = iov_from_buf(sg, elem->in_num, guest_offset,
dcf6f5e1 1173 buf + offset, size - offset);
fbe78f4f 1174 total += len;
279a4253
MT
1175 offset += len;
1176 /* If buffers can't be merged, at this point we
1177 * must have consumed the complete packet.
1178 * Otherwise, drop it. */
1179 if (!n->mergeable_rx_bufs && offset < size) {
51b19ebe
PB
1180 virtqueue_discard(q->rx_vq, elem, total);
1181 g_free(elem);
279a4253
MT
1182 return size;
1183 }
fbe78f4f
AL
1184
1185 /* signal other side */
51b19ebe
PB
1186 virtqueue_fill(q->rx_vq, elem, total, i++);
1187 g_free(elem);
fbe78f4f
AL
1188 }
1189
63c58728 1190 if (mhdr_cnt) {
1399c60d 1191 virtio_stw_p(vdev, &mhdr.num_buffers, i);
63c58728
MT
1192 iov_from_buf(mhdr_sg, mhdr_cnt,
1193 0,
1194 &mhdr.num_buffers, sizeof mhdr.num_buffers);
44b15bc5 1195 }
fbe78f4f 1196
0c87e93e 1197 virtqueue_flush(q->rx_vq, i);
17a0ca55 1198 virtio_notify(vdev, q->rx_vq);
4f1c942b
MM
1199
1200 return size;
fbe78f4f
AL
1201}
1202
0c87e93e 1203static int32_t virtio_net_flush_tx(VirtIONetQueue *q);
6243375f 1204
4e68f7a0 1205static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
6243375f 1206{
cc1f0f45 1207 VirtIONet *n = qemu_get_nic_opaque(nc);
fed699f9 1208 VirtIONetQueue *q = virtio_net_get_subqueue(nc);
17a0ca55 1209 VirtIODevice *vdev = VIRTIO_DEVICE(n);
6243375f 1210
51b19ebe 1211 virtqueue_push(q->tx_vq, q->async_tx.elem, 0);
17a0ca55 1212 virtio_notify(vdev, q->tx_vq);
6243375f 1213
51b19ebe
PB
1214 g_free(q->async_tx.elem);
1215 q->async_tx.elem = NULL;
6243375f 1216
0c87e93e
JW
1217 virtio_queue_set_notification(q->tx_vq, 1);
1218 virtio_net_flush_tx(q);
6243375f
MM
1219}
1220
fbe78f4f 1221/* TX */
0c87e93e 1222static int32_t virtio_net_flush_tx(VirtIONetQueue *q)
fbe78f4f 1223{
0c87e93e 1224 VirtIONet *n = q->n;
17a0ca55 1225 VirtIODevice *vdev = VIRTIO_DEVICE(n);
51b19ebe 1226 VirtQueueElement *elem;
e3f30488 1227 int32_t num_packets = 0;
fed699f9 1228 int queue_index = vq2q(virtio_get_queue_index(q->tx_vq));
17a0ca55 1229 if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
e3f30488
AW
1230 return num_packets;
1231 }
fbe78f4f 1232
51b19ebe 1233 if (q->async_tx.elem) {
0c87e93e 1234 virtio_queue_set_notification(q->tx_vq, 0);
e3f30488 1235 return num_packets;
6243375f
MM
1236 }
1237
51b19ebe 1238 for (;;) {
bd89dd98 1239 ssize_t ret;
51b19ebe
PB
1240 unsigned int out_num;
1241 struct iovec sg[VIRTQUEUE_MAX_SIZE], sg2[VIRTQUEUE_MAX_SIZE + 1], *out_sg;
feb93f36 1242 struct virtio_net_hdr_mrg_rxbuf mhdr;
fbe78f4f 1243
51b19ebe
PB
1244 elem = virtqueue_pop(q->tx_vq, sizeof(VirtQueueElement));
1245 if (!elem) {
1246 break;
1247 }
1248
1249 out_num = elem->out_num;
1250 out_sg = elem->out_sg;
7b80d08e 1251 if (out_num < 1) {
fa5e56c2
GK
1252 virtio_error(vdev, "virtio-net header not in first element");
1253 virtqueue_detach_element(q->tx_vq, elem, 0);
1254 g_free(elem);
1255 return -EINVAL;
fbe78f4f
AL
1256 }
1257
032a74a1 1258 if (n->has_vnet_hdr) {
feb93f36
JW
1259 if (iov_to_buf(out_sg, out_num, 0, &mhdr, n->guest_hdr_len) <
1260 n->guest_hdr_len) {
fa5e56c2
GK
1261 virtio_error(vdev, "virtio-net header incorrect");
1262 virtqueue_detach_element(q->tx_vq, elem, 0);
1263 g_free(elem);
1264 return -EINVAL;
032a74a1 1265 }
1bfa316c 1266 if (n->needs_vnet_hdr_swap) {
feb93f36
JW
1267 virtio_net_hdr_swap(vdev, (void *) &mhdr);
1268 sg2[0].iov_base = &mhdr;
1269 sg2[0].iov_len = n->guest_hdr_len;
1270 out_num = iov_copy(&sg2[1], ARRAY_SIZE(sg2) - 1,
1271 out_sg, out_num,
1272 n->guest_hdr_len, -1);
1273 if (out_num == VIRTQUEUE_MAX_SIZE) {
1274 goto drop;
1275 }
1276 out_num += 1;
1277 out_sg = sg2;
1278 }
032a74a1 1279 }
14761f9c
MT
1280 /*
1281 * If host wants to see the guest header as is, we can
1282 * pass it on unchanged. Otherwise, copy just the parts
1283 * that host is interested in.
1284 */
1285 assert(n->host_hdr_len <= n->guest_hdr_len);
1286 if (n->host_hdr_len != n->guest_hdr_len) {
1287 unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
1288 out_sg, out_num,
1289 0, n->host_hdr_len);
1290 sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
1291 out_sg, out_num,
1292 n->guest_hdr_len, -1);
1293 out_num = sg_num;
1294 out_sg = sg;
fbe78f4f
AL
1295 }
1296
fed699f9
JW
1297 ret = qemu_sendv_packet_async(qemu_get_subqueue(n->nic, queue_index),
1298 out_sg, out_num, virtio_net_tx_complete);
6243375f 1299 if (ret == 0) {
0c87e93e
JW
1300 virtio_queue_set_notification(q->tx_vq, 0);
1301 q->async_tx.elem = elem;
e3f30488 1302 return -EBUSY;
6243375f
MM
1303 }
1304
feb93f36 1305drop:
51b19ebe 1306 virtqueue_push(q->tx_vq, elem, 0);
17a0ca55 1307 virtio_notify(vdev, q->tx_vq);
51b19ebe 1308 g_free(elem);
e3f30488
AW
1309
1310 if (++num_packets >= n->tx_burst) {
1311 break;
1312 }
fbe78f4f 1313 }
e3f30488 1314 return num_packets;
fbe78f4f
AL
1315}
1316
a697a334 1317static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
fbe78f4f 1318{
17a0ca55 1319 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1320 VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
fbe78f4f 1321
783e7706 1322 /* This happens when device was stopped but VCPU wasn't. */
17a0ca55 1323 if (!vdev->vm_running) {
0c87e93e 1324 q->tx_waiting = 1;
783e7706
MT
1325 return;
1326 }
1327
0c87e93e 1328 if (q->tx_waiting) {
fbe78f4f 1329 virtio_queue_set_notification(vq, 1);
bc72ad67 1330 timer_del(q->tx_timer);
0c87e93e 1331 q->tx_waiting = 0;
fa5e56c2
GK
1332 if (virtio_net_flush_tx(q) == -EINVAL) {
1333 return;
1334 }
fbe78f4f 1335 } else {
bc72ad67
AB
1336 timer_mod(q->tx_timer,
1337 qemu_clock_get_ns(QEMU_CLOCK_VIRTUAL) + n->tx_timeout);
0c87e93e 1338 q->tx_waiting = 1;
fbe78f4f
AL
1339 virtio_queue_set_notification(vq, 0);
1340 }
1341}
1342
a697a334
AW
1343static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
1344{
17a0ca55 1345 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1346 VirtIONetQueue *q = &n->vqs[vq2q(virtio_get_queue_index(vq))];
a697a334 1347
0c87e93e 1348 if (unlikely(q->tx_waiting)) {
a697a334
AW
1349 return;
1350 }
0c87e93e 1351 q->tx_waiting = 1;
783e7706 1352 /* This happens when device was stopped but VCPU wasn't. */
17a0ca55 1353 if (!vdev->vm_running) {
783e7706
MT
1354 return;
1355 }
a697a334 1356 virtio_queue_set_notification(vq, 0);
0c87e93e 1357 qemu_bh_schedule(q->tx_bh);
a697a334
AW
1358}
1359
fbe78f4f
AL
1360static void virtio_net_tx_timer(void *opaque)
1361{
0c87e93e
JW
1362 VirtIONetQueue *q = opaque;
1363 VirtIONet *n = q->n;
17a0ca55 1364 VirtIODevice *vdev = VIRTIO_DEVICE(n);
e8bcf842
MT
1365 /* This happens when device was stopped but BH wasn't. */
1366 if (!vdev->vm_running) {
1367 /* Make sure tx waiting is set, so we'll run when restarted. */
1368 assert(q->tx_waiting);
1369 return;
1370 }
fbe78f4f 1371
0c87e93e 1372 q->tx_waiting = 0;
fbe78f4f
AL
1373
1374 /* Just in case the driver is not ready on more */
17a0ca55 1375 if (!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK)) {
fbe78f4f 1376 return;
17a0ca55 1377 }
fbe78f4f 1378
0c87e93e
JW
1379 virtio_queue_set_notification(q->tx_vq, 1);
1380 virtio_net_flush_tx(q);
fbe78f4f
AL
1381}
1382
a697a334
AW
1383static void virtio_net_tx_bh(void *opaque)
1384{
0c87e93e
JW
1385 VirtIONetQueue *q = opaque;
1386 VirtIONet *n = q->n;
17a0ca55 1387 VirtIODevice *vdev = VIRTIO_DEVICE(n);
a697a334
AW
1388 int32_t ret;
1389
e8bcf842
MT
1390 /* This happens when device was stopped but BH wasn't. */
1391 if (!vdev->vm_running) {
1392 /* Make sure tx waiting is set, so we'll run when restarted. */
1393 assert(q->tx_waiting);
1394 return;
1395 }
783e7706 1396
0c87e93e 1397 q->tx_waiting = 0;
a697a334
AW
1398
1399 /* Just in case the driver is not ready on more */
17a0ca55 1400 if (unlikely(!(vdev->status & VIRTIO_CONFIG_S_DRIVER_OK))) {
a697a334 1401 return;
17a0ca55 1402 }
a697a334 1403
0c87e93e 1404 ret = virtio_net_flush_tx(q);
fa5e56c2
GK
1405 if (ret == -EBUSY || ret == -EINVAL) {
1406 return; /* Notification re-enable handled by tx_complete or device
1407 * broken */
a697a334
AW
1408 }
1409
1410 /* If we flush a full burst of packets, assume there are
1411 * more coming and immediately reschedule */
1412 if (ret >= n->tx_burst) {
0c87e93e
JW
1413 qemu_bh_schedule(q->tx_bh);
1414 q->tx_waiting = 1;
a697a334
AW
1415 return;
1416 }
1417
1418 /* If less than a full burst, re-enable notification and flush
1419 * anything that may have come in while we weren't looking. If
1420 * we find something, assume the guest is still active and reschedule */
0c87e93e 1421 virtio_queue_set_notification(q->tx_vq, 1);
fa5e56c2
GK
1422 ret = virtio_net_flush_tx(q);
1423 if (ret == -EINVAL) {
1424 return;
1425 } else if (ret > 0) {
0c87e93e
JW
1426 virtio_queue_set_notification(q->tx_vq, 0);
1427 qemu_bh_schedule(q->tx_bh);
1428 q->tx_waiting = 1;
a697a334
AW
1429 }
1430}
1431
f9d6dbf0
WC
1432static void virtio_net_add_queue(VirtIONet *n, int index)
1433{
1434 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1435
1c0fbfa3
MT
1436 n->vqs[index].rx_vq = virtio_add_queue(vdev, n->net_conf.rx_queue_size,
1437 virtio_net_handle_rx);
f9d6dbf0
WC
1438 if (n->net_conf.tx && !strcmp(n->net_conf.tx, "timer")) {
1439 n->vqs[index].tx_vq =
1440 virtio_add_queue(vdev, 256, virtio_net_handle_tx_timer);
1441 n->vqs[index].tx_timer = timer_new_ns(QEMU_CLOCK_VIRTUAL,
1442 virtio_net_tx_timer,
1443 &n->vqs[index]);
1444 } else {
1445 n->vqs[index].tx_vq =
1446 virtio_add_queue(vdev, 256, virtio_net_handle_tx_bh);
1447 n->vqs[index].tx_bh = qemu_bh_new(virtio_net_tx_bh, &n->vqs[index]);
1448 }
1449
1450 n->vqs[index].tx_waiting = 0;
1451 n->vqs[index].n = n;
1452}
1453
1454static void virtio_net_del_queue(VirtIONet *n, int index)
1455{
1456 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1457 VirtIONetQueue *q = &n->vqs[index];
1458 NetClientState *nc = qemu_get_subqueue(n->nic, index);
1459
1460 qemu_purge_queued_packets(nc);
1461
1462 virtio_del_queue(vdev, index * 2);
1463 if (q->tx_timer) {
1464 timer_del(q->tx_timer);
1465 timer_free(q->tx_timer);
1466 } else {
1467 qemu_bh_delete(q->tx_bh);
1468 }
1469 virtio_del_queue(vdev, index * 2 + 1);
1470}
1471
1472static void virtio_net_change_num_queues(VirtIONet *n, int new_max_queues)
1473{
1474 VirtIODevice *vdev = VIRTIO_DEVICE(n);
1475 int old_num_queues = virtio_get_num_queues(vdev);
1476 int new_num_queues = new_max_queues * 2 + 1;
1477 int i;
1478
1479 assert(old_num_queues >= 3);
1480 assert(old_num_queues % 2 == 1);
1481
1482 if (old_num_queues == new_num_queues) {
1483 return;
1484 }
1485
1486 /*
1487 * We always need to remove and add ctrl vq if
1488 * old_num_queues != new_num_queues. Remove ctrl_vq first,
1489 * and then we only enter one of the following too loops.
1490 */
1491 virtio_del_queue(vdev, old_num_queues - 1);
1492
1493 for (i = new_num_queues - 1; i < old_num_queues - 1; i += 2) {
1494 /* new_num_queues < old_num_queues */
1495 virtio_net_del_queue(n, i / 2);
1496 }
1497
1498 for (i = old_num_queues - 1; i < new_num_queues - 1; i += 2) {
1499 /* new_num_queues > old_num_queues */
1500 virtio_net_add_queue(n, i / 2);
1501 }
1502
1503 /* add ctrl_vq last */
1504 n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
1505}
1506
ec57db16 1507static void virtio_net_set_multiqueue(VirtIONet *n, int multiqueue)
fed699f9 1508{
f9d6dbf0
WC
1509 int max = multiqueue ? n->max_queues : 1;
1510
fed699f9 1511 n->multiqueue = multiqueue;
f9d6dbf0 1512 virtio_net_change_num_queues(n, max);
fed699f9 1513
fed699f9
JW
1514 virtio_net_set_queues(n);
1515}
1516
037dab2f
GK
1517static void virtio_net_save_device(VirtIODevice *vdev, QEMUFile *f)
1518{
1519 VirtIONet *n = VIRTIO_NET(vdev);
1520 int i;
fbe78f4f 1521
79674068 1522 qemu_put_buffer(f, n->mac, ETH_ALEN);
5f800801 1523 qemu_put_be32(f, n->vqs[0].tx_waiting);
e46cb38f 1524 qemu_put_be32(f, n->mergeable_rx_bufs);
9d6271b8 1525 qemu_put_be16(f, n->status);
f10c592e
AW
1526 qemu_put_byte(f, n->promisc);
1527 qemu_put_byte(f, n->allmulti);
b6503ed9
AL
1528 qemu_put_be32(f, n->mac_table.in_use);
1529 qemu_put_buffer(f, n->mac_table.macs, n->mac_table.in_use * ETH_ALEN);
f21c0ed9 1530 qemu_put_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
3a330134 1531 qemu_put_be32(f, n->has_vnet_hdr);
8fd2a2f1
AW
1532 qemu_put_byte(f, n->mac_table.multi_overflow);
1533 qemu_put_byte(f, n->mac_table.uni_overflow);
015cb166
AW
1534 qemu_put_byte(f, n->alluni);
1535 qemu_put_byte(f, n->nomulti);
1536 qemu_put_byte(f, n->nouni);
1537 qemu_put_byte(f, n->nobcast);
0ce0e8f4 1538 qemu_put_byte(f, n->has_ufo);
5f800801
JW
1539 if (n->max_queues > 1) {
1540 qemu_put_be16(f, n->max_queues);
1541 qemu_put_be16(f, n->curr_queues);
1542 for (i = 1; i < n->curr_queues; i++) {
1543 qemu_put_be32(f, n->vqs[i].tx_waiting);
1544 }
1545 }
644c9858 1546
95129d6f 1547 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
644c9858
DF
1548 qemu_put_be64(f, n->curr_guest_offloads);
1549 }
fbe78f4f
AL
1550}
1551
037dab2f
GK
1552static int virtio_net_load_device(VirtIODevice *vdev, QEMUFile *f,
1553 int version_id)
1554{
1555 VirtIONet *n = VIRTIO_NET(vdev);
1556 int i, link_down;
fbe78f4f 1557
79674068 1558 qemu_get_buffer(f, n->mac, ETH_ALEN);
5f800801 1559 n->vqs[0].tx_waiting = qemu_get_be32(f);
ff3a8066 1560
bb9d17f8 1561 virtio_net_set_mrg_rx_bufs(n, qemu_get_be32(f),
95129d6f
CH
1562 virtio_vdev_has_feature(vdev,
1563 VIRTIO_F_VERSION_1));
fbe78f4f 1564
76010cb3 1565 n->status = qemu_get_be16(f);
9d6271b8 1566
76010cb3
DDAG
1567 n->promisc = qemu_get_byte(f);
1568 n->allmulti = qemu_get_byte(f);
002437cd 1569
76010cb3
DDAG
1570 n->mac_table.in_use = qemu_get_be32(f);
1571 /* MAC_TABLE_ENTRIES may be different from the saved image */
1572 if (n->mac_table.in_use <= MAC_TABLE_ENTRIES) {
1573 qemu_get_buffer(f, n->mac_table.macs,
1574 n->mac_table.in_use * ETH_ALEN);
1575 } else {
1576 int64_t i;
1577
1578 /* Overflow detected - can happen if source has a larger MAC table.
1579 * We simply set overflow flag so there's no need to maintain the
1580 * table of addresses, discard them all.
1581 * Note: 64 bit math to avoid integer overflow.
1582 */
1583 for (i = 0; i < (int64_t)n->mac_table.in_use * ETH_ALEN; ++i) {
1584 qemu_get_byte(f);
b6503ed9 1585 }
76010cb3
DDAG
1586 n->mac_table.multi_overflow = n->mac_table.uni_overflow = 1;
1587 n->mac_table.in_use = 0;
b6503ed9
AL
1588 }
1589
76010cb3 1590 qemu_get_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
f21c0ed9 1591
76010cb3
DDAG
1592 if (qemu_get_be32(f) && !peer_has_vnet_hdr(n)) {
1593 error_report("virtio-net: saved image requires vnet_hdr=on");
1594 return -1;
6c042c16
AW
1595 }
1596
76010cb3
DDAG
1597 n->mac_table.multi_overflow = qemu_get_byte(f);
1598 n->mac_table.uni_overflow = qemu_get_byte(f);
8fd2a2f1 1599
76010cb3
DDAG
1600 n->alluni = qemu_get_byte(f);
1601 n->nomulti = qemu_get_byte(f);
1602 n->nouni = qemu_get_byte(f);
1603 n->nobcast = qemu_get_byte(f);
015cb166 1604
76010cb3
DDAG
1605 if (qemu_get_byte(f) && !peer_has_ufo(n)) {
1606 error_report("virtio-net: saved image requires TUN_F_UFO support");
1607 return -1;
0ce0e8f4
MM
1608 }
1609
5f800801
JW
1610 if (n->max_queues > 1) {
1611 if (n->max_queues != qemu_get_be16(f)) {
1612 error_report("virtio-net: different max_queues ");
1613 return -1;
1614 }
1615
1616 n->curr_queues = qemu_get_be16(f);
eea750a5
MT
1617 if (n->curr_queues > n->max_queues) {
1618 error_report("virtio-net: curr_queues %x > max_queues %x",
1619 n->curr_queues, n->max_queues);
1620 return -1;
1621 }
5f800801
JW
1622 for (i = 1; i < n->curr_queues; i++) {
1623 n->vqs[i].tx_waiting = qemu_get_be32(f);
1624 }
1625 }
1626
6c666823
MT
1627 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_GUEST_OFFLOADS)) {
1628 n->curr_guest_offloads = qemu_get_be64(f);
1629 } else {
1630 n->curr_guest_offloads = virtio_net_supported_guest_offloads(n);
1631 }
1632
1633 if (peer_has_vnet_hdr(n)) {
1634 virtio_net_apply_guest_offloads(n);
1635 }
1636
5f800801
JW
1637 virtio_net_set_queues(n);
1638
2d9aba39
AW
1639 /* Find the first multicast entry in the saved MAC filter */
1640 for (i = 0; i < n->mac_table.in_use; i++) {
1641 if (n->mac_table.macs[i * ETH_ALEN] & 1) {
1642 break;
1643 }
1644 }
1645 n->mac_table.first_multi = i;
98991481
AK
1646
1647 /* nc.link_down can't be migrated, so infer link_down according
1648 * to link status bit in n->status */
5f800801
JW
1649 link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
1650 for (i = 0; i < n->max_queues; i++) {
1651 qemu_get_subqueue(n->nic, i)->link_down = link_down;
1652 }
98991481 1653
6c666823
MT
1654 if (virtio_vdev_has_feature(vdev, VIRTIO_NET_F_GUEST_ANNOUNCE) &&
1655 virtio_vdev_has_feature(vdev, VIRTIO_NET_F_CTRL_VQ)) {
1656 n->announce_counter = SELF_ANNOUNCE_ROUNDS;
1657 timer_mod(n->announce_timer, qemu_clock_get_ms(QEMU_CLOCK_VIRTUAL));
1658 }
1659
fbe78f4f
AL
1660 return 0;
1661}
1662
eb6b6c12 1663static NetClientInfo net_virtio_info = {
f394b2e2 1664 .type = NET_CLIENT_DRIVER_NIC,
eb6b6c12
MM
1665 .size = sizeof(NICState),
1666 .can_receive = virtio_net_can_receive,
1667 .receive = virtio_net_receive,
eb6b6c12 1668 .link_status_changed = virtio_net_set_link_status,
b1be4280 1669 .query_rx_filter = virtio_net_query_rxfilter,
eb6b6c12
MM
1670};
1671
f56a1247
MT
1672static bool virtio_net_guest_notifier_pending(VirtIODevice *vdev, int idx)
1673{
17a0ca55 1674 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1675 NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
f56a1247 1676 assert(n->vhost_started);
ed8b4afe 1677 return vhost_net_virtqueue_pending(get_vhost_net(nc->peer), idx);
f56a1247
MT
1678}
1679
1680static void virtio_net_guest_notifier_mask(VirtIODevice *vdev, int idx,
1681 bool mask)
1682{
17a0ca55 1683 VirtIONet *n = VIRTIO_NET(vdev);
fed699f9 1684 NetClientState *nc = qemu_get_subqueue(n->nic, vq2q(idx));
f56a1247 1685 assert(n->vhost_started);
ed8b4afe 1686 vhost_net_virtqueue_mask(get_vhost_net(nc->peer),
f56a1247
MT
1687 vdev, idx, mask);
1688}
1689
019a3edb 1690static void virtio_net_set_config_size(VirtIONet *n, uint64_t host_features)
fbe78f4f 1691{
14f9b664 1692 int i, config_size = 0;
0cd09c3a 1693 virtio_add_feature(&host_features, VIRTIO_NET_F_MAC);
14f9b664
JL
1694 for (i = 0; feature_sizes[i].flags != 0; i++) {
1695 if (host_features & feature_sizes[i].flags) {
1696 config_size = MAX(feature_sizes[i].end, config_size);
1697 }
1698 }
17ec5a86
FK
1699 n->config_size = config_size;
1700}
1701
8a253ec2
FK
1702void virtio_net_set_netclient_name(VirtIONet *n, const char *name,
1703 const char *type)
1704{
1705 /*
1706 * The name can be NULL, the netclient name will be type.x.
1707 */
1708 assert(type != NULL);
1709
9e288406 1710 g_free(n->netclient_name);
9e288406 1711 g_free(n->netclient_type);
80e0090a 1712 n->netclient_name = g_strdup(name);
8a253ec2
FK
1713 n->netclient_type = g_strdup(type);
1714}
1715
e6f746b3 1716static void virtio_net_device_realize(DeviceState *dev, Error **errp)
17ec5a86 1717{
e6f746b3 1718 VirtIODevice *vdev = VIRTIO_DEVICE(dev);
284a32f0 1719 VirtIONet *n = VIRTIO_NET(dev);
b1be4280 1720 NetClientState *nc;
284a32f0 1721 int i;
1773d9ee 1722
da3e8a23 1723 virtio_net_set_config_size(n, n->host_features);
284a32f0 1724 virtio_init(vdev, "virtio-net", VIRTIO_ID_NET, n->config_size);
fbe78f4f 1725
1c0fbfa3
MT
1726 /*
1727 * We set a lower limit on RX queue size to what it always was.
1728 * Guests that want a smaller ring can always resize it without
1729 * help from us (using virtio 1 and up).
1730 */
1731 if (n->net_conf.rx_queue_size < VIRTIO_NET_RX_QUEUE_MIN_SIZE ||
1732 n->net_conf.rx_queue_size > VIRTQUEUE_MAX_SIZE ||
1733 (n->net_conf.rx_queue_size & (n->net_conf.rx_queue_size - 1))) {
1734 error_setg(errp, "Invalid rx_queue_size (= %" PRIu16 "), "
1735 "must be a power of 2 between %d and %d.",
1736 n->net_conf.rx_queue_size, VIRTIO_NET_RX_QUEUE_MIN_SIZE,
1737 VIRTQUEUE_MAX_SIZE);
1738 virtio_cleanup(vdev);
1739 return;
1740 }
1741
575a1c0e 1742 n->max_queues = MAX(n->nic_conf.peers.queues, 1);
87b3bd1c 1743 if (n->max_queues * 2 + 1 > VIRTIO_QUEUE_MAX) {
7e0e736e 1744 error_setg(errp, "Invalid number of queues (= %" PRIu32 "), "
631b22ea 1745 "must be a positive integer less than %d.",
87b3bd1c 1746 n->max_queues, (VIRTIO_QUEUE_MAX - 1) / 2);
7e0e736e
JW
1747 virtio_cleanup(vdev);
1748 return;
1749 }
f6b26cf2 1750 n->vqs = g_malloc0(sizeof(VirtIONetQueue) * n->max_queues);
fed699f9 1751 n->curr_queues = 1;
1773d9ee 1752 n->tx_timeout = n->net_conf.txtimer;
a697a334 1753
1773d9ee
FK
1754 if (n->net_conf.tx && strcmp(n->net_conf.tx, "timer")
1755 && strcmp(n->net_conf.tx, "bh")) {
e7b43f7e
SH
1756 error_report("virtio-net: "
1757 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1773d9ee 1758 n->net_conf.tx);
e7b43f7e 1759 error_report("Defaulting to \"bh\"");
a697a334
AW
1760 }
1761
da51a335 1762 for (i = 0; i < n->max_queues; i++) {
f9d6dbf0 1763 virtio_net_add_queue(n, i);
a697a334 1764 }
da51a335 1765
17a0ca55 1766 n->ctrl_vq = virtio_add_queue(vdev, 64, virtio_net_handle_ctrl);
1773d9ee
FK
1767 qemu_macaddr_default_if_unset(&n->nic_conf.macaddr);
1768 memcpy(&n->mac[0], &n->nic_conf.macaddr, sizeof(n->mac));
554c97dd 1769 n->status = VIRTIO_NET_S_LINK_UP;
f57fcf70
JW
1770 n->announce_timer = timer_new_ms(QEMU_CLOCK_VIRTUAL,
1771 virtio_net_announce_timer, n);
fbe78f4f 1772
8a253ec2
FK
1773 if (n->netclient_type) {
1774 /*
1775 * Happen when virtio_net_set_netclient_name has been called.
1776 */
1777 n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
1778 n->netclient_type, n->netclient_name, n);
1779 } else {
1780 n->nic = qemu_new_nic(&net_virtio_info, &n->nic_conf,
284a32f0 1781 object_get_typename(OBJECT(dev)), dev->id, n);
8a253ec2
FK
1782 }
1783
6e371ab8
MT
1784 peer_test_vnet_hdr(n);
1785 if (peer_has_vnet_hdr(n)) {
fed699f9 1786 for (i = 0; i < n->max_queues; i++) {
d6085e3a 1787 qemu_using_vnet_hdr(qemu_get_subqueue(n->nic, i)->peer, true);
fed699f9 1788 }
6e371ab8
MT
1789 n->host_hdr_len = sizeof(struct virtio_net_hdr);
1790 } else {
1791 n->host_hdr_len = 0;
1792 }
eb6b6c12 1793
1773d9ee 1794 qemu_format_nic_info_str(qemu_get_queue(n->nic), n->nic_conf.macaddr.a);
96d5e201 1795
fed699f9 1796 n->vqs[0].tx_waiting = 0;
1773d9ee 1797 n->tx_burst = n->net_conf.txburst;
bb9d17f8 1798 virtio_net_set_mrg_rx_bufs(n, 0, 0);
002437cd 1799 n->promisc = 1; /* for compatibility */
fbe78f4f 1800
7267c094 1801 n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
b6503ed9 1802
7267c094 1803 n->vlans = g_malloc0(MAX_VLAN >> 3);
f21c0ed9 1804
b1be4280
AK
1805 nc = qemu_get_queue(n->nic);
1806 nc->rxfilter_notify_enabled = 1;
1807
284a32f0 1808 n->qdev = dev;
17ec5a86
FK
1809}
1810
306ec6c3 1811static void virtio_net_device_unrealize(DeviceState *dev, Error **errp)
17ec5a86 1812{
306ec6c3
AF
1813 VirtIODevice *vdev = VIRTIO_DEVICE(dev);
1814 VirtIONet *n = VIRTIO_NET(dev);
f9d6dbf0 1815 int i, max_queues;
17ec5a86
FK
1816
1817 /* This will stop vhost backend if appropriate. */
1818 virtio_net_set_status(vdev, 0);
1819
9e288406
MA
1820 g_free(n->netclient_name);
1821 n->netclient_name = NULL;
1822 g_free(n->netclient_type);
1823 n->netclient_type = NULL;
8a253ec2 1824
17ec5a86
FK
1825 g_free(n->mac_table.macs);
1826 g_free(n->vlans);
1827
f9d6dbf0
WC
1828 max_queues = n->multiqueue ? n->max_queues : 1;
1829 for (i = 0; i < max_queues; i++) {
1830 virtio_net_del_queue(n, i);
17ec5a86
FK
1831 }
1832
f57fcf70
JW
1833 timer_del(n->announce_timer);
1834 timer_free(n->announce_timer);
17ec5a86
FK
1835 g_free(n->vqs);
1836 qemu_del_nic(n->nic);
6a1a8cc7 1837 virtio_cleanup(vdev);
17ec5a86
FK
1838}
1839
1840static void virtio_net_instance_init(Object *obj)
1841{
1842 VirtIONet *n = VIRTIO_NET(obj);
1843
1844 /*
1845 * The default config_size is sizeof(struct virtio_net_config).
1846 * Can be overriden with virtio_net_set_config_size.
1847 */
1848 n->config_size = sizeof(struct virtio_net_config);
aa4197c3
GA
1849 device_add_bootindex_property(obj, &n->nic_conf.bootindex,
1850 "bootindex", "/ethernet-phy@0",
1851 DEVICE(n), NULL);
17ec5a86
FK
1852}
1853
4d45dcfb
HP
1854static void virtio_net_pre_save(void *opaque)
1855{
1856 VirtIONet *n = opaque;
1857
1858 /* At this point, backend must be stopped, otherwise
1859 * it might keep writing to memory. */
1860 assert(!n->vhost_started);
1861}
1862
1863static const VMStateDescription vmstate_virtio_net = {
1864 .name = "virtio-net",
1865 .minimum_version_id = VIRTIO_NET_VM_VERSION,
1866 .version_id = VIRTIO_NET_VM_VERSION,
1867 .fields = (VMStateField[]) {
1868 VMSTATE_VIRTIO_DEVICE,
1869 VMSTATE_END_OF_LIST()
1870 },
1871 .pre_save = virtio_net_pre_save,
1872};
290c2428 1873
17ec5a86 1874static Property virtio_net_properties[] = {
87108bb2
SZ
1875 DEFINE_PROP_BIT("csum", VirtIONet, host_features, VIRTIO_NET_F_CSUM, true),
1876 DEFINE_PROP_BIT("guest_csum", VirtIONet, host_features,
1877 VIRTIO_NET_F_GUEST_CSUM, true),
1878 DEFINE_PROP_BIT("gso", VirtIONet, host_features, VIRTIO_NET_F_GSO, true),
1879 DEFINE_PROP_BIT("guest_tso4", VirtIONet, host_features,
1880 VIRTIO_NET_F_GUEST_TSO4, true),
1881 DEFINE_PROP_BIT("guest_tso6", VirtIONet, host_features,
1882 VIRTIO_NET_F_GUEST_TSO6, true),
1883 DEFINE_PROP_BIT("guest_ecn", VirtIONet, host_features,
1884 VIRTIO_NET_F_GUEST_ECN, true),
1885 DEFINE_PROP_BIT("guest_ufo", VirtIONet, host_features,
1886 VIRTIO_NET_F_GUEST_UFO, true),
1887 DEFINE_PROP_BIT("guest_announce", VirtIONet, host_features,
1888 VIRTIO_NET_F_GUEST_ANNOUNCE, true),
1889 DEFINE_PROP_BIT("host_tso4", VirtIONet, host_features,
1890 VIRTIO_NET_F_HOST_TSO4, true),
1891 DEFINE_PROP_BIT("host_tso6", VirtIONet, host_features,
1892 VIRTIO_NET_F_HOST_TSO6, true),
1893 DEFINE_PROP_BIT("host_ecn", VirtIONet, host_features,
1894 VIRTIO_NET_F_HOST_ECN, true),
1895 DEFINE_PROP_BIT("host_ufo", VirtIONet, host_features,
1896 VIRTIO_NET_F_HOST_UFO, true),
1897 DEFINE_PROP_BIT("mrg_rxbuf", VirtIONet, host_features,
1898 VIRTIO_NET_F_MRG_RXBUF, true),
1899 DEFINE_PROP_BIT("status", VirtIONet, host_features,
1900 VIRTIO_NET_F_STATUS, true),
1901 DEFINE_PROP_BIT("ctrl_vq", VirtIONet, host_features,
1902 VIRTIO_NET_F_CTRL_VQ, true),
1903 DEFINE_PROP_BIT("ctrl_rx", VirtIONet, host_features,
1904 VIRTIO_NET_F_CTRL_RX, true),
1905 DEFINE_PROP_BIT("ctrl_vlan", VirtIONet, host_features,
1906 VIRTIO_NET_F_CTRL_VLAN, true),
1907 DEFINE_PROP_BIT("ctrl_rx_extra", VirtIONet, host_features,
1908 VIRTIO_NET_F_CTRL_RX_EXTRA, true),
1909 DEFINE_PROP_BIT("ctrl_mac_addr", VirtIONet, host_features,
1910 VIRTIO_NET_F_CTRL_MAC_ADDR, true),
1911 DEFINE_PROP_BIT("ctrl_guest_offloads", VirtIONet, host_features,
1912 VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, true),
1913 DEFINE_PROP_BIT("mq", VirtIONet, host_features, VIRTIO_NET_F_MQ, false),
17ec5a86
FK
1914 DEFINE_NIC_PROPERTIES(VirtIONet, nic_conf),
1915 DEFINE_PROP_UINT32("x-txtimer", VirtIONet, net_conf.txtimer,
87108bb2 1916 TX_TIMER_INTERVAL),
17ec5a86
FK
1917 DEFINE_PROP_INT32("x-txburst", VirtIONet, net_conf.txburst, TX_BURST),
1918 DEFINE_PROP_STRING("tx", VirtIONet, net_conf.tx),
1c0fbfa3
MT
1919 DEFINE_PROP_UINT16("rx_queue_size", VirtIONet, net_conf.rx_queue_size,
1920 VIRTIO_NET_RX_QUEUE_DEFAULT_SIZE),
17ec5a86
FK
1921 DEFINE_PROP_END_OF_LIST(),
1922};
1923
1924static void virtio_net_class_init(ObjectClass *klass, void *data)
1925{
1926 DeviceClass *dc = DEVICE_CLASS(klass);
1927 VirtioDeviceClass *vdc = VIRTIO_DEVICE_CLASS(klass);
e6f746b3 1928
17ec5a86 1929 dc->props = virtio_net_properties;
290c2428 1930 dc->vmsd = &vmstate_virtio_net;
125ee0ed 1931 set_bit(DEVICE_CATEGORY_NETWORK, dc->categories);
e6f746b3 1932 vdc->realize = virtio_net_device_realize;
306ec6c3 1933 vdc->unrealize = virtio_net_device_unrealize;
17ec5a86
FK
1934 vdc->get_config = virtio_net_get_config;
1935 vdc->set_config = virtio_net_set_config;
1936 vdc->get_features = virtio_net_get_features;
1937 vdc->set_features = virtio_net_set_features;
1938 vdc->bad_features = virtio_net_bad_features;
1939 vdc->reset = virtio_net_reset;
1940 vdc->set_status = virtio_net_set_status;
1941 vdc->guest_notifier_mask = virtio_net_guest_notifier_mask;
1942 vdc->guest_notifier_pending = virtio_net_guest_notifier_pending;
037dab2f
GK
1943 vdc->load = virtio_net_load_device;
1944 vdc->save = virtio_net_save_device;
17ec5a86
FK
1945}
1946
1947static const TypeInfo virtio_net_info = {
1948 .name = TYPE_VIRTIO_NET,
1949 .parent = TYPE_VIRTIO_DEVICE,
1950 .instance_size = sizeof(VirtIONet),
1951 .instance_init = virtio_net_instance_init,
1952 .class_init = virtio_net_class_init,
1953};
1954
1955static void virtio_register_types(void)
1956{
1957 type_register_static(&virtio_net_info);
1958}
1959
1960type_init(virtio_register_types)