blob: b756d57b1a768725da47d8672ef04c9d8c2b73bf [file] [log] [blame]
aliguorifbe78f42008-12-17 19:13:11 +00001/*
2 * Virtio Network Device
3 *
4 * Copyright IBM, Corp. 2007
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010014#include "qemu/iov.h"
aliguorifbe78f42008-12-17 19:13:11 +000015#include "virtio.h"
Paolo Bonzini1422e322012-10-24 08:43:34 +020016#include "net/net.h"
Mark McLoughlin7200ac32009-10-22 17:49:03 +010017#include "net/checksum.h"
Mark McLoughlina8ed73f2009-10-22 17:49:05 +010018#include "net/tap.h"
Paolo Bonzini1de7afc2012-12-17 18:20:00 +010019#include "qemu/error-report.h"
20#include "qemu/timer.h"
aliguorifbe78f42008-12-17 19:13:11 +000021#include "virtio-net.h"
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +020022#include "vhost_net.h"
aliguorifbe78f42008-12-17 19:13:11 +000023
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +010024#define VIRTIO_NET_VM_VERSION 11
aliguorib6503ed2009-02-05 22:36:28 +000025
Alex Williamson4ffb17f2009-06-05 14:47:23 -060026#define MAC_TABLE_ENTRIES 64
aliguorif21c0ed2009-02-05 22:36:32 +000027#define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
aliguori9d6271b2009-02-05 22:36:04 +000028
aliguorifbe78f42008-12-17 19:13:11 +000029typedef struct VirtIONet
30{
31 VirtIODevice vdev;
aliguori79674062009-02-05 22:36:12 +000032 uint8_t mac[ETH_ALEN];
aliguori554c97d2009-01-08 19:46:33 +000033 uint16_t status;
aliguorifbe78f42008-12-17 19:13:11 +000034 VirtQueue *rx_vq;
35 VirtQueue *tx_vq;
aliguori3d11d362009-02-05 22:36:16 +000036 VirtQueue *ctrl_vq;
Mark McLoughlineb6b6c12009-11-25 18:49:11 +000037 NICState *nic;
aliguorifbe78f42008-12-17 19:13:11 +000038 QEMUTimer *tx_timer;
Alex Williamsona697a332010-09-02 09:01:10 -060039 QEMUBH *tx_bh;
Alex Williamsonf0c07c72010-09-02 09:00:50 -060040 uint32_t tx_timeout;
Alex Williamsone3f30482010-09-02 09:00:57 -060041 int32_t tx_burst;
Alex Williamson4b4b8d32010-09-02 09:01:04 -060042 int tx_waiting;
Mark McLoughlin3a330132009-10-22 17:43:45 +010043 uint32_t has_vnet_hdr;
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +020044 size_t host_hdr_len;
45 size_t guest_hdr_len;
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +010046 uint8_t has_ufo;
Mark McLoughlin62433752009-06-18 18:21:36 +010047 struct {
48 VirtQueueElement elem;
49 ssize_t len;
50 } async_tx;
aliguorifbe78f42008-12-17 19:13:11 +000051 int mergeable_rx_bufs;
Alex Williamsonf10c5922009-06-05 14:46:57 -060052 uint8_t promisc;
53 uint8_t allmulti;
Alex Williamson015cb162009-06-05 14:47:18 -060054 uint8_t alluni;
55 uint8_t nomulti;
56 uint8_t nouni;
57 uint8_t nobcast;
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +020058 uint8_t vhost_started;
aliguorib6503ed2009-02-05 22:36:28 +000059 struct {
60 int in_use;
Alex Williamson2d9aba32009-06-05 14:47:13 -060061 int first_multi;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -060062 uint8_t multi_overflow;
63 uint8_t uni_overflow;
aliguorib6503ed2009-02-05 22:36:28 +000064 uint8_t *macs;
65 } mac_table;
aliguorif21c0ed2009-02-05 22:36:32 +000066 uint32_t *vlans;
Alex Williamson01657c82010-06-25 11:09:28 -060067 DeviceState *qdev;
aliguorifbe78f42008-12-17 19:13:11 +000068} VirtIONet;
69
70/* TODO
71 * - we could suppress RX interrupt if we were so inclined.
72 */
73
74static VirtIONet *to_virtio_net(VirtIODevice *vdev)
75{
76 return (VirtIONet *)vdev;
77}
78
aliguori0f03eca2009-02-05 22:36:08 +000079static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
aliguorifbe78f42008-12-17 19:13:11 +000080{
81 VirtIONet *n = to_virtio_net(vdev);
82 struct virtio_net_config netcfg;
83
Stefan Hajnoczib46d97f2011-03-03 21:42:28 +000084 stw_p(&netcfg.status, n->status);
aliguori79674062009-02-05 22:36:12 +000085 memcpy(netcfg.mac, n->mac, ETH_ALEN);
aliguorifbe78f42008-12-17 19:13:11 +000086 memcpy(config, &netcfg, sizeof(netcfg));
87}
88
aliguori0f03eca2009-02-05 22:36:08 +000089static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
90{
91 VirtIONet *n = to_virtio_net(vdev);
92 struct virtio_net_config netcfg;
93
94 memcpy(&netcfg, config, sizeof(netcfg));
95
aliguori79674062009-02-05 22:36:12 +000096 if (memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
97 memcpy(n->mac, netcfg.mac, ETH_ALEN);
Mark McLoughlineb6b6c12009-11-25 18:49:11 +000098 qemu_format_nic_info_str(&n->nic->nc, n->mac);
aliguori0f03eca2009-02-05 22:36:08 +000099 }
100}
101
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200102static bool virtio_net_started(VirtIONet *n, uint8_t status)
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200103{
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200104 return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200105 (n->status & VIRTIO_NET_S_LINK_UP) && n->vdev.vm_running;
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200106}
107
108static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
109{
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200110 if (!n->nic->nc.peer) {
111 return;
112 }
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200113 if (n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200114 return;
115 }
116
117 if (!tap_get_vhost_net(n->nic->nc.peer)) {
118 return;
119 }
Michael S. Tsirkin32993692011-02-09 18:45:09 +0200120 if (!!n->vhost_started == virtio_net_started(n, status) &&
121 !n->nic->nc.peer->link_down) {
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200122 return;
123 }
124 if (!n->vhost_started) {
mst@redhat.com5430a282011-02-01 22:13:42 +0200125 int r;
126 if (!vhost_net_query(tap_get_vhost_net(n->nic->nc.peer), &n->vdev)) {
127 return;
128 }
Michael S. Tsirkin1830b802012-12-25 17:38:59 +0200129 n->vhost_started = 1;
mst@redhat.com5430a282011-02-01 22:13:42 +0200130 r = vhost_net_start(tap_get_vhost_net(n->nic->nc.peer), &n->vdev);
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200131 if (r < 0) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000132 error_report("unable to start vhost net: %d: "
133 "falling back on userspace virtio", -r);
Michael S. Tsirkin1830b802012-12-25 17:38:59 +0200134 n->vhost_started = 0;
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200135 }
136 } else {
137 vhost_net_stop(tap_get_vhost_net(n->nic->nc.peer), &n->vdev);
138 n->vhost_started = 0;
139 }
140}
141
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200142static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
143{
144 VirtIONet *n = to_virtio_net(vdev);
145
146 virtio_net_vhost_status(n, status);
147
148 if (!n->tx_waiting) {
149 return;
150 }
151
152 if (virtio_net_started(n, status) && !n->vhost_started) {
153 if (n->tx_timer) {
154 qemu_mod_timer(n->tx_timer,
Paolo Bonzini74475452011-03-11 16:47:48 +0100155 qemu_get_clock_ns(vm_clock) + n->tx_timeout);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200156 } else {
157 qemu_bh_schedule(n->tx_bh);
158 }
159 } else {
160 if (n->tx_timer) {
161 qemu_del_timer(n->tx_timer);
162 } else {
163 qemu_bh_cancel(n->tx_bh);
164 }
165 }
166}
167
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100168static void virtio_net_set_link_status(NetClientState *nc)
aliguori554c97d2009-01-08 19:46:33 +0000169{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000170 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
aliguori554c97d2009-01-08 19:46:33 +0000171 uint16_t old_status = n->status;
172
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000173 if (nc->link_down)
aliguori554c97d2009-01-08 19:46:33 +0000174 n->status &= ~VIRTIO_NET_S_LINK_UP;
175 else
176 n->status |= VIRTIO_NET_S_LINK_UP;
177
178 if (n->status != old_status)
179 virtio_notify_config(&n->vdev);
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200180
181 virtio_net_set_status(&n->vdev, n->vdev.status);
aliguori554c97d2009-01-08 19:46:33 +0000182}
183
aliguori002437c2009-02-05 22:36:20 +0000184static void virtio_net_reset(VirtIODevice *vdev)
185{
186 VirtIONet *n = to_virtio_net(vdev);
187
188 /* Reset back to compatibility mode */
189 n->promisc = 1;
190 n->allmulti = 0;
Alex Williamson015cb162009-06-05 14:47:18 -0600191 n->alluni = 0;
192 n->nomulti = 0;
193 n->nouni = 0;
194 n->nobcast = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000195
aliguorif21c0ed2009-02-05 22:36:32 +0000196 /* Flush any MAC and VLAN filter table state */
aliguorib6503ed2009-02-05 22:36:28 +0000197 n->mac_table.in_use = 0;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600198 n->mac_table.first_multi = 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600199 n->mac_table.multi_overflow = 0;
200 n->mac_table.uni_overflow = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000201 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
aliguorif21c0ed2009-02-05 22:36:32 +0000202 memset(n->vlans, 0, MAX_VLAN >> 3);
aliguori002437c2009-02-05 22:36:20 +0000203}
204
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200205static void peer_test_vnet_hdr(VirtIONet *n)
Mark McLoughlin3a330132009-10-22 17:43:45 +0100206{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000207 if (!n->nic->nc.peer)
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200208 return;
Mark McLoughlin3a330132009-10-22 17:43:45 +0100209
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200210 if (n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP)
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200211 return;
Mark McLoughlin3a330132009-10-22 17:43:45 +0100212
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000213 n->has_vnet_hdr = tap_has_vnet_hdr(n->nic->nc.peer);
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200214}
Mark McLoughlin3a330132009-10-22 17:43:45 +0100215
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200216static int peer_has_vnet_hdr(VirtIONet *n)
217{
Mark McLoughlin3a330132009-10-22 17:43:45 +0100218 return n->has_vnet_hdr;
219}
220
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100221static int peer_has_ufo(VirtIONet *n)
222{
223 if (!peer_has_vnet_hdr(n))
224 return 0;
225
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000226 n->has_ufo = tap_has_ufo(n->nic->nc.peer);
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100227
228 return n->has_ufo;
229}
230
Michael S. Tsirkinff3a8062012-09-24 21:05:03 +0200231static void virtio_net_set_mrg_rx_bufs(VirtIONet *n, int mergeable_rx_bufs)
232{
233 n->mergeable_rx_bufs = mergeable_rx_bufs;
234
235 n->guest_hdr_len = n->mergeable_rx_bufs ?
236 sizeof(struct virtio_net_hdr_mrg_rxbuf) : sizeof(struct virtio_net_hdr);
237
238 if (peer_has_vnet_hdr(n) &&
239 tap_has_vnet_hdr_len(n->nic->nc.peer, n->guest_hdr_len)) {
240 tap_set_vnet_hdr_len(n->nic->nc.peer, n->guest_hdr_len);
241 n->host_hdr_len = n->guest_hdr_len;
242 }
243}
244
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200245static uint32_t virtio_net_get_features(VirtIODevice *vdev, uint32_t features)
aliguorifbe78f42008-12-17 19:13:11 +0000246{
Mark McLoughlin3a330132009-10-22 17:43:45 +0100247 VirtIONet *n = to_virtio_net(vdev);
aliguorifbe78f42008-12-17 19:13:11 +0000248
Michael S. Tsirkinc9f79a32010-01-12 20:50:17 +0200249 features |= (1 << VIRTIO_NET_F_MAC);
250
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +0200251 if (!peer_has_vnet_hdr(n)) {
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200252 features &= ~(0x1 << VIRTIO_NET_F_CSUM);
253 features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO4);
254 features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO6);
255 features &= ~(0x1 << VIRTIO_NET_F_HOST_ECN);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100256
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200257 features &= ~(0x1 << VIRTIO_NET_F_GUEST_CSUM);
258 features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO4);
259 features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO6);
260 features &= ~(0x1 << VIRTIO_NET_F_GUEST_ECN);
261 }
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100262
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200263 if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
264 features &= ~(0x1 << VIRTIO_NET_F_GUEST_UFO);
265 features &= ~(0x1 << VIRTIO_NET_F_HOST_UFO);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100266 }
267
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +0200268 if (!n->nic->nc.peer ||
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200269 n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +0200270 return features;
271 }
272 if (!tap_get_vhost_net(n->nic->nc.peer)) {
273 return features;
274 }
275 return vhost_net_get_features(tap_get_vhost_net(n->nic->nc.peer), features);
aliguorifbe78f42008-12-17 19:13:11 +0000276}
277
aliguori8eca6b12009-04-05 17:40:08 +0000278static uint32_t virtio_net_bad_features(VirtIODevice *vdev)
279{
280 uint32_t features = 0;
281
282 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
283 * but also these: */
284 features |= (1 << VIRTIO_NET_F_MAC);
Dustin Kirkland184bd042009-10-29 10:34:15 -0500285 features |= (1 << VIRTIO_NET_F_CSUM);
286 features |= (1 << VIRTIO_NET_F_HOST_TSO4);
287 features |= (1 << VIRTIO_NET_F_HOST_TSO6);
288 features |= (1 << VIRTIO_NET_F_HOST_ECN);
aliguori8eca6b12009-04-05 17:40:08 +0000289
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200290 return features;
aliguori8eca6b12009-04-05 17:40:08 +0000291}
292
aliguorifbe78f42008-12-17 19:13:11 +0000293static void virtio_net_set_features(VirtIODevice *vdev, uint32_t features)
294{
295 VirtIONet *n = to_virtio_net(vdev);
296
Michael S. Tsirkinff3a8062012-09-24 21:05:03 +0200297 virtio_net_set_mrg_rx_bufs(n, !!(features & (1 << VIRTIO_NET_F_MRG_RXBUF)));
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100298
299 if (n->has_vnet_hdr) {
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000300 tap_set_offload(n->nic->nc.peer,
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100301 (features >> VIRTIO_NET_F_GUEST_CSUM) & 1,
302 (features >> VIRTIO_NET_F_GUEST_TSO4) & 1,
303 (features >> VIRTIO_NET_F_GUEST_TSO6) & 1,
Sridhar Samudrala6c9f58b2009-10-22 17:43:49 +0100304 (features >> VIRTIO_NET_F_GUEST_ECN) & 1,
305 (features >> VIRTIO_NET_F_GUEST_UFO) & 1);
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100306 }
David L Stevensdc14a392010-03-31 21:20:31 +0300307 if (!n->nic->nc.peer ||
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200308 n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
David L Stevensdc14a392010-03-31 21:20:31 +0300309 return;
310 }
311 if (!tap_get_vhost_net(n->nic->nc.peer)) {
312 return;
313 }
Michael S. Tsirkin57c32292010-05-09 14:35:43 +0300314 vhost_net_ack_features(tap_get_vhost_net(n->nic->nc.peer), features);
aliguorifbe78f42008-12-17 19:13:11 +0000315}
316
aliguori002437c2009-02-05 22:36:20 +0000317static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
318 VirtQueueElement *elem)
319{
320 uint8_t on;
321
322 if (elem->out_num != 2 || elem->out_sg[1].iov_len != sizeof(on)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000323 error_report("virtio-net ctrl invalid rx mode command");
aliguori002437c2009-02-05 22:36:20 +0000324 exit(1);
325 }
326
327 on = ldub_p(elem->out_sg[1].iov_base);
328
329 if (cmd == VIRTIO_NET_CTRL_RX_MODE_PROMISC)
330 n->promisc = on;
331 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_ALLMULTI)
332 n->allmulti = on;
Alex Williamson015cb162009-06-05 14:47:18 -0600333 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_ALLUNI)
334 n->alluni = on;
335 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOMULTI)
336 n->nomulti = on;
337 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOUNI)
338 n->nouni = on;
339 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOBCAST)
340 n->nobcast = on;
aliguori002437c2009-02-05 22:36:20 +0000341 else
342 return VIRTIO_NET_ERR;
343
344 return VIRTIO_NET_OK;
345}
346
aliguorib6503ed2009-02-05 22:36:28 +0000347static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
348 VirtQueueElement *elem)
349{
350 struct virtio_net_ctrl_mac mac_data;
351
352 if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET || elem->out_num != 3 ||
353 elem->out_sg[1].iov_len < sizeof(mac_data) ||
354 elem->out_sg[2].iov_len < sizeof(mac_data))
355 return VIRTIO_NET_ERR;
356
357 n->mac_table.in_use = 0;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600358 n->mac_table.first_multi = 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600359 n->mac_table.uni_overflow = 0;
360 n->mac_table.multi_overflow = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000361 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
362
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100363 mac_data.entries = ldl_p(elem->out_sg[1].iov_base);
aliguorib6503ed2009-02-05 22:36:28 +0000364
365 if (sizeof(mac_data.entries) +
366 (mac_data.entries * ETH_ALEN) > elem->out_sg[1].iov_len)
367 return VIRTIO_NET_ERR;
368
369 if (mac_data.entries <= MAC_TABLE_ENTRIES) {
370 memcpy(n->mac_table.macs, elem->out_sg[1].iov_base + sizeof(mac_data),
371 mac_data.entries * ETH_ALEN);
372 n->mac_table.in_use += mac_data.entries;
373 } else {
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600374 n->mac_table.uni_overflow = 1;
aliguorib6503ed2009-02-05 22:36:28 +0000375 }
376
Alex Williamson2d9aba32009-06-05 14:47:13 -0600377 n->mac_table.first_multi = n->mac_table.in_use;
378
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100379 mac_data.entries = ldl_p(elem->out_sg[2].iov_base);
aliguorib6503ed2009-02-05 22:36:28 +0000380
381 if (sizeof(mac_data.entries) +
382 (mac_data.entries * ETH_ALEN) > elem->out_sg[2].iov_len)
383 return VIRTIO_NET_ERR;
384
385 if (mac_data.entries) {
386 if (n->mac_table.in_use + mac_data.entries <= MAC_TABLE_ENTRIES) {
387 memcpy(n->mac_table.macs + (n->mac_table.in_use * ETH_ALEN),
388 elem->out_sg[2].iov_base + sizeof(mac_data),
389 mac_data.entries * ETH_ALEN);
390 n->mac_table.in_use += mac_data.entries;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600391 } else {
392 n->mac_table.multi_overflow = 1;
393 }
aliguorib6503ed2009-02-05 22:36:28 +0000394 }
395
396 return VIRTIO_NET_OK;
397}
398
aliguorif21c0ed2009-02-05 22:36:32 +0000399static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
400 VirtQueueElement *elem)
401{
402 uint16_t vid;
403
404 if (elem->out_num != 2 || elem->out_sg[1].iov_len != sizeof(vid)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000405 error_report("virtio-net ctrl invalid vlan command");
aliguorif21c0ed2009-02-05 22:36:32 +0000406 return VIRTIO_NET_ERR;
407 }
408
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100409 vid = lduw_p(elem->out_sg[1].iov_base);
aliguorif21c0ed2009-02-05 22:36:32 +0000410
411 if (vid >= MAX_VLAN)
412 return VIRTIO_NET_ERR;
413
414 if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
415 n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
416 else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
417 n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
418 else
419 return VIRTIO_NET_ERR;
420
421 return VIRTIO_NET_OK;
422}
423
aliguori3d11d362009-02-05 22:36:16 +0000424static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
425{
aliguori002437c2009-02-05 22:36:20 +0000426 VirtIONet *n = to_virtio_net(vdev);
aliguori3d11d362009-02-05 22:36:16 +0000427 struct virtio_net_ctrl_hdr ctrl;
428 virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
429 VirtQueueElement elem;
430
431 while (virtqueue_pop(vq, &elem)) {
432 if ((elem.in_num < 1) || (elem.out_num < 1)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000433 error_report("virtio-net ctrl missing headers");
aliguori3d11d362009-02-05 22:36:16 +0000434 exit(1);
435 }
436
437 if (elem.out_sg[0].iov_len < sizeof(ctrl) ||
aliguoric6bb9a32009-03-13 15:04:02 +0000438 elem.in_sg[elem.in_num - 1].iov_len < sizeof(status)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000439 error_report("virtio-net ctrl header not in correct element");
aliguori3d11d362009-02-05 22:36:16 +0000440 exit(1);
441 }
442
443 ctrl.class = ldub_p(elem.out_sg[0].iov_base);
444 ctrl.cmd = ldub_p(elem.out_sg[0].iov_base + sizeof(ctrl.class));
445
aliguori002437c2009-02-05 22:36:20 +0000446 if (ctrl.class == VIRTIO_NET_CTRL_RX_MODE)
447 status = virtio_net_handle_rx_mode(n, ctrl.cmd, &elem);
aliguorib6503ed2009-02-05 22:36:28 +0000448 else if (ctrl.class == VIRTIO_NET_CTRL_MAC)
449 status = virtio_net_handle_mac(n, ctrl.cmd, &elem);
aliguorif21c0ed2009-02-05 22:36:32 +0000450 else if (ctrl.class == VIRTIO_NET_CTRL_VLAN)
451 status = virtio_net_handle_vlan_table(n, ctrl.cmd, &elem);
aliguori002437c2009-02-05 22:36:20 +0000452
aliguori3d11d362009-02-05 22:36:16 +0000453 stb_p(elem.in_sg[elem.in_num - 1].iov_base, status);
454
455 virtqueue_push(vq, &elem, sizeof(status));
456 virtio_notify(vdev, vq);
457 }
458}
459
aliguorifbe78f42008-12-17 19:13:11 +0000460/* RX */
461
462static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
463{
Mark McLoughlin8aeff622009-04-29 13:40:02 +0100464 VirtIONet *n = to_virtio_net(vdev);
465
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000466 qemu_flush_queued_packets(&n->nic->nc);
aliguorifbe78f42008-12-17 19:13:11 +0000467}
468
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100469static int virtio_net_can_receive(NetClientState *nc)
aliguorifbe78f42008-12-17 19:13:11 +0000470{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000471 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200472 if (!n->vdev.vm_running) {
Michael S. Tsirkin95477322010-11-22 19:52:19 +0200473 return 0;
474 }
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000475
aliguorifbe78f42008-12-17 19:13:11 +0000476 if (!virtio_queue_ready(n->rx_vq) ||
477 !(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK))
478 return 0;
479
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000480 return 1;
481}
482
483static int virtio_net_has_buffers(VirtIONet *n, int bufsize)
484{
aliguorifbe78f42008-12-17 19:13:11 +0000485 if (virtio_queue_empty(n->rx_vq) ||
486 (n->mergeable_rx_bufs &&
487 !virtqueue_avail_bytes(n->rx_vq, bufsize, 0))) {
488 virtio_queue_set_notification(n->rx_vq, 1);
Tom Lendacky06b12972010-02-08 10:10:01 -0600489
490 /* To avoid a race condition where the guest has made some buffers
491 * available after the above check but before notification was
492 * enabled, check for available buffers again.
493 */
494 if (virtio_queue_empty(n->rx_vq) ||
495 (n->mergeable_rx_bufs &&
496 !virtqueue_avail_bytes(n->rx_vq, bufsize, 0)))
497 return 0;
aliguorifbe78f42008-12-17 19:13:11 +0000498 }
499
500 virtio_queue_set_notification(n->rx_vq, 0);
501 return 1;
502}
503
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100504/* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
505 * it never finds out that the packets don't have valid checksums. This
506 * causes dhclient to get upset. Fedora's carried a patch for ages to
507 * fix this with Xen but it hasn't appeared in an upstream release of
508 * dhclient yet.
509 *
510 * To avoid breaking existing guests, we catch udp packets and add
511 * checksums. This is terrible but it's better than hacking the guest
512 * kernels.
513 *
514 * N.B. if we introduce a zero-copy API, this operation is no longer free so
515 * we should provide a mechanism to disable it to avoid polluting the host
516 * cache.
517 */
518static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200519 uint8_t *buf, size_t size)
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100520{
521 if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
522 (size > 27 && size < 1500) && /* normal sized MTU */
523 (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
524 (buf[23] == 17) && /* ip.protocol == UDP */
525 (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200526 net_checksum_calculate(buf, size);
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100527 hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
528 }
529}
530
Michael S. Tsirkin280598b2012-09-24 13:24:17 +0200531static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
532 const void *buf, size_t size)
aliguorifbe78f42008-12-17 19:13:11 +0000533{
Mark McLoughlin3a330132009-10-22 17:43:45 +0100534 if (n->has_vnet_hdr) {
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200535 /* FIXME this cast is evil */
536 void *wbuf = (void *)buf;
Michael S. Tsirkin280598b2012-09-24 13:24:17 +0200537 work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
538 size - n->host_hdr_len);
539 iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200540 } else {
541 struct virtio_net_hdr hdr = {
542 .flags = 0,
543 .gso_type = VIRTIO_NET_HDR_GSO_NONE
544 };
545 iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100546 }
aliguorifbe78f42008-12-17 19:13:11 +0000547}
548
aliguori3831ab22009-02-05 22:36:24 +0000549static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
550{
551 static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
aliguorif21c0ed2009-02-05 22:36:32 +0000552 static const uint8_t vlan[] = {0x81, 0x00};
aliguori3831ab22009-02-05 22:36:24 +0000553 uint8_t *ptr = (uint8_t *)buf;
aliguorib6503ed2009-02-05 22:36:28 +0000554 int i;
aliguori3831ab22009-02-05 22:36:24 +0000555
556 if (n->promisc)
557 return 1;
558
Michael S. Tsirkine043ebc2012-09-24 16:27:27 +0200559 ptr += n->host_hdr_len;
Mark McLoughlin3a330132009-10-22 17:43:45 +0100560
aliguorif21c0ed2009-02-05 22:36:32 +0000561 if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
562 int vid = be16_to_cpup((uint16_t *)(ptr + 14)) & 0xfff;
563 if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
564 return 0;
565 }
566
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600567 if (ptr[0] & 1) { // multicast
568 if (!memcmp(ptr, bcast, sizeof(bcast))) {
Alex Williamson015cb162009-06-05 14:47:18 -0600569 return !n->nobcast;
570 } else if (n->nomulti) {
571 return 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600572 } else if (n->allmulti || n->mac_table.multi_overflow) {
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600573 return 1;
574 }
Alex Williamson2d9aba32009-06-05 14:47:13 -0600575
576 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
577 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
578 return 1;
579 }
580 }
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600581 } else { // unicast
Alex Williamson015cb162009-06-05 14:47:18 -0600582 if (n->nouni) {
583 return 0;
584 } else if (n->alluni || n->mac_table.uni_overflow) {
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600585 return 1;
586 } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600587 return 1;
588 }
aliguori3831ab22009-02-05 22:36:24 +0000589
Alex Williamson2d9aba32009-06-05 14:47:13 -0600590 for (i = 0; i < n->mac_table.first_multi; i++) {
591 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
592 return 1;
593 }
594 }
aliguorib6503ed2009-02-05 22:36:28 +0000595 }
596
aliguori3831ab22009-02-05 22:36:24 +0000597 return 0;
598}
599
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100600static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, size_t size)
aliguorifbe78f42008-12-17 19:13:11 +0000601{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000602 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200603 struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
604 struct virtio_net_hdr_mrg_rxbuf mhdr;
605 unsigned mhdr_cnt = 0;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200606 size_t offset, i, guest_offset;
aliguorifbe78f42008-12-17 19:13:11 +0000607
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000608 if (!virtio_net_can_receive(&n->nic->nc))
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000609 return -1;
610
Michael S. Tsirkin940cda92010-06-06 18:53:10 +0300611 /* hdr_len refers to the header we supply to the guest */
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200612 if (!virtio_net_has_buffers(n, size + n->guest_hdr_len - n->host_hdr_len))
Mark McLoughlin8aeff622009-04-29 13:40:02 +0100613 return 0;
aliguorifbe78f42008-12-17 19:13:11 +0000614
aliguori3831ab22009-02-05 22:36:24 +0000615 if (!receive_filter(n, buf, size))
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100616 return size;
aliguori3831ab22009-02-05 22:36:24 +0000617
aliguorifbe78f42008-12-17 19:13:11 +0000618 offset = i = 0;
619
620 while (offset < size) {
621 VirtQueueElement elem;
622 int len, total;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200623 const struct iovec *sg = elem.in_sg;
aliguorifbe78f42008-12-17 19:13:11 +0000624
Amit Shah22c253d2010-01-13 16:24:43 +0530625 total = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000626
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300627 if (virtqueue_pop(n->rx_vq, &elem) == 0) {
aliguorifbe78f42008-12-17 19:13:11 +0000628 if (i == 0)
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100629 return -1;
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000630 error_report("virtio-net unexpected empty queue: "
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300631 "i %zd mergeable %d offset %zd, size %zd, "
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000632 "guest hdr len %zd, host hdr len %zd guest features 0x%x",
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300633 i, n->mergeable_rx_bufs, offset, size,
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200634 n->guest_hdr_len, n->host_hdr_len, n->vdev.guest_features);
aliguorifbe78f42008-12-17 19:13:11 +0000635 exit(1);
636 }
637
638 if (elem.in_num < 1) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000639 error_report("virtio-net receive queue contains no in buffers");
aliguorifbe78f42008-12-17 19:13:11 +0000640 exit(1);
641 }
642
aliguorifbe78f42008-12-17 19:13:11 +0000643 if (i == 0) {
Michael S. Tsirkinc8d28e72012-09-24 13:26:55 +0200644 assert(offset == 0);
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200645 if (n->mergeable_rx_bufs) {
646 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
647 sg, elem.in_num,
648 offsetof(typeof(mhdr), num_buffers),
649 sizeof(mhdr.num_buffers));
650 }
aliguorifbe78f42008-12-17 19:13:11 +0000651
Michael S. Tsirkinc8d28e72012-09-24 13:26:55 +0200652 receive_header(n, sg, elem.in_num, buf, size);
653 offset = n->host_hdr_len;
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200654 total += n->guest_hdr_len;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200655 guest_offset = n->guest_hdr_len;
656 } else {
657 guest_offset = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000658 }
659
660 /* copy in packet. ugh */
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200661 len = iov_from_buf(sg, elem.in_num, guest_offset,
Michael Tokarevdcf6f5e2012-03-11 18:05:12 +0400662 buf + offset, size - offset);
aliguorifbe78f42008-12-17 19:13:11 +0000663 total += len;
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300664 offset += len;
665 /* If buffers can't be merged, at this point we
666 * must have consumed the complete packet.
667 * Otherwise, drop it. */
668 if (!n->mergeable_rx_bufs && offset < size) {
669#if 0
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000670 error_report("virtio-net truncated non-mergeable packet: "
671 "i %zd mergeable %d offset %zd, size %zd, "
672 "guest hdr len %zd, host hdr len %zd",
673 i, n->mergeable_rx_bufs,
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200674 offset, size, n->guest_hdr_len, n->host_hdr_len);
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300675#endif
676 return size;
677 }
aliguorifbe78f42008-12-17 19:13:11 +0000678
679 /* signal other side */
680 virtqueue_fill(n->rx_vq, &elem, total, i++);
aliguorifbe78f42008-12-17 19:13:11 +0000681 }
682
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200683 if (mhdr_cnt) {
684 stw_p(&mhdr.num_buffers, i);
685 iov_from_buf(mhdr_sg, mhdr_cnt,
686 0,
687 &mhdr.num_buffers, sizeof mhdr.num_buffers);
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100688 }
aliguorifbe78f42008-12-17 19:13:11 +0000689
690 virtqueue_flush(n->rx_vq, i);
691 virtio_notify(&n->vdev, n->rx_vq);
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100692
693 return size;
aliguorifbe78f42008-12-17 19:13:11 +0000694}
695
Alex Williamsone3f30482010-09-02 09:00:57 -0600696static int32_t virtio_net_flush_tx(VirtIONet *n, VirtQueue *vq);
Mark McLoughlin62433752009-06-18 18:21:36 +0100697
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100698static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
Mark McLoughlin62433752009-06-18 18:21:36 +0100699{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000700 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Mark McLoughlin62433752009-06-18 18:21:36 +0100701
Michael S. Tsirkin40bad8f2012-09-24 15:15:43 +0200702 virtqueue_push(n->tx_vq, &n->async_tx.elem, 0);
Mark McLoughlin62433752009-06-18 18:21:36 +0100703 virtio_notify(&n->vdev, n->tx_vq);
704
705 n->async_tx.elem.out_num = n->async_tx.len = 0;
706
707 virtio_queue_set_notification(n->tx_vq, 1);
708 virtio_net_flush_tx(n, n->tx_vq);
709}
710
aliguorifbe78f42008-12-17 19:13:11 +0000711/* TX */
Alex Williamsone3f30482010-09-02 09:00:57 -0600712static int32_t virtio_net_flush_tx(VirtIONet *n, VirtQueue *vq)
aliguorifbe78f42008-12-17 19:13:11 +0000713{
714 VirtQueueElement elem;
Alex Williamsone3f30482010-09-02 09:00:57 -0600715 int32_t num_packets = 0;
Alex Williamsone3f30482010-09-02 09:00:57 -0600716 if (!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK)) {
717 return num_packets;
718 }
aliguorifbe78f42008-12-17 19:13:11 +0000719
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200720 assert(n->vdev.vm_running);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200721
Mark McLoughlin62433752009-06-18 18:21:36 +0100722 if (n->async_tx.elem.out_num) {
723 virtio_queue_set_notification(n->tx_vq, 0);
Alex Williamsone3f30482010-09-02 09:00:57 -0600724 return num_packets;
Mark McLoughlin62433752009-06-18 18:21:36 +0100725 }
726
aliguorifbe78f42008-12-17 19:13:11 +0000727 while (virtqueue_pop(vq, &elem)) {
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200728 ssize_t ret, len;
aliguorifbe78f42008-12-17 19:13:11 +0000729 unsigned int out_num = elem.out_num;
730 struct iovec *out_sg = &elem.out_sg[0];
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200731 struct iovec sg[VIRTQUEUE_MAX_SIZE];
aliguorifbe78f42008-12-17 19:13:11 +0000732
Michael S. Tsirkin7b80d082012-09-24 14:54:44 +0200733 if (out_num < 1) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000734 error_report("virtio-net header not in first element");
aliguorifbe78f42008-12-17 19:13:11 +0000735 exit(1);
736 }
737
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200738 /*
739 * If host wants to see the guest header as is, we can
740 * pass it on unchanged. Otherwise, copy just the parts
741 * that host is interested in.
742 */
743 assert(n->host_hdr_len <= n->guest_hdr_len);
744 if (n->host_hdr_len != n->guest_hdr_len) {
745 unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
746 out_sg, out_num,
747 0, n->host_hdr_len);
748 sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
749 out_sg, out_num,
750 n->guest_hdr_len, -1);
751 out_num = sg_num;
752 out_sg = sg;
aliguorifbe78f42008-12-17 19:13:11 +0000753 }
754
Michael S. Tsirkin7b80d082012-09-24 14:54:44 +0200755 len = n->guest_hdr_len;
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200756
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000757 ret = qemu_sendv_packet_async(&n->nic->nc, out_sg, out_num,
Mark McLoughlin62433752009-06-18 18:21:36 +0100758 virtio_net_tx_complete);
759 if (ret == 0) {
760 virtio_queue_set_notification(n->tx_vq, 0);
761 n->async_tx.elem = elem;
762 n->async_tx.len = len;
Alex Williamsone3f30482010-09-02 09:00:57 -0600763 return -EBUSY;
Mark McLoughlin62433752009-06-18 18:21:36 +0100764 }
765
766 len += ret;
aliguorifbe78f42008-12-17 19:13:11 +0000767
Michael S. Tsirkin40bad8f2012-09-24 15:15:43 +0200768 virtqueue_push(vq, &elem, 0);
aliguorifbe78f42008-12-17 19:13:11 +0000769 virtio_notify(&n->vdev, vq);
Alex Williamsone3f30482010-09-02 09:00:57 -0600770
771 if (++num_packets >= n->tx_burst) {
772 break;
773 }
aliguorifbe78f42008-12-17 19:13:11 +0000774 }
Alex Williamsone3f30482010-09-02 09:00:57 -0600775 return num_packets;
aliguorifbe78f42008-12-17 19:13:11 +0000776}
777
Alex Williamsona697a332010-09-02 09:01:10 -0600778static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
aliguorifbe78f42008-12-17 19:13:11 +0000779{
780 VirtIONet *n = to_virtio_net(vdev);
781
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200782 /* This happens when device was stopped but VCPU wasn't. */
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200783 if (!n->vdev.vm_running) {
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200784 n->tx_waiting = 1;
785 return;
786 }
787
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600788 if (n->tx_waiting) {
aliguorifbe78f42008-12-17 19:13:11 +0000789 virtio_queue_set_notification(vq, 1);
790 qemu_del_timer(n->tx_timer);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600791 n->tx_waiting = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000792 virtio_net_flush_tx(n, vq);
793 } else {
794 qemu_mod_timer(n->tx_timer,
Paolo Bonzini74475452011-03-11 16:47:48 +0100795 qemu_get_clock_ns(vm_clock) + n->tx_timeout);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600796 n->tx_waiting = 1;
aliguorifbe78f42008-12-17 19:13:11 +0000797 virtio_queue_set_notification(vq, 0);
798 }
799}
800
Alex Williamsona697a332010-09-02 09:01:10 -0600801static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
802{
803 VirtIONet *n = to_virtio_net(vdev);
804
805 if (unlikely(n->tx_waiting)) {
806 return;
807 }
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200808 n->tx_waiting = 1;
809 /* This happens when device was stopped but VCPU wasn't. */
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200810 if (!n->vdev.vm_running) {
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200811 return;
812 }
Alex Williamsona697a332010-09-02 09:01:10 -0600813 virtio_queue_set_notification(vq, 0);
814 qemu_bh_schedule(n->tx_bh);
Alex Williamsona697a332010-09-02 09:01:10 -0600815}
816
aliguorifbe78f42008-12-17 19:13:11 +0000817static void virtio_net_tx_timer(void *opaque)
818{
819 VirtIONet *n = opaque;
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200820 assert(n->vdev.vm_running);
aliguorifbe78f42008-12-17 19:13:11 +0000821
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600822 n->tx_waiting = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000823
824 /* Just in case the driver is not ready on more */
825 if (!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK))
826 return;
827
828 virtio_queue_set_notification(n->tx_vq, 1);
829 virtio_net_flush_tx(n, n->tx_vq);
830}
831
Alex Williamsona697a332010-09-02 09:01:10 -0600832static void virtio_net_tx_bh(void *opaque)
833{
834 VirtIONet *n = opaque;
835 int32_t ret;
836
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200837 assert(n->vdev.vm_running);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200838
Alex Williamsona697a332010-09-02 09:01:10 -0600839 n->tx_waiting = 0;
840
841 /* Just in case the driver is not ready on more */
842 if (unlikely(!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK)))
843 return;
844
845 ret = virtio_net_flush_tx(n, n->tx_vq);
846 if (ret == -EBUSY) {
847 return; /* Notification re-enable handled by tx_complete */
848 }
849
850 /* If we flush a full burst of packets, assume there are
851 * more coming and immediately reschedule */
852 if (ret >= n->tx_burst) {
853 qemu_bh_schedule(n->tx_bh);
854 n->tx_waiting = 1;
855 return;
856 }
857
858 /* If less than a full burst, re-enable notification and flush
859 * anything that may have come in while we weren't looking. If
860 * we find something, assume the guest is still active and reschedule */
861 virtio_queue_set_notification(n->tx_vq, 1);
862 if (virtio_net_flush_tx(n, n->tx_vq) > 0) {
863 virtio_queue_set_notification(n->tx_vq, 0);
864 qemu_bh_schedule(n->tx_bh);
865 n->tx_waiting = 1;
866 }
867}
868
aliguorifbe78f42008-12-17 19:13:11 +0000869static void virtio_net_save(QEMUFile *f, void *opaque)
870{
871 VirtIONet *n = opaque;
872
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200873 /* At this point, backend must be stopped, otherwise
874 * it might keep writing to memory. */
875 assert(!n->vhost_started);
aliguorifbe78f42008-12-17 19:13:11 +0000876 virtio_save(&n->vdev, f);
877
aliguori79674062009-02-05 22:36:12 +0000878 qemu_put_buffer(f, n->mac, ETH_ALEN);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600879 qemu_put_be32(f, n->tx_waiting);
aliguorie46cb382009-01-07 17:50:45 +0000880 qemu_put_be32(f, n->mergeable_rx_bufs);
aliguori9d6271b2009-02-05 22:36:04 +0000881 qemu_put_be16(f, n->status);
Alex Williamsonf10c5922009-06-05 14:46:57 -0600882 qemu_put_byte(f, n->promisc);
883 qemu_put_byte(f, n->allmulti);
aliguorib6503ed2009-02-05 22:36:28 +0000884 qemu_put_be32(f, n->mac_table.in_use);
885 qemu_put_buffer(f, n->mac_table.macs, n->mac_table.in_use * ETH_ALEN);
aliguorif21c0ed2009-02-05 22:36:32 +0000886 qemu_put_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100887 qemu_put_be32(f, n->has_vnet_hdr);
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600888 qemu_put_byte(f, n->mac_table.multi_overflow);
889 qemu_put_byte(f, n->mac_table.uni_overflow);
Alex Williamson015cb162009-06-05 14:47:18 -0600890 qemu_put_byte(f, n->alluni);
891 qemu_put_byte(f, n->nomulti);
892 qemu_put_byte(f, n->nouni);
893 qemu_put_byte(f, n->nobcast);
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100894 qemu_put_byte(f, n->has_ufo);
aliguorifbe78f42008-12-17 19:13:11 +0000895}
896
897static int virtio_net_load(QEMUFile *f, void *opaque, int version_id)
898{
899 VirtIONet *n = opaque;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600900 int i;
Orit Wassermann2a633c42012-05-16 12:21:35 +0200901 int ret;
aliguorifbe78f42008-12-17 19:13:11 +0000902
aliguori9d6271b2009-02-05 22:36:04 +0000903 if (version_id < 2 || version_id > VIRTIO_NET_VM_VERSION)
aliguorifbe78f42008-12-17 19:13:11 +0000904 return -EINVAL;
905
Orit Wassermann2a633c42012-05-16 12:21:35 +0200906 ret = virtio_load(&n->vdev, f);
907 if (ret) {
908 return ret;
909 }
aliguorifbe78f42008-12-17 19:13:11 +0000910
aliguori79674062009-02-05 22:36:12 +0000911 qemu_get_buffer(f, n->mac, ETH_ALEN);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600912 n->tx_waiting = qemu_get_be32(f);
Michael S. Tsirkinff3a8062012-09-24 21:05:03 +0200913
914 virtio_net_set_mrg_rx_bufs(n, qemu_get_be32(f));
aliguorifbe78f42008-12-17 19:13:11 +0000915
aliguori9d6271b2009-02-05 22:36:04 +0000916 if (version_id >= 3)
917 n->status = qemu_get_be16(f);
918
aliguori002437c2009-02-05 22:36:20 +0000919 if (version_id >= 4) {
Alex Williamsonf10c5922009-06-05 14:46:57 -0600920 if (version_id < 8) {
921 n->promisc = qemu_get_be32(f);
922 n->allmulti = qemu_get_be32(f);
923 } else {
924 n->promisc = qemu_get_byte(f);
925 n->allmulti = qemu_get_byte(f);
926 }
aliguori002437c2009-02-05 22:36:20 +0000927 }
928
aliguorib6503ed2009-02-05 22:36:28 +0000929 if (version_id >= 5) {
930 n->mac_table.in_use = qemu_get_be32(f);
931 /* MAC_TABLE_ENTRIES may be different from the saved image */
932 if (n->mac_table.in_use <= MAC_TABLE_ENTRIES) {
933 qemu_get_buffer(f, n->mac_table.macs,
934 n->mac_table.in_use * ETH_ALEN);
935 } else if (n->mac_table.in_use) {
Juan Quintelae398d612012-08-29 19:03:09 +0200936 uint8_t *buf = g_malloc0(n->mac_table.in_use);
937 qemu_get_buffer(f, buf, n->mac_table.in_use * ETH_ALEN);
938 g_free(buf);
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600939 n->mac_table.multi_overflow = n->mac_table.uni_overflow = 1;
aliguorib6503ed2009-02-05 22:36:28 +0000940 n->mac_table.in_use = 0;
941 }
942 }
943
aliguorif21c0ed2009-02-05 22:36:32 +0000944 if (version_id >= 6)
945 qemu_get_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
946
Mark McLoughlin3a330132009-10-22 17:43:45 +0100947 if (version_id >= 7) {
948 if (qemu_get_be32(f) && !peer_has_vnet_hdr(n)) {
Markus Armbruster1ecda022010-02-18 17:25:24 +0100949 error_report("virtio-net: saved image requires vnet_hdr=on");
Mark McLoughlin3a330132009-10-22 17:43:45 +0100950 return -1;
951 }
952
953 if (n->has_vnet_hdr) {
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000954 tap_set_offload(n->nic->nc.peer,
Michael S. Tsirkin704a76f2010-01-10 13:52:47 +0200955 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_CSUM) & 1,
956 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_TSO4) & 1,
957 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_TSO6) & 1,
958 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_ECN) & 1,
959 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_UFO) & 1);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100960 }
Alex Williamson6c042c12009-06-05 14:46:52 -0600961 }
962
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600963 if (version_id >= 9) {
964 n->mac_table.multi_overflow = qemu_get_byte(f);
965 n->mac_table.uni_overflow = qemu_get_byte(f);
966 }
967
Alex Williamson015cb162009-06-05 14:47:18 -0600968 if (version_id >= 10) {
969 n->alluni = qemu_get_byte(f);
970 n->nomulti = qemu_get_byte(f);
971 n->nouni = qemu_get_byte(f);
972 n->nobcast = qemu_get_byte(f);
973 }
974
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100975 if (version_id >= 11) {
976 if (qemu_get_byte(f) && !peer_has_ufo(n)) {
Markus Armbruster1ecda022010-02-18 17:25:24 +0100977 error_report("virtio-net: saved image requires TUN_F_UFO support");
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100978 return -1;
979 }
980 }
981
Alex Williamson2d9aba32009-06-05 14:47:13 -0600982 /* Find the first multicast entry in the saved MAC filter */
983 for (i = 0; i < n->mac_table.in_use; i++) {
984 if (n->mac_table.macs[i * ETH_ALEN] & 1) {
985 break;
986 }
987 }
988 n->mac_table.first_multi = i;
Amos Kong98991482012-09-28 10:06:02 +0800989
990 /* nc.link_down can't be migrated, so infer link_down according
991 * to link status bit in n->status */
992 n->nic->nc.link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
993
aliguorifbe78f42008-12-17 19:13:11 +0000994 return 0;
995}
996
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100997static void virtio_net_cleanup(NetClientState *nc)
aliguorib946a152009-04-17 17:11:08 +0000998{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000999 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
aliguorib946a152009-04-17 17:11:08 +00001000
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001001 n->nic = NULL;
aliguorib946a152009-04-17 17:11:08 +00001002}
1003
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001004static NetClientInfo net_virtio_info = {
Laszlo Ersek2be64a62012-07-17 16:17:12 +02001005 .type = NET_CLIENT_OPTIONS_KIND_NIC,
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001006 .size = sizeof(NICState),
1007 .can_receive = virtio_net_can_receive,
1008 .receive = virtio_net_receive,
1009 .cleanup = virtio_net_cleanup,
1010 .link_status_changed = virtio_net_set_link_status,
1011};
1012
Alex Williamsonf0c07c72010-09-02 09:00:50 -06001013VirtIODevice *virtio_net_init(DeviceState *dev, NICConf *conf,
1014 virtio_net_conf *net)
aliguorifbe78f42008-12-17 19:13:11 +00001015{
1016 VirtIONet *n;
aliguorifbe78f42008-12-17 19:13:11 +00001017
Paul Brook53c25ce2009-05-18 14:51:59 +01001018 n = (VirtIONet *)virtio_common_init("virtio-net", VIRTIO_ID_NET,
1019 sizeof(struct virtio_net_config),
1020 sizeof(VirtIONet));
aliguorifbe78f42008-12-17 19:13:11 +00001021
aliguori0f03eca2009-02-05 22:36:08 +00001022 n->vdev.get_config = virtio_net_get_config;
1023 n->vdev.set_config = virtio_net_set_config;
aliguorifbe78f42008-12-17 19:13:11 +00001024 n->vdev.get_features = virtio_net_get_features;
1025 n->vdev.set_features = virtio_net_set_features;
aliguori8eca6b12009-04-05 17:40:08 +00001026 n->vdev.bad_features = virtio_net_bad_features;
aliguori002437c2009-02-05 22:36:20 +00001027 n->vdev.reset = virtio_net_reset;
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +02001028 n->vdev.set_status = virtio_net_set_status;
aliguorifbe78f42008-12-17 19:13:11 +00001029 n->rx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_rx);
Alex Williamsona697a332010-09-02 09:01:10 -06001030
1031 if (net->tx && strcmp(net->tx, "timer") && strcmp(net->tx, "bh")) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +00001032 error_report("virtio-net: "
1033 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1034 net->tx);
1035 error_report("Defaulting to \"bh\"");
Alex Williamsona697a332010-09-02 09:01:10 -06001036 }
1037
1038 if (net->tx && !strcmp(net->tx, "timer")) {
1039 n->tx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_tx_timer);
Paolo Bonzini74475452011-03-11 16:47:48 +01001040 n->tx_timer = qemu_new_timer_ns(vm_clock, virtio_net_tx_timer, n);
Alex Williamsona697a332010-09-02 09:01:10 -06001041 n->tx_timeout = net->txtimer;
1042 } else {
1043 n->tx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_tx_bh);
1044 n->tx_bh = qemu_bh_new(virtio_net_tx_bh, n);
1045 }
Alex Williamson4ffb17f2009-06-05 14:47:23 -06001046 n->ctrl_vq = virtio_add_queue(&n->vdev, 64, virtio_net_handle_ctrl);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001047 qemu_macaddr_default_if_unset(&conf->macaddr);
Mark McLoughlin3cbe04c2009-10-28 14:07:23 +00001048 memcpy(&n->mac[0], &conf->macaddr, sizeof(n->mac));
aliguori554c97d2009-01-08 19:46:33 +00001049 n->status = VIRTIO_NET_S_LINK_UP;
aliguorifbe78f42008-12-17 19:13:11 +00001050
Anthony Liguorif79f2bf2011-12-04 11:17:51 -06001051 n->nic = qemu_new_nic(&net_virtio_info, conf, object_get_typename(OBJECT(dev)), dev->id, n);
Michael S. Tsirkin6e371ab2012-09-24 17:04:21 +02001052 peer_test_vnet_hdr(n);
1053 if (peer_has_vnet_hdr(n)) {
1054 tap_using_vnet_hdr(n->nic->nc.peer, 1);
1055 n->host_hdr_len = sizeof(struct virtio_net_hdr);
1056 } else {
1057 n->host_hdr_len = 0;
1058 }
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001059
1060 qemu_format_nic_info_str(&n->nic->nc, conf->macaddr.a);
aliguori96d5e202009-01-07 17:47:15 +00001061
Alex Williamson4b4b8d32010-09-02 09:01:04 -06001062 n->tx_waiting = 0;
Alex Williamsone3f30482010-09-02 09:00:57 -06001063 n->tx_burst = net->txburst;
Michael S. Tsirkinff3a8062012-09-24 21:05:03 +02001064 virtio_net_set_mrg_rx_bufs(n, 0);
aliguori002437c2009-02-05 22:36:20 +00001065 n->promisc = 1; /* for compatibility */
aliguorifbe78f42008-12-17 19:13:11 +00001066
Anthony Liguori7267c092011-08-20 22:09:37 -05001067 n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
aliguorib6503ed2009-02-05 22:36:28 +00001068
Anthony Liguori7267c092011-08-20 22:09:37 -05001069 n->vlans = g_malloc0(MAX_VLAN >> 3);
aliguorif21c0ed2009-02-05 22:36:32 +00001070
Alex Williamson01657c82010-06-25 11:09:28 -06001071 n->qdev = dev;
1072 register_savevm(dev, "virtio-net", -1, VIRTIO_NET_VM_VERSION,
aliguorifbe78f42008-12-17 19:13:11 +00001073 virtio_net_save, virtio_net_load, n);
Paul Brookcf21e102009-05-14 22:35:07 +01001074
Gleb Natapov1ca4d092010-12-08 13:35:05 +02001075 add_boot_device_path(conf->bootindex, dev, "/ethernet-phy@0");
1076
Paul Brook53c25ce2009-05-18 14:51:59 +01001077 return &n->vdev;
Paul Brookcf21e102009-05-14 22:35:07 +01001078}
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001079
1080void virtio_net_exit(VirtIODevice *vdev)
1081{
1082 VirtIONet *n = DO_UPCAST(VirtIONet, vdev, vdev);
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +02001083
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +02001084 /* This will stop vhost backend if appropriate. */
1085 virtio_net_set_status(vdev, 0);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001086
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001087 qemu_purge_queued_packets(&n->nic->nc);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001088
Alex Williamson01657c82010-06-25 11:09:28 -06001089 unregister_savevm(n->qdev, "virtio-net", n);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001090
Anthony Liguori7267c092011-08-20 22:09:37 -05001091 g_free(n->mac_table.macs);
1092 g_free(n->vlans);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001093
Alex Williamsona697a332010-09-02 09:01:10 -06001094 if (n->tx_timer) {
1095 qemu_del_timer(n->tx_timer);
1096 qemu_free_timer(n->tx_timer);
1097 } else {
1098 qemu_bh_delete(n->tx_bh);
1099 }
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001100
Stefan Hajnoczib20c6b92012-07-24 16:35:15 +01001101 qemu_del_net_client(&n->nic->nc);
Amit Shahb52dfd72011-07-27 14:00:31 +05301102 virtio_cleanup(&n->vdev);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001103}