blob: dc4a26cbd62f28f42109ad114449b7b02c4d89c4 [file] [log] [blame]
aliguorifbe78f42008-12-17 19:13:11 +00001/*
2 * Virtio Network Device
3 *
4 * Copyright IBM, Corp. 2007
5 *
6 * Authors:
7 * Anthony Liguori <aliguori@us.ibm.com>
8 *
9 * This work is licensed under the terms of the GNU GPL, version 2. See
10 * the COPYING file in the top-level directory.
11 *
12 */
13
Amit Shahe4d56392010-04-27 18:04:05 +053014#include "iov.h"
aliguorifbe78f42008-12-17 19:13:11 +000015#include "virtio.h"
16#include "net.h"
Mark McLoughlin7200ac32009-10-22 17:49:03 +010017#include "net/checksum.h"
Mark McLoughlina8ed73f2009-10-22 17:49:05 +010018#include "net/tap.h"
Markus Armbruster2f792012010-02-18 16:24:31 +010019#include "qemu-error.h"
aliguorifbe78f42008-12-17 19:13:11 +000020#include "qemu-timer.h"
21#include "virtio-net.h"
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +020022#include "vhost_net.h"
aliguorifbe78f42008-12-17 19:13:11 +000023
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +010024#define VIRTIO_NET_VM_VERSION 11
aliguorib6503ed2009-02-05 22:36:28 +000025
Alex Williamson4ffb17f2009-06-05 14:47:23 -060026#define MAC_TABLE_ENTRIES 64
aliguorif21c0ed2009-02-05 22:36:32 +000027#define MAX_VLAN (1 << 12) /* Per 802.1Q definition */
aliguori9d6271b2009-02-05 22:36:04 +000028
aliguorifbe78f42008-12-17 19:13:11 +000029typedef struct VirtIONet
30{
31 VirtIODevice vdev;
aliguori79674062009-02-05 22:36:12 +000032 uint8_t mac[ETH_ALEN];
aliguori554c97d2009-01-08 19:46:33 +000033 uint16_t status;
aliguorifbe78f42008-12-17 19:13:11 +000034 VirtQueue *rx_vq;
35 VirtQueue *tx_vq;
aliguori3d11d362009-02-05 22:36:16 +000036 VirtQueue *ctrl_vq;
Mark McLoughlineb6b6c12009-11-25 18:49:11 +000037 NICState *nic;
aliguorifbe78f42008-12-17 19:13:11 +000038 QEMUTimer *tx_timer;
Alex Williamsona697a332010-09-02 09:01:10 -060039 QEMUBH *tx_bh;
Alex Williamsonf0c07c72010-09-02 09:00:50 -060040 uint32_t tx_timeout;
Alex Williamsone3f30482010-09-02 09:00:57 -060041 int32_t tx_burst;
Alex Williamson4b4b8d32010-09-02 09:01:04 -060042 int tx_waiting;
Mark McLoughlin3a330132009-10-22 17:43:45 +010043 uint32_t has_vnet_hdr;
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +020044 size_t host_hdr_len;
45 size_t guest_hdr_len;
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +010046 uint8_t has_ufo;
Mark McLoughlin62433752009-06-18 18:21:36 +010047 struct {
48 VirtQueueElement elem;
49 ssize_t len;
50 } async_tx;
aliguorifbe78f42008-12-17 19:13:11 +000051 int mergeable_rx_bufs;
Alex Williamsonf10c5922009-06-05 14:46:57 -060052 uint8_t promisc;
53 uint8_t allmulti;
Alex Williamson015cb162009-06-05 14:47:18 -060054 uint8_t alluni;
55 uint8_t nomulti;
56 uint8_t nouni;
57 uint8_t nobcast;
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +020058 uint8_t vhost_started;
aliguorib6503ed2009-02-05 22:36:28 +000059 struct {
60 int in_use;
Alex Williamson2d9aba32009-06-05 14:47:13 -060061 int first_multi;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -060062 uint8_t multi_overflow;
63 uint8_t uni_overflow;
aliguorib6503ed2009-02-05 22:36:28 +000064 uint8_t *macs;
65 } mac_table;
aliguorif21c0ed2009-02-05 22:36:32 +000066 uint32_t *vlans;
Alex Williamson01657c82010-06-25 11:09:28 -060067 DeviceState *qdev;
aliguorifbe78f42008-12-17 19:13:11 +000068} VirtIONet;
69
70/* TODO
71 * - we could suppress RX interrupt if we were so inclined.
72 */
73
74static VirtIONet *to_virtio_net(VirtIODevice *vdev)
75{
76 return (VirtIONet *)vdev;
77}
78
aliguori0f03eca2009-02-05 22:36:08 +000079static void virtio_net_get_config(VirtIODevice *vdev, uint8_t *config)
aliguorifbe78f42008-12-17 19:13:11 +000080{
81 VirtIONet *n = to_virtio_net(vdev);
82 struct virtio_net_config netcfg;
83
Stefan Hajnoczib46d97f2011-03-03 21:42:28 +000084 stw_p(&netcfg.status, n->status);
aliguori79674062009-02-05 22:36:12 +000085 memcpy(netcfg.mac, n->mac, ETH_ALEN);
aliguorifbe78f42008-12-17 19:13:11 +000086 memcpy(config, &netcfg, sizeof(netcfg));
87}
88
aliguori0f03eca2009-02-05 22:36:08 +000089static void virtio_net_set_config(VirtIODevice *vdev, const uint8_t *config)
90{
91 VirtIONet *n = to_virtio_net(vdev);
92 struct virtio_net_config netcfg;
93
94 memcpy(&netcfg, config, sizeof(netcfg));
95
aliguori79674062009-02-05 22:36:12 +000096 if (memcmp(netcfg.mac, n->mac, ETH_ALEN)) {
97 memcpy(n->mac, netcfg.mac, ETH_ALEN);
Mark McLoughlineb6b6c12009-11-25 18:49:11 +000098 qemu_format_nic_info_str(&n->nic->nc, n->mac);
aliguori0f03eca2009-02-05 22:36:08 +000099 }
100}
101
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200102static bool virtio_net_started(VirtIONet *n, uint8_t status)
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200103{
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200104 return (status & VIRTIO_CONFIG_S_DRIVER_OK) &&
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200105 (n->status & VIRTIO_NET_S_LINK_UP) && n->vdev.vm_running;
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200106}
107
108static void virtio_net_vhost_status(VirtIONet *n, uint8_t status)
109{
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200110 if (!n->nic->nc.peer) {
111 return;
112 }
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200113 if (n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200114 return;
115 }
116
117 if (!tap_get_vhost_net(n->nic->nc.peer)) {
118 return;
119 }
Michael S. Tsirkin32993692011-02-09 18:45:09 +0200120 if (!!n->vhost_started == virtio_net_started(n, status) &&
121 !n->nic->nc.peer->link_down) {
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200122 return;
123 }
124 if (!n->vhost_started) {
mst@redhat.com5430a282011-02-01 22:13:42 +0200125 int r;
126 if (!vhost_net_query(tap_get_vhost_net(n->nic->nc.peer), &n->vdev)) {
127 return;
128 }
129 r = vhost_net_start(tap_get_vhost_net(n->nic->nc.peer), &n->vdev);
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200130 if (r < 0) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000131 error_report("unable to start vhost net: %d: "
132 "falling back on userspace virtio", -r);
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200133 } else {
134 n->vhost_started = 1;
135 }
136 } else {
137 vhost_net_stop(tap_get_vhost_net(n->nic->nc.peer), &n->vdev);
138 n->vhost_started = 0;
139 }
140}
141
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200142static void virtio_net_set_status(struct VirtIODevice *vdev, uint8_t status)
143{
144 VirtIONet *n = to_virtio_net(vdev);
145
146 virtio_net_vhost_status(n, status);
147
148 if (!n->tx_waiting) {
149 return;
150 }
151
152 if (virtio_net_started(n, status) && !n->vhost_started) {
153 if (n->tx_timer) {
154 qemu_mod_timer(n->tx_timer,
Paolo Bonzini74475452011-03-11 16:47:48 +0100155 qemu_get_clock_ns(vm_clock) + n->tx_timeout);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200156 } else {
157 qemu_bh_schedule(n->tx_bh);
158 }
159 } else {
160 if (n->tx_timer) {
161 qemu_del_timer(n->tx_timer);
162 } else {
163 qemu_bh_cancel(n->tx_bh);
164 }
165 }
166}
167
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100168static void virtio_net_set_link_status(NetClientState *nc)
aliguori554c97d2009-01-08 19:46:33 +0000169{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000170 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
aliguori554c97d2009-01-08 19:46:33 +0000171 uint16_t old_status = n->status;
172
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000173 if (nc->link_down)
aliguori554c97d2009-01-08 19:46:33 +0000174 n->status &= ~VIRTIO_NET_S_LINK_UP;
175 else
176 n->status |= VIRTIO_NET_S_LINK_UP;
177
178 if (n->status != old_status)
179 virtio_notify_config(&n->vdev);
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200180
181 virtio_net_set_status(&n->vdev, n->vdev.status);
aliguori554c97d2009-01-08 19:46:33 +0000182}
183
aliguori002437c2009-02-05 22:36:20 +0000184static void virtio_net_reset(VirtIODevice *vdev)
185{
186 VirtIONet *n = to_virtio_net(vdev);
187
188 /* Reset back to compatibility mode */
189 n->promisc = 1;
190 n->allmulti = 0;
Alex Williamson015cb162009-06-05 14:47:18 -0600191 n->alluni = 0;
192 n->nomulti = 0;
193 n->nouni = 0;
194 n->nobcast = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000195
aliguorif21c0ed2009-02-05 22:36:32 +0000196 /* Flush any MAC and VLAN filter table state */
aliguorib6503ed2009-02-05 22:36:28 +0000197 n->mac_table.in_use = 0;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600198 n->mac_table.first_multi = 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600199 n->mac_table.multi_overflow = 0;
200 n->mac_table.uni_overflow = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000201 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
aliguorif21c0ed2009-02-05 22:36:32 +0000202 memset(n->vlans, 0, MAX_VLAN >> 3);
aliguori002437c2009-02-05 22:36:20 +0000203}
204
Mark McLoughlin3a330132009-10-22 17:43:45 +0100205static int peer_has_vnet_hdr(VirtIONet *n)
206{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000207 if (!n->nic->nc.peer)
Mark McLoughlin3a330132009-10-22 17:43:45 +0100208 return 0;
209
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200210 if (n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP)
Mark McLoughlin3a330132009-10-22 17:43:45 +0100211 return 0;
212
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000213 n->has_vnet_hdr = tap_has_vnet_hdr(n->nic->nc.peer);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100214
215 return n->has_vnet_hdr;
216}
217
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100218static int peer_has_ufo(VirtIONet *n)
219{
220 if (!peer_has_vnet_hdr(n))
221 return 0;
222
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000223 n->has_ufo = tap_has_ufo(n->nic->nc.peer);
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100224
225 return n->has_ufo;
226}
227
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200228static uint32_t virtio_net_get_features(VirtIODevice *vdev, uint32_t features)
aliguorifbe78f42008-12-17 19:13:11 +0000229{
Mark McLoughlin3a330132009-10-22 17:43:45 +0100230 VirtIONet *n = to_virtio_net(vdev);
aliguorifbe78f42008-12-17 19:13:11 +0000231
Michael S. Tsirkinc9f79a32010-01-12 20:50:17 +0200232 features |= (1 << VIRTIO_NET_F_MAC);
233
Mark McLoughlin3a330132009-10-22 17:43:45 +0100234 if (peer_has_vnet_hdr(n)) {
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000235 tap_using_vnet_hdr(n->nic->nc.peer, 1);
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200236 n->host_hdr_len = sizeof(struct virtio_net_hdr);
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200237 } else {
238 features &= ~(0x1 << VIRTIO_NET_F_CSUM);
239 features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO4);
240 features &= ~(0x1 << VIRTIO_NET_F_HOST_TSO6);
241 features &= ~(0x1 << VIRTIO_NET_F_HOST_ECN);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100242
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200243 features &= ~(0x1 << VIRTIO_NET_F_GUEST_CSUM);
244 features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO4);
245 features &= ~(0x1 << VIRTIO_NET_F_GUEST_TSO6);
246 features &= ~(0x1 << VIRTIO_NET_F_GUEST_ECN);
247 }
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100248
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200249 if (!peer_has_vnet_hdr(n) || !peer_has_ufo(n)) {
250 features &= ~(0x1 << VIRTIO_NET_F_GUEST_UFO);
251 features &= ~(0x1 << VIRTIO_NET_F_HOST_UFO);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100252 }
253
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +0200254 if (!n->nic->nc.peer ||
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200255 n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +0200256 return features;
257 }
258 if (!tap_get_vhost_net(n->nic->nc.peer)) {
259 return features;
260 }
261 return vhost_net_get_features(tap_get_vhost_net(n->nic->nc.peer), features);
aliguorifbe78f42008-12-17 19:13:11 +0000262}
263
aliguori8eca6b12009-04-05 17:40:08 +0000264static uint32_t virtio_net_bad_features(VirtIODevice *vdev)
265{
266 uint32_t features = 0;
267
268 /* Linux kernel 2.6.25. It understood MAC (as everyone must),
269 * but also these: */
270 features |= (1 << VIRTIO_NET_F_MAC);
Dustin Kirkland184bd042009-10-29 10:34:15 -0500271 features |= (1 << VIRTIO_NET_F_CSUM);
272 features |= (1 << VIRTIO_NET_F_HOST_TSO4);
273 features |= (1 << VIRTIO_NET_F_HOST_TSO6);
274 features |= (1 << VIRTIO_NET_F_HOST_ECN);
aliguori8eca6b12009-04-05 17:40:08 +0000275
Michael S. Tsirkin81725392010-01-10 13:52:53 +0200276 return features;
aliguori8eca6b12009-04-05 17:40:08 +0000277}
278
aliguorifbe78f42008-12-17 19:13:11 +0000279static void virtio_net_set_features(VirtIODevice *vdev, uint32_t features)
280{
281 VirtIONet *n = to_virtio_net(vdev);
282
283 n->mergeable_rx_bufs = !!(features & (1 << VIRTIO_NET_F_MRG_RXBUF));
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200284 n->guest_hdr_len = n->mergeable_rx_bufs ?
285 sizeof(struct virtio_net_hdr_mrg_rxbuf) : sizeof(struct virtio_net_hdr);
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100286
287 if (n->has_vnet_hdr) {
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000288 tap_set_offload(n->nic->nc.peer,
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100289 (features >> VIRTIO_NET_F_GUEST_CSUM) & 1,
290 (features >> VIRTIO_NET_F_GUEST_TSO4) & 1,
291 (features >> VIRTIO_NET_F_GUEST_TSO6) & 1,
Sridhar Samudrala6c9f58b2009-10-22 17:43:49 +0100292 (features >> VIRTIO_NET_F_GUEST_ECN) & 1,
293 (features >> VIRTIO_NET_F_GUEST_UFO) & 1);
Mark McLoughlinf5436dd2009-10-22 17:43:47 +0100294 }
David L Stevensdc14a392010-03-31 21:20:31 +0300295 if (!n->nic->nc.peer ||
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200296 n->nic->nc.peer->info->type != NET_CLIENT_OPTIONS_KIND_TAP) {
David L Stevensdc14a392010-03-31 21:20:31 +0300297 return;
298 }
299 if (!tap_get_vhost_net(n->nic->nc.peer)) {
300 return;
301 }
Michael S. Tsirkin57c32292010-05-09 14:35:43 +0300302 vhost_net_ack_features(tap_get_vhost_net(n->nic->nc.peer), features);
aliguorifbe78f42008-12-17 19:13:11 +0000303}
304
aliguori002437c2009-02-05 22:36:20 +0000305static int virtio_net_handle_rx_mode(VirtIONet *n, uint8_t cmd,
306 VirtQueueElement *elem)
307{
308 uint8_t on;
309
310 if (elem->out_num != 2 || elem->out_sg[1].iov_len != sizeof(on)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000311 error_report("virtio-net ctrl invalid rx mode command");
aliguori002437c2009-02-05 22:36:20 +0000312 exit(1);
313 }
314
315 on = ldub_p(elem->out_sg[1].iov_base);
316
317 if (cmd == VIRTIO_NET_CTRL_RX_MODE_PROMISC)
318 n->promisc = on;
319 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_ALLMULTI)
320 n->allmulti = on;
Alex Williamson015cb162009-06-05 14:47:18 -0600321 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_ALLUNI)
322 n->alluni = on;
323 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOMULTI)
324 n->nomulti = on;
325 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOUNI)
326 n->nouni = on;
327 else if (cmd == VIRTIO_NET_CTRL_RX_MODE_NOBCAST)
328 n->nobcast = on;
aliguori002437c2009-02-05 22:36:20 +0000329 else
330 return VIRTIO_NET_ERR;
331
332 return VIRTIO_NET_OK;
333}
334
aliguorib6503ed2009-02-05 22:36:28 +0000335static int virtio_net_handle_mac(VirtIONet *n, uint8_t cmd,
336 VirtQueueElement *elem)
337{
338 struct virtio_net_ctrl_mac mac_data;
339
340 if (cmd != VIRTIO_NET_CTRL_MAC_TABLE_SET || elem->out_num != 3 ||
341 elem->out_sg[1].iov_len < sizeof(mac_data) ||
342 elem->out_sg[2].iov_len < sizeof(mac_data))
343 return VIRTIO_NET_ERR;
344
345 n->mac_table.in_use = 0;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600346 n->mac_table.first_multi = 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600347 n->mac_table.uni_overflow = 0;
348 n->mac_table.multi_overflow = 0;
aliguorib6503ed2009-02-05 22:36:28 +0000349 memset(n->mac_table.macs, 0, MAC_TABLE_ENTRIES * ETH_ALEN);
350
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100351 mac_data.entries = ldl_p(elem->out_sg[1].iov_base);
aliguorib6503ed2009-02-05 22:36:28 +0000352
353 if (sizeof(mac_data.entries) +
354 (mac_data.entries * ETH_ALEN) > elem->out_sg[1].iov_len)
355 return VIRTIO_NET_ERR;
356
357 if (mac_data.entries <= MAC_TABLE_ENTRIES) {
358 memcpy(n->mac_table.macs, elem->out_sg[1].iov_base + sizeof(mac_data),
359 mac_data.entries * ETH_ALEN);
360 n->mac_table.in_use += mac_data.entries;
361 } else {
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600362 n->mac_table.uni_overflow = 1;
aliguorib6503ed2009-02-05 22:36:28 +0000363 }
364
Alex Williamson2d9aba32009-06-05 14:47:13 -0600365 n->mac_table.first_multi = n->mac_table.in_use;
366
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100367 mac_data.entries = ldl_p(elem->out_sg[2].iov_base);
aliguorib6503ed2009-02-05 22:36:28 +0000368
369 if (sizeof(mac_data.entries) +
370 (mac_data.entries * ETH_ALEN) > elem->out_sg[2].iov_len)
371 return VIRTIO_NET_ERR;
372
373 if (mac_data.entries) {
374 if (n->mac_table.in_use + mac_data.entries <= MAC_TABLE_ENTRIES) {
375 memcpy(n->mac_table.macs + (n->mac_table.in_use * ETH_ALEN),
376 elem->out_sg[2].iov_base + sizeof(mac_data),
377 mac_data.entries * ETH_ALEN);
378 n->mac_table.in_use += mac_data.entries;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600379 } else {
380 n->mac_table.multi_overflow = 1;
381 }
aliguorib6503ed2009-02-05 22:36:28 +0000382 }
383
384 return VIRTIO_NET_OK;
385}
386
aliguorif21c0ed2009-02-05 22:36:32 +0000387static int virtio_net_handle_vlan_table(VirtIONet *n, uint8_t cmd,
388 VirtQueueElement *elem)
389{
390 uint16_t vid;
391
392 if (elem->out_num != 2 || elem->out_sg[1].iov_len != sizeof(vid)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000393 error_report("virtio-net ctrl invalid vlan command");
aliguorif21c0ed2009-02-05 22:36:32 +0000394 return VIRTIO_NET_ERR;
395 }
396
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100397 vid = lduw_p(elem->out_sg[1].iov_base);
aliguorif21c0ed2009-02-05 22:36:32 +0000398
399 if (vid >= MAX_VLAN)
400 return VIRTIO_NET_ERR;
401
402 if (cmd == VIRTIO_NET_CTRL_VLAN_ADD)
403 n->vlans[vid >> 5] |= (1U << (vid & 0x1f));
404 else if (cmd == VIRTIO_NET_CTRL_VLAN_DEL)
405 n->vlans[vid >> 5] &= ~(1U << (vid & 0x1f));
406 else
407 return VIRTIO_NET_ERR;
408
409 return VIRTIO_NET_OK;
410}
411
aliguori3d11d362009-02-05 22:36:16 +0000412static void virtio_net_handle_ctrl(VirtIODevice *vdev, VirtQueue *vq)
413{
aliguori002437c2009-02-05 22:36:20 +0000414 VirtIONet *n = to_virtio_net(vdev);
aliguori3d11d362009-02-05 22:36:16 +0000415 struct virtio_net_ctrl_hdr ctrl;
416 virtio_net_ctrl_ack status = VIRTIO_NET_ERR;
417 VirtQueueElement elem;
418
419 while (virtqueue_pop(vq, &elem)) {
420 if ((elem.in_num < 1) || (elem.out_num < 1)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000421 error_report("virtio-net ctrl missing headers");
aliguori3d11d362009-02-05 22:36:16 +0000422 exit(1);
423 }
424
425 if (elem.out_sg[0].iov_len < sizeof(ctrl) ||
aliguoric6bb9a32009-03-13 15:04:02 +0000426 elem.in_sg[elem.in_num - 1].iov_len < sizeof(status)) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000427 error_report("virtio-net ctrl header not in correct element");
aliguori3d11d362009-02-05 22:36:16 +0000428 exit(1);
429 }
430
431 ctrl.class = ldub_p(elem.out_sg[0].iov_base);
432 ctrl.cmd = ldub_p(elem.out_sg[0].iov_base + sizeof(ctrl.class));
433
aliguori002437c2009-02-05 22:36:20 +0000434 if (ctrl.class == VIRTIO_NET_CTRL_RX_MODE)
435 status = virtio_net_handle_rx_mode(n, ctrl.cmd, &elem);
aliguorib6503ed2009-02-05 22:36:28 +0000436 else if (ctrl.class == VIRTIO_NET_CTRL_MAC)
437 status = virtio_net_handle_mac(n, ctrl.cmd, &elem);
aliguorif21c0ed2009-02-05 22:36:32 +0000438 else if (ctrl.class == VIRTIO_NET_CTRL_VLAN)
439 status = virtio_net_handle_vlan_table(n, ctrl.cmd, &elem);
aliguori002437c2009-02-05 22:36:20 +0000440
aliguori3d11d362009-02-05 22:36:16 +0000441 stb_p(elem.in_sg[elem.in_num - 1].iov_base, status);
442
443 virtqueue_push(vq, &elem, sizeof(status));
444 virtio_notify(vdev, vq);
445 }
446}
447
aliguorifbe78f42008-12-17 19:13:11 +0000448/* RX */
449
450static void virtio_net_handle_rx(VirtIODevice *vdev, VirtQueue *vq)
451{
Mark McLoughlin8aeff622009-04-29 13:40:02 +0100452 VirtIONet *n = to_virtio_net(vdev);
453
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000454 qemu_flush_queued_packets(&n->nic->nc);
aliguorifbe78f42008-12-17 19:13:11 +0000455}
456
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100457static int virtio_net_can_receive(NetClientState *nc)
aliguorifbe78f42008-12-17 19:13:11 +0000458{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000459 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200460 if (!n->vdev.vm_running) {
Michael S. Tsirkin95477322010-11-22 19:52:19 +0200461 return 0;
462 }
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000463
aliguorifbe78f42008-12-17 19:13:11 +0000464 if (!virtio_queue_ready(n->rx_vq) ||
465 !(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK))
466 return 0;
467
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000468 return 1;
469}
470
471static int virtio_net_has_buffers(VirtIONet *n, int bufsize)
472{
aliguorifbe78f42008-12-17 19:13:11 +0000473 if (virtio_queue_empty(n->rx_vq) ||
474 (n->mergeable_rx_bufs &&
475 !virtqueue_avail_bytes(n->rx_vq, bufsize, 0))) {
476 virtio_queue_set_notification(n->rx_vq, 1);
Tom Lendacky06b12972010-02-08 10:10:01 -0600477
478 /* To avoid a race condition where the guest has made some buffers
479 * available after the above check but before notification was
480 * enabled, check for available buffers again.
481 */
482 if (virtio_queue_empty(n->rx_vq) ||
483 (n->mergeable_rx_bufs &&
484 !virtqueue_avail_bytes(n->rx_vq, bufsize, 0)))
485 return 0;
aliguorifbe78f42008-12-17 19:13:11 +0000486 }
487
488 virtio_queue_set_notification(n->rx_vq, 0);
489 return 1;
490}
491
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100492/* dhclient uses AF_PACKET but doesn't pass auxdata to the kernel so
493 * it never finds out that the packets don't have valid checksums. This
494 * causes dhclient to get upset. Fedora's carried a patch for ages to
495 * fix this with Xen but it hasn't appeared in an upstream release of
496 * dhclient yet.
497 *
498 * To avoid breaking existing guests, we catch udp packets and add
499 * checksums. This is terrible but it's better than hacking the guest
500 * kernels.
501 *
502 * N.B. if we introduce a zero-copy API, this operation is no longer free so
503 * we should provide a mechanism to disable it to avoid polluting the host
504 * cache.
505 */
506static void work_around_broken_dhclient(struct virtio_net_hdr *hdr,
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200507 uint8_t *buf, size_t size)
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100508{
509 if ((hdr->flags & VIRTIO_NET_HDR_F_NEEDS_CSUM) && /* missing csum */
510 (size > 27 && size < 1500) && /* normal sized MTU */
511 (buf[12] == 0x08 && buf[13] == 0x00) && /* ethertype == IPv4 */
512 (buf[23] == 17) && /* ip.protocol == UDP */
513 (buf[34] == 0 && buf[35] == 67)) { /* udp.srcport == bootps */
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200514 net_checksum_calculate(buf, size);
Anthony Liguori1d41b0c2009-10-22 17:43:48 +0100515 hdr->flags &= ~VIRTIO_NET_HDR_F_NEEDS_CSUM;
516 }
517}
518
Michael S. Tsirkin280598b2012-09-24 13:24:17 +0200519static void receive_header(VirtIONet *n, const struct iovec *iov, int iov_cnt,
520 const void *buf, size_t size)
aliguorifbe78f42008-12-17 19:13:11 +0000521{
Mark McLoughlin3a330132009-10-22 17:43:45 +0100522 if (n->has_vnet_hdr) {
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200523 /* FIXME this cast is evil */
524 void *wbuf = (void *)buf;
Michael S. Tsirkin280598b2012-09-24 13:24:17 +0200525 work_around_broken_dhclient(wbuf, wbuf + n->host_hdr_len,
526 size - n->host_hdr_len);
527 iov_from_buf(iov, iov_cnt, 0, buf, sizeof(struct virtio_net_hdr));
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200528 } else {
529 struct virtio_net_hdr hdr = {
530 .flags = 0,
531 .gso_type = VIRTIO_NET_HDR_GSO_NONE
532 };
533 iov_from_buf(iov, iov_cnt, 0, &hdr, sizeof hdr);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100534 }
aliguorifbe78f42008-12-17 19:13:11 +0000535}
536
aliguori3831ab22009-02-05 22:36:24 +0000537static int receive_filter(VirtIONet *n, const uint8_t *buf, int size)
538{
539 static const uint8_t bcast[] = {0xff, 0xff, 0xff, 0xff, 0xff, 0xff};
aliguorif21c0ed2009-02-05 22:36:32 +0000540 static const uint8_t vlan[] = {0x81, 0x00};
aliguori3831ab22009-02-05 22:36:24 +0000541 uint8_t *ptr = (uint8_t *)buf;
aliguorib6503ed2009-02-05 22:36:28 +0000542 int i;
aliguori3831ab22009-02-05 22:36:24 +0000543
544 if (n->promisc)
545 return 1;
546
Mark McLoughlin3a330132009-10-22 17:43:45 +0100547 if (n->has_vnet_hdr) {
548 ptr += sizeof(struct virtio_net_hdr);
549 }
550
aliguorif21c0ed2009-02-05 22:36:32 +0000551 if (!memcmp(&ptr[12], vlan, sizeof(vlan))) {
552 int vid = be16_to_cpup((uint16_t *)(ptr + 14)) & 0xfff;
553 if (!(n->vlans[vid >> 5] & (1U << (vid & 0x1f))))
554 return 0;
555 }
556
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600557 if (ptr[0] & 1) { // multicast
558 if (!memcmp(ptr, bcast, sizeof(bcast))) {
Alex Williamson015cb162009-06-05 14:47:18 -0600559 return !n->nobcast;
560 } else if (n->nomulti) {
561 return 0;
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600562 } else if (n->allmulti || n->mac_table.multi_overflow) {
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600563 return 1;
564 }
Alex Williamson2d9aba32009-06-05 14:47:13 -0600565
566 for (i = n->mac_table.first_multi; i < n->mac_table.in_use; i++) {
567 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
568 return 1;
569 }
570 }
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600571 } else { // unicast
Alex Williamson015cb162009-06-05 14:47:18 -0600572 if (n->nouni) {
573 return 0;
574 } else if (n->alluni || n->mac_table.uni_overflow) {
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600575 return 1;
576 } else if (!memcmp(ptr, n->mac, ETH_ALEN)) {
Alex Williamsonbbe2f392009-06-05 14:47:02 -0600577 return 1;
578 }
aliguori3831ab22009-02-05 22:36:24 +0000579
Alex Williamson2d9aba32009-06-05 14:47:13 -0600580 for (i = 0; i < n->mac_table.first_multi; i++) {
581 if (!memcmp(ptr, &n->mac_table.macs[i * ETH_ALEN], ETH_ALEN)) {
582 return 1;
583 }
584 }
aliguorib6503ed2009-02-05 22:36:28 +0000585 }
586
aliguori3831ab22009-02-05 22:36:24 +0000587 return 0;
588}
589
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100590static ssize_t virtio_net_receive(NetClientState *nc, const uint8_t *buf, size_t size)
aliguorifbe78f42008-12-17 19:13:11 +0000591{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000592 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200593 struct iovec mhdr_sg[VIRTQUEUE_MAX_SIZE];
594 struct virtio_net_hdr_mrg_rxbuf mhdr;
595 unsigned mhdr_cnt = 0;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200596 size_t offset, i, guest_offset;
aliguorifbe78f42008-12-17 19:13:11 +0000597
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000598 if (!virtio_net_can_receive(&n->nic->nc))
Mark McLoughlincdd5cc12009-10-27 18:16:38 +0000599 return -1;
600
Michael S. Tsirkin940cda92010-06-06 18:53:10 +0300601 /* hdr_len refers to the header we supply to the guest */
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200602 if (!virtio_net_has_buffers(n, size + n->guest_hdr_len - n->host_hdr_len))
Mark McLoughlin8aeff622009-04-29 13:40:02 +0100603 return 0;
aliguorifbe78f42008-12-17 19:13:11 +0000604
aliguori3831ab22009-02-05 22:36:24 +0000605 if (!receive_filter(n, buf, size))
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100606 return size;
aliguori3831ab22009-02-05 22:36:24 +0000607
aliguorifbe78f42008-12-17 19:13:11 +0000608 offset = i = 0;
609
610 while (offset < size) {
611 VirtQueueElement elem;
612 int len, total;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200613 const struct iovec *sg = elem.in_sg;
aliguorifbe78f42008-12-17 19:13:11 +0000614
Amit Shah22c253d2010-01-13 16:24:43 +0530615 total = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000616
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300617 if (virtqueue_pop(n->rx_vq, &elem) == 0) {
aliguorifbe78f42008-12-17 19:13:11 +0000618 if (i == 0)
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100619 return -1;
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000620 error_report("virtio-net unexpected empty queue: "
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300621 "i %zd mergeable %d offset %zd, size %zd, "
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000622 "guest hdr len %zd, host hdr len %zd guest features 0x%x",
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300623 i, n->mergeable_rx_bufs, offset, size,
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200624 n->guest_hdr_len, n->host_hdr_len, n->vdev.guest_features);
aliguorifbe78f42008-12-17 19:13:11 +0000625 exit(1);
626 }
627
628 if (elem.in_num < 1) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000629 error_report("virtio-net receive queue contains no in buffers");
aliguorifbe78f42008-12-17 19:13:11 +0000630 exit(1);
631 }
632
aliguorifbe78f42008-12-17 19:13:11 +0000633 if (i == 0) {
Michael S. Tsirkinc8d28e72012-09-24 13:26:55 +0200634 assert(offset == 0);
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200635 if (n->mergeable_rx_bufs) {
636 mhdr_cnt = iov_copy(mhdr_sg, ARRAY_SIZE(mhdr_sg),
637 sg, elem.in_num,
638 offsetof(typeof(mhdr), num_buffers),
639 sizeof(mhdr.num_buffers));
640 }
aliguorifbe78f42008-12-17 19:13:11 +0000641
Michael S. Tsirkinc8d28e72012-09-24 13:26:55 +0200642 receive_header(n, sg, elem.in_num, buf, size);
643 offset = n->host_hdr_len;
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200644 total += n->guest_hdr_len;
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200645 guest_offset = n->guest_hdr_len;
646 } else {
647 guest_offset = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000648 }
649
650 /* copy in packet. ugh */
Michael S. Tsirkin22cc84d2012-09-24 13:14:16 +0200651 len = iov_from_buf(sg, elem.in_num, guest_offset,
Michael Tokarevdcf6f5e2012-03-11 18:05:12 +0400652 buf + offset, size - offset);
aliguorifbe78f42008-12-17 19:13:11 +0000653 total += len;
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300654 offset += len;
655 /* If buffers can't be merged, at this point we
656 * must have consumed the complete packet.
657 * Otherwise, drop it. */
658 if (!n->mergeable_rx_bufs && offset < size) {
659#if 0
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000660 error_report("virtio-net truncated non-mergeable packet: "
661 "i %zd mergeable %d offset %zd, size %zd, "
662 "guest hdr len %zd, host hdr len %zd",
663 i, n->mergeable_rx_bufs,
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200664 offset, size, n->guest_hdr_len, n->host_hdr_len);
Michael S. Tsirkin279a4252010-06-22 16:22:49 +0300665#endif
666 return size;
667 }
aliguorifbe78f42008-12-17 19:13:11 +0000668
669 /* signal other side */
670 virtqueue_fill(n->rx_vq, &elem, total, i++);
aliguorifbe78f42008-12-17 19:13:11 +0000671 }
672
Michael S. Tsirkin63c58722012-09-24 13:17:13 +0200673 if (mhdr_cnt) {
674 stw_p(&mhdr.num_buffers, i);
675 iov_from_buf(mhdr_sg, mhdr_cnt,
676 0,
677 &mhdr.num_buffers, sizeof mhdr.num_buffers);
Aurelien Jarno44b15bc2011-01-25 11:55:14 +0100678 }
aliguorifbe78f42008-12-17 19:13:11 +0000679
680 virtqueue_flush(n->rx_vq, i);
681 virtio_notify(&n->vdev, n->rx_vq);
Mark McLoughlin4f1c9422009-05-18 13:40:55 +0100682
683 return size;
aliguorifbe78f42008-12-17 19:13:11 +0000684}
685
Alex Williamsone3f30482010-09-02 09:00:57 -0600686static int32_t virtio_net_flush_tx(VirtIONet *n, VirtQueue *vq);
Mark McLoughlin62433752009-06-18 18:21:36 +0100687
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100688static void virtio_net_tx_complete(NetClientState *nc, ssize_t len)
Mark McLoughlin62433752009-06-18 18:21:36 +0100689{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000690 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
Mark McLoughlin62433752009-06-18 18:21:36 +0100691
Michael S. Tsirkin40bad8f2012-09-24 15:15:43 +0200692 virtqueue_push(n->tx_vq, &n->async_tx.elem, 0);
Mark McLoughlin62433752009-06-18 18:21:36 +0100693 virtio_notify(&n->vdev, n->tx_vq);
694
695 n->async_tx.elem.out_num = n->async_tx.len = 0;
696
697 virtio_queue_set_notification(n->tx_vq, 1);
698 virtio_net_flush_tx(n, n->tx_vq);
699}
700
aliguorifbe78f42008-12-17 19:13:11 +0000701/* TX */
Alex Williamsone3f30482010-09-02 09:00:57 -0600702static int32_t virtio_net_flush_tx(VirtIONet *n, VirtQueue *vq)
aliguorifbe78f42008-12-17 19:13:11 +0000703{
704 VirtQueueElement elem;
Alex Williamsone3f30482010-09-02 09:00:57 -0600705 int32_t num_packets = 0;
Alex Williamsone3f30482010-09-02 09:00:57 -0600706 if (!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK)) {
707 return num_packets;
708 }
aliguorifbe78f42008-12-17 19:13:11 +0000709
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200710 assert(n->vdev.vm_running);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200711
Mark McLoughlin62433752009-06-18 18:21:36 +0100712 if (n->async_tx.elem.out_num) {
713 virtio_queue_set_notification(n->tx_vq, 0);
Alex Williamsone3f30482010-09-02 09:00:57 -0600714 return num_packets;
Mark McLoughlin62433752009-06-18 18:21:36 +0100715 }
716
aliguorifbe78f42008-12-17 19:13:11 +0000717 while (virtqueue_pop(vq, &elem)) {
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200718 ssize_t ret, len;
aliguorifbe78f42008-12-17 19:13:11 +0000719 unsigned int out_num = elem.out_num;
720 struct iovec *out_sg = &elem.out_sg[0];
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200721 struct iovec sg[VIRTQUEUE_MAX_SIZE];
aliguorifbe78f42008-12-17 19:13:11 +0000722
Michael S. Tsirkin7b80d082012-09-24 14:54:44 +0200723 if (out_num < 1) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +0000724 error_report("virtio-net header not in first element");
aliguorifbe78f42008-12-17 19:13:11 +0000725 exit(1);
726 }
727
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200728 /*
729 * If host wants to see the guest header as is, we can
730 * pass it on unchanged. Otherwise, copy just the parts
731 * that host is interested in.
732 */
733 assert(n->host_hdr_len <= n->guest_hdr_len);
734 if (n->host_hdr_len != n->guest_hdr_len) {
735 unsigned sg_num = iov_copy(sg, ARRAY_SIZE(sg),
736 out_sg, out_num,
737 0, n->host_hdr_len);
738 sg_num += iov_copy(sg + sg_num, ARRAY_SIZE(sg) - sg_num,
739 out_sg, out_num,
740 n->guest_hdr_len, -1);
741 out_num = sg_num;
742 out_sg = sg;
aliguorifbe78f42008-12-17 19:13:11 +0000743 }
744
Michael S. Tsirkin7b80d082012-09-24 14:54:44 +0200745 len = n->guest_hdr_len;
Michael S. Tsirkin14761f92012-09-24 14:52:28 +0200746
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000747 ret = qemu_sendv_packet_async(&n->nic->nc, out_sg, out_num,
Mark McLoughlin62433752009-06-18 18:21:36 +0100748 virtio_net_tx_complete);
749 if (ret == 0) {
750 virtio_queue_set_notification(n->tx_vq, 0);
751 n->async_tx.elem = elem;
752 n->async_tx.len = len;
Alex Williamsone3f30482010-09-02 09:00:57 -0600753 return -EBUSY;
Mark McLoughlin62433752009-06-18 18:21:36 +0100754 }
755
756 len += ret;
aliguorifbe78f42008-12-17 19:13:11 +0000757
Michael S. Tsirkin40bad8f2012-09-24 15:15:43 +0200758 virtqueue_push(vq, &elem, 0);
aliguorifbe78f42008-12-17 19:13:11 +0000759 virtio_notify(&n->vdev, vq);
Alex Williamsone3f30482010-09-02 09:00:57 -0600760
761 if (++num_packets >= n->tx_burst) {
762 break;
763 }
aliguorifbe78f42008-12-17 19:13:11 +0000764 }
Alex Williamsone3f30482010-09-02 09:00:57 -0600765 return num_packets;
aliguorifbe78f42008-12-17 19:13:11 +0000766}
767
Alex Williamsona697a332010-09-02 09:01:10 -0600768static void virtio_net_handle_tx_timer(VirtIODevice *vdev, VirtQueue *vq)
aliguorifbe78f42008-12-17 19:13:11 +0000769{
770 VirtIONet *n = to_virtio_net(vdev);
771
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200772 /* This happens when device was stopped but VCPU wasn't. */
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200773 if (!n->vdev.vm_running) {
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200774 n->tx_waiting = 1;
775 return;
776 }
777
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600778 if (n->tx_waiting) {
aliguorifbe78f42008-12-17 19:13:11 +0000779 virtio_queue_set_notification(vq, 1);
780 qemu_del_timer(n->tx_timer);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600781 n->tx_waiting = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000782 virtio_net_flush_tx(n, vq);
783 } else {
784 qemu_mod_timer(n->tx_timer,
Paolo Bonzini74475452011-03-11 16:47:48 +0100785 qemu_get_clock_ns(vm_clock) + n->tx_timeout);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600786 n->tx_waiting = 1;
aliguorifbe78f42008-12-17 19:13:11 +0000787 virtio_queue_set_notification(vq, 0);
788 }
789}
790
Alex Williamsona697a332010-09-02 09:01:10 -0600791static void virtio_net_handle_tx_bh(VirtIODevice *vdev, VirtQueue *vq)
792{
793 VirtIONet *n = to_virtio_net(vdev);
794
795 if (unlikely(n->tx_waiting)) {
796 return;
797 }
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200798 n->tx_waiting = 1;
799 /* This happens when device was stopped but VCPU wasn't. */
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200800 if (!n->vdev.vm_running) {
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200801 return;
802 }
Alex Williamsona697a332010-09-02 09:01:10 -0600803 virtio_queue_set_notification(vq, 0);
804 qemu_bh_schedule(n->tx_bh);
Alex Williamsona697a332010-09-02 09:01:10 -0600805}
806
aliguorifbe78f42008-12-17 19:13:11 +0000807static void virtio_net_tx_timer(void *opaque)
808{
809 VirtIONet *n = opaque;
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200810 assert(n->vdev.vm_running);
aliguorifbe78f42008-12-17 19:13:11 +0000811
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600812 n->tx_waiting = 0;
aliguorifbe78f42008-12-17 19:13:11 +0000813
814 /* Just in case the driver is not ready on more */
815 if (!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK))
816 return;
817
818 virtio_queue_set_notification(n->tx_vq, 1);
819 virtio_net_flush_tx(n, n->tx_vq);
820}
821
Alex Williamsona697a332010-09-02 09:01:10 -0600822static void virtio_net_tx_bh(void *opaque)
823{
824 VirtIONet *n = opaque;
825 int32_t ret;
826
Michael S. Tsirkin85cf2a82011-01-10 14:28:40 +0200827 assert(n->vdev.vm_running);
Michael S. Tsirkin783e7702010-11-22 19:52:30 +0200828
Alex Williamsona697a332010-09-02 09:01:10 -0600829 n->tx_waiting = 0;
830
831 /* Just in case the driver is not ready on more */
832 if (unlikely(!(n->vdev.status & VIRTIO_CONFIG_S_DRIVER_OK)))
833 return;
834
835 ret = virtio_net_flush_tx(n, n->tx_vq);
836 if (ret == -EBUSY) {
837 return; /* Notification re-enable handled by tx_complete */
838 }
839
840 /* If we flush a full burst of packets, assume there are
841 * more coming and immediately reschedule */
842 if (ret >= n->tx_burst) {
843 qemu_bh_schedule(n->tx_bh);
844 n->tx_waiting = 1;
845 return;
846 }
847
848 /* If less than a full burst, re-enable notification and flush
849 * anything that may have come in while we weren't looking. If
850 * we find something, assume the guest is still active and reschedule */
851 virtio_queue_set_notification(n->tx_vq, 1);
852 if (virtio_net_flush_tx(n, n->tx_vq) > 0) {
853 virtio_queue_set_notification(n->tx_vq, 0);
854 qemu_bh_schedule(n->tx_bh);
855 n->tx_waiting = 1;
856 }
857}
858
aliguorifbe78f42008-12-17 19:13:11 +0000859static void virtio_net_save(QEMUFile *f, void *opaque)
860{
861 VirtIONet *n = opaque;
862
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +0200863 /* At this point, backend must be stopped, otherwise
864 * it might keep writing to memory. */
865 assert(!n->vhost_started);
aliguorifbe78f42008-12-17 19:13:11 +0000866 virtio_save(&n->vdev, f);
867
aliguori79674062009-02-05 22:36:12 +0000868 qemu_put_buffer(f, n->mac, ETH_ALEN);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600869 qemu_put_be32(f, n->tx_waiting);
aliguorie46cb382009-01-07 17:50:45 +0000870 qemu_put_be32(f, n->mergeable_rx_bufs);
aliguori9d6271b2009-02-05 22:36:04 +0000871 qemu_put_be16(f, n->status);
Alex Williamsonf10c5922009-06-05 14:46:57 -0600872 qemu_put_byte(f, n->promisc);
873 qemu_put_byte(f, n->allmulti);
aliguorib6503ed2009-02-05 22:36:28 +0000874 qemu_put_be32(f, n->mac_table.in_use);
875 qemu_put_buffer(f, n->mac_table.macs, n->mac_table.in_use * ETH_ALEN);
aliguorif21c0ed2009-02-05 22:36:32 +0000876 qemu_put_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100877 qemu_put_be32(f, n->has_vnet_hdr);
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600878 qemu_put_byte(f, n->mac_table.multi_overflow);
879 qemu_put_byte(f, n->mac_table.uni_overflow);
Alex Williamson015cb162009-06-05 14:47:18 -0600880 qemu_put_byte(f, n->alluni);
881 qemu_put_byte(f, n->nomulti);
882 qemu_put_byte(f, n->nouni);
883 qemu_put_byte(f, n->nobcast);
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100884 qemu_put_byte(f, n->has_ufo);
aliguorifbe78f42008-12-17 19:13:11 +0000885}
886
887static int virtio_net_load(QEMUFile *f, void *opaque, int version_id)
888{
889 VirtIONet *n = opaque;
Alex Williamson2d9aba32009-06-05 14:47:13 -0600890 int i;
Orit Wassermann2a633c42012-05-16 12:21:35 +0200891 int ret;
aliguorifbe78f42008-12-17 19:13:11 +0000892
aliguori9d6271b2009-02-05 22:36:04 +0000893 if (version_id < 2 || version_id > VIRTIO_NET_VM_VERSION)
aliguorifbe78f42008-12-17 19:13:11 +0000894 return -EINVAL;
895
Orit Wassermann2a633c42012-05-16 12:21:35 +0200896 ret = virtio_load(&n->vdev, f);
897 if (ret) {
898 return ret;
899 }
aliguorifbe78f42008-12-17 19:13:11 +0000900
aliguori79674062009-02-05 22:36:12 +0000901 qemu_get_buffer(f, n->mac, ETH_ALEN);
Alex Williamson4b4b8d32010-09-02 09:01:04 -0600902 n->tx_waiting = qemu_get_be32(f);
aliguorie46cb382009-01-07 17:50:45 +0000903 n->mergeable_rx_bufs = qemu_get_be32(f);
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200904 n->guest_hdr_len = n->mergeable_rx_bufs ?
905 sizeof(struct virtio_net_hdr_mrg_rxbuf) : sizeof(struct virtio_net_hdr);
aliguorifbe78f42008-12-17 19:13:11 +0000906
aliguori9d6271b2009-02-05 22:36:04 +0000907 if (version_id >= 3)
908 n->status = qemu_get_be16(f);
909
aliguori002437c2009-02-05 22:36:20 +0000910 if (version_id >= 4) {
Alex Williamsonf10c5922009-06-05 14:46:57 -0600911 if (version_id < 8) {
912 n->promisc = qemu_get_be32(f);
913 n->allmulti = qemu_get_be32(f);
914 } else {
915 n->promisc = qemu_get_byte(f);
916 n->allmulti = qemu_get_byte(f);
917 }
aliguori002437c2009-02-05 22:36:20 +0000918 }
919
aliguorib6503ed2009-02-05 22:36:28 +0000920 if (version_id >= 5) {
921 n->mac_table.in_use = qemu_get_be32(f);
922 /* MAC_TABLE_ENTRIES may be different from the saved image */
923 if (n->mac_table.in_use <= MAC_TABLE_ENTRIES) {
924 qemu_get_buffer(f, n->mac_table.macs,
925 n->mac_table.in_use * ETH_ALEN);
926 } else if (n->mac_table.in_use) {
Juan Quintelae398d612012-08-29 19:03:09 +0200927 uint8_t *buf = g_malloc0(n->mac_table.in_use);
928 qemu_get_buffer(f, buf, n->mac_table.in_use * ETH_ALEN);
929 g_free(buf);
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600930 n->mac_table.multi_overflow = n->mac_table.uni_overflow = 1;
aliguorib6503ed2009-02-05 22:36:28 +0000931 n->mac_table.in_use = 0;
932 }
933 }
934
aliguorif21c0ed2009-02-05 22:36:32 +0000935 if (version_id >= 6)
936 qemu_get_buffer(f, (uint8_t *)n->vlans, MAX_VLAN >> 3);
937
Mark McLoughlin3a330132009-10-22 17:43:45 +0100938 if (version_id >= 7) {
939 if (qemu_get_be32(f) && !peer_has_vnet_hdr(n)) {
Markus Armbruster1ecda022010-02-18 17:25:24 +0100940 error_report("virtio-net: saved image requires vnet_hdr=on");
Mark McLoughlin3a330132009-10-22 17:43:45 +0100941 return -1;
942 }
943
944 if (n->has_vnet_hdr) {
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000945 tap_using_vnet_hdr(n->nic->nc.peer, 1);
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +0200946 n->host_hdr_len = sizeof(struct virtio_net_hdr);
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000947 tap_set_offload(n->nic->nc.peer,
Michael S. Tsirkin704a76f2010-01-10 13:52:47 +0200948 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_CSUM) & 1,
949 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_TSO4) & 1,
950 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_TSO6) & 1,
951 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_ECN) & 1,
952 (n->vdev.guest_features >> VIRTIO_NET_F_GUEST_UFO) & 1);
Mark McLoughlin3a330132009-10-22 17:43:45 +0100953 }
Alex Williamson6c042c12009-06-05 14:46:52 -0600954 }
955
Alex Williamson8fd2a2f2009-06-05 14:47:08 -0600956 if (version_id >= 9) {
957 n->mac_table.multi_overflow = qemu_get_byte(f);
958 n->mac_table.uni_overflow = qemu_get_byte(f);
959 }
960
Alex Williamson015cb162009-06-05 14:47:18 -0600961 if (version_id >= 10) {
962 n->alluni = qemu_get_byte(f);
963 n->nomulti = qemu_get_byte(f);
964 n->nouni = qemu_get_byte(f);
965 n->nobcast = qemu_get_byte(f);
966 }
967
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100968 if (version_id >= 11) {
969 if (qemu_get_byte(f) && !peer_has_ufo(n)) {
Markus Armbruster1ecda022010-02-18 17:25:24 +0100970 error_report("virtio-net: saved image requires TUN_F_UFO support");
Mark McLoughlin0ce0e8f2009-10-22 17:43:50 +0100971 return -1;
972 }
973 }
974
Alex Williamson2d9aba32009-06-05 14:47:13 -0600975 /* Find the first multicast entry in the saved MAC filter */
976 for (i = 0; i < n->mac_table.in_use; i++) {
977 if (n->mac_table.macs[i * ETH_ALEN] & 1) {
978 break;
979 }
980 }
981 n->mac_table.first_multi = i;
Amos Kong98991482012-09-28 10:06:02 +0800982
983 /* nc.link_down can't be migrated, so infer link_down according
984 * to link status bit in n->status */
985 n->nic->nc.link_down = (n->status & VIRTIO_NET_S_LINK_UP) == 0;
986
aliguorifbe78f42008-12-17 19:13:11 +0000987 return 0;
988}
989
Stefan Hajnoczi4e68f7a2012-07-24 16:35:13 +0100990static void virtio_net_cleanup(NetClientState *nc)
aliguorib946a152009-04-17 17:11:08 +0000991{
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000992 VirtIONet *n = DO_UPCAST(NICState, nc, nc)->opaque;
aliguorib946a152009-04-17 17:11:08 +0000993
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000994 n->nic = NULL;
aliguorib946a152009-04-17 17:11:08 +0000995}
996
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000997static NetClientInfo net_virtio_info = {
Laszlo Ersek2be64a62012-07-17 16:17:12 +0200998 .type = NET_CLIENT_OPTIONS_KIND_NIC,
Mark McLoughlineb6b6c12009-11-25 18:49:11 +0000999 .size = sizeof(NICState),
1000 .can_receive = virtio_net_can_receive,
1001 .receive = virtio_net_receive,
1002 .cleanup = virtio_net_cleanup,
1003 .link_status_changed = virtio_net_set_link_status,
1004};
1005
Alex Williamsonf0c07c72010-09-02 09:00:50 -06001006VirtIODevice *virtio_net_init(DeviceState *dev, NICConf *conf,
1007 virtio_net_conf *net)
aliguorifbe78f42008-12-17 19:13:11 +00001008{
1009 VirtIONet *n;
aliguorifbe78f42008-12-17 19:13:11 +00001010
Paul Brook53c25ce2009-05-18 14:51:59 +01001011 n = (VirtIONet *)virtio_common_init("virtio-net", VIRTIO_ID_NET,
1012 sizeof(struct virtio_net_config),
1013 sizeof(VirtIONet));
aliguorifbe78f42008-12-17 19:13:11 +00001014
aliguori0f03eca2009-02-05 22:36:08 +00001015 n->vdev.get_config = virtio_net_get_config;
1016 n->vdev.set_config = virtio_net_set_config;
aliguorifbe78f42008-12-17 19:13:11 +00001017 n->vdev.get_features = virtio_net_get_features;
1018 n->vdev.set_features = virtio_net_set_features;
aliguori8eca6b12009-04-05 17:40:08 +00001019 n->vdev.bad_features = virtio_net_bad_features;
aliguori002437c2009-02-05 22:36:20 +00001020 n->vdev.reset = virtio_net_reset;
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +02001021 n->vdev.set_status = virtio_net_set_status;
aliguorifbe78f42008-12-17 19:13:11 +00001022 n->rx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_rx);
Alex Williamsona697a332010-09-02 09:01:10 -06001023
1024 if (net->tx && strcmp(net->tx, "timer") && strcmp(net->tx, "bh")) {
Stefan Hajnoczie7b43f72010-11-15 20:44:37 +00001025 error_report("virtio-net: "
1026 "Unknown option tx=%s, valid options: \"timer\" \"bh\"",
1027 net->tx);
1028 error_report("Defaulting to \"bh\"");
Alex Williamsona697a332010-09-02 09:01:10 -06001029 }
1030
1031 if (net->tx && !strcmp(net->tx, "timer")) {
1032 n->tx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_tx_timer);
Paolo Bonzini74475452011-03-11 16:47:48 +01001033 n->tx_timer = qemu_new_timer_ns(vm_clock, virtio_net_tx_timer, n);
Alex Williamsona697a332010-09-02 09:01:10 -06001034 n->tx_timeout = net->txtimer;
1035 } else {
1036 n->tx_vq = virtio_add_queue(&n->vdev, 256, virtio_net_handle_tx_bh);
1037 n->tx_bh = qemu_bh_new(virtio_net_tx_bh, n);
1038 }
Alex Williamson4ffb17f2009-06-05 14:47:23 -06001039 n->ctrl_vq = virtio_add_queue(&n->vdev, 64, virtio_net_handle_ctrl);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001040 qemu_macaddr_default_if_unset(&conf->macaddr);
Mark McLoughlin3cbe04c2009-10-28 14:07:23 +00001041 memcpy(&n->mac[0], &conf->macaddr, sizeof(n->mac));
aliguori554c97d2009-01-08 19:46:33 +00001042 n->status = VIRTIO_NET_S_LINK_UP;
aliguorifbe78f42008-12-17 19:13:11 +00001043
Anthony Liguorif79f2bf2011-12-04 11:17:51 -06001044 n->nic = qemu_new_nic(&net_virtio_info, conf, object_get_typename(OBJECT(dev)), dev->id, n);
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001045
1046 qemu_format_nic_info_str(&n->nic->nc, conf->macaddr.a);
aliguori96d5e202009-01-07 17:47:15 +00001047
Alex Williamson4b4b8d32010-09-02 09:01:04 -06001048 n->tx_waiting = 0;
Alex Williamsone3f30482010-09-02 09:00:57 -06001049 n->tx_burst = net->txburst;
aliguorifbe78f42008-12-17 19:13:11 +00001050 n->mergeable_rx_bufs = 0;
Michael S. Tsirkine35e23f2012-09-24 12:12:25 +02001051 n->guest_hdr_len = sizeof(struct virtio_net_hdr);
aliguori002437c2009-02-05 22:36:20 +00001052 n->promisc = 1; /* for compatibility */
aliguorifbe78f42008-12-17 19:13:11 +00001053
Anthony Liguori7267c092011-08-20 22:09:37 -05001054 n->mac_table.macs = g_malloc0(MAC_TABLE_ENTRIES * ETH_ALEN);
aliguorib6503ed2009-02-05 22:36:28 +00001055
Anthony Liguori7267c092011-08-20 22:09:37 -05001056 n->vlans = g_malloc0(MAX_VLAN >> 3);
aliguorif21c0ed2009-02-05 22:36:32 +00001057
Alex Williamson01657c82010-06-25 11:09:28 -06001058 n->qdev = dev;
1059 register_savevm(dev, "virtio-net", -1, VIRTIO_NET_VM_VERSION,
aliguorifbe78f42008-12-17 19:13:11 +00001060 virtio_net_save, virtio_net_load, n);
Paul Brookcf21e102009-05-14 22:35:07 +01001061
Gleb Natapov1ca4d092010-12-08 13:35:05 +02001062 add_boot_device_path(conf->bootindex, dev, "/ethernet-phy@0");
1063
Paul Brook53c25ce2009-05-18 14:51:59 +01001064 return &n->vdev;
Paul Brookcf21e102009-05-14 22:35:07 +01001065}
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001066
1067void virtio_net_exit(VirtIODevice *vdev)
1068{
1069 VirtIONet *n = DO_UPCAST(VirtIONet, vdev, vdev);
Michael S. Tsirkin9bc63042010-03-17 13:08:42 +02001070
Michael S. Tsirkinafbaa7b2010-09-27 18:41:30 +02001071 /* This will stop vhost backend if appropriate. */
1072 virtio_net_set_status(vdev, 0);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001073
Mark McLoughlineb6b6c12009-11-25 18:49:11 +00001074 qemu_purge_queued_packets(&n->nic->nc);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001075
Alex Williamson01657c82010-06-25 11:09:28 -06001076 unregister_savevm(n->qdev, "virtio-net", n);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001077
Anthony Liguori7267c092011-08-20 22:09:37 -05001078 g_free(n->mac_table.macs);
1079 g_free(n->vlans);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001080
Alex Williamsona697a332010-09-02 09:01:10 -06001081 if (n->tx_timer) {
1082 qemu_del_timer(n->tx_timer);
1083 qemu_free_timer(n->tx_timer);
1084 } else {
1085 qemu_bh_delete(n->tx_bh);
1086 }
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001087
Stefan Hajnoczib20c6b92012-07-24 16:35:15 +01001088 qemu_del_net_client(&n->nic->nc);
Amit Shahb52dfd72011-07-27 14:00:31 +05301089 virtio_cleanup(&n->vdev);
Gerd Hoffmann97b15622009-10-21 15:25:35 +02001090}