]>
Commit | Line | Data |
---|---|---|
d5970055 MT |
1 | /* |
2 | * vhost-net support | |
3 | * | |
4 | * Copyright Red Hat, Inc. 2010 | |
5 | * | |
6 | * Authors: | |
7 | * Michael S. Tsirkin <[email protected]> | |
8 | * | |
9 | * This work is licensed under the terms of the GNU GPL, version 2. See | |
10 | * the COPYING file in the top-level directory. | |
6b620ca3 PB |
11 | * |
12 | * Contributions after 2012-01-13 are licensed under the terms of the | |
13 | * GNU GPL, version 2 or (at your option) any later version. | |
d5970055 MT |
14 | */ |
15 | ||
1422e32d | 16 | #include "net/net.h" |
d5970055 | 17 | #include "net/tap.h" |
03ce5744 | 18 | #include "net/vhost-user.h" |
d5970055 | 19 | |
0d09e41a PB |
20 | #include "hw/virtio/virtio-net.h" |
21 | #include "net/vhost_net.h" | |
1de7afc9 | 22 | #include "qemu/error-report.h" |
d5970055 MT |
23 | |
24 | #include "config.h" | |
25 | ||
26 | #ifdef CONFIG_VHOST_NET | |
27 | #include <linux/vhost.h> | |
d5970055 MT |
28 | #include <sys/socket.h> |
29 | #include <linux/kvm.h> | |
30 | #include <fcntl.h> | |
d5970055 MT |
31 | #include <netpacket/packet.h> |
32 | #include <net/ethernet.h> | |
33 | #include <net/if.h> | |
34 | #include <netinet/in.h> | |
35 | ||
36 | #include <stdio.h> | |
37 | ||
4fbe0f32 | 38 | #include "standard-headers/linux/virtio_ring.h" |
0d09e41a | 39 | #include "hw/virtio/vhost.h" |
1c819449 | 40 | #include "hw/virtio/virtio-bus.h" |
d5970055 MT |
41 | |
42 | struct vhost_net { | |
43 | struct vhost_dev dev; | |
44 | struct vhost_virtqueue vqs[2]; | |
45 | int backend; | |
35277d14 | 46 | NetClientState *nc; |
d5970055 MT |
47 | }; |
48 | ||
2e6d46d7 NN |
49 | /* Features supported by host kernel. */ |
50 | static const int kernel_feature_bits[] = { | |
51 | VIRTIO_F_NOTIFY_ON_EMPTY, | |
52 | VIRTIO_RING_F_INDIRECT_DESC, | |
53 | VIRTIO_RING_F_EVENT_IDX, | |
54 | VIRTIO_NET_F_MRG_RXBUF, | |
55 | VHOST_INVALID_FEATURE_BIT | |
56 | }; | |
57 | ||
5f4c01ca NN |
58 | /* Features supported by others. */ |
59 | const int user_feature_bits[] = { | |
60 | VIRTIO_F_NOTIFY_ON_EMPTY, | |
61 | VIRTIO_RING_F_INDIRECT_DESC, | |
62 | VIRTIO_RING_F_EVENT_IDX, | |
63 | ||
64 | VIRTIO_F_ANY_LAYOUT, | |
65 | VIRTIO_NET_F_CSUM, | |
66 | VIRTIO_NET_F_GUEST_CSUM, | |
67 | VIRTIO_NET_F_GSO, | |
68 | VIRTIO_NET_F_GUEST_TSO4, | |
69 | VIRTIO_NET_F_GUEST_TSO6, | |
70 | VIRTIO_NET_F_GUEST_ECN, | |
71 | VIRTIO_NET_F_GUEST_UFO, | |
72 | VIRTIO_NET_F_HOST_TSO4, | |
73 | VIRTIO_NET_F_HOST_TSO6, | |
74 | VIRTIO_NET_F_HOST_ECN, | |
75 | VIRTIO_NET_F_HOST_UFO, | |
76 | VIRTIO_NET_F_MRG_RXBUF, | |
77 | VIRTIO_NET_F_STATUS, | |
78 | VIRTIO_NET_F_CTRL_VQ, | |
79 | VIRTIO_NET_F_CTRL_RX, | |
80 | VIRTIO_NET_F_CTRL_VLAN, | |
81 | VIRTIO_NET_F_CTRL_RX_EXTRA, | |
82 | VIRTIO_NET_F_CTRL_MAC_ADDR, | |
83 | VIRTIO_NET_F_CTRL_GUEST_OFFLOADS, | |
84 | ||
85 | VIRTIO_NET_F_MQ, | |
86 | ||
87 | VHOST_INVALID_FEATURE_BIT | |
88 | }; | |
89 | ||
2e6d46d7 | 90 | static const int *vhost_net_get_feature_bits(struct vhost_net *net) |
d5970055 | 91 | { |
2e6d46d7 NN |
92 | const int *feature_bits = 0; |
93 | ||
94 | switch (net->nc->info->type) { | |
95 | case NET_CLIENT_OPTIONS_KIND_TAP: | |
96 | feature_bits = kernel_feature_bits; | |
97 | break; | |
5f4c01ca NN |
98 | case NET_CLIENT_OPTIONS_KIND_VHOST_USER: |
99 | feature_bits = user_feature_bits; | |
100 | break; | |
2e6d46d7 NN |
101 | default: |
102 | error_report("Feature bits not defined for this type: %d", | |
103 | net->nc->info->type); | |
104 | break; | |
ca736c8e | 105 | } |
2e6d46d7 NN |
106 | |
107 | return feature_bits; | |
108 | } | |
109 | ||
110 | unsigned vhost_net_get_features(struct vhost_net *net, unsigned features) | |
111 | { | |
112 | return vhost_get_features(&net->dev, vhost_net_get_feature_bits(net), | |
113 | features); | |
d5970055 MT |
114 | } |
115 | ||
116 | void vhost_net_ack_features(struct vhost_net *net, unsigned features) | |
117 | { | |
b49ae913 | 118 | net->dev.acked_features = net->dev.backend_features; |
2e6d46d7 | 119 | vhost_ack_features(&net->dev, vhost_net_get_feature_bits(net), features); |
d5970055 MT |
120 | } |
121 | ||
4e68f7a0 | 122 | static int vhost_net_get_fd(NetClientState *backend) |
d5970055 MT |
123 | { |
124 | switch (backend->info->type) { | |
2be64a68 | 125 | case NET_CLIENT_OPTIONS_KIND_TAP: |
d5970055 MT |
126 | return tap_get_fd(backend); |
127 | default: | |
128 | fprintf(stderr, "vhost-net requires tap backend\n"); | |
129 | return -EBADFD; | |
130 | } | |
131 | } | |
132 | ||
81647a65 | 133 | struct vhost_net *vhost_net_init(VhostNetOptions *options) |
d5970055 MT |
134 | { |
135 | int r; | |
1a1bfac9 | 136 | bool backend_kernel = options->backend_type == VHOST_BACKEND_TYPE_KERNEL; |
7267c094 | 137 | struct vhost_net *net = g_malloc(sizeof *net); |
81647a65 NN |
138 | |
139 | if (!options->net_backend) { | |
140 | fprintf(stderr, "vhost-net requires net backend to be setup\n"); | |
d5970055 MT |
141 | goto fail; |
142 | } | |
81647a65 | 143 | |
1a1bfac9 NN |
144 | if (backend_kernel) { |
145 | r = vhost_net_get_fd(options->net_backend); | |
146 | if (r < 0) { | |
147 | goto fail; | |
148 | } | |
149 | net->dev.backend_features = qemu_has_vnet_hdr(options->net_backend) | |
150 | ? 0 : (1 << VHOST_NET_F_VIRTIO_NET_HDR); | |
151 | net->backend = r; | |
152 | } else { | |
153 | net->dev.backend_features = 0; | |
154 | net->backend = -1; | |
d5970055 | 155 | } |
81647a65 | 156 | net->nc = options->net_backend; |
d5970055 | 157 | |
f56a1247 MT |
158 | net->dev.nvqs = 2; |
159 | net->dev.vqs = net->vqs; | |
160 | ||
81647a65 | 161 | r = vhost_dev_init(&net->dev, options->opaque, |
1a1bfac9 | 162 | options->backend_type, options->force); |
d5970055 MT |
163 | if (r < 0) { |
164 | goto fail; | |
165 | } | |
1a1bfac9 | 166 | if (backend_kernel) { |
d8e80ae3 DM |
167 | if (!qemu_has_vnet_hdr_len(options->net_backend, |
168 | sizeof(struct virtio_net_hdr_mrg_rxbuf))) { | |
169 | net->dev.features &= ~(1 << VIRTIO_NET_F_MRG_RXBUF); | |
170 | } | |
1a1bfac9 NN |
171 | if (~net->dev.features & net->dev.backend_features) { |
172 | fprintf(stderr, "vhost lacks feature mask %" PRIu64 | |
173 | " for backend\n", | |
174 | (uint64_t)(~net->dev.features & net->dev.backend_features)); | |
175 | vhost_dev_cleanup(&net->dev); | |
176 | goto fail; | |
177 | } | |
d5970055 | 178 | } |
d5970055 MT |
179 | /* Set sane init value. Override when guest acks. */ |
180 | vhost_net_ack_features(net, 0); | |
181 | return net; | |
182 | fail: | |
7267c094 | 183 | g_free(net); |
d5970055 MT |
184 | return NULL; |
185 | } | |
186 | ||
5430a28f MT |
187 | bool vhost_net_query(VHostNetState *net, VirtIODevice *dev) |
188 | { | |
189 | return vhost_dev_query(&net->dev, dev); | |
190 | } | |
191 | ||
cd7d1d26 JW |
192 | static void vhost_net_set_vq_index(struct vhost_net *net, int vq_index) |
193 | { | |
194 | net->dev.vq_index = vq_index; | |
195 | } | |
196 | ||
a9f98bb5 | 197 | static int vhost_net_start_one(struct vhost_net *net, |
cd7d1d26 | 198 | VirtIODevice *dev) |
d5970055 MT |
199 | { |
200 | struct vhost_vring_file file = { }; | |
201 | int r; | |
b0b3db79 | 202 | |
a9f98bb5 JW |
203 | net->dev.nvqs = 2; |
204 | net->dev.vqs = net->vqs; | |
a9f98bb5 | 205 | |
b0b3db79 MT |
206 | r = vhost_dev_enable_notifiers(&net->dev, dev); |
207 | if (r < 0) { | |
208 | goto fail_notifiers; | |
209 | } | |
d5970055 | 210 | |
d5970055 MT |
211 | r = vhost_dev_start(&net->dev, dev); |
212 | if (r < 0) { | |
b0b3db79 | 213 | goto fail_start; |
d5970055 MT |
214 | } |
215 | ||
212d69f2 NN |
216 | if (net->nc->info->poll) { |
217 | net->nc->info->poll(net->nc, false); | |
218 | } | |
219 | ||
1a1bfac9 NN |
220 | if (net->nc->info->type == NET_CLIENT_OPTIONS_KIND_TAP) { |
221 | qemu_set_fd_handler(net->backend, NULL, NULL, NULL); | |
222 | file.fd = net->backend; | |
223 | for (file.index = 0; file.index < net->dev.nvqs; ++file.index) { | |
224 | const VhostOps *vhost_ops = net->dev.vhost_ops; | |
225 | r = vhost_ops->vhost_call(&net->dev, VHOST_NET_SET_BACKEND, | |
226 | &file); | |
227 | if (r < 0) { | |
228 | r = -errno; | |
229 | goto fail; | |
230 | } | |
d5970055 MT |
231 | } |
232 | } | |
233 | return 0; | |
234 | fail: | |
235 | file.fd = -1; | |
1a1bfac9 NN |
236 | if (net->nc->info->type == NET_CLIENT_OPTIONS_KIND_TAP) { |
237 | while (file.index-- > 0) { | |
238 | const VhostOps *vhost_ops = net->dev.vhost_ops; | |
239 | int r = vhost_ops->vhost_call(&net->dev, VHOST_NET_SET_BACKEND, | |
240 | &file); | |
241 | assert(r >= 0); | |
242 | } | |
d5970055 | 243 | } |
212d69f2 NN |
244 | if (net->nc->info->poll) { |
245 | net->nc->info->poll(net->nc, true); | |
246 | } | |
d5970055 | 247 | vhost_dev_stop(&net->dev, dev); |
b0b3db79 MT |
248 | fail_start: |
249 | vhost_dev_disable_notifiers(&net->dev, dev); | |
250 | fail_notifiers: | |
d5970055 MT |
251 | return r; |
252 | } | |
253 | ||
a9f98bb5 JW |
254 | static void vhost_net_stop_one(struct vhost_net *net, |
255 | VirtIODevice *dev) | |
d5970055 MT |
256 | { |
257 | struct vhost_vring_file file = { .fd = -1 }; | |
258 | ||
1a1bfac9 NN |
259 | if (net->nc->info->type == NET_CLIENT_OPTIONS_KIND_TAP) { |
260 | for (file.index = 0; file.index < net->dev.nvqs; ++file.index) { | |
261 | const VhostOps *vhost_ops = net->dev.vhost_ops; | |
262 | int r = vhost_ops->vhost_call(&net->dev, VHOST_NET_SET_BACKEND, | |
263 | &file); | |
264 | assert(r >= 0); | |
265 | } | |
d5970055 | 266 | } |
212d69f2 NN |
267 | if (net->nc->info->poll) { |
268 | net->nc->info->poll(net->nc, true); | |
269 | } | |
d5970055 | 270 | vhost_dev_stop(&net->dev, dev); |
b0b3db79 | 271 | vhost_dev_disable_notifiers(&net->dev, dev); |
d5970055 MT |
272 | } |
273 | ||
371df9f5 GK |
274 | static bool vhost_net_device_endian_ok(VirtIODevice *vdev) |
275 | { | |
276 | #ifdef TARGET_IS_BIENDIAN | |
277 | #ifdef HOST_WORDS_BIGENDIAN | |
278 | return virtio_is_big_endian(vdev); | |
279 | #else | |
280 | return !virtio_is_big_endian(vdev); | |
281 | #endif | |
282 | #else | |
283 | return true; | |
284 | #endif | |
285 | } | |
286 | ||
a9f98bb5 JW |
287 | int vhost_net_start(VirtIODevice *dev, NetClientState *ncs, |
288 | int total_queues) | |
289 | { | |
1c819449 FK |
290 | BusState *qbus = BUS(qdev_get_parent_bus(DEVICE(dev))); |
291 | VirtioBusState *vbus = VIRTIO_BUS(qbus); | |
292 | VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(vbus); | |
cd7d1d26 | 293 | int r, e, i; |
a9f98bb5 | 294 | |
371df9f5 GK |
295 | if (!vhost_net_device_endian_ok(dev)) { |
296 | error_report("vhost-net does not support cross-endian"); | |
297 | r = -ENOSYS; | |
298 | goto err; | |
299 | } | |
300 | ||
1c819449 | 301 | if (!k->set_guest_notifiers) { |
312fd5f2 | 302 | error_report("binding does not support guest notifiers"); |
a9f98bb5 JW |
303 | r = -ENOSYS; |
304 | goto err; | |
305 | } | |
306 | ||
307 | for (i = 0; i < total_queues; i++) { | |
cd7d1d26 | 308 | vhost_net_set_vq_index(get_vhost_net(ncs[i].peer), i * 2); |
a9f98bb5 JW |
309 | } |
310 | ||
1c819449 | 311 | r = k->set_guest_notifiers(qbus->parent, total_queues * 2, true); |
a9f98bb5 | 312 | if (r < 0) { |
312fd5f2 | 313 | error_report("Error binding guest notifier: %d", -r); |
a9f98bb5 JW |
314 | goto err; |
315 | } | |
316 | ||
cd7d1d26 JW |
317 | for (i = 0; i < total_queues; i++) { |
318 | r = vhost_net_start_one(get_vhost_net(ncs[i].peer), dev); | |
319 | ||
320 | if (r < 0) { | |
321 | goto err_start; | |
322 | } | |
323 | } | |
324 | ||
a9f98bb5 JW |
325 | return 0; |
326 | ||
cd7d1d26 | 327 | err_start: |
a9f98bb5 | 328 | while (--i >= 0) { |
ed8b4afe | 329 | vhost_net_stop_one(get_vhost_net(ncs[i].peer), dev); |
a9f98bb5 | 330 | } |
cd7d1d26 JW |
331 | e = k->set_guest_notifiers(qbus->parent, total_queues * 2, false); |
332 | if (e < 0) { | |
333 | fprintf(stderr, "vhost guest notifier cleanup failed: %d\n", e); | |
334 | fflush(stderr); | |
335 | } | |
336 | err: | |
a9f98bb5 JW |
337 | return r; |
338 | } | |
339 | ||
340 | void vhost_net_stop(VirtIODevice *dev, NetClientState *ncs, | |
341 | int total_queues) | |
342 | { | |
1c819449 FK |
343 | BusState *qbus = BUS(qdev_get_parent_bus(DEVICE(dev))); |
344 | VirtioBusState *vbus = VIRTIO_BUS(qbus); | |
345 | VirtioBusClass *k = VIRTIO_BUS_GET_CLASS(vbus); | |
a9f98bb5 JW |
346 | int i, r; |
347 | ||
cd7d1d26 JW |
348 | for (i = 0; i < total_queues; i++) { |
349 | vhost_net_stop_one(get_vhost_net(ncs[i].peer), dev); | |
350 | } | |
351 | ||
1c819449 | 352 | r = k->set_guest_notifiers(qbus->parent, total_queues * 2, false); |
a9f98bb5 JW |
353 | if (r < 0) { |
354 | fprintf(stderr, "vhost guest notifier cleanup failed: %d\n", r); | |
355 | fflush(stderr); | |
356 | } | |
357 | assert(r >= 0); | |
a9f98bb5 JW |
358 | } |
359 | ||
d5970055 MT |
360 | void vhost_net_cleanup(struct vhost_net *net) |
361 | { | |
362 | vhost_dev_cleanup(&net->dev); | |
7267c094 | 363 | g_free(net); |
d5970055 | 364 | } |
f56a1247 MT |
365 | |
366 | bool vhost_net_virtqueue_pending(VHostNetState *net, int idx) | |
367 | { | |
368 | return vhost_virtqueue_pending(&net->dev, idx); | |
369 | } | |
370 | ||
371 | void vhost_net_virtqueue_mask(VHostNetState *net, VirtIODevice *dev, | |
372 | int idx, bool mask) | |
373 | { | |
374 | vhost_virtqueue_mask(&net->dev, dev, idx, mask); | |
375 | } | |
ed8b4afe NN |
376 | |
377 | VHostNetState *get_vhost_net(NetClientState *nc) | |
378 | { | |
379 | VHostNetState *vhost_net = 0; | |
380 | ||
381 | if (!nc) { | |
382 | return 0; | |
383 | } | |
384 | ||
385 | switch (nc->info->type) { | |
386 | case NET_CLIENT_OPTIONS_KIND_TAP: | |
387 | vhost_net = tap_get_vhost_net(nc); | |
388 | break; | |
03ce5744 NN |
389 | case NET_CLIENT_OPTIONS_KIND_VHOST_USER: |
390 | vhost_net = vhost_user_get_vhost_net(nc); | |
391 | break; | |
ed8b4afe NN |
392 | default: |
393 | break; | |
394 | } | |
395 | ||
396 | return vhost_net; | |
397 | } | |
d5970055 | 398 | #else |
81647a65 | 399 | struct vhost_net *vhost_net_init(VhostNetOptions *options) |
5430a28f | 400 | { |
35f75462 | 401 | error_report("vhost-net support is not compiled in"); |
5430a28f MT |
402 | return NULL; |
403 | } | |
404 | ||
405 | bool vhost_net_query(VHostNetState *net, VirtIODevice *dev) | |
d5970055 | 406 | { |
5430a28f | 407 | return false; |
d5970055 MT |
408 | } |
409 | ||
a9f98bb5 JW |
410 | int vhost_net_start(VirtIODevice *dev, |
411 | NetClientState *ncs, | |
412 | int total_queues) | |
d5970055 | 413 | { |
5430a28f | 414 | return -ENOSYS; |
d5970055 | 415 | } |
a9f98bb5 JW |
416 | void vhost_net_stop(VirtIODevice *dev, |
417 | NetClientState *ncs, | |
418 | int total_queues) | |
d5970055 MT |
419 | { |
420 | } | |
421 | ||
422 | void vhost_net_cleanup(struct vhost_net *net) | |
423 | { | |
424 | } | |
425 | ||
426 | unsigned vhost_net_get_features(struct vhost_net *net, unsigned features) | |
427 | { | |
5430a28f | 428 | return features; |
d5970055 MT |
429 | } |
430 | void vhost_net_ack_features(struct vhost_net *net, unsigned features) | |
431 | { | |
432 | } | |
f56a1247 MT |
433 | |
434 | bool vhost_net_virtqueue_pending(VHostNetState *net, int idx) | |
435 | { | |
4dd72e04 | 436 | return false; |
f56a1247 MT |
437 | } |
438 | ||
439 | void vhost_net_virtqueue_mask(VHostNetState *net, VirtIODevice *dev, | |
440 | int idx, bool mask) | |
441 | { | |
442 | } | |
ed8b4afe NN |
443 | |
444 | VHostNetState *get_vhost_net(NetClientState *nc) | |
445 | { | |
446 | return 0; | |
447 | } | |
d5970055 | 448 | #endif |