4 * Copyright IBM, Corp. 2007
5 * Copyright (c) 2009 CodeSourcery
11 * This work is licensed under the terms of the GNU GPL, version 2. See
12 * the COPYING file in the top-level directory.
14 * Contributions after 2012-01-13 are licensed under the terms of the
15 * GNU GPL, version 2 or (at your option) any later version.
18 #include "qemu/osdep.h"
20 #include "standard-headers/linux/virtio_pci.h"
21 #include "hw/virtio/virtio.h"
22 #include "hw/pci/pci.h"
23 #include "hw/pci/pci_bus.h"
24 #include "qapi/error.h"
25 #include "qemu/error-report.h"
26 #include "hw/pci/msi.h"
27 #include "hw/pci/msix.h"
28 #include "hw/loader.h"
29 #include "sysemu/kvm.h"
30 #include "virtio-pci.h"
31 #include "qemu/range.h"
32 #include "hw/virtio/virtio-bus.h"
33 #include "qapi/visitor.h"
35 #define VIRTIO_PCI_REGION_SIZE(dev) VIRTIO_PCI_CONFIG_OFF(msix_present(dev))
37 #undef VIRTIO_PCI_CONFIG
39 /* The remaining space is defined by each driver as the per-driver
40 * configuration space */
41 #define VIRTIO_PCI_CONFIG_SIZE(dev) VIRTIO_PCI_CONFIG_OFF(msix_enabled(dev))
43 static void virtio_pci_bus_new(VirtioBusState *bus, size_t bus_size,
45 static void virtio_pci_reset(DeviceState *qdev);
48 /* DeviceState to VirtIOPCIProxy. For use off data-path. TODO: use QOM. */
49 static inline VirtIOPCIProxy *to_virtio_pci_proxy(DeviceState *d)
51 return container_of(d, VirtIOPCIProxy, pci_dev.qdev);
54 /* DeviceState to VirtIOPCIProxy. Note: used on datapath,
55 * be careful and test performance if you change this.
57 static inline VirtIOPCIProxy *to_virtio_pci_proxy_fast(DeviceState *d)
59 return container_of(d, VirtIOPCIProxy, pci_dev.qdev);
62 static void virtio_pci_notify(DeviceState *d, uint16_t vector)
64 VirtIOPCIProxy *proxy = to_virtio_pci_proxy_fast(d);
66 if (msix_enabled(&proxy->pci_dev))
67 msix_notify(&proxy->pci_dev, vector);
69 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
70 pci_set_irq(&proxy->pci_dev, atomic_read(&vdev->isr) & 1);
74 static void virtio_pci_save_config(DeviceState *d, QEMUFile *f)
76 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
77 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
79 pci_device_save(&proxy->pci_dev, f);
80 msix_save(&proxy->pci_dev, f);
81 if (msix_present(&proxy->pci_dev))
82 qemu_put_be16(f, vdev->config_vector);
85 static const VMStateDescription vmstate_virtio_pci_modern_queue_state = {
86 .name = "virtio_pci/modern_queue_state",
88 .minimum_version_id = 1,
89 .fields = (VMStateField[]) {
90 VMSTATE_UINT16(num, VirtIOPCIQueue),
91 VMSTATE_UNUSED(1), /* enabled was stored as be16 */
92 VMSTATE_BOOL(enabled, VirtIOPCIQueue),
93 VMSTATE_UINT32_ARRAY(desc, VirtIOPCIQueue, 2),
94 VMSTATE_UINT32_ARRAY(avail, VirtIOPCIQueue, 2),
95 VMSTATE_UINT32_ARRAY(used, VirtIOPCIQueue, 2),
100 static bool virtio_pci_modern_state_needed(void *opaque)
102 VirtIOPCIProxy *proxy = opaque;
104 return virtio_pci_modern(proxy);
107 static const VMStateDescription vmstate_virtio_pci_modern_state_sub = {
108 .name = "virtio_pci/modern_state",
110 .minimum_version_id = 1,
111 .needed = &virtio_pci_modern_state_needed,
112 .fields = (VMStateField[]) {
113 VMSTATE_UINT32(dfselect, VirtIOPCIProxy),
114 VMSTATE_UINT32(gfselect, VirtIOPCIProxy),
115 VMSTATE_UINT32_ARRAY(guest_features, VirtIOPCIProxy, 2),
116 VMSTATE_STRUCT_ARRAY(vqs, VirtIOPCIProxy, VIRTIO_QUEUE_MAX, 0,
117 vmstate_virtio_pci_modern_queue_state,
119 VMSTATE_END_OF_LIST()
123 static const VMStateDescription vmstate_virtio_pci = {
124 .name = "virtio_pci",
126 .minimum_version_id = 1,
127 .minimum_version_id_old = 1,
128 .fields = (VMStateField[]) {
129 VMSTATE_END_OF_LIST()
131 .subsections = (const VMStateDescription*[]) {
132 &vmstate_virtio_pci_modern_state_sub,
137 static bool virtio_pci_has_extra_state(DeviceState *d)
139 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
141 return proxy->flags & VIRTIO_PCI_FLAG_MIGRATE_EXTRA;
144 static void virtio_pci_save_extra_state(DeviceState *d, QEMUFile *f)
146 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
148 vmstate_save_state(f, &vmstate_virtio_pci, proxy, NULL);
151 static int virtio_pci_load_extra_state(DeviceState *d, QEMUFile *f)
153 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
155 return vmstate_load_state(f, &vmstate_virtio_pci, proxy, 1);
158 static void virtio_pci_save_queue(DeviceState *d, int n, QEMUFile *f)
160 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
161 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
163 if (msix_present(&proxy->pci_dev))
164 qemu_put_be16(f, virtio_queue_vector(vdev, n));
167 static int virtio_pci_load_config(DeviceState *d, QEMUFile *f)
169 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
170 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
173 ret = pci_device_load(&proxy->pci_dev, f);
177 msix_unuse_all_vectors(&proxy->pci_dev);
178 msix_load(&proxy->pci_dev, f);
179 if (msix_present(&proxy->pci_dev)) {
180 qemu_get_be16s(f, &vdev->config_vector);
182 vdev->config_vector = VIRTIO_NO_VECTOR;
184 if (vdev->config_vector != VIRTIO_NO_VECTOR) {
185 return msix_vector_use(&proxy->pci_dev, vdev->config_vector);
190 static int virtio_pci_load_queue(DeviceState *d, int n, QEMUFile *f)
192 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
193 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
196 if (msix_present(&proxy->pci_dev)) {
197 qemu_get_be16s(f, &vector);
199 vector = VIRTIO_NO_VECTOR;
201 virtio_queue_set_vector(vdev, n, vector);
202 if (vector != VIRTIO_NO_VECTOR) {
203 return msix_vector_use(&proxy->pci_dev, vector);
209 static bool virtio_pci_ioeventfd_enabled(DeviceState *d)
211 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
213 return (proxy->flags & VIRTIO_PCI_FLAG_USE_IOEVENTFD) != 0;
216 #define QEMU_VIRTIO_PCI_QUEUE_MEM_MULT 0x1000
218 static inline int virtio_pci_queue_mem_mult(struct VirtIOPCIProxy *proxy)
220 return (proxy->flags & VIRTIO_PCI_FLAG_PAGE_PER_VQ) ?
221 QEMU_VIRTIO_PCI_QUEUE_MEM_MULT : 4;
224 static int virtio_pci_ioeventfd_assign(DeviceState *d, EventNotifier *notifier,
227 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
228 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
229 VirtQueue *vq = virtio_get_queue(vdev, n);
230 bool legacy = virtio_pci_legacy(proxy);
231 bool modern = virtio_pci_modern(proxy);
232 bool fast_mmio = kvm_ioeventfd_any_length_enabled();
233 bool modern_pio = proxy->flags & VIRTIO_PCI_FLAG_MODERN_PIO_NOTIFY;
234 MemoryRegion *modern_mr = &proxy->notify.mr;
235 MemoryRegion *modern_notify_mr = &proxy->notify_pio.mr;
236 MemoryRegion *legacy_mr = &proxy->bar;
237 hwaddr modern_addr = virtio_pci_queue_mem_mult(proxy) *
238 virtio_get_queue_index(vq);
239 hwaddr legacy_addr = VIRTIO_PCI_QUEUE_NOTIFY;
244 memory_region_add_eventfd(modern_mr, modern_addr, 0,
247 memory_region_add_eventfd(modern_mr, modern_addr, 2,
251 memory_region_add_eventfd(modern_notify_mr, 0, 2,
256 memory_region_add_eventfd(legacy_mr, legacy_addr, 2,
262 memory_region_del_eventfd(modern_mr, modern_addr, 0,
265 memory_region_del_eventfd(modern_mr, modern_addr, 2,
269 memory_region_del_eventfd(modern_notify_mr, 0, 2,
274 memory_region_del_eventfd(legacy_mr, legacy_addr, 2,
281 static void virtio_pci_start_ioeventfd(VirtIOPCIProxy *proxy)
283 virtio_bus_start_ioeventfd(&proxy->bus);
286 static void virtio_pci_stop_ioeventfd(VirtIOPCIProxy *proxy)
288 virtio_bus_stop_ioeventfd(&proxy->bus);
291 static void virtio_ioport_write(void *opaque, uint32_t addr, uint32_t val)
293 VirtIOPCIProxy *proxy = opaque;
294 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
298 case VIRTIO_PCI_GUEST_FEATURES:
299 /* Guest does not negotiate properly? We have to assume nothing. */
300 if (val & (1 << VIRTIO_F_BAD_FEATURE)) {
301 val = virtio_bus_get_vdev_bad_features(&proxy->bus);
303 virtio_set_features(vdev, val);
305 case VIRTIO_PCI_QUEUE_PFN:
306 pa = (hwaddr)val << VIRTIO_PCI_QUEUE_ADDR_SHIFT;
308 virtio_pci_reset(DEVICE(proxy));
311 virtio_queue_set_addr(vdev, vdev->queue_sel, pa);
313 case VIRTIO_PCI_QUEUE_SEL:
314 if (val < VIRTIO_QUEUE_MAX)
315 vdev->queue_sel = val;
317 case VIRTIO_PCI_QUEUE_NOTIFY:
318 if (val < VIRTIO_QUEUE_MAX) {
319 virtio_queue_notify(vdev, val);
322 case VIRTIO_PCI_STATUS:
323 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
324 virtio_pci_stop_ioeventfd(proxy);
327 virtio_set_status(vdev, val & 0xFF);
329 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
330 virtio_pci_start_ioeventfd(proxy);
333 if (vdev->status == 0) {
334 virtio_pci_reset(DEVICE(proxy));
337 /* Linux before 2.6.34 drives the device without enabling
338 the PCI device bus master bit. Enable it automatically
339 for the guest. This is a PCI spec violation but so is
340 initiating DMA with bus master bit clear. */
341 if (val == (VIRTIO_CONFIG_S_ACKNOWLEDGE | VIRTIO_CONFIG_S_DRIVER)) {
342 pci_default_write_config(&proxy->pci_dev, PCI_COMMAND,
343 proxy->pci_dev.config[PCI_COMMAND] |
344 PCI_COMMAND_MASTER, 1);
347 case VIRTIO_MSI_CONFIG_VECTOR:
348 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
349 /* Make it possible for guest to discover an error took place. */
350 if (msix_vector_use(&proxy->pci_dev, val) < 0)
351 val = VIRTIO_NO_VECTOR;
352 vdev->config_vector = val;
354 case VIRTIO_MSI_QUEUE_VECTOR:
355 msix_vector_unuse(&proxy->pci_dev,
356 virtio_queue_vector(vdev, vdev->queue_sel));
357 /* Make it possible for guest to discover an error took place. */
358 if (msix_vector_use(&proxy->pci_dev, val) < 0)
359 val = VIRTIO_NO_VECTOR;
360 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
363 error_report("%s: unexpected address 0x%x value 0x%x",
364 __func__, addr, val);
369 static uint32_t virtio_ioport_read(VirtIOPCIProxy *proxy, uint32_t addr)
371 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
372 uint32_t ret = 0xFFFFFFFF;
375 case VIRTIO_PCI_HOST_FEATURES:
376 ret = vdev->host_features;
378 case VIRTIO_PCI_GUEST_FEATURES:
379 ret = vdev->guest_features;
381 case VIRTIO_PCI_QUEUE_PFN:
382 ret = virtio_queue_get_addr(vdev, vdev->queue_sel)
383 >> VIRTIO_PCI_QUEUE_ADDR_SHIFT;
385 case VIRTIO_PCI_QUEUE_NUM:
386 ret = virtio_queue_get_num(vdev, vdev->queue_sel);
388 case VIRTIO_PCI_QUEUE_SEL:
389 ret = vdev->queue_sel;
391 case VIRTIO_PCI_STATUS:
395 /* reading from the ISR also clears it. */
396 ret = atomic_xchg(&vdev->isr, 0);
397 pci_irq_deassert(&proxy->pci_dev);
399 case VIRTIO_MSI_CONFIG_VECTOR:
400 ret = vdev->config_vector;
402 case VIRTIO_MSI_QUEUE_VECTOR:
403 ret = virtio_queue_vector(vdev, vdev->queue_sel);
412 static uint64_t virtio_pci_config_read(void *opaque, hwaddr addr,
415 VirtIOPCIProxy *proxy = opaque;
416 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
417 uint32_t config = VIRTIO_PCI_CONFIG_SIZE(&proxy->pci_dev);
420 return virtio_ioport_read(proxy, addr);
426 val = virtio_config_readb(vdev, addr);
429 val = virtio_config_readw(vdev, addr);
430 if (virtio_is_big_endian(vdev)) {
435 val = virtio_config_readl(vdev, addr);
436 if (virtio_is_big_endian(vdev)) {
444 static void virtio_pci_config_write(void *opaque, hwaddr addr,
445 uint64_t val, unsigned size)
447 VirtIOPCIProxy *proxy = opaque;
448 uint32_t config = VIRTIO_PCI_CONFIG_SIZE(&proxy->pci_dev);
449 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
451 virtio_ioport_write(proxy, addr, val);
456 * Virtio-PCI is odd. Ioports are LE but config space is target native
461 virtio_config_writeb(vdev, addr, val);
464 if (virtio_is_big_endian(vdev)) {
467 virtio_config_writew(vdev, addr, val);
470 if (virtio_is_big_endian(vdev)) {
473 virtio_config_writel(vdev, addr, val);
478 static const MemoryRegionOps virtio_pci_config_ops = {
479 .read = virtio_pci_config_read,
480 .write = virtio_pci_config_write,
482 .min_access_size = 1,
483 .max_access_size = 4,
485 .endianness = DEVICE_LITTLE_ENDIAN,
488 static MemoryRegion *virtio_address_space_lookup(VirtIOPCIProxy *proxy,
489 hwaddr *off, int len)
492 VirtIOPCIRegion *reg;
494 for (i = 0; i < ARRAY_SIZE(proxy->regs); ++i) {
495 reg = &proxy->regs[i];
496 if (*off >= reg->offset &&
497 *off + len <= reg->offset + reg->size) {
506 /* Below are generic functions to do memcpy from/to an address space,
507 * without byteswaps, with input validation.
509 * As regular address_space_* APIs all do some kind of byteswap at least for
510 * some host/target combinations, we are forced to explicitly convert to a
511 * known-endianness integer value.
512 * It doesn't really matter which endian format to go through, so the code
513 * below selects the endian that causes the least amount of work on the given
516 * Note: host pointer must be aligned.
519 void virtio_address_space_write(VirtIOPCIProxy *proxy, hwaddr addr,
520 const uint8_t *buf, int len)
525 /* address_space_* APIs assume an aligned address.
526 * As address is under guest control, handle illegal values.
530 mr = virtio_address_space_lookup(proxy, &addr, len);
535 /* Make sure caller aligned buf properly */
536 assert(!(((uintptr_t)buf) & (len - 1)));
540 val = pci_get_byte(buf);
543 val = cpu_to_le16(pci_get_word(buf));
546 val = cpu_to_le32(pci_get_long(buf));
549 /* As length is under guest control, handle illegal values. */
552 memory_region_dispatch_write(mr, addr, val, len, MEMTXATTRS_UNSPECIFIED);
556 virtio_address_space_read(VirtIOPCIProxy *proxy, hwaddr addr,
557 uint8_t *buf, int len)
562 /* address_space_* APIs assume an aligned address.
563 * As address is under guest control, handle illegal values.
567 mr = virtio_address_space_lookup(proxy, &addr, len);
572 /* Make sure caller aligned buf properly */
573 assert(!(((uintptr_t)buf) & (len - 1)));
575 memory_region_dispatch_read(mr, addr, &val, len, MEMTXATTRS_UNSPECIFIED);
578 pci_set_byte(buf, val);
581 pci_set_word(buf, le16_to_cpu(val));
584 pci_set_long(buf, le32_to_cpu(val));
587 /* As length is under guest control, handle illegal values. */
592 static void virtio_write_config(PCIDevice *pci_dev, uint32_t address,
593 uint32_t val, int len)
595 VirtIOPCIProxy *proxy = VIRTIO_PCI(pci_dev);
596 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
597 struct virtio_pci_cfg_cap *cfg;
599 pci_default_write_config(pci_dev, address, val, len);
601 if (range_covers_byte(address, len, PCI_COMMAND) &&
602 !(pci_dev->config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
603 virtio_pci_stop_ioeventfd(proxy);
604 virtio_set_status(vdev, vdev->status & ~VIRTIO_CONFIG_S_DRIVER_OK);
607 if (proxy->config_cap &&
608 ranges_overlap(address, len, proxy->config_cap + offsetof(struct virtio_pci_cfg_cap,
610 sizeof cfg->pci_cfg_data)) {
614 cfg = (void *)(proxy->pci_dev.config + proxy->config_cap);
615 off = le32_to_cpu(cfg->cap.offset);
616 len = le32_to_cpu(cfg->cap.length);
618 if (len == 1 || len == 2 || len == 4) {
619 assert(len <= sizeof cfg->pci_cfg_data);
620 virtio_address_space_write(proxy, off, cfg->pci_cfg_data, len);
625 static uint32_t virtio_read_config(PCIDevice *pci_dev,
626 uint32_t address, int len)
628 VirtIOPCIProxy *proxy = VIRTIO_PCI(pci_dev);
629 struct virtio_pci_cfg_cap *cfg;
631 if (proxy->config_cap &&
632 ranges_overlap(address, len, proxy->config_cap + offsetof(struct virtio_pci_cfg_cap,
634 sizeof cfg->pci_cfg_data)) {
638 cfg = (void *)(proxy->pci_dev.config + proxy->config_cap);
639 off = le32_to_cpu(cfg->cap.offset);
640 len = le32_to_cpu(cfg->cap.length);
642 if (len == 1 || len == 2 || len == 4) {
643 assert(len <= sizeof cfg->pci_cfg_data);
644 virtio_address_space_read(proxy, off, cfg->pci_cfg_data, len);
648 return pci_default_read_config(pci_dev, address, len);
651 static int kvm_virtio_pci_vq_vector_use(VirtIOPCIProxy *proxy,
652 unsigned int queue_no,
655 VirtIOIRQFD *irqfd = &proxy->vector_irqfd[vector];
658 if (irqfd->users == 0) {
659 ret = kvm_irqchip_add_msi_route(kvm_state, vector, &proxy->pci_dev);
669 static void kvm_virtio_pci_vq_vector_release(VirtIOPCIProxy *proxy,
672 VirtIOIRQFD *irqfd = &proxy->vector_irqfd[vector];
673 if (--irqfd->users == 0) {
674 kvm_irqchip_release_virq(kvm_state, irqfd->virq);
678 static int kvm_virtio_pci_irqfd_use(VirtIOPCIProxy *proxy,
679 unsigned int queue_no,
682 VirtIOIRQFD *irqfd = &proxy->vector_irqfd[vector];
683 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
684 VirtQueue *vq = virtio_get_queue(vdev, queue_no);
685 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
686 return kvm_irqchip_add_irqfd_notifier_gsi(kvm_state, n, NULL, irqfd->virq);
689 static void kvm_virtio_pci_irqfd_release(VirtIOPCIProxy *proxy,
690 unsigned int queue_no,
693 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
694 VirtQueue *vq = virtio_get_queue(vdev, queue_no);
695 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
696 VirtIOIRQFD *irqfd = &proxy->vector_irqfd[vector];
699 ret = kvm_irqchip_remove_irqfd_notifier_gsi(kvm_state, n, irqfd->virq);
703 static int kvm_virtio_pci_vector_use(VirtIOPCIProxy *proxy, int nvqs)
705 PCIDevice *dev = &proxy->pci_dev;
706 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
707 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
711 for (queue_no = 0; queue_no < nvqs; queue_no++) {
712 if (!virtio_queue_get_num(vdev, queue_no)) {
715 vector = virtio_queue_vector(vdev, queue_no);
716 if (vector >= msix_nr_vectors_allocated(dev)) {
719 ret = kvm_virtio_pci_vq_vector_use(proxy, queue_no, vector);
723 /* If guest supports masking, set up irqfd now.
724 * Otherwise, delay until unmasked in the frontend.
726 if (vdev->use_guest_notifier_mask && k->guest_notifier_mask) {
727 ret = kvm_virtio_pci_irqfd_use(proxy, queue_no, vector);
729 kvm_virtio_pci_vq_vector_release(proxy, vector);
737 while (--queue_no >= 0) {
738 vector = virtio_queue_vector(vdev, queue_no);
739 if (vector >= msix_nr_vectors_allocated(dev)) {
742 if (vdev->use_guest_notifier_mask && k->guest_notifier_mask) {
743 kvm_virtio_pci_irqfd_release(proxy, queue_no, vector);
745 kvm_virtio_pci_vq_vector_release(proxy, vector);
750 static void kvm_virtio_pci_vector_release(VirtIOPCIProxy *proxy, int nvqs)
752 PCIDevice *dev = &proxy->pci_dev;
753 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
756 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
758 for (queue_no = 0; queue_no < nvqs; queue_no++) {
759 if (!virtio_queue_get_num(vdev, queue_no)) {
762 vector = virtio_queue_vector(vdev, queue_no);
763 if (vector >= msix_nr_vectors_allocated(dev)) {
766 /* If guest supports masking, clean up irqfd now.
767 * Otherwise, it was cleaned when masked in the frontend.
769 if (vdev->use_guest_notifier_mask && k->guest_notifier_mask) {
770 kvm_virtio_pci_irqfd_release(proxy, queue_no, vector);
772 kvm_virtio_pci_vq_vector_release(proxy, vector);
776 static int virtio_pci_vq_vector_unmask(VirtIOPCIProxy *proxy,
777 unsigned int queue_no,
781 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
782 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
783 VirtQueue *vq = virtio_get_queue(vdev, queue_no);
784 EventNotifier *n = virtio_queue_get_guest_notifier(vq);
788 if (proxy->vector_irqfd) {
789 irqfd = &proxy->vector_irqfd[vector];
790 if (irqfd->msg.data != msg.data || irqfd->msg.address != msg.address) {
791 ret = kvm_irqchip_update_msi_route(kvm_state, irqfd->virq, msg,
796 kvm_irqchip_commit_routes(kvm_state);
800 /* If guest supports masking, irqfd is already setup, unmask it.
801 * Otherwise, set it up now.
803 if (vdev->use_guest_notifier_mask && k->guest_notifier_mask) {
804 k->guest_notifier_mask(vdev, queue_no, false);
805 /* Test after unmasking to avoid losing events. */
806 if (k->guest_notifier_pending &&
807 k->guest_notifier_pending(vdev, queue_no)) {
808 event_notifier_set(n);
811 ret = kvm_virtio_pci_irqfd_use(proxy, queue_no, vector);
816 static void virtio_pci_vq_vector_mask(VirtIOPCIProxy *proxy,
817 unsigned int queue_no,
820 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
821 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
823 /* If guest supports masking, keep irqfd but mask it.
824 * Otherwise, clean it up now.
826 if (vdev->use_guest_notifier_mask && k->guest_notifier_mask) {
827 k->guest_notifier_mask(vdev, queue_no, true);
829 kvm_virtio_pci_irqfd_release(proxy, queue_no, vector);
833 static int virtio_pci_vector_unmask(PCIDevice *dev, unsigned vector,
836 VirtIOPCIProxy *proxy = container_of(dev, VirtIOPCIProxy, pci_dev);
837 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
838 VirtQueue *vq = virtio_vector_first_queue(vdev, vector);
839 int ret, index, unmasked = 0;
842 index = virtio_get_queue_index(vq);
843 if (!virtio_queue_get_num(vdev, index)) {
846 if (index < proxy->nvqs_with_notifiers) {
847 ret = virtio_pci_vq_vector_unmask(proxy, index, vector, msg);
853 vq = virtio_vector_next_queue(vq);
859 vq = virtio_vector_first_queue(vdev, vector);
860 while (vq && unmasked >= 0) {
861 index = virtio_get_queue_index(vq);
862 if (index < proxy->nvqs_with_notifiers) {
863 virtio_pci_vq_vector_mask(proxy, index, vector);
866 vq = virtio_vector_next_queue(vq);
871 static void virtio_pci_vector_mask(PCIDevice *dev, unsigned vector)
873 VirtIOPCIProxy *proxy = container_of(dev, VirtIOPCIProxy, pci_dev);
874 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
875 VirtQueue *vq = virtio_vector_first_queue(vdev, vector);
879 index = virtio_get_queue_index(vq);
880 if (!virtio_queue_get_num(vdev, index)) {
883 if (index < proxy->nvqs_with_notifiers) {
884 virtio_pci_vq_vector_mask(proxy, index, vector);
886 vq = virtio_vector_next_queue(vq);
890 static void virtio_pci_vector_poll(PCIDevice *dev,
891 unsigned int vector_start,
892 unsigned int vector_end)
894 VirtIOPCIProxy *proxy = container_of(dev, VirtIOPCIProxy, pci_dev);
895 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
896 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
899 EventNotifier *notifier;
902 for (queue_no = 0; queue_no < proxy->nvqs_with_notifiers; queue_no++) {
903 if (!virtio_queue_get_num(vdev, queue_no)) {
906 vector = virtio_queue_vector(vdev, queue_no);
907 if (vector < vector_start || vector >= vector_end ||
908 !msix_is_masked(dev, vector)) {
911 vq = virtio_get_queue(vdev, queue_no);
912 notifier = virtio_queue_get_guest_notifier(vq);
913 if (k->guest_notifier_pending) {
914 if (k->guest_notifier_pending(vdev, queue_no)) {
915 msix_set_pending(dev, vector);
917 } else if (event_notifier_test_and_clear(notifier)) {
918 msix_set_pending(dev, vector);
923 static int virtio_pci_set_guest_notifier(DeviceState *d, int n, bool assign,
926 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
927 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
928 VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
929 VirtQueue *vq = virtio_get_queue(vdev, n);
930 EventNotifier *notifier = virtio_queue_get_guest_notifier(vq);
933 int r = event_notifier_init(notifier, 0);
937 virtio_queue_set_guest_notifier_fd_handler(vq, true, with_irqfd);
939 virtio_queue_set_guest_notifier_fd_handler(vq, false, with_irqfd);
940 event_notifier_cleanup(notifier);
943 if (!msix_enabled(&proxy->pci_dev) &&
944 vdev->use_guest_notifier_mask &&
945 vdc->guest_notifier_mask) {
946 vdc->guest_notifier_mask(vdev, n, !assign);
952 static bool virtio_pci_query_guest_notifiers(DeviceState *d)
954 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
955 return msix_enabled(&proxy->pci_dev);
958 static int virtio_pci_set_guest_notifiers(DeviceState *d, int nvqs, bool assign)
960 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
961 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
962 VirtioDeviceClass *k = VIRTIO_DEVICE_GET_CLASS(vdev);
964 bool with_irqfd = msix_enabled(&proxy->pci_dev) &&
965 kvm_msi_via_irqfd_enabled();
967 nvqs = MIN(nvqs, VIRTIO_QUEUE_MAX);
969 /* When deassigning, pass a consistent nvqs value
970 * to avoid leaking notifiers.
972 assert(assign || nvqs == proxy->nvqs_with_notifiers);
974 proxy->nvqs_with_notifiers = nvqs;
976 /* Must unset vector notifier while guest notifier is still assigned */
977 if ((proxy->vector_irqfd || k->guest_notifier_mask) && !assign) {
978 msix_unset_vector_notifiers(&proxy->pci_dev);
979 if (proxy->vector_irqfd) {
980 kvm_virtio_pci_vector_release(proxy, nvqs);
981 g_free(proxy->vector_irqfd);
982 proxy->vector_irqfd = NULL;
986 for (n = 0; n < nvqs; n++) {
987 if (!virtio_queue_get_num(vdev, n)) {
991 r = virtio_pci_set_guest_notifier(d, n, assign, with_irqfd);
997 /* Must set vector notifier after guest notifier has been assigned */
998 if ((with_irqfd || k->guest_notifier_mask) && assign) {
1000 proxy->vector_irqfd =
1001 g_malloc0(sizeof(*proxy->vector_irqfd) *
1002 msix_nr_vectors_allocated(&proxy->pci_dev));
1003 r = kvm_virtio_pci_vector_use(proxy, nvqs);
1008 r = msix_set_vector_notifiers(&proxy->pci_dev,
1009 virtio_pci_vector_unmask,
1010 virtio_pci_vector_mask,
1011 virtio_pci_vector_poll);
1013 goto notifiers_error;
1022 kvm_virtio_pci_vector_release(proxy, nvqs);
1026 /* We get here on assignment failure. Recover by undoing for VQs 0 .. n. */
1029 virtio_pci_set_guest_notifier(d, n, !assign, with_irqfd);
1034 static int virtio_pci_set_host_notifier_mr(DeviceState *d, int n,
1035 MemoryRegion *mr, bool assign)
1037 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
1040 if (n >= VIRTIO_QUEUE_MAX || !virtio_pci_modern(proxy) ||
1041 virtio_pci_queue_mem_mult(proxy) != memory_region_size(mr)) {
1046 offset = virtio_pci_queue_mem_mult(proxy) * n;
1047 memory_region_add_subregion_overlap(&proxy->notify.mr, offset, mr, 1);
1049 memory_region_del_subregion(&proxy->notify.mr, mr);
1055 static void virtio_pci_vmstate_change(DeviceState *d, bool running)
1057 VirtIOPCIProxy *proxy = to_virtio_pci_proxy(d);
1058 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1061 /* Old QEMU versions did not set bus master enable on status write.
1062 * Detect DRIVER set and enable it.
1064 if ((proxy->flags & VIRTIO_PCI_FLAG_BUS_MASTER_BUG_MIGRATION) &&
1065 (vdev->status & VIRTIO_CONFIG_S_DRIVER) &&
1066 !(proxy->pci_dev.config[PCI_COMMAND] & PCI_COMMAND_MASTER)) {
1067 pci_default_write_config(&proxy->pci_dev, PCI_COMMAND,
1068 proxy->pci_dev.config[PCI_COMMAND] |
1069 PCI_COMMAND_MASTER, 1);
1071 virtio_pci_start_ioeventfd(proxy);
1073 virtio_pci_stop_ioeventfd(proxy);
1078 * virtio-pci: This is the PCIDevice which has a virtio-pci-bus.
1081 static int virtio_pci_query_nvectors(DeviceState *d)
1083 VirtIOPCIProxy *proxy = VIRTIO_PCI(d);
1085 return proxy->nvectors;
1088 static AddressSpace *virtio_pci_get_dma_as(DeviceState *d)
1090 VirtIOPCIProxy *proxy = VIRTIO_PCI(d);
1091 PCIDevice *dev = &proxy->pci_dev;
1093 return pci_get_address_space(dev);
1096 static int virtio_pci_add_mem_cap(VirtIOPCIProxy *proxy,
1097 struct virtio_pci_cap *cap)
1099 PCIDevice *dev = &proxy->pci_dev;
1102 offset = pci_add_capability(dev, PCI_CAP_ID_VNDR, 0,
1103 cap->cap_len, &error_abort);
1105 assert(cap->cap_len >= sizeof *cap);
1106 memcpy(dev->config + offset + PCI_CAP_FLAGS, &cap->cap_len,
1107 cap->cap_len - PCI_CAP_FLAGS);
1112 static uint64_t virtio_pci_common_read(void *opaque, hwaddr addr,
1115 VirtIOPCIProxy *proxy = opaque;
1116 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1121 case VIRTIO_PCI_COMMON_DFSELECT:
1122 val = proxy->dfselect;
1124 case VIRTIO_PCI_COMMON_DF:
1125 if (proxy->dfselect <= 1) {
1126 VirtioDeviceClass *vdc = VIRTIO_DEVICE_GET_CLASS(vdev);
1128 val = (vdev->host_features & ~vdc->legacy_features) >>
1129 (32 * proxy->dfselect);
1132 case VIRTIO_PCI_COMMON_GFSELECT:
1133 val = proxy->gfselect;
1135 case VIRTIO_PCI_COMMON_GF:
1136 if (proxy->gfselect < ARRAY_SIZE(proxy->guest_features)) {
1137 val = proxy->guest_features[proxy->gfselect];
1140 case VIRTIO_PCI_COMMON_MSIX:
1141 val = vdev->config_vector;
1143 case VIRTIO_PCI_COMMON_NUMQ:
1144 for (i = 0; i < VIRTIO_QUEUE_MAX; ++i) {
1145 if (virtio_queue_get_num(vdev, i)) {
1150 case VIRTIO_PCI_COMMON_STATUS:
1153 case VIRTIO_PCI_COMMON_CFGGENERATION:
1154 val = vdev->generation;
1156 case VIRTIO_PCI_COMMON_Q_SELECT:
1157 val = vdev->queue_sel;
1159 case VIRTIO_PCI_COMMON_Q_SIZE:
1160 val = virtio_queue_get_num(vdev, vdev->queue_sel);
1162 case VIRTIO_PCI_COMMON_Q_MSIX:
1163 val = virtio_queue_vector(vdev, vdev->queue_sel);
1165 case VIRTIO_PCI_COMMON_Q_ENABLE:
1166 val = proxy->vqs[vdev->queue_sel].enabled;
1168 case VIRTIO_PCI_COMMON_Q_NOFF:
1169 /* Simply map queues in order */
1170 val = vdev->queue_sel;
1172 case VIRTIO_PCI_COMMON_Q_DESCLO:
1173 val = proxy->vqs[vdev->queue_sel].desc[0];
1175 case VIRTIO_PCI_COMMON_Q_DESCHI:
1176 val = proxy->vqs[vdev->queue_sel].desc[1];
1178 case VIRTIO_PCI_COMMON_Q_AVAILLO:
1179 val = proxy->vqs[vdev->queue_sel].avail[0];
1181 case VIRTIO_PCI_COMMON_Q_AVAILHI:
1182 val = proxy->vqs[vdev->queue_sel].avail[1];
1184 case VIRTIO_PCI_COMMON_Q_USEDLO:
1185 val = proxy->vqs[vdev->queue_sel].used[0];
1187 case VIRTIO_PCI_COMMON_Q_USEDHI:
1188 val = proxy->vqs[vdev->queue_sel].used[1];
1197 static void virtio_pci_common_write(void *opaque, hwaddr addr,
1198 uint64_t val, unsigned size)
1200 VirtIOPCIProxy *proxy = opaque;
1201 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1204 case VIRTIO_PCI_COMMON_DFSELECT:
1205 proxy->dfselect = val;
1207 case VIRTIO_PCI_COMMON_GFSELECT:
1208 proxy->gfselect = val;
1210 case VIRTIO_PCI_COMMON_GF:
1211 if (proxy->gfselect < ARRAY_SIZE(proxy->guest_features)) {
1212 proxy->guest_features[proxy->gfselect] = val;
1213 virtio_set_features(vdev,
1214 (((uint64_t)proxy->guest_features[1]) << 32) |
1215 proxy->guest_features[0]);
1218 case VIRTIO_PCI_COMMON_MSIX:
1219 msix_vector_unuse(&proxy->pci_dev, vdev->config_vector);
1220 /* Make it possible for guest to discover an error took place. */
1221 if (msix_vector_use(&proxy->pci_dev, val) < 0) {
1222 val = VIRTIO_NO_VECTOR;
1224 vdev->config_vector = val;
1226 case VIRTIO_PCI_COMMON_STATUS:
1227 if (!(val & VIRTIO_CONFIG_S_DRIVER_OK)) {
1228 virtio_pci_stop_ioeventfd(proxy);
1231 virtio_set_status(vdev, val & 0xFF);
1233 if (val & VIRTIO_CONFIG_S_DRIVER_OK) {
1234 virtio_pci_start_ioeventfd(proxy);
1237 if (vdev->status == 0) {
1238 virtio_pci_reset(DEVICE(proxy));
1242 case VIRTIO_PCI_COMMON_Q_SELECT:
1243 if (val < VIRTIO_QUEUE_MAX) {
1244 vdev->queue_sel = val;
1247 case VIRTIO_PCI_COMMON_Q_SIZE:
1248 proxy->vqs[vdev->queue_sel].num = val;
1250 case VIRTIO_PCI_COMMON_Q_MSIX:
1251 msix_vector_unuse(&proxy->pci_dev,
1252 virtio_queue_vector(vdev, vdev->queue_sel));
1253 /* Make it possible for guest to discover an error took place. */
1254 if (msix_vector_use(&proxy->pci_dev, val) < 0) {
1255 val = VIRTIO_NO_VECTOR;
1257 virtio_queue_set_vector(vdev, vdev->queue_sel, val);
1259 case VIRTIO_PCI_COMMON_Q_ENABLE:
1260 virtio_queue_set_num(vdev, vdev->queue_sel,
1261 proxy->vqs[vdev->queue_sel].num);
1262 virtio_queue_set_rings(vdev, vdev->queue_sel,
1263 ((uint64_t)proxy->vqs[vdev->queue_sel].desc[1]) << 32 |
1264 proxy->vqs[vdev->queue_sel].desc[0],
1265 ((uint64_t)proxy->vqs[vdev->queue_sel].avail[1]) << 32 |
1266 proxy->vqs[vdev->queue_sel].avail[0],
1267 ((uint64_t)proxy->vqs[vdev->queue_sel].used[1]) << 32 |
1268 proxy->vqs[vdev->queue_sel].used[0]);
1269 proxy->vqs[vdev->queue_sel].enabled = 1;
1271 case VIRTIO_PCI_COMMON_Q_DESCLO:
1272 proxy->vqs[vdev->queue_sel].desc[0] = val;
1274 case VIRTIO_PCI_COMMON_Q_DESCHI:
1275 proxy->vqs[vdev->queue_sel].desc[1] = val;
1277 case VIRTIO_PCI_COMMON_Q_AVAILLO:
1278 proxy->vqs[vdev->queue_sel].avail[0] = val;
1280 case VIRTIO_PCI_COMMON_Q_AVAILHI:
1281 proxy->vqs[vdev->queue_sel].avail[1] = val;
1283 case VIRTIO_PCI_COMMON_Q_USEDLO:
1284 proxy->vqs[vdev->queue_sel].used[0] = val;
1286 case VIRTIO_PCI_COMMON_Q_USEDHI:
1287 proxy->vqs[vdev->queue_sel].used[1] = val;
1295 static uint64_t virtio_pci_notify_read(void *opaque, hwaddr addr,
1301 static void virtio_pci_notify_write(void *opaque, hwaddr addr,
1302 uint64_t val, unsigned size)
1304 VirtIODevice *vdev = opaque;
1305 VirtIOPCIProxy *proxy = VIRTIO_PCI(DEVICE(vdev)->parent_bus->parent);
1306 unsigned queue = addr / virtio_pci_queue_mem_mult(proxy);
1308 if (queue < VIRTIO_QUEUE_MAX) {
1309 virtio_queue_notify(vdev, queue);
1313 static void virtio_pci_notify_write_pio(void *opaque, hwaddr addr,
1314 uint64_t val, unsigned size)
1316 VirtIODevice *vdev = opaque;
1317 unsigned queue = val;
1319 if (queue < VIRTIO_QUEUE_MAX) {
1320 virtio_queue_notify(vdev, queue);
1324 static uint64_t virtio_pci_isr_read(void *opaque, hwaddr addr,
1327 VirtIOPCIProxy *proxy = opaque;
1328 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1329 uint64_t val = atomic_xchg(&vdev->isr, 0);
1330 pci_irq_deassert(&proxy->pci_dev);
1335 static void virtio_pci_isr_write(void *opaque, hwaddr addr,
1336 uint64_t val, unsigned size)
1340 static uint64_t virtio_pci_device_read(void *opaque, hwaddr addr,
1343 VirtIODevice *vdev = opaque;
1348 val = virtio_config_modern_readb(vdev, addr);
1351 val = virtio_config_modern_readw(vdev, addr);
1354 val = virtio_config_modern_readl(vdev, addr);
1360 static void virtio_pci_device_write(void *opaque, hwaddr addr,
1361 uint64_t val, unsigned size)
1363 VirtIODevice *vdev = opaque;
1366 virtio_config_modern_writeb(vdev, addr, val);
1369 virtio_config_modern_writew(vdev, addr, val);
1372 virtio_config_modern_writel(vdev, addr, val);
1377 static void virtio_pci_modern_regions_init(VirtIOPCIProxy *proxy)
1379 static const MemoryRegionOps common_ops = {
1380 .read = virtio_pci_common_read,
1381 .write = virtio_pci_common_write,
1383 .min_access_size = 1,
1384 .max_access_size = 4,
1386 .endianness = DEVICE_LITTLE_ENDIAN,
1388 static const MemoryRegionOps isr_ops = {
1389 .read = virtio_pci_isr_read,
1390 .write = virtio_pci_isr_write,
1392 .min_access_size = 1,
1393 .max_access_size = 4,
1395 .endianness = DEVICE_LITTLE_ENDIAN,
1397 static const MemoryRegionOps device_ops = {
1398 .read = virtio_pci_device_read,
1399 .write = virtio_pci_device_write,
1401 .min_access_size = 1,
1402 .max_access_size = 4,
1404 .endianness = DEVICE_LITTLE_ENDIAN,
1406 static const MemoryRegionOps notify_ops = {
1407 .read = virtio_pci_notify_read,
1408 .write = virtio_pci_notify_write,
1410 .min_access_size = 1,
1411 .max_access_size = 4,
1413 .endianness = DEVICE_LITTLE_ENDIAN,
1415 static const MemoryRegionOps notify_pio_ops = {
1416 .read = virtio_pci_notify_read,
1417 .write = virtio_pci_notify_write_pio,
1419 .min_access_size = 1,
1420 .max_access_size = 4,
1422 .endianness = DEVICE_LITTLE_ENDIAN,
1426 memory_region_init_io(&proxy->common.mr, OBJECT(proxy),
1429 "virtio-pci-common",
1430 proxy->common.size);
1432 memory_region_init_io(&proxy->isr.mr, OBJECT(proxy),
1438 memory_region_init_io(&proxy->device.mr, OBJECT(proxy),
1440 virtio_bus_get_device(&proxy->bus),
1441 "virtio-pci-device",
1442 proxy->device.size);
1444 memory_region_init_io(&proxy->notify.mr, OBJECT(proxy),
1446 virtio_bus_get_device(&proxy->bus),
1447 "virtio-pci-notify",
1448 proxy->notify.size);
1450 memory_region_init_io(&proxy->notify_pio.mr, OBJECT(proxy),
1452 virtio_bus_get_device(&proxy->bus),
1453 "virtio-pci-notify-pio",
1454 proxy->notify_pio.size);
1457 static void virtio_pci_modern_region_map(VirtIOPCIProxy *proxy,
1458 VirtIOPCIRegion *region,
1459 struct virtio_pci_cap *cap,
1463 memory_region_add_subregion(mr, region->offset, ®ion->mr);
1465 cap->cfg_type = region->type;
1467 cap->offset = cpu_to_le32(region->offset);
1468 cap->length = cpu_to_le32(region->size);
1469 virtio_pci_add_mem_cap(proxy, cap);
1473 static void virtio_pci_modern_mem_region_map(VirtIOPCIProxy *proxy,
1474 VirtIOPCIRegion *region,
1475 struct virtio_pci_cap *cap)
1477 virtio_pci_modern_region_map(proxy, region, cap,
1478 &proxy->modern_bar, proxy->modern_mem_bar_idx);
1481 static void virtio_pci_modern_io_region_map(VirtIOPCIProxy *proxy,
1482 VirtIOPCIRegion *region,
1483 struct virtio_pci_cap *cap)
1485 virtio_pci_modern_region_map(proxy, region, cap,
1486 &proxy->io_bar, proxy->modern_io_bar_idx);
1489 static void virtio_pci_modern_mem_region_unmap(VirtIOPCIProxy *proxy,
1490 VirtIOPCIRegion *region)
1492 memory_region_del_subregion(&proxy->modern_bar,
1496 static void virtio_pci_modern_io_region_unmap(VirtIOPCIProxy *proxy,
1497 VirtIOPCIRegion *region)
1499 memory_region_del_subregion(&proxy->io_bar,
1503 static void virtio_pci_pre_plugged(DeviceState *d, Error **errp)
1505 VirtIOPCIProxy *proxy = VIRTIO_PCI(d);
1506 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1508 if (virtio_pci_modern(proxy)) {
1509 virtio_add_feature(&vdev->host_features, VIRTIO_F_VERSION_1);
1512 virtio_add_feature(&vdev->host_features, VIRTIO_F_BAD_FEATURE);
1515 /* This is called by virtio-bus just after the device is plugged. */
1516 static void virtio_pci_device_plugged(DeviceState *d, Error **errp)
1518 VirtIOPCIProxy *proxy = VIRTIO_PCI(d);
1519 VirtioBusState *bus = &proxy->bus;
1520 bool legacy = virtio_pci_legacy(proxy);
1522 bool modern_pio = proxy->flags & VIRTIO_PCI_FLAG_MODERN_PIO_NOTIFY;
1525 VirtIODevice *vdev = virtio_bus_get_device(&proxy->bus);
1528 * Virtio capabilities present without
1529 * VIRTIO_F_VERSION_1 confuses guests
1531 if (!proxy->ignore_backend_features &&
1532 !virtio_has_feature(vdev->host_features, VIRTIO_F_VERSION_1)) {
1533 virtio_pci_disable_modern(proxy);
1536 error_setg(errp, "Device doesn't support modern mode, and legacy"
1537 " mode is disabled");
1538 error_append_hint(errp, "Set disable-legacy to off\n");
1544 modern = virtio_pci_modern(proxy);
1546 config = proxy->pci_dev.config;
1547 if (proxy->class_code) {
1548 pci_config_set_class(config, proxy->class_code);
1552 if (virtio_host_has_feature(vdev, VIRTIO_F_IOMMU_PLATFORM)) {
1553 error_setg(errp, "VIRTIO_F_IOMMU_PLATFORM was supported by"
1554 " neither legacy nor transitional device");
1558 * Legacy and transitional devices use specific subsystem IDs.
1559 * Note that the subsystem vendor ID (config + PCI_SUBSYSTEM_VENDOR_ID)
1560 * is set to PCI_SUBVENDOR_ID_REDHAT_QUMRANET by default.
1562 pci_set_word(config + PCI_SUBSYSTEM_ID, virtio_bus_get_vdev_id(bus));
1564 /* pure virtio-1.0 */
1565 pci_set_word(config + PCI_VENDOR_ID,
1566 PCI_VENDOR_ID_REDHAT_QUMRANET);
1567 pci_set_word(config + PCI_DEVICE_ID,
1568 0x1040 + virtio_bus_get_vdev_id(bus));
1569 pci_config_set_revision(config, 1);
1571 config[PCI_INTERRUPT_PIN] = 1;
1575 struct virtio_pci_cap cap = {
1576 .cap_len = sizeof cap,
1578 struct virtio_pci_notify_cap notify = {
1579 .cap.cap_len = sizeof notify,
1580 .notify_off_multiplier =
1581 cpu_to_le32(virtio_pci_queue_mem_mult(proxy)),
1583 struct virtio_pci_cfg_cap cfg = {
1584 .cap.cap_len = sizeof cfg,
1585 .cap.cfg_type = VIRTIO_PCI_CAP_PCI_CFG,
1587 struct virtio_pci_notify_cap notify_pio = {
1588 .cap.cap_len = sizeof notify,
1589 .notify_off_multiplier = cpu_to_le32(0x0),
1592 struct virtio_pci_cfg_cap *cfg_mask;
1594 virtio_pci_modern_regions_init(proxy);
1596 virtio_pci_modern_mem_region_map(proxy, &proxy->common, &cap);
1597 virtio_pci_modern_mem_region_map(proxy, &proxy->isr, &cap);
1598 virtio_pci_modern_mem_region_map(proxy, &proxy->device, &cap);
1599 virtio_pci_modern_mem_region_map(proxy, &proxy->notify, ¬ify.cap);
1602 memory_region_init(&proxy->io_bar, OBJECT(proxy),
1603 "virtio-pci-io", 0x4);
1605 pci_register_bar(&proxy->pci_dev, proxy->modern_io_bar_idx,
1606 PCI_BASE_ADDRESS_SPACE_IO, &proxy->io_bar);
1608 virtio_pci_modern_io_region_map(proxy, &proxy->notify_pio,
1612 pci_register_bar(&proxy->pci_dev, proxy->modern_mem_bar_idx,
1613 PCI_BASE_ADDRESS_SPACE_MEMORY |
1614 PCI_BASE_ADDRESS_MEM_PREFETCH |
1615 PCI_BASE_ADDRESS_MEM_TYPE_64,
1616 &proxy->modern_bar);
1618 proxy->config_cap = virtio_pci_add_mem_cap(proxy, &cfg.cap);
1619 cfg_mask = (void *)(proxy->pci_dev.wmask + proxy->config_cap);
1620 pci_set_byte(&cfg_mask->cap.bar, ~0x0);
1621 pci_set_long((uint8_t *)&cfg_mask->cap.offset, ~0x0);
1622 pci_set_long((uint8_t *)&cfg_mask->cap.length, ~0x0);
1623 pci_set_long(cfg_mask->pci_cfg_data, ~0x0);
1626 if (proxy->nvectors) {
1627 int err = msix_init_exclusive_bar(&proxy->pci_dev, proxy->nvectors,
1628 proxy->msix_bar_idx, NULL);
1630 /* Notice when a system that supports MSIx can't initialize it */
1631 if (err != -ENOTSUP) {
1632 warn_report("unable to init msix vectors to %" PRIu32,
1635 proxy->nvectors = 0;
1639 proxy->pci_dev.config_write = virtio_write_config;
1640 proxy->pci_dev.config_read = virtio_read_config;
1643 size = VIRTIO_PCI_REGION_SIZE(&proxy->pci_dev)
1644 + virtio_bus_get_vdev_config_len(bus);
1645 size = pow2ceil(size);
1647 memory_region_init_io(&proxy->bar, OBJECT(proxy),
1648 &virtio_pci_config_ops,
1649 proxy, "virtio-pci", size);
1651 pci_register_bar(&proxy->pci_dev, proxy->legacy_io_bar_idx,
1652 PCI_BASE_ADDRESS_SPACE_IO, &proxy->bar);
1656 static void virtio_pci_device_unplugged(DeviceState *d)
1658 VirtIOPCIProxy *proxy = VIRTIO_PCI(d);
1659 bool modern = virtio_pci_modern(proxy);
1660 bool modern_pio = proxy->flags & VIRTIO_PCI_FLAG_MODERN_PIO_NOTIFY;
1662 virtio_pci_stop_ioeventfd(proxy);
1665 virtio_pci_modern_mem_region_unmap(proxy, &proxy->common);
1666 virtio_pci_modern_mem_region_unmap(proxy, &proxy->isr);
1667 virtio_pci_modern_mem_region_unmap(proxy, &proxy->device);
1668 virtio_pci_modern_mem_region_unmap(proxy, &proxy->notify);
1670 virtio_pci_modern_io_region_unmap(proxy, &proxy->notify_pio);
1675 static void virtio_pci_realize(PCIDevice *pci_dev, Error **errp)
1677 VirtIOPCIProxy *proxy = VIRTIO_PCI(pci_dev);
1678 VirtioPCIClass *k = VIRTIO_PCI_GET_CLASS(pci_dev);
1679 bool pcie_port = pci_bus_is_express(pci_get_bus(pci_dev)) &&
1680 !pci_bus_is_root(pci_get_bus(pci_dev));
1682 if (kvm_enabled() && !kvm_has_many_ioeventfds()) {
1683 proxy->flags &= ~VIRTIO_PCI_FLAG_USE_IOEVENTFD;
1687 * virtio pci bar layout used by default.
1688 * subclasses can re-arrange things if needed.
1690 * region 0 -- virtio legacy io bar
1691 * region 1 -- msi-x bar
1692 * region 4+5 -- virtio modern memory (64bit) bar
1695 proxy->legacy_io_bar_idx = 0;
1696 proxy->msix_bar_idx = 1;
1697 proxy->modern_io_bar_idx = 2;
1698 proxy->modern_mem_bar_idx = 4;
1700 proxy->common.offset = 0x0;
1701 proxy->common.size = 0x1000;
1702 proxy->common.type = VIRTIO_PCI_CAP_COMMON_CFG;
1704 proxy->isr.offset = 0x1000;
1705 proxy->isr.size = 0x1000;
1706 proxy->isr.type = VIRTIO_PCI_CAP_ISR_CFG;
1708 proxy->device.offset = 0x2000;
1709 proxy->device.size = 0x1000;
1710 proxy->device.type = VIRTIO_PCI_CAP_DEVICE_CFG;
1712 proxy->notify.offset = 0x3000;
1713 proxy->notify.size = virtio_pci_queue_mem_mult(proxy) * VIRTIO_QUEUE_MAX;
1714 proxy->notify.type = VIRTIO_PCI_CAP_NOTIFY_CFG;
1716 proxy->notify_pio.offset = 0x0;
1717 proxy->notify_pio.size = 0x4;
1718 proxy->notify_pio.type = VIRTIO_PCI_CAP_NOTIFY_CFG;
1720 /* subclasses can enforce modern, so do this unconditionally */
1721 memory_region_init(&proxy->modern_bar, OBJECT(proxy), "virtio-pci",
1722 /* PCI BAR regions must be powers of 2 */
1723 pow2ceil(proxy->notify.offset + proxy->notify.size));
1725 if ((proxy->disable_legacy == ON_OFF_AUTO_ON) ||
1726 ((proxy->disable_legacy == ON_OFF_AUTO_AUTO) && pcie_port)) {
1727 if (proxy->disable_modern) {
1728 error_setg(errp, "device cannot work as neither modern nor "
1729 "legacy mode is enabled");
1730 error_append_hint(errp, "Set either disable-modern or "
1731 "disable-legacy to off\n");
1734 proxy->mode = VIRTIO_PCI_MODE_MODERN;
1736 if (proxy->disable_modern) {
1737 proxy->mode = VIRTIO_PCI_MODE_LEGACY;
1739 proxy->mode = VIRTIO_PCI_MODE_TRANSITIONAL;
1743 if (pcie_port && pci_is_express(pci_dev)) {
1746 pos = pcie_endpoint_cap_init(pci_dev, 0);
1749 pos = pci_add_capability(pci_dev, PCI_CAP_ID_PM, 0,
1750 PCI_PM_SIZEOF, errp);
1755 pci_dev->exp.pm_cap = pos;
1758 * Indicates that this function complies with revision 1.2 of the
1759 * PCI Power Management Interface Specification.
1761 pci_set_word(pci_dev->config + pos + PCI_PM_PMC, 0x3);
1763 if (proxy->flags & VIRTIO_PCI_FLAG_INIT_DEVERR) {
1764 /* Init error enabling flags */
1765 pcie_cap_deverr_init(pci_dev);
1768 if (proxy->flags & VIRTIO_PCI_FLAG_INIT_LNKCTL) {
1769 /* Init Link Control Register */
1770 pcie_cap_lnkctl_init(pci_dev);
1773 if (proxy->flags & VIRTIO_PCI_FLAG_INIT_PM) {
1774 /* Init Power Management Control Register */
1775 pci_set_word(pci_dev->wmask + pos + PCI_PM_CTRL,
1776 PCI_PM_CTRL_STATE_MASK);
1779 if (proxy->flags & VIRTIO_PCI_FLAG_ATS) {
1780 pcie_ats_init(pci_dev, 256);
1785 * make future invocations of pci_is_express() return false
1786 * and pci_config_size() return PCI_CONFIG_SPACE_SIZE.
1788 pci_dev->cap_present &= ~QEMU_PCI_CAP_EXPRESS;
1791 virtio_pci_bus_new(&proxy->bus, sizeof(proxy->bus), proxy);
1793 k->realize(proxy, errp);
1797 static void virtio_pci_exit(PCIDevice *pci_dev)
1799 msix_uninit_exclusive_bar(pci_dev);
1802 static void virtio_pci_reset(DeviceState *qdev)
1804 VirtIOPCIProxy *proxy = VIRTIO_PCI(qdev);
1805 VirtioBusState *bus = VIRTIO_BUS(&proxy->bus);
1806 PCIDevice *dev = PCI_DEVICE(qdev);
1809 virtio_pci_stop_ioeventfd(proxy);
1810 virtio_bus_reset(bus);
1811 msix_unuse_all_vectors(&proxy->pci_dev);
1813 for (i = 0; i < VIRTIO_QUEUE_MAX; i++) {
1814 proxy->vqs[i].enabled = 0;
1815 proxy->vqs[i].num = 0;
1816 proxy->vqs[i].desc[0] = proxy->vqs[i].desc[1] = 0;
1817 proxy->vqs[i].avail[0] = proxy->vqs[i].avail[1] = 0;
1818 proxy->vqs[i].used[0] = proxy->vqs[i].used[1] = 0;
1821 if (pci_is_express(dev)) {
1822 pcie_cap_deverr_reset(dev);
1823 pcie_cap_lnkctl_reset(dev);
1825 pci_set_word(dev->config + dev->exp.pm_cap + PCI_PM_CTRL, 0);
1829 static Property virtio_pci_properties[] = {
1830 DEFINE_PROP_BIT("virtio-pci-bus-master-bug-migration", VirtIOPCIProxy, flags,
1831 VIRTIO_PCI_FLAG_BUS_MASTER_BUG_MIGRATION_BIT, false),
1832 DEFINE_PROP_BIT("migrate-extra", VirtIOPCIProxy, flags,
1833 VIRTIO_PCI_FLAG_MIGRATE_EXTRA_BIT, true),
1834 DEFINE_PROP_BIT("modern-pio-notify", VirtIOPCIProxy, flags,
1835 VIRTIO_PCI_FLAG_MODERN_PIO_NOTIFY_BIT, false),
1836 DEFINE_PROP_BIT("x-disable-pcie", VirtIOPCIProxy, flags,
1837 VIRTIO_PCI_FLAG_DISABLE_PCIE_BIT, false),
1838 DEFINE_PROP_BIT("page-per-vq", VirtIOPCIProxy, flags,
1839 VIRTIO_PCI_FLAG_PAGE_PER_VQ_BIT, false),
1840 DEFINE_PROP_BOOL("x-ignore-backend-features", VirtIOPCIProxy,
1841 ignore_backend_features, false),
1842 DEFINE_PROP_BIT("ats", VirtIOPCIProxy, flags,
1843 VIRTIO_PCI_FLAG_ATS_BIT, false),
1844 DEFINE_PROP_BIT("x-pcie-deverr-init", VirtIOPCIProxy, flags,
1845 VIRTIO_PCI_FLAG_INIT_DEVERR_BIT, true),
1846 DEFINE_PROP_BIT("x-pcie-lnkctl-init", VirtIOPCIProxy, flags,
1847 VIRTIO_PCI_FLAG_INIT_LNKCTL_BIT, true),
1848 DEFINE_PROP_BIT("x-pcie-pm-init", VirtIOPCIProxy, flags,
1849 VIRTIO_PCI_FLAG_INIT_PM_BIT, true),
1850 DEFINE_PROP_END_OF_LIST(),
1853 static void virtio_pci_dc_realize(DeviceState *qdev, Error **errp)
1855 VirtioPCIClass *vpciklass = VIRTIO_PCI_GET_CLASS(qdev);
1856 VirtIOPCIProxy *proxy = VIRTIO_PCI(qdev);
1857 PCIDevice *pci_dev = &proxy->pci_dev;
1859 if (!(proxy->flags & VIRTIO_PCI_FLAG_DISABLE_PCIE) &&
1860 virtio_pci_modern(proxy)) {
1861 pci_dev->cap_present |= QEMU_PCI_CAP_EXPRESS;
1864 vpciklass->parent_dc_realize(qdev, errp);
1867 static void virtio_pci_class_init(ObjectClass *klass, void *data)
1869 DeviceClass *dc = DEVICE_CLASS(klass);
1870 PCIDeviceClass *k = PCI_DEVICE_CLASS(klass);
1871 VirtioPCIClass *vpciklass = VIRTIO_PCI_CLASS(klass);
1873 dc->props = virtio_pci_properties;
1874 k->realize = virtio_pci_realize;
1875 k->exit = virtio_pci_exit;
1876 k->vendor_id = PCI_VENDOR_ID_REDHAT_QUMRANET;
1877 k->revision = VIRTIO_PCI_ABI_VERSION;
1878 k->class_id = PCI_CLASS_OTHERS;
1879 device_class_set_parent_realize(dc, virtio_pci_dc_realize,
1880 &vpciklass->parent_dc_realize);
1881 dc->reset = virtio_pci_reset;
1884 static const TypeInfo virtio_pci_info = {
1885 .name = TYPE_VIRTIO_PCI,
1886 .parent = TYPE_PCI_DEVICE,
1887 .instance_size = sizeof(VirtIOPCIProxy),
1888 .class_init = virtio_pci_class_init,
1889 .class_size = sizeof(VirtioPCIClass),
1893 static Property virtio_pci_generic_properties[] = {
1894 DEFINE_PROP_ON_OFF_AUTO("disable-legacy", VirtIOPCIProxy, disable_legacy,
1896 DEFINE_PROP_BOOL("disable-modern", VirtIOPCIProxy, disable_modern, false),
1897 DEFINE_PROP_END_OF_LIST(),
1900 static void virtio_pci_base_class_init(ObjectClass *klass, void *data)
1902 const VirtioPCIDeviceTypeInfo *t = data;
1903 if (t->class_init) {
1904 t->class_init(klass, NULL);
1908 static void virtio_pci_generic_class_init(ObjectClass *klass, void *data)
1910 DeviceClass *dc = DEVICE_CLASS(klass);
1912 dc->props = virtio_pci_generic_properties;
1915 /* Used when the generic type and the base type is the same */
1916 static void virtio_pci_generic_base_class_init(ObjectClass *klass, void *data)
1918 virtio_pci_base_class_init(klass, data);
1919 virtio_pci_generic_class_init(klass, NULL);
1922 static void virtio_pci_transitional_instance_init(Object *obj)
1924 VirtIOPCIProxy *proxy = VIRTIO_PCI(obj);
1926 proxy->disable_legacy = ON_OFF_AUTO_OFF;
1927 proxy->disable_modern = false;
1930 static void virtio_pci_non_transitional_instance_init(Object *obj)
1932 VirtIOPCIProxy *proxy = VIRTIO_PCI(obj);
1934 proxy->disable_legacy = ON_OFF_AUTO_ON;
1935 proxy->disable_modern = false;
1938 void virtio_pci_types_register(const VirtioPCIDeviceTypeInfo *t)
1940 TypeInfo base_type_info = {
1941 .name = t->base_name,
1942 .parent = t->parent ? t->parent : TYPE_VIRTIO_PCI,
1943 .instance_size = t->instance_size,
1944 .instance_init = t->instance_init,
1945 .class_size = t->class_size,
1946 .class_init = virtio_pci_base_class_init,
1947 .class_data = (void *)t,
1950 TypeInfo generic_type_info = {
1951 .name = t->generic_name,
1952 .parent = base_type_info.name,
1953 .class_init = virtio_pci_generic_class_init,
1954 .interfaces = (InterfaceInfo[]) {
1955 { INTERFACE_PCIE_DEVICE },
1956 { INTERFACE_CONVENTIONAL_PCI_DEVICE },
1961 if (!base_type_info.name) {
1962 /* No base type -> register a single generic device type */
1963 base_type_info.name = t->generic_name;
1964 base_type_info.class_init = virtio_pci_generic_base_class_init;
1965 base_type_info.interfaces = generic_type_info.interfaces;
1966 base_type_info.abstract = false;
1967 generic_type_info.name = NULL;
1968 assert(!t->non_transitional_name);
1969 assert(!t->transitional_name);
1972 type_register(&base_type_info);
1973 if (generic_type_info.name) {
1974 type_register(&generic_type_info);
1977 if (t->non_transitional_name) {
1978 const TypeInfo non_transitional_type_info = {
1979 .name = t->non_transitional_name,
1980 .parent = base_type_info.name,
1981 .instance_init = virtio_pci_non_transitional_instance_init,
1982 .interfaces = (InterfaceInfo[]) {
1983 { INTERFACE_PCIE_DEVICE },
1984 { INTERFACE_CONVENTIONAL_PCI_DEVICE },
1988 type_register(&non_transitional_type_info);
1991 if (t->transitional_name) {
1992 const TypeInfo transitional_type_info = {
1993 .name = t->transitional_name,
1994 .parent = base_type_info.name,
1995 .instance_init = virtio_pci_transitional_instance_init,
1996 .interfaces = (InterfaceInfo[]) {
1998 * Transitional virtio devices work only as Conventional PCI
1999 * devices because they require PIO ports.
2001 { INTERFACE_CONVENTIONAL_PCI_DEVICE },
2005 type_register(&transitional_type_info);
2009 /* virtio-pci-bus */
2011 static void virtio_pci_bus_new(VirtioBusState *bus, size_t bus_size,
2012 VirtIOPCIProxy *dev)
2014 DeviceState *qdev = DEVICE(dev);
2015 char virtio_bus_name[] = "virtio-bus";
2017 qbus_create_inplace(bus, bus_size, TYPE_VIRTIO_PCI_BUS, qdev,
2021 static void virtio_pci_bus_class_init(ObjectClass *klass, void *data)
2023 BusClass *bus_class = BUS_CLASS(klass);
2024 VirtioBusClass *k = VIRTIO_BUS_CLASS(klass);
2025 bus_class->max_dev = 1;
2026 k->notify = virtio_pci_notify;
2027 k->save_config = virtio_pci_save_config;
2028 k->load_config = virtio_pci_load_config;
2029 k->save_queue = virtio_pci_save_queue;
2030 k->load_queue = virtio_pci_load_queue;
2031 k->save_extra_state = virtio_pci_save_extra_state;
2032 k->load_extra_state = virtio_pci_load_extra_state;
2033 k->has_extra_state = virtio_pci_has_extra_state;
2034 k->query_guest_notifiers = virtio_pci_query_guest_notifiers;
2035 k->set_guest_notifiers = virtio_pci_set_guest_notifiers;
2036 k->set_host_notifier_mr = virtio_pci_set_host_notifier_mr;
2037 k->vmstate_change = virtio_pci_vmstate_change;
2038 k->pre_plugged = virtio_pci_pre_plugged;
2039 k->device_plugged = virtio_pci_device_plugged;
2040 k->device_unplugged = virtio_pci_device_unplugged;
2041 k->query_nvectors = virtio_pci_query_nvectors;
2042 k->ioeventfd_enabled = virtio_pci_ioeventfd_enabled;
2043 k->ioeventfd_assign = virtio_pci_ioeventfd_assign;
2044 k->get_dma_as = virtio_pci_get_dma_as;
2047 static const TypeInfo virtio_pci_bus_info = {
2048 .name = TYPE_VIRTIO_PCI_BUS,
2049 .parent = TYPE_VIRTIO_BUS,
2050 .instance_size = sizeof(VirtioPCIBusState),
2051 .class_init = virtio_pci_bus_class_init,
2054 static void virtio_pci_register_types(void)
2057 type_register_static(&virtio_pci_bus_info);
2058 type_register_static(&virtio_pci_info);
2061 type_init(virtio_pci_register_types)