1 // SPDX-License-Identifier: GPL-2.0
3 * Physical device callbacks for vfio_ccw
5 * Copyright IBM Corp. 2017
6 * Copyright Red Hat, Inc. 2019
13 #include <linux/vfio.h>
14 #include <linux/nospec.h>
15 #include <linux/slab.h>
17 #include "vfio_ccw_private.h"
19 static const struct vfio_device_ops vfio_ccw_dev_ops;
21 static int vfio_ccw_mdev_reset(struct vfio_ccw_private *private)
24 * If the FSM state is seen as Not Operational after closing
25 * and re-opening the mdev, return an error.
27 vfio_ccw_fsm_event(private, VFIO_CCW_EVENT_CLOSE);
28 vfio_ccw_fsm_event(private, VFIO_CCW_EVENT_OPEN);
29 if (private->state == VFIO_CCW_STATE_NOT_OPER)
35 static void vfio_ccw_dma_unmap(struct vfio_device *vdev, u64 iova, u64 length)
37 struct vfio_ccw_private *private =
38 container_of(vdev, struct vfio_ccw_private, vdev);
40 /* Drivers MUST unpin pages in response to an invalidation. */
41 if (!cp_iova_pinned(&private->cp, iova, length))
44 vfio_ccw_mdev_reset(private);
47 static int vfio_ccw_mdev_init_dev(struct vfio_device *vdev)
49 struct vfio_ccw_private *private =
50 container_of(vdev, struct vfio_ccw_private, vdev);
52 init_completion(&private->release_comp);
56 static int vfio_ccw_mdev_probe(struct mdev_device *mdev)
58 struct vfio_ccw_private *private = dev_get_drvdata(mdev->dev.parent);
61 if (private->state == VFIO_CCW_STATE_NOT_OPER)
64 ret = vfio_init_device(&private->vdev, &mdev->dev, &vfio_ccw_dev_ops);
68 VFIO_CCW_MSG_EVENT(2, "sch %x.%x.%04x: create\n",
69 private->sch->schid.cssid,
70 private->sch->schid.ssid,
71 private->sch->schid.sch_no);
73 ret = vfio_register_emulated_iommu_dev(&private->vdev);
76 dev_set_drvdata(&mdev->dev, private);
80 vfio_put_device(&private->vdev);
84 static void vfio_ccw_mdev_release_dev(struct vfio_device *vdev)
86 struct vfio_ccw_private *private =
87 container_of(vdev, struct vfio_ccw_private, vdev);
90 * We cannot free vfio_ccw_private here because it includes
91 * parent info which must be free'ed by css driver.
93 * Use a workaround by memset'ing the core device part and
94 * then notifying the remove path that all active references
95 * to this device have been released.
97 memset(vdev, 0, sizeof(*vdev));
98 complete(&private->release_comp);
101 static void vfio_ccw_mdev_remove(struct mdev_device *mdev)
103 struct vfio_ccw_private *private = dev_get_drvdata(mdev->dev.parent);
105 VFIO_CCW_MSG_EVENT(2, "sch %x.%x.%04x: remove\n",
106 private->sch->schid.cssid,
107 private->sch->schid.ssid,
108 private->sch->schid.sch_no);
110 vfio_unregister_group_dev(&private->vdev);
112 vfio_put_device(&private->vdev);
114 * Wait for all active references on mdev are released so it
115 * is safe to defer kfree() to a later point.
117 * TODO: the clean fix is to split parent/mdev info from ccw
118 * private structure so each can be managed in its own life
121 wait_for_completion(&private->release_comp);
124 static int vfio_ccw_mdev_open_device(struct vfio_device *vdev)
126 struct vfio_ccw_private *private =
127 container_of(vdev, struct vfio_ccw_private, vdev);
130 /* Device cannot simply be opened again from this state */
131 if (private->state == VFIO_CCW_STATE_NOT_OPER)
134 ret = vfio_ccw_register_async_dev_regions(private);
138 ret = vfio_ccw_register_schib_dev_regions(private);
142 ret = vfio_ccw_register_crw_dev_regions(private);
146 vfio_ccw_fsm_event(private, VFIO_CCW_EVENT_OPEN);
147 if (private->state == VFIO_CCW_STATE_NOT_OPER) {
155 vfio_ccw_unregister_dev_regions(private);
159 static void vfio_ccw_mdev_close_device(struct vfio_device *vdev)
161 struct vfio_ccw_private *private =
162 container_of(vdev, struct vfio_ccw_private, vdev);
164 vfio_ccw_fsm_event(private, VFIO_CCW_EVENT_CLOSE);
165 vfio_ccw_unregister_dev_regions(private);
168 static ssize_t vfio_ccw_mdev_read_io_region(struct vfio_ccw_private *private,
169 char __user *buf, size_t count,
172 loff_t pos = *ppos & VFIO_CCW_OFFSET_MASK;
173 struct ccw_io_region *region;
176 if (pos + count > sizeof(*region))
179 mutex_lock(&private->io_mutex);
180 region = private->io_region;
181 if (copy_to_user(buf, (void *)region + pos, count))
185 mutex_unlock(&private->io_mutex);
189 static ssize_t vfio_ccw_mdev_read(struct vfio_device *vdev,
194 struct vfio_ccw_private *private =
195 container_of(vdev, struct vfio_ccw_private, vdev);
196 unsigned int index = VFIO_CCW_OFFSET_TO_INDEX(*ppos);
198 if (index >= VFIO_CCW_NUM_REGIONS + private->num_regions)
202 case VFIO_CCW_CONFIG_REGION_INDEX:
203 return vfio_ccw_mdev_read_io_region(private, buf, count, ppos);
205 index -= VFIO_CCW_NUM_REGIONS;
206 return private->region[index].ops->read(private, buf, count,
213 static ssize_t vfio_ccw_mdev_write_io_region(struct vfio_ccw_private *private,
214 const char __user *buf,
215 size_t count, loff_t *ppos)
217 loff_t pos = *ppos & VFIO_CCW_OFFSET_MASK;
218 struct ccw_io_region *region;
221 if (pos + count > sizeof(*region))
224 if (!mutex_trylock(&private->io_mutex))
227 region = private->io_region;
228 if (copy_from_user((void *)region + pos, buf, count)) {
233 vfio_ccw_fsm_event(private, VFIO_CCW_EVENT_IO_REQ);
234 ret = (region->ret_code != 0) ? region->ret_code : count;
237 mutex_unlock(&private->io_mutex);
241 static ssize_t vfio_ccw_mdev_write(struct vfio_device *vdev,
242 const char __user *buf,
246 struct vfio_ccw_private *private =
247 container_of(vdev, struct vfio_ccw_private, vdev);
248 unsigned int index = VFIO_CCW_OFFSET_TO_INDEX(*ppos);
250 if (index >= VFIO_CCW_NUM_REGIONS + private->num_regions)
254 case VFIO_CCW_CONFIG_REGION_INDEX:
255 return vfio_ccw_mdev_write_io_region(private, buf, count, ppos);
257 index -= VFIO_CCW_NUM_REGIONS;
258 return private->region[index].ops->write(private, buf, count,
265 static int vfio_ccw_mdev_get_device_info(struct vfio_ccw_private *private,
266 struct vfio_device_info *info)
268 info->flags = VFIO_DEVICE_FLAGS_CCW | VFIO_DEVICE_FLAGS_RESET;
269 info->num_regions = VFIO_CCW_NUM_REGIONS + private->num_regions;
270 info->num_irqs = VFIO_CCW_NUM_IRQS;
275 static int vfio_ccw_mdev_get_region_info(struct vfio_ccw_private *private,
276 struct vfio_region_info *info,
281 switch (info->index) {
282 case VFIO_CCW_CONFIG_REGION_INDEX:
284 info->size = sizeof(struct ccw_io_region);
285 info->flags = VFIO_REGION_INFO_FLAG_READ
286 | VFIO_REGION_INFO_FLAG_WRITE;
288 default: /* all other regions are handled via capability chain */
290 struct vfio_info_cap caps = { .buf = NULL, .size = 0 };
291 struct vfio_region_info_cap_type cap_type = {
292 .header.id = VFIO_REGION_INFO_CAP_TYPE,
293 .header.version = 1 };
297 VFIO_CCW_NUM_REGIONS + private->num_regions)
300 info->index = array_index_nospec(info->index,
301 VFIO_CCW_NUM_REGIONS +
302 private->num_regions);
304 i = info->index - VFIO_CCW_NUM_REGIONS;
306 info->offset = VFIO_CCW_INDEX_TO_OFFSET(info->index);
307 info->size = private->region[i].size;
308 info->flags = private->region[i].flags;
310 cap_type.type = private->region[i].type;
311 cap_type.subtype = private->region[i].subtype;
313 ret = vfio_info_add_capability(&caps, &cap_type.header,
318 info->flags |= VFIO_REGION_INFO_FLAG_CAPS;
319 if (info->argsz < sizeof(*info) + caps.size) {
320 info->argsz = sizeof(*info) + caps.size;
321 info->cap_offset = 0;
323 vfio_info_cap_shift(&caps, sizeof(*info));
324 if (copy_to_user((void __user *)arg + sizeof(*info),
325 caps.buf, caps.size)) {
329 info->cap_offset = sizeof(*info);
339 static int vfio_ccw_mdev_get_irq_info(struct vfio_irq_info *info)
341 switch (info->index) {
342 case VFIO_CCW_IO_IRQ_INDEX:
343 case VFIO_CCW_CRW_IRQ_INDEX:
344 case VFIO_CCW_REQ_IRQ_INDEX:
346 info->flags = VFIO_IRQ_INFO_EVENTFD;
355 static int vfio_ccw_mdev_set_irqs(struct vfio_ccw_private *private,
360 struct eventfd_ctx **ctx;
362 if (!(flags & VFIO_IRQ_SET_ACTION_TRIGGER))
366 case VFIO_CCW_IO_IRQ_INDEX:
367 ctx = &private->io_trigger;
369 case VFIO_CCW_CRW_IRQ_INDEX:
370 ctx = &private->crw_trigger;
372 case VFIO_CCW_REQ_IRQ_INDEX:
373 ctx = &private->req_trigger;
379 switch (flags & VFIO_IRQ_SET_DATA_TYPE_MASK) {
380 case VFIO_IRQ_SET_DATA_NONE:
383 eventfd_signal(*ctx, 1);
386 case VFIO_IRQ_SET_DATA_BOOL:
390 if (get_user(trigger, (uint8_t __user *)data))
394 eventfd_signal(*ctx, 1);
397 case VFIO_IRQ_SET_DATA_EVENTFD:
401 if (get_user(fd, (int32_t __user *)data))
406 eventfd_ctx_put(*ctx);
408 } else if (fd >= 0) {
409 struct eventfd_ctx *efdctx;
411 efdctx = eventfd_ctx_fdget(fd);
413 return PTR_ERR(efdctx);
416 eventfd_ctx_put(*ctx);
429 int vfio_ccw_register_dev_region(struct vfio_ccw_private *private,
430 unsigned int subtype,
431 const struct vfio_ccw_regops *ops,
432 size_t size, u32 flags, void *data)
434 struct vfio_ccw_region *region;
436 region = krealloc(private->region,
437 (private->num_regions + 1) * sizeof(*region),
442 private->region = region;
443 private->region[private->num_regions].type = VFIO_REGION_TYPE_CCW;
444 private->region[private->num_regions].subtype = subtype;
445 private->region[private->num_regions].ops = ops;
446 private->region[private->num_regions].size = size;
447 private->region[private->num_regions].flags = flags;
448 private->region[private->num_regions].data = data;
450 private->num_regions++;
455 void vfio_ccw_unregister_dev_regions(struct vfio_ccw_private *private)
459 for (i = 0; i < private->num_regions; i++)
460 private->region[i].ops->release(private, &private->region[i]);
461 private->num_regions = 0;
462 kfree(private->region);
463 private->region = NULL;
466 static ssize_t vfio_ccw_mdev_ioctl(struct vfio_device *vdev,
470 struct vfio_ccw_private *private =
471 container_of(vdev, struct vfio_ccw_private, vdev);
476 case VFIO_DEVICE_GET_INFO:
478 struct vfio_device_info info;
480 minsz = offsetofend(struct vfio_device_info, num_irqs);
482 if (copy_from_user(&info, (void __user *)arg, minsz))
485 if (info.argsz < minsz)
488 ret = vfio_ccw_mdev_get_device_info(private, &info);
492 return copy_to_user((void __user *)arg, &info, minsz) ? -EFAULT : 0;
494 case VFIO_DEVICE_GET_REGION_INFO:
496 struct vfio_region_info info;
498 minsz = offsetofend(struct vfio_region_info, offset);
500 if (copy_from_user(&info, (void __user *)arg, minsz))
503 if (info.argsz < minsz)
506 ret = vfio_ccw_mdev_get_region_info(private, &info, arg);
510 return copy_to_user((void __user *)arg, &info, minsz) ? -EFAULT : 0;
512 case VFIO_DEVICE_GET_IRQ_INFO:
514 struct vfio_irq_info info;
516 minsz = offsetofend(struct vfio_irq_info, count);
518 if (copy_from_user(&info, (void __user *)arg, minsz))
521 if (info.argsz < minsz || info.index >= VFIO_CCW_NUM_IRQS)
524 ret = vfio_ccw_mdev_get_irq_info(&info);
528 if (info.count == -1)
531 return copy_to_user((void __user *)arg, &info, minsz) ? -EFAULT : 0;
533 case VFIO_DEVICE_SET_IRQS:
535 struct vfio_irq_set hdr;
539 minsz = offsetofend(struct vfio_irq_set, count);
541 if (copy_from_user(&hdr, (void __user *)arg, minsz))
544 ret = vfio_set_irqs_validate_and_prepare(&hdr, 1,
550 data = (void __user *)(arg + minsz);
551 return vfio_ccw_mdev_set_irqs(private, hdr.flags, hdr.index,
554 case VFIO_DEVICE_RESET:
555 return vfio_ccw_mdev_reset(private);
561 /* Request removal of the device*/
562 static void vfio_ccw_mdev_request(struct vfio_device *vdev, unsigned int count)
564 struct vfio_ccw_private *private =
565 container_of(vdev, struct vfio_ccw_private, vdev);
566 struct device *dev = vdev->dev;
568 if (private->req_trigger) {
570 dev_notice_ratelimited(dev,
571 "Relaying device request to user (#%u)\n",
574 eventfd_signal(private->req_trigger, 1);
575 } else if (count == 0) {
577 "No device request channel registered, blocked until released by user\n");
581 static const struct vfio_device_ops vfio_ccw_dev_ops = {
582 .init = vfio_ccw_mdev_init_dev,
583 .release = vfio_ccw_mdev_release_dev,
584 .open_device = vfio_ccw_mdev_open_device,
585 .close_device = vfio_ccw_mdev_close_device,
586 .read = vfio_ccw_mdev_read,
587 .write = vfio_ccw_mdev_write,
588 .ioctl = vfio_ccw_mdev_ioctl,
589 .request = vfio_ccw_mdev_request,
590 .dma_unmap = vfio_ccw_dma_unmap,
593 struct mdev_driver vfio_ccw_mdev_driver = {
594 .device_api = VFIO_DEVICE_API_CCW_STRING,
597 .name = "vfio_ccw_mdev",
598 .owner = THIS_MODULE,
599 .mod_name = KBUILD_MODNAME,
601 .probe = vfio_ccw_mdev_probe,
602 .remove = vfio_ccw_mdev_remove,