blob: 5e7bf143cb2230df8485f26addbc21d5f0c201f5 [file] [log] [blame]
Thomas Gleixnerd2912cb2019-06-04 10:11:33 +02001/* SPDX-License-Identifier: GPL-2.0-only */
Alex Williamsoncba33452012-07-31 08:16:22 -06002/*
3 * VFIO API definition
4 *
5 * Copyright (C) 2012 Red Hat, Inc. All rights reserved.
6 * Author: Alex Williamson <[email protected]>
Alex Williamsoncba33452012-07-31 08:16:22 -06007 */
8#ifndef VFIO_H
9#define VFIO_H
10
Alex Williamsoncba33452012-07-31 08:16:22 -060011
12#include <linux/iommu.h>
13#include <linux/mm.h>
Antonios Motakis7e992d62015-03-16 14:08:54 -060014#include <linux/workqueue.h>
15#include <linux/poll.h>
David Howells607ca462012-10-13 10:46:48 +010016#include <uapi/linux/vfio.h>
Yishai Hadas80c4b922022-09-08 21:34:43 +030017#include <linux/iova_bitmap.h>
Alex Williamsoncba33452012-07-31 08:16:22 -060018
Jason Gunthorpeba70a892022-05-04 16:14:44 -030019struct kvm;
20
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -030021/*
22 * VFIO devices can be placed in a set, this allows all devices to share this
23 * structure and the VFIO core will provide a lock that is held around
24 * open_device()/close_device() for all devices in the set.
25 */
26struct vfio_device_set {
27 void *set_id;
28 struct mutex lock;
29 struct list_head device_list;
30 unsigned int device_count;
31};
32
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -060033struct vfio_device {
34 struct device *dev;
35 const struct vfio_device_ops *ops;
Yishai Hadas6e97eba2022-06-28 18:59:10 +030036 /*
Yishai Hadas80c4b922022-09-08 21:34:43 +030037 * mig_ops/log_ops is a static property of the vfio_device which must
38 * be set prior to registering the vfio_device.
Yishai Hadas6e97eba2022-06-28 18:59:10 +030039 */
40 const struct vfio_migration_ops *mig_ops;
Yishai Hadas80c4b922022-09-08 21:34:43 +030041 const struct vfio_log_ops *log_ops;
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -060042 struct vfio_group *group;
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -030043 struct vfio_device_set *dev_set;
44 struct list_head dev_set_list;
Jason Gunthorpe8cb3d832022-02-24 16:20:19 +020045 unsigned int migration_flags;
Matthew Rosato421cfe62022-05-19 14:33:11 -040046 /* Driver must reference the kvm during open_device or never touch it */
47 struct kvm *kvm;
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -060048
49 /* Members below here are private, not for driver use */
Yi Liu3c28a762022-09-21 18:44:01 +080050 unsigned int index;
51 struct device device; /* device.kref covers object life circle */
Kevin Tiancb9ff3f2022-09-21 18:43:47 +080052 refcount_t refcount; /* user count on registered device*/
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -030053 unsigned int open_count;
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -060054 struct completion comp;
55 struct list_head group_next;
Jason Gunthorpe8cfc5b62022-07-19 21:02:49 -030056 struct list_head iommu_entry;
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -060057};
58
Alex Williamsoncba33452012-07-31 08:16:22 -060059/**
60 * struct vfio_device_ops - VFIO bus driver device callbacks
61 *
Kevin Tiancb9ff3f2022-09-21 18:43:47 +080062 * @init: initialize private fields in device structure
63 * @release: Reclaim private fields in device structure
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -030064 * @open_device: Called when the first file descriptor is opened for this device
65 * @close_device: Opposite of open_device
Alex Williamsoncba33452012-07-31 08:16:22 -060066 * @read: Perform read(2) on device file descriptor
67 * @write: Perform write(2) on device file descriptor
68 * @ioctl: Perform ioctl(2) on device file descriptor, supporting VFIO_DEVICE_*
69 * operations documented below
70 * @mmap: Perform mmap(2) on a region of the device file descriptor
Alex Williamson13060b62015-02-06 15:05:07 -070071 * @request: Request for the bus driver to release the device
Alex Williamson5f3874c2020-03-24 09:28:25 -060072 * @match: Optional device name match callback (return: 0 for no-match, >0 for
73 * match, -errno for abort (ex. match with insufficient or incorrect
74 * additional args)
Jason Gunthorpece4b46572022-07-19 21:02:48 -030075 * @dma_unmap: Called when userspace unmaps IOVA from the container
76 * this device is attached to.
Jason Gunthorpe445ad492022-02-24 16:20:17 +020077 * @device_feature: Optional, fill in the VFIO_DEVICE_FEATURE ioctl
Alex Williamsoncba33452012-07-31 08:16:22 -060078 */
79struct vfio_device_ops {
80 char *name;
Kevin Tiancb9ff3f2022-09-21 18:43:47 +080081 int (*init)(struct vfio_device *vdev);
82 void (*release)(struct vfio_device *vdev);
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -030083 int (*open_device)(struct vfio_device *vdev);
84 void (*close_device)(struct vfio_device *vdev);
Jason Gunthorpe6df62c52021-03-30 09:53:08 -060085 ssize_t (*read)(struct vfio_device *vdev, char __user *buf,
Alex Williamsoncba33452012-07-31 08:16:22 -060086 size_t count, loff_t *ppos);
Jason Gunthorpe6df62c52021-03-30 09:53:08 -060087 ssize_t (*write)(struct vfio_device *vdev, const char __user *buf,
Alex Williamsoncba33452012-07-31 08:16:22 -060088 size_t count, loff_t *size);
Jason Gunthorpe6df62c52021-03-30 09:53:08 -060089 long (*ioctl)(struct vfio_device *vdev, unsigned int cmd,
Alex Williamsoncba33452012-07-31 08:16:22 -060090 unsigned long arg);
Jason Gunthorpe6df62c52021-03-30 09:53:08 -060091 int (*mmap)(struct vfio_device *vdev, struct vm_area_struct *vma);
92 void (*request)(struct vfio_device *vdev, unsigned int count);
93 int (*match)(struct vfio_device *vdev, char *buf);
Jason Gunthorpece4b46572022-07-19 21:02:48 -030094 void (*dma_unmap)(struct vfio_device *vdev, u64 iova, u64 length);
Jason Gunthorpe445ad492022-02-24 16:20:17 +020095 int (*device_feature)(struct vfio_device *device, u32 flags,
96 void __user *arg, size_t argsz);
Yishai Hadas6e97eba2022-06-28 18:59:10 +030097};
98
99/**
100 * @migration_set_state: Optional callback to change the migration state for
101 * devices that support migration. It's mandatory for
102 * VFIO_DEVICE_FEATURE_MIGRATION migration support.
103 * The returned FD is used for data transfer according to the FSM
104 * definition. The driver is responsible to ensure that FD reaches end
105 * of stream or error whenever the migration FSM leaves a data transfer
106 * state or before close_device() returns.
107 * @migration_get_state: Optional callback to get the migration state for
108 * devices that support migration. It's mandatory for
109 * VFIO_DEVICE_FEATURE_MIGRATION migration support.
110 */
111struct vfio_migration_ops {
Jason Gunthorpe115dcec2022-02-24 16:20:18 +0200112 struct file *(*migration_set_state)(
113 struct vfio_device *device,
114 enum vfio_device_mig_state new_state);
115 int (*migration_get_state)(struct vfio_device *device,
116 enum vfio_device_mig_state *curr_state);
Alex Williamsoncba33452012-07-31 08:16:22 -0600117};
118
Jason Gunthorpe445ad492022-02-24 16:20:17 +0200119/**
Yishai Hadas80c4b922022-09-08 21:34:43 +0300120 * @log_start: Optional callback to ask the device start DMA logging.
121 * @log_stop: Optional callback to ask the device stop DMA logging.
122 * @log_read_and_clear: Optional callback to ask the device read
123 * and clear the dirty DMAs in some given range.
124 *
125 * The vfio core implementation of the DEVICE_FEATURE_DMA_LOGGING_ set
126 * of features does not track logging state relative to the device,
127 * therefore the device implementation of vfio_log_ops must handle
128 * arbitrary user requests. This includes rejecting subsequent calls
129 * to log_start without an intervening log_stop, as well as graceful
130 * handling of log_stop and log_read_and_clear from invalid states.
131 */
132struct vfio_log_ops {
133 int (*log_start)(struct vfio_device *device,
134 struct rb_root_cached *ranges, u32 nnodes, u64 *page_size);
135 int (*log_stop)(struct vfio_device *device);
136 int (*log_read_and_clear)(struct vfio_device *device,
137 unsigned long iova, unsigned long length,
138 struct iova_bitmap *dirty);
139};
140
141/**
Jason Gunthorpe445ad492022-02-24 16:20:17 +0200142 * vfio_check_feature - Validate user input for the VFIO_DEVICE_FEATURE ioctl
143 * @flags: Arg from the device_feature op
144 * @argsz: Arg from the device_feature op
145 * @supported_ops: Combination of VFIO_DEVICE_FEATURE_GET and SET the driver
146 * supports
147 * @minsz: Minimum data size the driver accepts
148 *
149 * For use in a driver's device_feature op. Checks that the inputs to the
150 * VFIO_DEVICE_FEATURE ioctl are correct for the driver's feature. Returns 1 if
151 * the driver should execute the get or set, otherwise the relevant
152 * value should be returned.
153 */
154static inline int vfio_check_feature(u32 flags, size_t argsz, u32 supported_ops,
155 size_t minsz)
156{
157 if ((flags & (VFIO_DEVICE_FEATURE_GET | VFIO_DEVICE_FEATURE_SET)) &
158 ~supported_ops)
159 return -EINVAL;
160 if (flags & VFIO_DEVICE_FEATURE_PROBE)
161 return 0;
162 /* Without PROBE one of GET or SET must be requested */
163 if (!(flags & (VFIO_DEVICE_FEATURE_GET | VFIO_DEVICE_FEATURE_SET)))
164 return -EINVAL;
165 if (argsz < minsz)
166 return -EINVAL;
167 return 1;
168}
169
Kevin Tiancb9ff3f2022-09-21 18:43:47 +0800170struct vfio_device *_vfio_alloc_device(size_t size, struct device *dev,
171 const struct vfio_device_ops *ops);
172#define vfio_alloc_device(dev_struct, member, dev, ops) \
173 container_of(_vfio_alloc_device(sizeof(struct dev_struct) + \
174 BUILD_BUG_ON_ZERO(offsetof( \
175 struct dev_struct, member)), \
176 dev, ops), \
177 struct dev_struct, member)
178
179int vfio_init_device(struct vfio_device *device, struct device *dev,
180 const struct vfio_device_ops *ops);
181void vfio_free_device(struct vfio_device *device);
Kevin Tiancb9ff3f2022-09-21 18:43:47 +0800182static inline void vfio_put_device(struct vfio_device *device)
183{
Yi Liu3c28a762022-09-21 18:44:01 +0800184 put_device(&device->device);
Kevin Tiancb9ff3f2022-09-21 18:43:47 +0800185}
186
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -0600187int vfio_register_group_dev(struct vfio_device *device);
Christoph Hellwigc68ea0d2021-09-24 17:56:57 +0200188int vfio_register_emulated_iommu_dev(struct vfio_device *device);
Jason Gunthorpe0bfc6a42021-03-30 09:53:05 -0600189void vfio_unregister_group_dev(struct vfio_device *device);
Alex Williamsoncba33452012-07-31 08:16:22 -0600190
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -0300191int vfio_assign_device_set(struct vfio_device *device, void *set_id);
Anthony DeRossi5cd189e2022-11-09 17:40:26 -0800192unsigned int vfio_device_set_open_count(struct vfio_device_set *dev_set);
Jason Gunthorpe2fd585f2021-08-05 22:19:00 -0300193
Jason Gunthorpe115dcec2022-02-24 16:20:18 +0200194int vfio_mig_get_next_state(struct vfio_device *device,
195 enum vfio_device_mig_state cur_fsm,
196 enum vfio_device_mig_state new_fsm,
197 enum vfio_device_mig_state *next_fsm);
198
Alexey Kardashevskiy6cdd97822013-08-05 10:52:36 -0600199/*
200 * External user API
201 */
Alex Williamsond1877e62022-06-08 12:55:13 -0600202struct iommu_group *vfio_file_iommu_group(struct file *file);
Jason Gunthorpe4b22ef02022-10-07 11:04:39 -0300203bool vfio_file_is_group(struct file *file);
Alex Williamsond1877e62022-06-08 12:55:13 -0600204bool vfio_file_enforced_coherent(struct file *file);
205void vfio_file_set_kvm(struct file *file, struct kvm *kvm);
206bool vfio_file_has_dev(struct file *file, struct vfio_device *device);
Alexey Kardashevskiy6cdd97822013-08-05 10:52:36 -0600207
Kirti Wankhede21690372016-11-17 02:16:17 +0530208#define VFIO_PIN_PAGES_MAX_ENTRIES (PAGE_SIZE/sizeof(unsigned long))
209
Nicolin Chen44abdd12022-07-22 19:02:51 -0700210int vfio_pin_pages(struct vfio_device *device, dma_addr_t iova,
Nicolin Chen34a255e62022-07-22 19:02:56 -0700211 int npage, int prot, struct page **pages);
Nicolin Chen44abdd12022-07-22 19:02:51 -0700212void vfio_unpin_pages(struct vfio_device *device, dma_addr_t iova, int npage);
Nicolin Chen8561aa42022-07-22 19:02:54 -0700213int vfio_dma_rw(struct vfio_device *device, dma_addr_t iova,
Alex Williamsond1877e62022-06-08 12:55:13 -0600214 void *data, size_t len, bool write);
Yan Zhao8d46c0c2020-03-24 09:27:57 -0600215
Alex Williamsond7a8d5e2016-02-22 16:02:33 -0700216/*
217 * Sub-module helpers
218 */
219struct vfio_info_cap {
220 struct vfio_info_cap_header *buf;
221 size_t size;
222};
Alex Williamsond1877e62022-06-08 12:55:13 -0600223struct vfio_info_cap_header *vfio_info_cap_add(struct vfio_info_cap *caps,
224 size_t size, u16 id,
225 u16 version);
226void vfio_info_cap_shift(struct vfio_info_cap *caps, size_t offset);
Alex Williamsond7a8d5e2016-02-22 16:02:33 -0700227
Alex Williamsond1877e62022-06-08 12:55:13 -0600228int vfio_info_add_capability(struct vfio_info_cap *caps,
229 struct vfio_info_cap_header *cap, size_t size);
Kirti Wankhedeb3c0a862016-11-17 02:16:25 +0530230
Alex Williamsond1877e62022-06-08 12:55:13 -0600231int vfio_set_irqs_validate_and_prepare(struct vfio_irq_set *hdr,
232 int num_irqs, int max_irq_type,
233 size_t *data_size);
Kirti Wankhedec747f08a2016-11-17 02:16:27 +0530234
Gavin Shan92d18a62014-08-08 10:36:20 -0600235struct pci_dev;
Murilo Opsfelder Araujobb67b492017-07-18 14:22:20 -0300236#if IS_ENABLED(CONFIG_VFIO_SPAPR_EEH)
Alex Williamsond1877e62022-06-08 12:55:13 -0600237void vfio_spapr_pci_eeh_open(struct pci_dev *pdev);
238void vfio_spapr_pci_eeh_release(struct pci_dev *pdev);
239long vfio_spapr_iommu_eeh_ioctl(struct iommu_group *group, unsigned int cmd,
240 unsigned long arg);
Gavin Shan1b69be52014-06-10 11:41:57 +1000241#else
Alexey Kardashevskiy9b936c92014-08-08 10:39:16 -0600242static inline void vfio_spapr_pci_eeh_open(struct pci_dev *pdev)
Gavin Shan1b69be52014-06-10 11:41:57 +1000243{
Gavin Shan1b69be52014-06-10 11:41:57 +1000244}
245
246static inline void vfio_spapr_pci_eeh_release(struct pci_dev *pdev)
247{
248}
249
250static inline long vfio_spapr_iommu_eeh_ioctl(struct iommu_group *group,
251 unsigned int cmd,
252 unsigned long arg)
253{
254 return -ENOTTY;
255}
Murilo Opsfelder Araujobb67b492017-07-18 14:22:20 -0300256#endif /* CONFIG_VFIO_SPAPR_EEH */
Antonios Motakis7e992d62015-03-16 14:08:54 -0600257
258/*
259 * IRQfd - generic
260 */
261struct virqfd {
262 void *opaque;
263 struct eventfd_ctx *eventfd;
264 int (*handler)(void *, void *);
265 void (*thread)(void *, void *);
266 void *data;
267 struct work_struct inject;
Ingo Molnarac6424b2017-06-20 12:06:13 +0200268 wait_queue_entry_t wait;
Antonios Motakis7e992d62015-03-16 14:08:54 -0600269 poll_table pt;
270 struct work_struct shutdown;
Alex Williamson33dc33f2024-03-29 15:38:51 -0600271 struct work_struct flush_inject;
Antonios Motakis7e992d62015-03-16 14:08:54 -0600272 struct virqfd **pvirqfd;
273};
274
Alex Williamsond1877e62022-06-08 12:55:13 -0600275int vfio_virqfd_enable(void *opaque, int (*handler)(void *, void *),
276 void (*thread)(void *, void *), void *data,
277 struct virqfd **pvirqfd, int fd);
278void vfio_virqfd_disable(struct virqfd **pvirqfd);
Alex Williamson33dc33f2024-03-29 15:38:51 -0600279void vfio_virqfd_flush_thread(struct virqfd **pvirqfd);
Antonios Motakis7e992d62015-03-16 14:08:54 -0600280
Alex Williamsoncba33452012-07-31 08:16:22 -0600281#endif /* VFIO_H */