Merge tag 'mm-hotfixes-stable-2025-07-11-16-16' of git://git.kernel.org/pub/scm/linux...
[linux-block.git] / include / linux / vfio.h
CommitLineData
d2912cb1 1/* SPDX-License-Identifier: GPL-2.0-only */
cba3345c
AW
2/*
3 * VFIO API definition
4 *
5 * Copyright (C) 2012 Red Hat, Inc. All rights reserved.
6 * Author: Alex Williamson <alex.williamson@redhat.com>
cba3345c
AW
7 */
8#ifndef VFIO_H
9#define VFIO_H
10
cba3345c
AW
11
12#include <linux/iommu.h>
13#include <linux/mm.h>
7e992d69
AM
14#include <linux/workqueue.h>
15#include <linux/poll.h>
8b6f173a 16#include <linux/cdev.h>
607ca46e 17#include <uapi/linux/vfio.h>
80c4b92a 18#include <linux/iova_bitmap.h>
cba3345c 19
ba70a89f 20struct kvm;
a4d1f91d
JG
21struct iommufd_ctx;
22struct iommufd_device;
4741f2e9 23struct iommufd_access;
ba70a89f 24
2fd585f4
JG
25/*
26 * VFIO devices can be placed in a set, this allows all devices to share this
27 * structure and the VFIO core will provide a lock that is held around
28 * open_device()/close_device() for all devices in the set.
29 */
30struct vfio_device_set {
31 void *set_id;
32 struct mutex lock;
33 struct list_head device_list;
34 unsigned int device_count;
35};
36
0bfc6a4e
JG
37struct vfio_device {
38 struct device *dev;
39 const struct vfio_device_ops *ops;
6e97eba8 40 /*
80c4b92a
YH
41 * mig_ops/log_ops is a static property of the vfio_device which must
42 * be set prior to registering the vfio_device.
6e97eba8
YH
43 */
44 const struct vfio_migration_ops *mig_ops;
80c4b92a 45 const struct vfio_log_ops *log_ops;
c1cce6d0 46#if IS_ENABLED(CONFIG_VFIO_GROUP)
0bfc6a4e 47 struct vfio_group *group;
c1cce6d0
YL
48 struct list_head group_next;
49 struct list_head iommu_entry;
50#endif
2fd585f4
JG
51 struct vfio_device_set *dev_set;
52 struct list_head dev_set_list;
8cb3d83b 53 unsigned int migration_flags;
421cfe65 54 struct kvm *kvm;
0bfc6a4e
JG
55
56 /* Members below here are private, not for driver use */
3c28a761
YL
57 unsigned int index;
58 struct device device; /* device.kref covers object life circle */
8b6f173a
YL
59#if IS_ENABLED(CONFIG_VFIO_DEVICE_CDEV)
60 struct cdev cdev;
61#endif
cb9ff3f3 62 refcount_t refcount; /* user count on registered device*/
2fd585f4 63 unsigned int open_count;
0bfc6a4e 64 struct completion comp;
4741f2e9 65 struct iommufd_access *iommufd_access;
2b48f52f 66 void (*put_kvm)(struct kvm *kvm);
b7c5e64f 67 struct inode *inode;
a4d1f91d
JG
68#if IS_ENABLED(CONFIG_IOMMUFD)
69 struct iommufd_device *iommufd_device;
29064134 70 struct ida pasids;
5fcc2696 71 u8 iommufd_attached:1;
a4d1f91d 72#endif
5fcc2696 73 u8 cdev_opened:1;
2202844e
LL
74#ifdef CONFIG_DEBUG_FS
75 /*
76 * debug_root is a static property of the vfio_device
77 * which must be set prior to registering the vfio_device.
78 */
79 struct dentry *debug_root;
80#endif
0bfc6a4e
JG
81};
82
cba3345c
AW
83/**
84 * struct vfio_device_ops - VFIO bus driver device callbacks
85 *
38e4614c 86 * @name: Name of the device driver.
cb9ff3f3
KT
87 * @init: initialize private fields in device structure
88 * @release: Reclaim private fields in device structure
fae90680
YL
89 * @bind_iommufd: Called when binding the device to an iommufd
90 * @unbind_iommufd: Opposite of bind_iommufd
91 * @attach_ioas: Called when attaching device to an IOAS/HWPT managed by the
9048c734
YL
92 * bound iommufd. Undo in unbind_iommufd if @detach_ioas is not
93 * called.
94 * @detach_ioas: Opposite of attach_ioas
29064134
YL
95 * @pasid_attach_ioas: The pasid variation of attach_ioas
96 * @pasid_detach_ioas: Opposite of pasid_attach_ioas
2fd585f4
JG
97 * @open_device: Called when the first file descriptor is opened for this device
98 * @close_device: Opposite of open_device
cba3345c
AW
99 * @read: Perform read(2) on device file descriptor
100 * @write: Perform write(2) on device file descriptor
101 * @ioctl: Perform ioctl(2) on device file descriptor, supporting VFIO_DEVICE_*
102 * operations documented below
103 * @mmap: Perform mmap(2) on a region of the device file descriptor
13060b64 104 * @request: Request for the bus driver to release the device
5f3874c2
AW
105 * @match: Optional device name match callback (return: 0 for no-match, >0 for
106 * match, -errno for abort (ex. match with insufficient or incorrect
107 * additional args)
ce4b4657
JG
108 * @dma_unmap: Called when userspace unmaps IOVA from the container
109 * this device is attached to.
445ad495 110 * @device_feature: Optional, fill in the VFIO_DEVICE_FEATURE ioctl
cba3345c
AW
111 */
112struct vfio_device_ops {
113 char *name;
cb9ff3f3
KT
114 int (*init)(struct vfio_device *vdev);
115 void (*release)(struct vfio_device *vdev);
a4d1f91d
JG
116 int (*bind_iommufd)(struct vfio_device *vdev,
117 struct iommufd_ctx *ictx, u32 *out_device_id);
118 void (*unbind_iommufd)(struct vfio_device *vdev);
119 int (*attach_ioas)(struct vfio_device *vdev, u32 *pt_id);
9048c734 120 void (*detach_ioas)(struct vfio_device *vdev);
29064134
YL
121 int (*pasid_attach_ioas)(struct vfio_device *vdev, u32 pasid,
122 u32 *pt_id);
123 void (*pasid_detach_ioas)(struct vfio_device *vdev, u32 pasid);
2fd585f4
JG
124 int (*open_device)(struct vfio_device *vdev);
125 void (*close_device)(struct vfio_device *vdev);
6df62c5b 126 ssize_t (*read)(struct vfio_device *vdev, char __user *buf,
cba3345c 127 size_t count, loff_t *ppos);
6df62c5b 128 ssize_t (*write)(struct vfio_device *vdev, const char __user *buf,
cba3345c 129 size_t count, loff_t *size);
6df62c5b 130 long (*ioctl)(struct vfio_device *vdev, unsigned int cmd,
cba3345c 131 unsigned long arg);
6df62c5b
JG
132 int (*mmap)(struct vfio_device *vdev, struct vm_area_struct *vma);
133 void (*request)(struct vfio_device *vdev, unsigned int count);
134 int (*match)(struct vfio_device *vdev, char *buf);
ce4b4657 135 void (*dma_unmap)(struct vfio_device *vdev, u64 iova, u64 length);
445ad495
JG
136 int (*device_feature)(struct vfio_device *device, u32 flags,
137 void __user *arg, size_t argsz);
6e97eba8
YH
138};
139
a4d1f91d 140#if IS_ENABLED(CONFIG_IOMMUFD)
9062ff40
YL
141struct iommufd_ctx *vfio_iommufd_device_ictx(struct vfio_device *vdev);
142int vfio_iommufd_get_dev_id(struct vfio_device *vdev, struct iommufd_ctx *ictx);
a4d1f91d
JG
143int vfio_iommufd_physical_bind(struct vfio_device *vdev,
144 struct iommufd_ctx *ictx, u32 *out_device_id);
145void vfio_iommufd_physical_unbind(struct vfio_device *vdev);
146int vfio_iommufd_physical_attach_ioas(struct vfio_device *vdev, u32 *pt_id);
9048c734 147void vfio_iommufd_physical_detach_ioas(struct vfio_device *vdev);
29064134
YL
148int vfio_iommufd_physical_pasid_attach_ioas(struct vfio_device *vdev,
149 u32 pasid, u32 *pt_id);
150void vfio_iommufd_physical_pasid_detach_ioas(struct vfio_device *vdev,
151 u32 pasid);
4741f2e9
JG
152int vfio_iommufd_emulated_bind(struct vfio_device *vdev,
153 struct iommufd_ctx *ictx, u32 *out_device_id);
154void vfio_iommufd_emulated_unbind(struct vfio_device *vdev);
155int vfio_iommufd_emulated_attach_ioas(struct vfio_device *vdev, u32 *pt_id);
8cfa7186 156void vfio_iommufd_emulated_detach_ioas(struct vfio_device *vdev);
a4d1f91d 157#else
9062ff40
YL
158static inline struct iommufd_ctx *
159vfio_iommufd_device_ictx(struct vfio_device *vdev)
160{
161 return NULL;
162}
163
164static inline int
165vfio_iommufd_get_dev_id(struct vfio_device *vdev, struct iommufd_ctx *ictx)
166{
167 return VFIO_PCI_DEVID_NOT_OWNED;
168}
169
a4d1f91d
JG
170#define vfio_iommufd_physical_bind \
171 ((int (*)(struct vfio_device *vdev, struct iommufd_ctx *ictx, \
172 u32 *out_device_id)) NULL)
173#define vfio_iommufd_physical_unbind \
174 ((void (*)(struct vfio_device *vdev)) NULL)
175#define vfio_iommufd_physical_attach_ioas \
176 ((int (*)(struct vfio_device *vdev, u32 *pt_id)) NULL)
9048c734
YL
177#define vfio_iommufd_physical_detach_ioas \
178 ((void (*)(struct vfio_device *vdev)) NULL)
29064134
YL
179#define vfio_iommufd_physical_pasid_attach_ioas \
180 ((int (*)(struct vfio_device *vdev, u32 pasid, u32 *pt_id)) NULL)
181#define vfio_iommufd_physical_pasid_detach_ioas \
182 ((void (*)(struct vfio_device *vdev, u32 pasid)) NULL)
4741f2e9
JG
183#define vfio_iommufd_emulated_bind \
184 ((int (*)(struct vfio_device *vdev, struct iommufd_ctx *ictx, \
185 u32 *out_device_id)) NULL)
186#define vfio_iommufd_emulated_unbind \
187 ((void (*)(struct vfio_device *vdev)) NULL)
188#define vfio_iommufd_emulated_attach_ioas \
189 ((int (*)(struct vfio_device *vdev, u32 *pt_id)) NULL)
8cfa7186
YL
190#define vfio_iommufd_emulated_detach_ioas \
191 ((void (*)(struct vfio_device *vdev)) NULL)
a4d1f91d
JG
192#endif
193
af949759
YL
194static inline bool vfio_device_cdev_opened(struct vfio_device *device)
195{
5fcc2696 196 return device->cdev_opened;
af949759
YL
197}
198
6e97eba8 199/**
38e4614c
SH
200 * struct vfio_migration_ops - VFIO bus device driver migration callbacks
201 *
6e97eba8
YH
202 * @migration_set_state: Optional callback to change the migration state for
203 * devices that support migration. It's mandatory for
204 * VFIO_DEVICE_FEATURE_MIGRATION migration support.
205 * The returned FD is used for data transfer according to the FSM
206 * definition. The driver is responsible to ensure that FD reaches end
207 * of stream or error whenever the migration FSM leaves a data transfer
208 * state or before close_device() returns.
209 * @migration_get_state: Optional callback to get the migration state for
210 * devices that support migration. It's mandatory for
211 * VFIO_DEVICE_FEATURE_MIGRATION migration support.
4e016f96
YH
212 * @migration_get_data_size: Optional callback to get the estimated data
213 * length that will be required to complete stop copy. It's mandatory for
214 * VFIO_DEVICE_FEATURE_MIGRATION migration support.
6e97eba8
YH
215 */
216struct vfio_migration_ops {
115dcec6
JG
217 struct file *(*migration_set_state)(
218 struct vfio_device *device,
219 enum vfio_device_mig_state new_state);
220 int (*migration_get_state)(struct vfio_device *device,
221 enum vfio_device_mig_state *curr_state);
4e016f96
YH
222 int (*migration_get_data_size)(struct vfio_device *device,
223 unsigned long *stop_copy_length);
cba3345c
AW
224};
225
80c4b92a 226/**
38e4614c
SH
227 * struct vfio_log_ops - VFIO bus device driver logging callbacks
228 *
80c4b92a
YH
229 * @log_start: Optional callback to ask the device start DMA logging.
230 * @log_stop: Optional callback to ask the device stop DMA logging.
231 * @log_read_and_clear: Optional callback to ask the device read
232 * and clear the dirty DMAs in some given range.
233 *
234 * The vfio core implementation of the DEVICE_FEATURE_DMA_LOGGING_ set
235 * of features does not track logging state relative to the device,
236 * therefore the device implementation of vfio_log_ops must handle
237 * arbitrary user requests. This includes rejecting subsequent calls
238 * to log_start without an intervening log_stop, as well as graceful
239 * handling of log_stop and log_read_and_clear from invalid states.
240 */
241struct vfio_log_ops {
242 int (*log_start)(struct vfio_device *device,
243 struct rb_root_cached *ranges, u32 nnodes, u64 *page_size);
244 int (*log_stop)(struct vfio_device *device);
245 int (*log_read_and_clear)(struct vfio_device *device,
246 unsigned long iova, unsigned long length,
247 struct iova_bitmap *dirty);
248};
249
445ad495
JG
250/**
251 * vfio_check_feature - Validate user input for the VFIO_DEVICE_FEATURE ioctl
252 * @flags: Arg from the device_feature op
253 * @argsz: Arg from the device_feature op
254 * @supported_ops: Combination of VFIO_DEVICE_FEATURE_GET and SET the driver
255 * supports
256 * @minsz: Minimum data size the driver accepts
257 *
258 * For use in a driver's device_feature op. Checks that the inputs to the
259 * VFIO_DEVICE_FEATURE ioctl are correct for the driver's feature. Returns 1 if
260 * the driver should execute the get or set, otherwise the relevant
261 * value should be returned.
262 */
263static inline int vfio_check_feature(u32 flags, size_t argsz, u32 supported_ops,
264 size_t minsz)
265{
266 if ((flags & (VFIO_DEVICE_FEATURE_GET | VFIO_DEVICE_FEATURE_SET)) &
267 ~supported_ops)
268 return -EINVAL;
269 if (flags & VFIO_DEVICE_FEATURE_PROBE)
270 return 0;
271 /* Without PROBE one of GET or SET must be requested */
272 if (!(flags & (VFIO_DEVICE_FEATURE_GET | VFIO_DEVICE_FEATURE_SET)))
273 return -EINVAL;
274 if (argsz < minsz)
275 return -EINVAL;
276 return 1;
277}
278
cb9ff3f3
KT
279struct vfio_device *_vfio_alloc_device(size_t size, struct device *dev,
280 const struct vfio_device_ops *ops);
281#define vfio_alloc_device(dev_struct, member, dev, ops) \
282 container_of(_vfio_alloc_device(sizeof(struct dev_struct) + \
283 BUILD_BUG_ON_ZERO(offsetof( \
284 struct dev_struct, member)), \
285 dev, ops), \
286 struct dev_struct, member)
287
cb9ff3f3
KT
288static inline void vfio_put_device(struct vfio_device *device)
289{
3c28a761 290 put_device(&device->device);
cb9ff3f3
KT
291}
292
0bfc6a4e 293int vfio_register_group_dev(struct vfio_device *device);
c68ea0d0 294int vfio_register_emulated_iommu_dev(struct vfio_device *device);
0bfc6a4e 295void vfio_unregister_group_dev(struct vfio_device *device);
cba3345c 296
2fd585f4 297int vfio_assign_device_set(struct vfio_device *device, void *set_id);
5cd189e4 298unsigned int vfio_device_set_open_count(struct vfio_device_set *dev_set);
a80e1de9
YL
299struct vfio_device *
300vfio_find_device_in_devset(struct vfio_device_set *dev_set,
301 struct device *dev);
2fd585f4 302
115dcec6
JG
303int vfio_mig_get_next_state(struct vfio_device *device,
304 enum vfio_device_mig_state cur_fsm,
305 enum vfio_device_mig_state new_fsm,
306 enum vfio_device_mig_state *next_fsm);
307
9a4087fa
BC
308void vfio_combine_iova_ranges(struct rb_root_cached *root, u32 cur_nodes,
309 u32 req_nodes);
310
6cdd9782
AK
311/*
312 * External user API
313 */
d1877e63 314struct iommu_group *vfio_file_iommu_group(struct file *file);
4ea95c04
SC
315
316#if IS_ENABLED(CONFIG_VFIO_GROUP)
4b22ef04 317bool vfio_file_is_group(struct file *file);
c1cce6d0
YL
318bool vfio_file_has_dev(struct file *file, struct vfio_device *device);
319#else
c1cce6d0
YL
320static inline bool vfio_file_is_group(struct file *file)
321{
322 return false;
323}
324
325static inline bool vfio_file_has_dev(struct file *file, struct vfio_device *device)
326{
327 return false;
328}
329#endif
b1a59be8 330bool vfio_file_is_valid(struct file *file);
d1877e63
AW
331bool vfio_file_enforced_coherent(struct file *file);
332void vfio_file_set_kvm(struct file *file, struct kvm *kvm);
6cdd9782 333
2169037d
KW
334#define VFIO_PIN_PAGES_MAX_ENTRIES (PAGE_SIZE/sizeof(unsigned long))
335
44abdd16 336int vfio_pin_pages(struct vfio_device *device, dma_addr_t iova,
34a255e6 337 int npage, int prot, struct page **pages);
44abdd16 338void vfio_unpin_pages(struct vfio_device *device, dma_addr_t iova, int npage);
8561aa4f 339int vfio_dma_rw(struct vfio_device *device, dma_addr_t iova,
d1877e63 340 void *data, size_t len, bool write);
8d46c0cc 341
d7a8d5ed
AW
342/*
343 * Sub-module helpers
344 */
345struct vfio_info_cap {
346 struct vfio_info_cap_header *buf;
347 size_t size;
348};
d1877e63
AW
349struct vfio_info_cap_header *vfio_info_cap_add(struct vfio_info_cap *caps,
350 size_t size, u16 id,
351 u16 version);
352void vfio_info_cap_shift(struct vfio_info_cap *caps, size_t offset);
d7a8d5ed 353
d1877e63
AW
354int vfio_info_add_capability(struct vfio_info_cap *caps,
355 struct vfio_info_cap_header *cap, size_t size);
b3c0a866 356
d1877e63
AW
357int vfio_set_irqs_validate_and_prepare(struct vfio_irq_set *hdr,
358 int num_irqs, int max_irq_type,
359 size_t *data_size);
c747f08a 360
7e992d69
AM
361/*
362 * IRQfd - generic
363 */
364struct virqfd {
365 void *opaque;
366 struct eventfd_ctx *eventfd;
367 int (*handler)(void *, void *);
368 void (*thread)(void *, void *);
369 void *data;
370 struct work_struct inject;
ac6424b9 371 wait_queue_entry_t wait;
7e992d69
AM
372 poll_table pt;
373 struct work_struct shutdown;
b620ecbd 374 struct work_struct flush_inject;
7e992d69
AM
375 struct virqfd **pvirqfd;
376};
377
d1877e63
AW
378int vfio_virqfd_enable(void *opaque, int (*handler)(void *, void *),
379 void (*thread)(void *, void *), void *data,
380 struct virqfd **pvirqfd, int fd);
381void vfio_virqfd_disable(struct virqfd **pvirqfd);
b620ecbd 382void vfio_virqfd_flush_thread(struct virqfd **pvirqfd);
7e992d69 383
cba3345c 384#endif /* VFIO_H */