2 * Copyright 2003 Tungsten Graphics, Inc., Cedar Park, Texas.
5 * Permission is hereby granted, free of charge, to any person obtaining a
6 * copy of this software and associated documentation files (the
7 * "Software"), to deal in the Software without restriction, including
8 * without limitation the rights to use, copy, modify, merge, publish,
9 * distribute, sub license, and/or sell copies of the Software, and to
10 * permit persons to whom the Software is furnished to do so, subject to
11 * the following conditions:
13 * The above copyright notice and this permission notice (including the
14 * next paragraph) shall be included in all copies or substantial portions
17 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
20 * IN NO EVENT SHALL TUNGSTEN GRAPHICS AND/OR ITS SUPPLIERS BE LIABLE FOR
21 * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
22 * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
23 * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
27 #ifndef _UAPI_I915_DRM_H_
28 #define _UAPI_I915_DRM_H_
32 #if defined(__cplusplus)
36 /* Please note that modifications to all structs defined here are
37 * subject to backwards-compatibility constraints.
41 * DOC: uevents generated by i915 on its device node
43 * I915_L3_PARITY_UEVENT - Generated when the driver receives a parity mismatch
44 * event from the GPU L3 cache. Additional information supplied is ROW,
45 * BANK, SUBBANK, SLICE of the affected cacheline. Userspace should keep
46 * track of these events, and if a specific cache-line seems to have a
47 * persistent error, remap it with the L3 remapping tool supplied in
48 * intel-gpu-tools. The value supplied with the event is always 1.
50 * I915_ERROR_UEVENT - Generated upon error detection, currently only via
51 * hangcheck. The error detection event is a good indicator of when things
52 * began to go badly. The value supplied with the event is a 1 upon error
53 * detection, and a 0 upon reset completion, signifying no more error
54 * exists. NOTE: Disabling hangcheck or reset via module parameter will
55 * cause the related events to not be seen.
57 * I915_RESET_UEVENT - Event is generated just before an attempt to reset the
58 * GPU. The value supplied with the event is always 1. NOTE: Disable
59 * reset via module parameter will cause this event to not be seen.
61 #define I915_L3_PARITY_UEVENT "L3_PARITY_ERROR"
62 #define I915_ERROR_UEVENT "ERROR"
63 #define I915_RESET_UEVENT "RESET"
66 * struct i915_user_extension - Base class for defining a chain of extensions
68 * Many interfaces need to grow over time. In most cases we can simply
69 * extend the struct and have userspace pass in more data. Another option,
70 * as demonstrated by Vulkan's approach to providing extensions for forward
71 * and backward compatibility, is to use a list of optional structs to
72 * provide those extra details.
74 * The key advantage to using an extension chain is that it allows us to
75 * redefine the interface more easily than an ever growing struct of
76 * increasing complexity, and for large parts of that interface to be
77 * entirely optional. The downside is more pointer chasing; chasing across
78 * the __user boundary with pointers encapsulated inside u64.
84 * struct i915_user_extension ext3 {
85 * .next_extension = 0, // end
88 * struct i915_user_extension ext2 {
89 * .next_extension = (uintptr_t)&ext3,
92 * struct i915_user_extension ext1 {
93 * .next_extension = (uintptr_t)&ext2,
97 * Typically the struct i915_user_extension would be embedded in some uAPI
98 * struct, and in this case we would feed it the head of the chain(i.e ext1),
99 * which would then apply all of the above extensions.
102 struct i915_user_extension {
106 * Pointer to the next struct i915_user_extension, or zero if the end.
108 __u64 next_extension;
110 * @name: Name of the extension.
112 * Note that the name here is just some integer.
114 * Also note that the name space for this is not global for the whole
115 * driver, but rather its scope/meaning is limited to the specific piece
116 * of uAPI which has embedded the struct i915_user_extension.
122 * All undefined bits must be zero.
128 * Reserved for future use; must be zero.
134 * MOCS indexes used for GPU surfaces, defining the cacheability of the
135 * surface data and the coherency for this data wrt. CPU vs. GPU accesses.
137 enum i915_mocs_table_index {
139 * Not cached anywhere, coherency between CPU and GPU accesses is
144 * Cacheability and coherency controlled by the kernel automatically
145 * based on the DRM_I915_GEM_SET_CACHING IOCTL setting and the current
146 * usage of the surface (used for display scanout or not).
150 * Cached in all GPU caches available on the platform.
151 * Coherency between CPU and GPU accesses to the surface is not
152 * guaranteed without extra synchronization.
158 * enum drm_i915_gem_engine_class - uapi engine type enumeration
160 * Different engines serve different roles, and there may be more than one
161 * engine serving each role. This enum provides a classification of the role
162 * of the engine, which may be used when requesting operations to be performed
163 * on a certain subset of engines, or for providing information about that
166 enum drm_i915_gem_engine_class {
168 * @I915_ENGINE_CLASS_RENDER:
170 * Render engines support instructions used for 3D, Compute (GPGPU),
171 * and programmable media workloads. These instructions fetch data and
172 * dispatch individual work items to threads that operate in parallel.
173 * The threads run small programs (called "kernels" or "shaders") on
174 * the GPU's execution units (EUs).
176 I915_ENGINE_CLASS_RENDER = 0,
179 * @I915_ENGINE_CLASS_COPY:
181 * Copy engines (also referred to as "blitters") support instructions
182 * that move blocks of data from one location in memory to another,
183 * or that fill a specified location of memory with fixed data.
184 * Copy engines can perform pre-defined logical or bitwise operations
185 * on the source, destination, or pattern data.
187 I915_ENGINE_CLASS_COPY = 1,
190 * @I915_ENGINE_CLASS_VIDEO:
192 * Video engines (also referred to as "bit stream decode" (BSD) or
193 * "vdbox") support instructions that perform fixed-function media
196 I915_ENGINE_CLASS_VIDEO = 2,
199 * @I915_ENGINE_CLASS_VIDEO_ENHANCE:
201 * Video enhancement engines (also referred to as "vebox") support
202 * instructions related to image enhancement.
204 I915_ENGINE_CLASS_VIDEO_ENHANCE = 3,
207 * @I915_ENGINE_CLASS_COMPUTE:
209 * Compute engines support a subset of the instructions available
210 * on render engines: compute engines support Compute (GPGPU) and
211 * programmable media workloads, but do not support the 3D pipeline.
213 I915_ENGINE_CLASS_COMPUTE = 4,
215 /* Values in this enum should be kept compact. */
218 * @I915_ENGINE_CLASS_INVALID:
220 * Placeholder value to represent an invalid engine class assignment.
222 I915_ENGINE_CLASS_INVALID = -1
226 * struct i915_engine_class_instance - Engine class/instance identifier
228 * There may be more than one engine fulfilling any role within the system.
229 * Each engine of a class is given a unique instance number and therefore
230 * any engine can be specified by its class:instance tuplet. APIs that allow
231 * access to any engine in the system will use struct i915_engine_class_instance
232 * for this identification.
234 struct i915_engine_class_instance {
238 * Engine class from enum drm_i915_gem_engine_class
241 #define I915_ENGINE_CLASS_INVALID_NONE -1
242 #define I915_ENGINE_CLASS_INVALID_VIRTUAL -2
249 __u16 engine_instance;
253 * DOC: perf_events exposed by i915 through /sys/bus/event_sources/drivers/i915
257 enum drm_i915_pmu_engine_sample {
258 I915_SAMPLE_BUSY = 0,
259 I915_SAMPLE_WAIT = 1,
263 #define I915_PMU_SAMPLE_BITS (4)
264 #define I915_PMU_SAMPLE_MASK (0xf)
265 #define I915_PMU_SAMPLE_INSTANCE_BITS (8)
266 #define I915_PMU_CLASS_SHIFT \
267 (I915_PMU_SAMPLE_BITS + I915_PMU_SAMPLE_INSTANCE_BITS)
269 #define __I915_PMU_ENGINE(class, instance, sample) \
270 ((class) << I915_PMU_CLASS_SHIFT | \
271 (instance) << I915_PMU_SAMPLE_BITS | \
274 #define I915_PMU_ENGINE_BUSY(class, instance) \
275 __I915_PMU_ENGINE(class, instance, I915_SAMPLE_BUSY)
277 #define I915_PMU_ENGINE_WAIT(class, instance) \
278 __I915_PMU_ENGINE(class, instance, I915_SAMPLE_WAIT)
280 #define I915_PMU_ENGINE_SEMA(class, instance) \
281 __I915_PMU_ENGINE(class, instance, I915_SAMPLE_SEMA)
284 * Top 4 bits of every non-engine counter are GT id.
286 #define __I915_PMU_GT_SHIFT (60)
288 #define ___I915_PMU_OTHER(gt, x) \
289 (((__u64)__I915_PMU_ENGINE(0xff, 0xff, 0xf) + 1 + (x)) | \
290 ((__u64)(gt) << __I915_PMU_GT_SHIFT))
292 #define __I915_PMU_OTHER(x) ___I915_PMU_OTHER(0, x)
294 #define I915_PMU_ACTUAL_FREQUENCY __I915_PMU_OTHER(0)
295 #define I915_PMU_REQUESTED_FREQUENCY __I915_PMU_OTHER(1)
296 #define I915_PMU_INTERRUPTS __I915_PMU_OTHER(2)
297 #define I915_PMU_RC6_RESIDENCY __I915_PMU_OTHER(3)
298 #define I915_PMU_SOFTWARE_GT_AWAKE_TIME __I915_PMU_OTHER(4)
300 #define I915_PMU_LAST /* Deprecated - do not use */ I915_PMU_RC6_RESIDENCY
302 #define __I915_PMU_ACTUAL_FREQUENCY(gt) ___I915_PMU_OTHER(gt, 0)
303 #define __I915_PMU_REQUESTED_FREQUENCY(gt) ___I915_PMU_OTHER(gt, 1)
304 #define __I915_PMU_INTERRUPTS(gt) ___I915_PMU_OTHER(gt, 2)
305 #define __I915_PMU_RC6_RESIDENCY(gt) ___I915_PMU_OTHER(gt, 3)
306 #define __I915_PMU_SOFTWARE_GT_AWAKE_TIME(gt) ___I915_PMU_OTHER(gt, 4)
308 /* Each region is a minimum of 16k, and there are at most 255 of them.
310 #define I915_NR_TEX_REGIONS 255 /* table size 2k - maximum due to use
311 * of chars for next/prev indices */
312 #define I915_LOG_MIN_TEX_REGION_SIZE 14
314 typedef struct _drm_i915_init {
316 I915_INIT_DMA = 0x01,
317 I915_CLEANUP_DMA = 0x02,
318 I915_RESUME_DMA = 0x03
320 unsigned int mmio_offset;
321 int sarea_priv_offset;
322 unsigned int ring_start;
323 unsigned int ring_end;
324 unsigned int ring_size;
325 unsigned int front_offset;
326 unsigned int back_offset;
327 unsigned int depth_offset;
331 unsigned int pitch_bits;
332 unsigned int back_pitch;
333 unsigned int depth_pitch;
335 unsigned int chipset;
338 typedef struct _drm_i915_sarea {
339 struct drm_tex_region texList[I915_NR_TEX_REGIONS + 1];
340 int last_upload; /* last time texture was uploaded */
341 int last_enqueue; /* last time a buffer was enqueued */
342 int last_dispatch; /* age of the most recently dispatched buffer */
343 int ctxOwner; /* last context to upload state */
345 int pf_enabled; /* is pageflipping allowed? */
347 int pf_current_page; /* which buffer is being displayed? */
348 int perf_boxes; /* performance boxes to be displayed */
349 int width, height; /* screen size in pixels */
351 drm_handle_t front_handle;
355 drm_handle_t back_handle;
359 drm_handle_t depth_handle;
363 drm_handle_t tex_handle;
366 int log_tex_granularity;
368 int rotation; /* 0, 90, 180 or 270 */
372 int virtualX, virtualY;
374 unsigned int front_tiled;
375 unsigned int back_tiled;
376 unsigned int depth_tiled;
377 unsigned int rotated_tiled;
378 unsigned int rotated2_tiled;
389 /* fill out some space for old userspace triple buffer */
390 drm_handle_t unused_handle;
391 __u32 unused1, unused2, unused3;
393 /* buffer object handles for static buffers. May change
394 * over the lifetime of the client.
396 __u32 front_bo_handle;
397 __u32 back_bo_handle;
398 __u32 unused_bo_handle;
399 __u32 depth_bo_handle;
403 /* due to userspace building against these headers we need some compat here */
404 #define planeA_x pipeA_x
405 #define planeA_y pipeA_y
406 #define planeA_w pipeA_w
407 #define planeA_h pipeA_h
408 #define planeB_x pipeB_x
409 #define planeB_y pipeB_y
410 #define planeB_w pipeB_w
411 #define planeB_h pipeB_h
413 /* Flags for perf_boxes
415 #define I915_BOX_RING_EMPTY 0x1
416 #define I915_BOX_FLIP 0x2
417 #define I915_BOX_WAIT 0x4
418 #define I915_BOX_TEXTURE_LOAD 0x8
419 #define I915_BOX_LOST_CONTEXT 0x10
422 * i915 specific ioctls.
424 * The device specific ioctl range is [DRM_COMMAND_BASE, DRM_COMMAND_END) ie
425 * [0x40, 0xa0) (a0 is excluded). The numbers below are defined as offset
426 * against DRM_COMMAND_BASE and should be between [0x0, 0x60).
428 #define DRM_I915_INIT 0x00
429 #define DRM_I915_FLUSH 0x01
430 #define DRM_I915_FLIP 0x02
431 #define DRM_I915_BATCHBUFFER 0x03
432 #define DRM_I915_IRQ_EMIT 0x04
433 #define DRM_I915_IRQ_WAIT 0x05
434 #define DRM_I915_GETPARAM 0x06
435 #define DRM_I915_SETPARAM 0x07
436 #define DRM_I915_ALLOC 0x08
437 #define DRM_I915_FREE 0x09
438 #define DRM_I915_INIT_HEAP 0x0a
439 #define DRM_I915_CMDBUFFER 0x0b
440 #define DRM_I915_DESTROY_HEAP 0x0c
441 #define DRM_I915_SET_VBLANK_PIPE 0x0d
442 #define DRM_I915_GET_VBLANK_PIPE 0x0e
443 #define DRM_I915_VBLANK_SWAP 0x0f
444 #define DRM_I915_HWS_ADDR 0x11
445 #define DRM_I915_GEM_INIT 0x13
446 #define DRM_I915_GEM_EXECBUFFER 0x14
447 #define DRM_I915_GEM_PIN 0x15
448 #define DRM_I915_GEM_UNPIN 0x16
449 #define DRM_I915_GEM_BUSY 0x17
450 #define DRM_I915_GEM_THROTTLE 0x18
451 #define DRM_I915_GEM_ENTERVT 0x19
452 #define DRM_I915_GEM_LEAVEVT 0x1a
453 #define DRM_I915_GEM_CREATE 0x1b
454 #define DRM_I915_GEM_PREAD 0x1c
455 #define DRM_I915_GEM_PWRITE 0x1d
456 #define DRM_I915_GEM_MMAP 0x1e
457 #define DRM_I915_GEM_SET_DOMAIN 0x1f
458 #define DRM_I915_GEM_SW_FINISH 0x20
459 #define DRM_I915_GEM_SET_TILING 0x21
460 #define DRM_I915_GEM_GET_TILING 0x22
461 #define DRM_I915_GEM_GET_APERTURE 0x23
462 #define DRM_I915_GEM_MMAP_GTT 0x24
463 #define DRM_I915_GET_PIPE_FROM_CRTC_ID 0x25
464 #define DRM_I915_GEM_MADVISE 0x26
465 #define DRM_I915_OVERLAY_PUT_IMAGE 0x27
466 #define DRM_I915_OVERLAY_ATTRS 0x28
467 #define DRM_I915_GEM_EXECBUFFER2 0x29
468 #define DRM_I915_GEM_EXECBUFFER2_WR DRM_I915_GEM_EXECBUFFER2
469 #define DRM_I915_GET_SPRITE_COLORKEY 0x2a
470 #define DRM_I915_SET_SPRITE_COLORKEY 0x2b
471 #define DRM_I915_GEM_WAIT 0x2c
472 #define DRM_I915_GEM_CONTEXT_CREATE 0x2d
473 #define DRM_I915_GEM_CONTEXT_DESTROY 0x2e
474 #define DRM_I915_GEM_SET_CACHING 0x2f
475 #define DRM_I915_GEM_GET_CACHING 0x30
476 #define DRM_I915_REG_READ 0x31
477 #define DRM_I915_GET_RESET_STATS 0x32
478 #define DRM_I915_GEM_USERPTR 0x33
479 #define DRM_I915_GEM_CONTEXT_GETPARAM 0x34
480 #define DRM_I915_GEM_CONTEXT_SETPARAM 0x35
481 #define DRM_I915_PERF_OPEN 0x36
482 #define DRM_I915_PERF_ADD_CONFIG 0x37
483 #define DRM_I915_PERF_REMOVE_CONFIG 0x38
484 #define DRM_I915_QUERY 0x39
485 #define DRM_I915_GEM_VM_CREATE 0x3a
486 #define DRM_I915_GEM_VM_DESTROY 0x3b
487 #define DRM_I915_GEM_CREATE_EXT 0x3c
488 /* Must be kept compact -- no holes */
490 #define DRM_IOCTL_I915_INIT DRM_IOW( DRM_COMMAND_BASE + DRM_I915_INIT, drm_i915_init_t)
491 #define DRM_IOCTL_I915_FLUSH DRM_IO ( DRM_COMMAND_BASE + DRM_I915_FLUSH)
492 #define DRM_IOCTL_I915_FLIP DRM_IO ( DRM_COMMAND_BASE + DRM_I915_FLIP)
493 #define DRM_IOCTL_I915_BATCHBUFFER DRM_IOW( DRM_COMMAND_BASE + DRM_I915_BATCHBUFFER, drm_i915_batchbuffer_t)
494 #define DRM_IOCTL_I915_IRQ_EMIT DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_IRQ_EMIT, drm_i915_irq_emit_t)
495 #define DRM_IOCTL_I915_IRQ_WAIT DRM_IOW( DRM_COMMAND_BASE + DRM_I915_IRQ_WAIT, drm_i915_irq_wait_t)
496 #define DRM_IOCTL_I915_GETPARAM DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GETPARAM, drm_i915_getparam_t)
497 #define DRM_IOCTL_I915_SETPARAM DRM_IOW( DRM_COMMAND_BASE + DRM_I915_SETPARAM, drm_i915_setparam_t)
498 #define DRM_IOCTL_I915_ALLOC DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_ALLOC, drm_i915_mem_alloc_t)
499 #define DRM_IOCTL_I915_FREE DRM_IOW( DRM_COMMAND_BASE + DRM_I915_FREE, drm_i915_mem_free_t)
500 #define DRM_IOCTL_I915_INIT_HEAP DRM_IOW( DRM_COMMAND_BASE + DRM_I915_INIT_HEAP, drm_i915_mem_init_heap_t)
501 #define DRM_IOCTL_I915_CMDBUFFER DRM_IOW( DRM_COMMAND_BASE + DRM_I915_CMDBUFFER, drm_i915_cmdbuffer_t)
502 #define DRM_IOCTL_I915_DESTROY_HEAP DRM_IOW( DRM_COMMAND_BASE + DRM_I915_DESTROY_HEAP, drm_i915_mem_destroy_heap_t)
503 #define DRM_IOCTL_I915_SET_VBLANK_PIPE DRM_IOW( DRM_COMMAND_BASE + DRM_I915_SET_VBLANK_PIPE, drm_i915_vblank_pipe_t)
504 #define DRM_IOCTL_I915_GET_VBLANK_PIPE DRM_IOR( DRM_COMMAND_BASE + DRM_I915_GET_VBLANK_PIPE, drm_i915_vblank_pipe_t)
505 #define DRM_IOCTL_I915_VBLANK_SWAP DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_VBLANK_SWAP, drm_i915_vblank_swap_t)
506 #define DRM_IOCTL_I915_HWS_ADDR DRM_IOW(DRM_COMMAND_BASE + DRM_I915_HWS_ADDR, struct drm_i915_gem_init)
507 #define DRM_IOCTL_I915_GEM_INIT DRM_IOW(DRM_COMMAND_BASE + DRM_I915_GEM_INIT, struct drm_i915_gem_init)
508 #define DRM_IOCTL_I915_GEM_EXECBUFFER DRM_IOW(DRM_COMMAND_BASE + DRM_I915_GEM_EXECBUFFER, struct drm_i915_gem_execbuffer)
509 #define DRM_IOCTL_I915_GEM_EXECBUFFER2 DRM_IOW(DRM_COMMAND_BASE + DRM_I915_GEM_EXECBUFFER2, struct drm_i915_gem_execbuffer2)
510 #define DRM_IOCTL_I915_GEM_EXECBUFFER2_WR DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_EXECBUFFER2_WR, struct drm_i915_gem_execbuffer2)
511 #define DRM_IOCTL_I915_GEM_PIN DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_PIN, struct drm_i915_gem_pin)
512 #define DRM_IOCTL_I915_GEM_UNPIN DRM_IOW(DRM_COMMAND_BASE + DRM_I915_GEM_UNPIN, struct drm_i915_gem_unpin)
513 #define DRM_IOCTL_I915_GEM_BUSY DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_BUSY, struct drm_i915_gem_busy)
514 #define DRM_IOCTL_I915_GEM_SET_CACHING DRM_IOW(DRM_COMMAND_BASE + DRM_I915_GEM_SET_CACHING, struct drm_i915_gem_caching)
515 #define DRM_IOCTL_I915_GEM_GET_CACHING DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_GET_CACHING, struct drm_i915_gem_caching)
516 #define DRM_IOCTL_I915_GEM_THROTTLE DRM_IO ( DRM_COMMAND_BASE + DRM_I915_GEM_THROTTLE)
517 #define DRM_IOCTL_I915_GEM_ENTERVT DRM_IO(DRM_COMMAND_BASE + DRM_I915_GEM_ENTERVT)
518 #define DRM_IOCTL_I915_GEM_LEAVEVT DRM_IO(DRM_COMMAND_BASE + DRM_I915_GEM_LEAVEVT)
519 #define DRM_IOCTL_I915_GEM_CREATE DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_CREATE, struct drm_i915_gem_create)
520 #define DRM_IOCTL_I915_GEM_CREATE_EXT DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_CREATE_EXT, struct drm_i915_gem_create_ext)
521 #define DRM_IOCTL_I915_GEM_PREAD DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_PREAD, struct drm_i915_gem_pread)
522 #define DRM_IOCTL_I915_GEM_PWRITE DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_PWRITE, struct drm_i915_gem_pwrite)
523 #define DRM_IOCTL_I915_GEM_MMAP DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP, struct drm_i915_gem_mmap)
524 #define DRM_IOCTL_I915_GEM_MMAP_GTT DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP_GTT, struct drm_i915_gem_mmap_gtt)
525 #define DRM_IOCTL_I915_GEM_MMAP_OFFSET DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MMAP_GTT, struct drm_i915_gem_mmap_offset)
526 #define DRM_IOCTL_I915_GEM_SET_DOMAIN DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_SET_DOMAIN, struct drm_i915_gem_set_domain)
527 #define DRM_IOCTL_I915_GEM_SW_FINISH DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_SW_FINISH, struct drm_i915_gem_sw_finish)
528 #define DRM_IOCTL_I915_GEM_SET_TILING DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_SET_TILING, struct drm_i915_gem_set_tiling)
529 #define DRM_IOCTL_I915_GEM_GET_TILING DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_GET_TILING, struct drm_i915_gem_get_tiling)
530 #define DRM_IOCTL_I915_GEM_GET_APERTURE DRM_IOR (DRM_COMMAND_BASE + DRM_I915_GEM_GET_APERTURE, struct drm_i915_gem_get_aperture)
531 #define DRM_IOCTL_I915_GET_PIPE_FROM_CRTC_ID DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GET_PIPE_FROM_CRTC_ID, struct drm_i915_get_pipe_from_crtc_id)
532 #define DRM_IOCTL_I915_GEM_MADVISE DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_MADVISE, struct drm_i915_gem_madvise)
533 #define DRM_IOCTL_I915_OVERLAY_PUT_IMAGE DRM_IOW(DRM_COMMAND_BASE + DRM_I915_OVERLAY_PUT_IMAGE, struct drm_intel_overlay_put_image)
534 #define DRM_IOCTL_I915_OVERLAY_ATTRS DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_OVERLAY_ATTRS, struct drm_intel_overlay_attrs)
535 #define DRM_IOCTL_I915_SET_SPRITE_COLORKEY DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_SET_SPRITE_COLORKEY, struct drm_intel_sprite_colorkey)
536 #define DRM_IOCTL_I915_GET_SPRITE_COLORKEY DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GET_SPRITE_COLORKEY, struct drm_intel_sprite_colorkey)
537 #define DRM_IOCTL_I915_GEM_WAIT DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_WAIT, struct drm_i915_gem_wait)
538 #define DRM_IOCTL_I915_GEM_CONTEXT_CREATE DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_CONTEXT_CREATE, struct drm_i915_gem_context_create)
539 #define DRM_IOCTL_I915_GEM_CONTEXT_CREATE_EXT DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_CONTEXT_CREATE, struct drm_i915_gem_context_create_ext)
540 #define DRM_IOCTL_I915_GEM_CONTEXT_DESTROY DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_CONTEXT_DESTROY, struct drm_i915_gem_context_destroy)
541 #define DRM_IOCTL_I915_REG_READ DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_REG_READ, struct drm_i915_reg_read)
542 #define DRM_IOCTL_I915_GET_RESET_STATS DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GET_RESET_STATS, struct drm_i915_reset_stats)
543 #define DRM_IOCTL_I915_GEM_USERPTR DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_USERPTR, struct drm_i915_gem_userptr)
544 #define DRM_IOCTL_I915_GEM_CONTEXT_GETPARAM DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_CONTEXT_GETPARAM, struct drm_i915_gem_context_param)
545 #define DRM_IOCTL_I915_GEM_CONTEXT_SETPARAM DRM_IOWR (DRM_COMMAND_BASE + DRM_I915_GEM_CONTEXT_SETPARAM, struct drm_i915_gem_context_param)
546 #define DRM_IOCTL_I915_PERF_OPEN DRM_IOW(DRM_COMMAND_BASE + DRM_I915_PERF_OPEN, struct drm_i915_perf_open_param)
547 #define DRM_IOCTL_I915_PERF_ADD_CONFIG DRM_IOW(DRM_COMMAND_BASE + DRM_I915_PERF_ADD_CONFIG, struct drm_i915_perf_oa_config)
548 #define DRM_IOCTL_I915_PERF_REMOVE_CONFIG DRM_IOW(DRM_COMMAND_BASE + DRM_I915_PERF_REMOVE_CONFIG, __u64)
549 #define DRM_IOCTL_I915_QUERY DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_QUERY, struct drm_i915_query)
550 #define DRM_IOCTL_I915_GEM_VM_CREATE DRM_IOWR(DRM_COMMAND_BASE + DRM_I915_GEM_VM_CREATE, struct drm_i915_gem_vm_control)
551 #define DRM_IOCTL_I915_GEM_VM_DESTROY DRM_IOW (DRM_COMMAND_BASE + DRM_I915_GEM_VM_DESTROY, struct drm_i915_gem_vm_control)
553 /* Allow drivers to submit batchbuffers directly to hardware, relying
554 * on the security mechanisms provided by hardware.
556 typedef struct drm_i915_batchbuffer {
557 int start; /* agp offset */
558 int used; /* nr bytes in use */
559 int DR1; /* hw flags for GFX_OP_DRAWRECT_INFO */
560 int DR4; /* window origin for GFX_OP_DRAWRECT_INFO */
561 int num_cliprects; /* mulitpass with multiple cliprects? */
562 struct drm_clip_rect __user *cliprects; /* pointer to userspace cliprects */
563 } drm_i915_batchbuffer_t;
565 /* As above, but pass a pointer to userspace buffer which can be
566 * validated by the kernel prior to sending to hardware.
568 typedef struct _drm_i915_cmdbuffer {
569 char __user *buf; /* pointer to userspace command buffer */
570 int sz; /* nr bytes in buf */
571 int DR1; /* hw flags for GFX_OP_DRAWRECT_INFO */
572 int DR4; /* window origin for GFX_OP_DRAWRECT_INFO */
573 int num_cliprects; /* mulitpass with multiple cliprects? */
574 struct drm_clip_rect __user *cliprects; /* pointer to userspace cliprects */
575 } drm_i915_cmdbuffer_t;
577 /* Userspace can request & wait on irq's:
579 typedef struct drm_i915_irq_emit {
581 } drm_i915_irq_emit_t;
583 typedef struct drm_i915_irq_wait {
585 } drm_i915_irq_wait_t;
588 * Different modes of per-process Graphics Translation Table,
589 * see I915_PARAM_HAS_ALIASING_PPGTT
591 #define I915_GEM_PPGTT_NONE 0
592 #define I915_GEM_PPGTT_ALIASING 1
593 #define I915_GEM_PPGTT_FULL 2
595 /* Ioctl to query kernel params:
597 #define I915_PARAM_IRQ_ACTIVE 1
598 #define I915_PARAM_ALLOW_BATCHBUFFER 2
599 #define I915_PARAM_LAST_DISPATCH 3
600 #define I915_PARAM_CHIPSET_ID 4
601 #define I915_PARAM_HAS_GEM 5
602 #define I915_PARAM_NUM_FENCES_AVAIL 6
603 #define I915_PARAM_HAS_OVERLAY 7
604 #define I915_PARAM_HAS_PAGEFLIPPING 8
605 #define I915_PARAM_HAS_EXECBUF2 9
606 #define I915_PARAM_HAS_BSD 10
607 #define I915_PARAM_HAS_BLT 11
608 #define I915_PARAM_HAS_RELAXED_FENCING 12
609 #define I915_PARAM_HAS_COHERENT_RINGS 13
610 #define I915_PARAM_HAS_EXEC_CONSTANTS 14
611 #define I915_PARAM_HAS_RELAXED_DELTA 15
612 #define I915_PARAM_HAS_GEN7_SOL_RESET 16
613 #define I915_PARAM_HAS_LLC 17
614 #define I915_PARAM_HAS_ALIASING_PPGTT 18
615 #define I915_PARAM_HAS_WAIT_TIMEOUT 19
616 #define I915_PARAM_HAS_SEMAPHORES 20
617 #define I915_PARAM_HAS_PRIME_VMAP_FLUSH 21
618 #define I915_PARAM_HAS_VEBOX 22
619 #define I915_PARAM_HAS_SECURE_BATCHES 23
620 #define I915_PARAM_HAS_PINNED_BATCHES 24
621 #define I915_PARAM_HAS_EXEC_NO_RELOC 25
622 #define I915_PARAM_HAS_EXEC_HANDLE_LUT 26
623 #define I915_PARAM_HAS_WT 27
624 #define I915_PARAM_CMD_PARSER_VERSION 28
625 #define I915_PARAM_HAS_COHERENT_PHYS_GTT 29
626 #define I915_PARAM_MMAP_VERSION 30
627 #define I915_PARAM_HAS_BSD2 31
628 #define I915_PARAM_REVISION 32
629 #define I915_PARAM_SUBSLICE_TOTAL 33
630 #define I915_PARAM_EU_TOTAL 34
631 #define I915_PARAM_HAS_GPU_RESET 35
632 #define I915_PARAM_HAS_RESOURCE_STREAMER 36
633 #define I915_PARAM_HAS_EXEC_SOFTPIN 37
634 #define I915_PARAM_HAS_POOLED_EU 38
635 #define I915_PARAM_MIN_EU_IN_POOL 39
636 #define I915_PARAM_MMAP_GTT_VERSION 40
639 * Query whether DRM_I915_GEM_EXECBUFFER2 supports user defined execution
640 * priorities and the driver will attempt to execute batches in priority order.
641 * The param returns a capability bitmask, nonzero implies that the scheduler
642 * is enabled, with different features present according to the mask.
644 * The initial priority for each batch is supplied by the context and is
645 * controlled via I915_CONTEXT_PARAM_PRIORITY.
647 #define I915_PARAM_HAS_SCHEDULER 41
648 #define I915_SCHEDULER_CAP_ENABLED (1ul << 0)
649 #define I915_SCHEDULER_CAP_PRIORITY (1ul << 1)
650 #define I915_SCHEDULER_CAP_PREEMPTION (1ul << 2)
651 #define I915_SCHEDULER_CAP_SEMAPHORES (1ul << 3)
652 #define I915_SCHEDULER_CAP_ENGINE_BUSY_STATS (1ul << 4)
654 * Indicates the 2k user priority levels are statically mapped into 3 buckets as
657 * -1k to -1 Low priority
659 * 1 to 1k Highest priority
661 #define I915_SCHEDULER_CAP_STATIC_PRIORITY_MAP (1ul << 5)
664 * Query the status of HuC load.
666 * The query can fail in the following scenarios with the listed error codes:
667 * -ENODEV if HuC is not present on this platform,
668 * -EOPNOTSUPP if HuC firmware usage is disabled,
669 * -ENOPKG if HuC firmware fetch failed,
670 * -ENOEXEC if HuC firmware is invalid or mismatched,
671 * -ENOMEM if i915 failed to prepare the FW objects for transfer to the uC,
672 * -EIO if the FW transfer or the FW authentication failed.
674 * If the IOCTL is successful, the returned parameter will be set to one of the
676 * * 0 if HuC firmware load is not complete,
677 * * 1 if HuC firmware is loaded and fully authenticated,
678 * * 2 if HuC firmware is loaded and authenticated for clear media only
680 #define I915_PARAM_HUC_STATUS 42
682 /* Query whether DRM_I915_GEM_EXECBUFFER2 supports the ability to opt-out of
683 * synchronisation with implicit fencing on individual objects.
684 * See EXEC_OBJECT_ASYNC.
686 #define I915_PARAM_HAS_EXEC_ASYNC 43
688 /* Query whether DRM_I915_GEM_EXECBUFFER2 supports explicit fence support -
689 * both being able to pass in a sync_file fd to wait upon before executing,
690 * and being able to return a new sync_file fd that is signaled when the
691 * current request is complete. See I915_EXEC_FENCE_IN and I915_EXEC_FENCE_OUT.
693 #define I915_PARAM_HAS_EXEC_FENCE 44
695 /* Query whether DRM_I915_GEM_EXECBUFFER2 supports the ability to capture
696 * user-specified buffers for post-mortem debugging of GPU hangs. See
697 * EXEC_OBJECT_CAPTURE.
699 #define I915_PARAM_HAS_EXEC_CAPTURE 45
701 #define I915_PARAM_SLICE_MASK 46
703 /* Assuming it's uniform for each slice, this queries the mask of subslices
704 * per-slice for this system.
706 #define I915_PARAM_SUBSLICE_MASK 47
709 * Query whether DRM_I915_GEM_EXECBUFFER2 supports supplying the batch buffer
710 * as the first execobject as opposed to the last. See I915_EXEC_BATCH_FIRST.
712 #define I915_PARAM_HAS_EXEC_BATCH_FIRST 48
714 /* Query whether DRM_I915_GEM_EXECBUFFER2 supports supplying an array of
715 * drm_i915_gem_exec_fence structures. See I915_EXEC_FENCE_ARRAY.
717 #define I915_PARAM_HAS_EXEC_FENCE_ARRAY 49
720 * Query whether every context (both per-file default and user created) is
721 * isolated (insofar as HW supports). If this parameter is not true, then
722 * freshly created contexts may inherit values from an existing context,
723 * rather than default HW values. If true, it also ensures (insofar as HW
724 * supports) that all state set by this context will not leak to any other
727 * As not every engine across every gen support contexts, the returned
728 * value reports the support of context isolation for individual engines by
729 * returning a bitmask of each engine class set to true if that class supports
732 #define I915_PARAM_HAS_CONTEXT_ISOLATION 50
734 /* Frequency of the command streamer timestamps given by the *_TIMESTAMP
735 * registers. This used to be fixed per platform but from CNL onwards, this
736 * might vary depending on the parts.
738 #define I915_PARAM_CS_TIMESTAMP_FREQUENCY 51
741 * Once upon a time we supposed that writes through the GGTT would be
742 * immediately in physical memory (once flushed out of the CPU path). However,
743 * on a few different processors and chipsets, this is not necessarily the case
744 * as the writes appear to be buffered internally. Thus a read of the backing
745 * storage (physical memory) via a different path (with different physical tags
746 * to the indirect write via the GGTT) will see stale values from before
747 * the GGTT write. Inside the kernel, we can for the most part keep track of
748 * the different read/write domains in use (e.g. set-domain), but the assumption
749 * of coherency is baked into the ABI, hence reporting its true state in this
752 * Reports true when writes via mmap_gtt are immediately visible following an
753 * lfence to flush the WCB.
755 * Reports false when writes via mmap_gtt are indeterminately delayed in an in
756 * internal buffer and are _not_ immediately visible to third parties accessing
757 * directly via mmap_cpu/mmap_wc. Use of mmap_gtt as part of an IPC
758 * communications channel when reporting false is strongly disadvised.
760 #define I915_PARAM_MMAP_GTT_COHERENT 52
763 * Query whether DRM_I915_GEM_EXECBUFFER2 supports coordination of parallel
764 * execution through use of explicit fence support.
765 * See I915_EXEC_FENCE_OUT and I915_EXEC_FENCE_SUBMIT.
767 #define I915_PARAM_HAS_EXEC_SUBMIT_FENCE 53
770 * Revision of the i915-perf uAPI. The value returned helps determine what
771 * i915-perf features are available. See drm_i915_perf_property_id.
773 #define I915_PARAM_PERF_REVISION 54
775 /* Query whether DRM_I915_GEM_EXECBUFFER2 supports supplying an array of
776 * timeline syncobj through drm_i915_gem_execbuffer_ext_timeline_fences. See
777 * I915_EXEC_USE_EXTENSIONS.
779 #define I915_PARAM_HAS_EXEC_TIMELINE_FENCES 55
781 /* Query if the kernel supports the I915_USERPTR_PROBE flag. */
782 #define I915_PARAM_HAS_USERPTR_PROBE 56
785 * Frequency of the timestamps in OA reports. This used to be the same as the CS
786 * timestamp frequency, but differs on some platforms.
788 #define I915_PARAM_OA_TIMESTAMP_FREQUENCY 57
791 * Query the status of PXP support in i915.
793 * The query can fail in the following scenarios with the listed error codes:
794 * -ENODEV = PXP support is not available on the GPU device or in the
795 * kernel due to missing component drivers or kernel configs.
797 * If the IOCTL is successful, the returned parameter will be set to one of
798 * the following values:
799 * 1 = PXP feature is supported and is ready for use.
800 * 2 = PXP feature is supported but should be ready soon (pending
801 * initialization of non-i915 system dependencies).
803 * NOTE: When param is supported (positive return values), user space should
804 * still refer to the GEM PXP context-creation UAPI header specs to be
805 * aware of possible failure due to system state machine at the time.
807 #define I915_PARAM_PXP_STATUS 58
810 * Query if kernel allows marking a context to send a Freq hint to SLPC. This
811 * will enable use of the strategies allowed by the SLPC algorithm.
813 #define I915_PARAM_HAS_CONTEXT_FREQ_HINT 59
815 /* Must be kept compact -- no holes and well documented */
818 * struct drm_i915_getparam - Driver parameter query structure.
820 struct drm_i915_getparam {
821 /** @param: Driver parameter to query. */
825 * @value: Address of memory where queried value should be put.
827 * WARNING: Using pointers instead of fixed-size u64 means we need to write
828 * compat32 code. Don't repeat this mistake.
834 * typedef drm_i915_getparam_t - Driver parameter query structure.
835 * See struct drm_i915_getparam.
837 typedef struct drm_i915_getparam drm_i915_getparam_t;
839 /* Ioctl to set kernel params:
841 #define I915_SETPARAM_USE_MI_BATCHBUFFER_START 1
842 #define I915_SETPARAM_TEX_LRU_LOG_GRANULARITY 2
843 #define I915_SETPARAM_ALLOW_BATCHBUFFER 3
844 #define I915_SETPARAM_NUM_USED_FENCES 4
845 /* Must be kept compact -- no holes */
847 typedef struct drm_i915_setparam {
850 } drm_i915_setparam_t;
852 /* A memory manager for regions of shared memory:
854 #define I915_MEM_REGION_AGP 1
856 typedef struct drm_i915_mem_alloc {
860 int __user *region_offset; /* offset from start of fb or agp */
861 } drm_i915_mem_alloc_t;
863 typedef struct drm_i915_mem_free {
866 } drm_i915_mem_free_t;
868 typedef struct drm_i915_mem_init_heap {
872 } drm_i915_mem_init_heap_t;
874 /* Allow memory manager to be torn down and re-initialized (eg on
877 typedef struct drm_i915_mem_destroy_heap {
879 } drm_i915_mem_destroy_heap_t;
881 /* Allow X server to configure which pipes to monitor for vblank signals
883 #define DRM_I915_VBLANK_PIPE_A 1
884 #define DRM_I915_VBLANK_PIPE_B 2
886 typedef struct drm_i915_vblank_pipe {
888 } drm_i915_vblank_pipe_t;
890 /* Schedule buffer swap at given vertical blank:
892 typedef struct drm_i915_vblank_swap {
893 drm_drawable_t drawable;
894 enum drm_vblank_seq_type seqtype;
895 unsigned int sequence;
896 } drm_i915_vblank_swap_t;
898 typedef struct drm_i915_hws_addr {
900 } drm_i915_hws_addr_t;
902 struct drm_i915_gem_init {
904 * Beginning offset in the GTT to be managed by the DRM memory
909 * Ending offset in the GTT to be managed by the DRM memory
915 struct drm_i915_gem_create {
917 * Requested size for the object.
919 * The (page-aligned) allocated size for the object will be returned.
923 * Returned handle for the object.
925 * Object handles are nonzero.
931 struct drm_i915_gem_pread {
932 /** Handle for the object being read. */
935 /** Offset into the object to read from */
937 /** Length of data to read */
940 * Pointer to write the data into.
942 * This is a fixed-size type for 32/64 compatibility.
947 struct drm_i915_gem_pwrite {
948 /** Handle for the object being written to. */
951 /** Offset into the object to write to */
953 /** Length of data to write */
956 * Pointer to read the data from.
958 * This is a fixed-size type for 32/64 compatibility.
963 struct drm_i915_gem_mmap {
964 /** Handle for the object being mapped. */
967 /** Offset in the object to map. */
970 * Length of data to map.
972 * The value will be page-aligned.
976 * Returned pointer the data was mapped at.
978 * This is a fixed-size type for 32/64 compatibility.
983 * Flags for extended behaviour.
985 * Added in version 2.
988 #define I915_MMAP_WC 0x1
991 struct drm_i915_gem_mmap_gtt {
992 /** Handle for the object being mapped. */
996 * Fake offset to use for subsequent mmap call
998 * This is a fixed-size type for 32/64 compatibility.
1004 * struct drm_i915_gem_mmap_offset - Retrieve an offset so we can mmap this buffer object.
1006 * This struct is passed as argument to the `DRM_IOCTL_I915_GEM_MMAP_OFFSET` ioctl,
1007 * and is used to retrieve the fake offset to mmap an object specified by &handle.
1009 * The legacy way of using `DRM_IOCTL_I915_GEM_MMAP` is removed on gen12+.
1010 * `DRM_IOCTL_I915_GEM_MMAP_GTT` is an older supported alias to this struct, but will behave
1011 * as setting the &extensions to 0, and &flags to `I915_MMAP_OFFSET_GTT`.
1013 struct drm_i915_gem_mmap_offset {
1014 /** @handle: Handle for the object being mapped. */
1016 /** @pad: Must be zero */
1019 * @offset: The fake offset to use for subsequent mmap call
1021 * This is a fixed-size type for 32/64 compatibility.
1026 * @flags: Flags for extended behaviour.
1028 * It is mandatory that one of the `MMAP_OFFSET` types
1029 * should be included:
1031 * - `I915_MMAP_OFFSET_GTT`: Use mmap with the object bound to GTT. (Write-Combined)
1032 * - `I915_MMAP_OFFSET_WC`: Use Write-Combined caching.
1033 * - `I915_MMAP_OFFSET_WB`: Use Write-Back caching.
1034 * - `I915_MMAP_OFFSET_FIXED`: Use object placement to determine caching.
1036 * On devices with local memory `I915_MMAP_OFFSET_FIXED` is the only valid
1037 * type. On devices without local memory, this caching mode is invalid.
1039 * As caching mode when specifying `I915_MMAP_OFFSET_FIXED`, WC or WB will
1040 * be used, depending on the object placement on creation. WB will be used
1041 * when the object can only exist in system memory, WC otherwise.
1045 #define I915_MMAP_OFFSET_GTT 0
1046 #define I915_MMAP_OFFSET_WC 1
1047 #define I915_MMAP_OFFSET_WB 2
1048 #define I915_MMAP_OFFSET_UC 3
1049 #define I915_MMAP_OFFSET_FIXED 4
1052 * @extensions: Zero-terminated chain of extensions.
1054 * No current extensions defined; mbz.
1060 * struct drm_i915_gem_set_domain - Adjust the objects write or read domain, in
1061 * preparation for accessing the pages via some CPU domain.
1063 * Specifying a new write or read domain will flush the object out of the
1064 * previous domain(if required), before then updating the objects domain
1065 * tracking with the new domain.
1067 * Note this might involve waiting for the object first if it is still active on
1070 * Supported values for @read_domains and @write_domain:
1072 * - I915_GEM_DOMAIN_WC: Uncached write-combined domain
1073 * - I915_GEM_DOMAIN_CPU: CPU cache domain
1074 * - I915_GEM_DOMAIN_GTT: Mappable aperture domain
1076 * All other domains are rejected.
1078 * Note that for discrete, starting from DG1, this is no longer supported, and
1079 * is instead rejected. On such platforms the CPU domain is effectively static,
1080 * where we also only support a single &drm_i915_gem_mmap_offset cache mode,
1081 * which can't be set explicitly and instead depends on the object placements,
1084 * Implicit caching rules, starting from DG1:
1086 * - If any of the object placements (see &drm_i915_gem_create_ext_memory_regions)
1087 * contain I915_MEMORY_CLASS_DEVICE then the object will be allocated and
1088 * mapped as write-combined only.
1090 * - Everything else is always allocated and mapped as write-back, with the
1091 * guarantee that everything is also coherent with the GPU.
1093 * Note that this is likely to change in the future again, where we might need
1094 * more flexibility on future devices, so making this all explicit as part of a
1095 * new &drm_i915_gem_create_ext extension is probable.
1097 struct drm_i915_gem_set_domain {
1098 /** @handle: Handle for the object. */
1101 /** @read_domains: New read domains. */
1105 * @write_domain: New write domain.
1107 * Note that having something in the write domain implies it's in the
1108 * read domain, and only that read domain.
1113 struct drm_i915_gem_sw_finish {
1114 /** Handle for the object */
1118 struct drm_i915_gem_relocation_entry {
1120 * Handle of the buffer being pointed to by this relocation entry.
1122 * It's appealing to make this be an index into the mm_validate_entry
1123 * list to refer to the buffer, but this allows the driver to create
1124 * a relocation list for state buffers and not re-write it per
1125 * exec using the buffer.
1127 __u32 target_handle;
1130 * Value to be added to the offset of the target buffer to make up
1131 * the relocation entry.
1135 /** Offset in the buffer the relocation entry will be written into */
1139 * Offset value of the target buffer that the relocation entry was last
1142 * If the buffer has the same offset as last time, we can skip syncing
1143 * and writing the relocation. This value is written back out by
1144 * the execbuffer ioctl when the relocation is written.
1146 __u64 presumed_offset;
1149 * Target memory domains read by this operation.
1154 * Target memory domains written by this operation.
1156 * Note that only one domain may be written by the whole
1157 * execbuffer operation, so that where there are conflicts,
1158 * the application will get -EINVAL back.
1164 * Intel memory domains
1166 * Most of these just align with the various caches in
1167 * the system and are used to flush and invalidate as
1168 * objects end up cached in different domains.
1171 #define I915_GEM_DOMAIN_CPU 0x00000001
1172 /** Render cache, used by 2D and 3D drawing */
1173 #define I915_GEM_DOMAIN_RENDER 0x00000002
1174 /** Sampler cache, used by texture engine */
1175 #define I915_GEM_DOMAIN_SAMPLER 0x00000004
1176 /** Command queue, used to load batch buffers */
1177 #define I915_GEM_DOMAIN_COMMAND 0x00000008
1178 /** Instruction cache, used by shader programs */
1179 #define I915_GEM_DOMAIN_INSTRUCTION 0x00000010
1180 /** Vertex address cache */
1181 #define I915_GEM_DOMAIN_VERTEX 0x00000020
1182 /** GTT domain - aperture and scanout */
1183 #define I915_GEM_DOMAIN_GTT 0x00000040
1184 /** WC domain - uncached access */
1185 #define I915_GEM_DOMAIN_WC 0x00000080
1188 struct drm_i915_gem_exec_object {
1190 * User's handle for a buffer to be bound into the GTT for this
1195 /** Number of relocations to be performed on this buffer */
1196 __u32 relocation_count;
1198 * Pointer to array of struct drm_i915_gem_relocation_entry containing
1199 * the relocations to be performed in this buffer.
1203 /** Required alignment in graphics aperture */
1207 * Returned value of the updated offset of the object, for future
1208 * presumed_offset writes.
1213 /* DRM_IOCTL_I915_GEM_EXECBUFFER was removed in Linux 5.13 */
1214 struct drm_i915_gem_execbuffer {
1216 * List of buffers to be validated with their relocations to be
1217 * performend on them.
1219 * This is a pointer to an array of struct drm_i915_gem_validate_entry.
1221 * These buffers must be listed in an order such that all relocations
1222 * a buffer is performing refer to buffers that have already appeared
1223 * in the validate list.
1228 /** Offset in the batchbuffer to start execution from. */
1229 __u32 batch_start_offset;
1230 /** Bytes used in batchbuffer from batch_start_offset */
1234 __u32 num_cliprects;
1235 /** This is a struct drm_clip_rect *cliprects */
1236 __u64 cliprects_ptr;
1239 struct drm_i915_gem_exec_object2 {
1241 * User's handle for a buffer to be bound into the GTT for this
1246 /** Number of relocations to be performed on this buffer */
1247 __u32 relocation_count;
1249 * Pointer to array of struct drm_i915_gem_relocation_entry containing
1250 * the relocations to be performed in this buffer.
1254 /** Required alignment in graphics aperture */
1258 * When the EXEC_OBJECT_PINNED flag is specified this is populated by
1259 * the user with the GTT offset at which this object will be pinned.
1261 * When the I915_EXEC_NO_RELOC flag is specified this must contain the
1262 * presumed_offset of the object.
1264 * During execbuffer2 the kernel populates it with the value of the
1265 * current GTT offset of the object, for future presumed_offset writes.
1267 * See struct drm_i915_gem_create_ext for the rules when dealing with
1268 * alignment restrictions with I915_MEMORY_CLASS_DEVICE, on devices with
1269 * minimum page sizes, like DG2.
1273 #define EXEC_OBJECT_NEEDS_FENCE (1<<0)
1274 #define EXEC_OBJECT_NEEDS_GTT (1<<1)
1275 #define EXEC_OBJECT_WRITE (1<<2)
1276 #define EXEC_OBJECT_SUPPORTS_48B_ADDRESS (1<<3)
1277 #define EXEC_OBJECT_PINNED (1<<4)
1278 #define EXEC_OBJECT_PAD_TO_SIZE (1<<5)
1279 /* The kernel implicitly tracks GPU activity on all GEM objects, and
1280 * synchronises operations with outstanding rendering. This includes
1281 * rendering on other devices if exported via dma-buf. However, sometimes
1282 * this tracking is too coarse and the user knows better. For example,
1283 * if the object is split into non-overlapping ranges shared between different
1284 * clients or engines (i.e. suballocating objects), the implicit tracking
1285 * by kernel assumes that each operation affects the whole object rather
1286 * than an individual range, causing needless synchronisation between clients.
1287 * The kernel will also forgo any CPU cache flushes prior to rendering from
1288 * the object as the client is expected to be also handling such domain
1291 * The kernel maintains the implicit tracking in order to manage resources
1292 * used by the GPU - this flag only disables the synchronisation prior to
1293 * rendering with this object in this execbuf.
1295 * Opting out of implicit synhronisation requires the user to do its own
1296 * explicit tracking to avoid rendering corruption. See, for example,
1297 * I915_PARAM_HAS_EXEC_FENCE to order execbufs and execute them asynchronously.
1299 #define EXEC_OBJECT_ASYNC (1<<6)
1300 /* Request that the contents of this execobject be copied into the error
1301 * state upon a GPU hang involving this batch for post-mortem debugging.
1302 * These buffers are recorded in no particular order as "user" in
1303 * /sys/class/drm/cardN/error. Query I915_PARAM_HAS_EXEC_CAPTURE to see
1304 * if the kernel supports this flag.
1306 #define EXEC_OBJECT_CAPTURE (1<<7)
1307 /* All remaining bits are MBZ and RESERVED FOR FUTURE USE */
1308 #define __EXEC_OBJECT_UNKNOWN_FLAGS -(EXEC_OBJECT_CAPTURE<<1)
1319 * struct drm_i915_gem_exec_fence - An input or output fence for the execbuf
1322 * The request will wait for input fence to signal before submission.
1324 * The returned output fence will be signaled after the completion of the
1327 struct drm_i915_gem_exec_fence {
1328 /** @handle: User's handle for a drm_syncobj to wait on or signal. */
1332 * @flags: Supported flags are:
1334 * I915_EXEC_FENCE_WAIT:
1335 * Wait for the input fence before request submission.
1337 * I915_EXEC_FENCE_SIGNAL:
1338 * Return request completion fence as output
1341 #define I915_EXEC_FENCE_WAIT (1<<0)
1342 #define I915_EXEC_FENCE_SIGNAL (1<<1)
1343 #define __I915_EXEC_FENCE_UNKNOWN_FLAGS (-(I915_EXEC_FENCE_SIGNAL << 1))
1347 * struct drm_i915_gem_execbuffer_ext_timeline_fences - Timeline fences
1348 * for execbuf ioctl.
1350 * This structure describes an array of drm_syncobj and associated points for
1351 * timeline variants of drm_syncobj. It is invalid to append this structure to
1352 * the execbuf if I915_EXEC_FENCE_ARRAY is set.
1354 struct drm_i915_gem_execbuffer_ext_timeline_fences {
1355 #define DRM_I915_GEM_EXECBUFFER_EXT_TIMELINE_FENCES 0
1356 /** @base: Extension link. See struct i915_user_extension. */
1357 struct i915_user_extension base;
1360 * @fence_count: Number of elements in the @handles_ptr & @value_ptr
1366 * @handles_ptr: Pointer to an array of struct drm_i915_gem_exec_fence
1367 * of length @fence_count.
1372 * @values_ptr: Pointer to an array of u64 values of length
1374 * Values must be 0 for a binary drm_syncobj. A Value of 0 for a
1375 * timeline drm_syncobj is invalid as it turns a drm_syncobj into a
1382 * struct drm_i915_gem_execbuffer2 - Structure for DRM_I915_GEM_EXECBUFFER2
1385 struct drm_i915_gem_execbuffer2 {
1386 /** @buffers_ptr: Pointer to a list of gem_exec_object2 structs */
1389 /** @buffer_count: Number of elements in @buffers_ptr array */
1393 * @batch_start_offset: Offset in the batchbuffer to start execution
1396 __u32 batch_start_offset;
1399 * @batch_len: Length in bytes of the batch buffer, starting from the
1400 * @batch_start_offset. If 0, length is assumed to be the batch buffer
1405 /** @DR1: deprecated */
1408 /** @DR4: deprecated */
1411 /** @num_cliprects: See @cliprects_ptr */
1412 __u32 num_cliprects;
1415 * @cliprects_ptr: Kernel clipping was a DRI1 misfeature.
1417 * It is invalid to use this field if I915_EXEC_FENCE_ARRAY or
1418 * I915_EXEC_USE_EXTENSIONS flags are not set.
1420 * If I915_EXEC_FENCE_ARRAY is set, then this is a pointer to an array
1421 * of &drm_i915_gem_exec_fence and @num_cliprects is the length of the
1424 * If I915_EXEC_USE_EXTENSIONS is set, then this is a pointer to a
1425 * single &i915_user_extension and num_cliprects is 0.
1427 __u64 cliprects_ptr;
1429 /** @flags: Execbuf flags */
1431 #define I915_EXEC_RING_MASK (0x3f)
1432 #define I915_EXEC_DEFAULT (0<<0)
1433 #define I915_EXEC_RENDER (1<<0)
1434 #define I915_EXEC_BSD (2<<0)
1435 #define I915_EXEC_BLT (3<<0)
1436 #define I915_EXEC_VEBOX (4<<0)
1438 /* Used for switching the constants addressing mode on gen4+ RENDER ring.
1439 * Gen6+ only supports relative addressing to dynamic state (default) and
1440 * absolute addressing.
1442 * These flags are ignored for the BSD and BLT rings.
1444 #define I915_EXEC_CONSTANTS_MASK (3<<6)
1445 #define I915_EXEC_CONSTANTS_REL_GENERAL (0<<6) /* default */
1446 #define I915_EXEC_CONSTANTS_ABSOLUTE (1<<6)
1447 #define I915_EXEC_CONSTANTS_REL_SURFACE (2<<6) /* gen4/5 only */
1449 /** Resets the SO write offset registers for transform feedback on gen7. */
1450 #define I915_EXEC_GEN7_SOL_RESET (1<<8)
1452 /** Request a privileged ("secure") batch buffer. Note only available for
1453 * DRM_ROOT_ONLY | DRM_MASTER processes.
1455 #define I915_EXEC_SECURE (1<<9)
1457 /** Inform the kernel that the batch is and will always be pinned. This
1458 * negates the requirement for a workaround to be performed to avoid
1459 * an incoherent CS (such as can be found on 830/845). If this flag is
1460 * not passed, the kernel will endeavour to make sure the batch is
1461 * coherent with the CS before execution. If this flag is passed,
1462 * userspace assumes the responsibility for ensuring the same.
1464 #define I915_EXEC_IS_PINNED (1<<10)
1466 /** Provide a hint to the kernel that the command stream and auxiliary
1467 * state buffers already holds the correct presumed addresses and so the
1468 * relocation process may be skipped if no buffers need to be moved in
1469 * preparation for the execbuffer.
1471 #define I915_EXEC_NO_RELOC (1<<11)
1473 /** Use the reloc.handle as an index into the exec object array rather
1474 * than as the per-file handle.
1476 #define I915_EXEC_HANDLE_LUT (1<<12)
1478 /** Used for switching BSD rings on the platforms with two BSD rings */
1479 #define I915_EXEC_BSD_SHIFT (13)
1480 #define I915_EXEC_BSD_MASK (3 << I915_EXEC_BSD_SHIFT)
1481 /* default ping-pong mode */
1482 #define I915_EXEC_BSD_DEFAULT (0 << I915_EXEC_BSD_SHIFT)
1483 #define I915_EXEC_BSD_RING1 (1 << I915_EXEC_BSD_SHIFT)
1484 #define I915_EXEC_BSD_RING2 (2 << I915_EXEC_BSD_SHIFT)
1486 /** Tell the kernel that the batchbuffer is processed by
1487 * the resource streamer.
1489 #define I915_EXEC_RESOURCE_STREAMER (1<<15)
1491 /* Setting I915_EXEC_FENCE_IN implies that lower_32_bits(rsvd2) represent
1492 * a sync_file fd to wait upon (in a nonblocking manner) prior to executing
1495 * Returns -EINVAL if the sync_file fd cannot be found.
1497 #define I915_EXEC_FENCE_IN (1<<16)
1499 /* Setting I915_EXEC_FENCE_OUT causes the ioctl to return a sync_file fd
1500 * in the upper_32_bits(rsvd2) upon success. Ownership of the fd is given
1501 * to the caller, and it should be close() after use. (The fd is a regular
1502 * file descriptor and will be cleaned up on process termination. It holds
1503 * a reference to the request, but nothing else.)
1505 * The sync_file fd can be combined with other sync_file and passed either
1506 * to execbuf using I915_EXEC_FENCE_IN, to atomic KMS ioctls (so that a flip
1507 * will only occur after this request completes), or to other devices.
1509 * Using I915_EXEC_FENCE_OUT requires use of
1510 * DRM_IOCTL_I915_GEM_EXECBUFFER2_WR ioctl so that the result is written
1511 * back to userspace. Failure to do so will cause the out-fence to always
1512 * be reported as zero, and the real fence fd to be leaked.
1514 #define I915_EXEC_FENCE_OUT (1<<17)
1517 * Traditionally the execbuf ioctl has only considered the final element in
1518 * the execobject[] to be the executable batch. Often though, the client
1519 * will known the batch object prior to construction and being able to place
1520 * it into the execobject[] array first can simplify the relocation tracking.
1521 * Setting I915_EXEC_BATCH_FIRST tells execbuf to use element 0 of the
1522 * execobject[] as the * batch instead (the default is to use the last
1525 #define I915_EXEC_BATCH_FIRST (1<<18)
1527 /* Setting I915_FENCE_ARRAY implies that num_cliprects and cliprects_ptr
1528 * define an array of i915_gem_exec_fence structures which specify a set of
1529 * dma fences to wait upon or signal.
1531 #define I915_EXEC_FENCE_ARRAY (1<<19)
1534 * Setting I915_EXEC_FENCE_SUBMIT implies that lower_32_bits(rsvd2) represent
1535 * a sync_file fd to wait upon (in a nonblocking manner) prior to executing
1538 * Returns -EINVAL if the sync_file fd cannot be found.
1540 #define I915_EXEC_FENCE_SUBMIT (1 << 20)
1543 * Setting I915_EXEC_USE_EXTENSIONS implies that
1544 * drm_i915_gem_execbuffer2.cliprects_ptr is treated as a pointer to an linked
1545 * list of i915_user_extension. Each i915_user_extension node is the base of a
1546 * larger structure. The list of supported structures are listed in the
1547 * drm_i915_gem_execbuffer_ext enum.
1549 #define I915_EXEC_USE_EXTENSIONS (1 << 21)
1550 #define __I915_EXEC_UNKNOWN_FLAGS (-(I915_EXEC_USE_EXTENSIONS << 1))
1552 /** @rsvd1: Context id */
1556 * @rsvd2: in and out sync_file file descriptors.
1558 * When I915_EXEC_FENCE_IN or I915_EXEC_FENCE_SUBMIT flag is set, the
1559 * lower 32 bits of this field will have the in sync_file fd (input).
1561 * When I915_EXEC_FENCE_OUT flag is set, the upper 32 bits of this
1562 * field will have the out sync_file fd (output).
1567 #define I915_EXEC_CONTEXT_ID_MASK (0xffffffff)
1568 #define i915_execbuffer2_set_context_id(eb2, context) \
1569 (eb2).rsvd1 = context & I915_EXEC_CONTEXT_ID_MASK
1570 #define i915_execbuffer2_get_context_id(eb2) \
1571 ((eb2).rsvd1 & I915_EXEC_CONTEXT_ID_MASK)
1573 struct drm_i915_gem_pin {
1574 /** Handle of the buffer to be pinned. */
1578 /** alignment required within the aperture */
1581 /** Returned GTT offset of the buffer. */
1585 struct drm_i915_gem_unpin {
1586 /** Handle of the buffer to be unpinned. */
1591 struct drm_i915_gem_busy {
1592 /** Handle of the buffer to check for busy */
1595 /** Return busy status
1597 * A return of 0 implies that the object is idle (after
1598 * having flushed any pending activity), and a non-zero return that
1599 * the object is still in-flight on the GPU. (The GPU has not yet
1600 * signaled completion for all pending requests that reference the
1601 * object.) An object is guaranteed to become idle eventually (so
1602 * long as no new GPU commands are executed upon it). Due to the
1603 * asynchronous nature of the hardware, an object reported
1604 * as busy may become idle before the ioctl is completed.
1606 * Furthermore, if the object is busy, which engine is busy is only
1607 * provided as a guide and only indirectly by reporting its class
1608 * (there may be more than one engine in each class). There are race
1609 * conditions which prevent the report of which engines are busy from
1610 * being always accurate. However, the converse is not true. If the
1611 * object is idle, the result of the ioctl, that all engines are idle,
1614 * The returned dword is split into two fields to indicate both
1615 * the engine classes on which the object is being read, and the
1616 * engine class on which it is currently being written (if any).
1618 * The low word (bits 0:15) indicate if the object is being written
1619 * to by any engine (there can only be one, as the GEM implicit
1620 * synchronisation rules force writes to be serialised). Only the
1621 * engine class (offset by 1, I915_ENGINE_CLASS_RENDER is reported as
1622 * 1 not 0 etc) for the last write is reported.
1624 * The high word (bits 16:31) are a bitmask of which engines classes
1625 * are currently reading from the object. Multiple engines may be
1626 * reading from the object simultaneously.
1628 * The value of each engine class is the same as specified in the
1629 * I915_CONTEXT_PARAM_ENGINES context parameter and via perf, i.e.
1630 * I915_ENGINE_CLASS_RENDER, I915_ENGINE_CLASS_COPY, etc.
1631 * Some hardware may have parallel execution engines, e.g. multiple
1632 * media engines, which are mapped to the same class identifier and so
1633 * are not separately reported for busyness.
1636 * Only the boolean result of this query is reliable; that is whether
1637 * the object is idle or busy. The report of which engines are busy
1638 * should be only used as a heuristic.
1644 * struct drm_i915_gem_caching - Set or get the caching for given object
1647 * Allow userspace to control the GTT caching bits for a given object when the
1648 * object is later mapped through the ppGTT(or GGTT on older platforms lacking
1649 * ppGTT support, or if the object is used for scanout). Note that this might
1650 * require unbinding the object from the GTT first, if its current caching value
1653 * Note that this all changes on discrete platforms, starting from DG1, the
1654 * set/get caching is no longer supported, and is now rejected. Instead the CPU
1655 * caching attributes(WB vs WC) will become an immutable creation time property
1656 * for the object, along with the GTT caching level. For now we don't expose any
1657 * new uAPI for this, instead on DG1 this is all implicit, although this largely
1658 * shouldn't matter since DG1 is coherent by default(without any way of
1661 * Implicit caching rules, starting from DG1:
1663 * - If any of the object placements (see &drm_i915_gem_create_ext_memory_regions)
1664 * contain I915_MEMORY_CLASS_DEVICE then the object will be allocated and
1665 * mapped as write-combined only.
1667 * - Everything else is always allocated and mapped as write-back, with the
1668 * guarantee that everything is also coherent with the GPU.
1670 * Note that this is likely to change in the future again, where we might need
1671 * more flexibility on future devices, so making this all explicit as part of a
1672 * new &drm_i915_gem_create_ext extension is probable.
1674 * Side note: Part of the reason for this is that changing the at-allocation-time CPU
1675 * caching attributes for the pages might be required(and is expensive) if we
1676 * need to then CPU map the pages later with different caching attributes. This
1677 * inconsistent caching behaviour, while supported on x86, is not universally
1678 * supported on other architectures. So for simplicity we opt for setting
1679 * everything at creation time, whilst also making it immutable, on discrete
1682 struct drm_i915_gem_caching {
1684 * @handle: Handle of the buffer to set/get the caching level.
1689 * @caching: The GTT caching level to apply or possible return value.
1691 * The supported @caching values:
1693 * I915_CACHING_NONE:
1695 * GPU access is not coherent with CPU caches. Default for machines
1696 * without an LLC. This means manual flushing might be needed, if we
1697 * want GPU access to be coherent.
1699 * I915_CACHING_CACHED:
1701 * GPU access is coherent with CPU caches and furthermore the data is
1702 * cached in last-level caches shared between CPU cores and the GPU GT.
1704 * I915_CACHING_DISPLAY:
1706 * Special GPU caching mode which is coherent with the scanout engines.
1707 * Transparently falls back to I915_CACHING_NONE on platforms where no
1708 * special cache mode (like write-through or gfdt flushing) is
1709 * available. The kernel automatically sets this mode when using a
1710 * buffer as a scanout target. Userspace can manually set this mode to
1711 * avoid a costly stall and clflush in the hotpath of drawing the first
1714 #define I915_CACHING_NONE 0
1715 #define I915_CACHING_CACHED 1
1716 #define I915_CACHING_DISPLAY 2
1720 #define I915_TILING_NONE 0
1721 #define I915_TILING_X 1
1722 #define I915_TILING_Y 2
1724 * Do not add new tiling types here. The I915_TILING_* values are for
1725 * de-tiling fence registers that no longer exist on modern platforms. Although
1726 * the hardware may support new types of tiling in general (e.g., Tile4), we
1727 * do not need to add them to the uapi that is specific to now-defunct ioctls.
1729 #define I915_TILING_LAST I915_TILING_Y
1731 #define I915_BIT_6_SWIZZLE_NONE 0
1732 #define I915_BIT_6_SWIZZLE_9 1
1733 #define I915_BIT_6_SWIZZLE_9_10 2
1734 #define I915_BIT_6_SWIZZLE_9_11 3
1735 #define I915_BIT_6_SWIZZLE_9_10_11 4
1736 /* Not seen by userland */
1737 #define I915_BIT_6_SWIZZLE_UNKNOWN 5
1738 /* Seen by userland. */
1739 #define I915_BIT_6_SWIZZLE_9_17 6
1740 #define I915_BIT_6_SWIZZLE_9_10_17 7
1742 struct drm_i915_gem_set_tiling {
1743 /** Handle of the buffer to have its tiling state updated */
1747 * Tiling mode for the object (I915_TILING_NONE, I915_TILING_X,
1750 * This value is to be set on request, and will be updated by the
1751 * kernel on successful return with the actual chosen tiling layout.
1753 * The tiling mode may be demoted to I915_TILING_NONE when the system
1754 * has bit 6 swizzling that can't be managed correctly by GEM.
1756 * Buffer contents become undefined when changing tiling_mode.
1761 * Stride in bytes for the object when in I915_TILING_X or
1767 * Returned address bit 6 swizzling required for CPU access through
1773 struct drm_i915_gem_get_tiling {
1774 /** Handle of the buffer to get tiling state for. */
1778 * Current tiling mode for the object (I915_TILING_NONE, I915_TILING_X,
1784 * Returned address bit 6 swizzling required for CPU access through
1790 * Returned address bit 6 swizzling required for CPU access through
1791 * mmap mapping whilst bound.
1793 __u32 phys_swizzle_mode;
1796 struct drm_i915_gem_get_aperture {
1797 /** Total size of the aperture used by i915_gem_execbuffer, in bytes */
1801 * Available space in the aperture used by i915_gem_execbuffer, in
1804 __u64 aper_available_size;
1807 struct drm_i915_get_pipe_from_crtc_id {
1808 /** ID of CRTC being requested **/
1811 /** pipe of requested CRTC **/
1815 #define I915_MADV_WILLNEED 0
1816 #define I915_MADV_DONTNEED 1
1817 #define __I915_MADV_PURGED 2 /* internal state */
1819 struct drm_i915_gem_madvise {
1820 /** Handle of the buffer to change the backing store advice */
1823 /* Advice: either the buffer will be needed again in the near future,
1824 * or won't be and could be discarded under memory pressure.
1828 /** Whether the backing store still exists. */
1833 #define I915_OVERLAY_TYPE_MASK 0xff
1834 #define I915_OVERLAY_YUV_PLANAR 0x01
1835 #define I915_OVERLAY_YUV_PACKED 0x02
1836 #define I915_OVERLAY_RGB 0x03
1838 #define I915_OVERLAY_DEPTH_MASK 0xff00
1839 #define I915_OVERLAY_RGB24 0x1000
1840 #define I915_OVERLAY_RGB16 0x2000
1841 #define I915_OVERLAY_RGB15 0x3000
1842 #define I915_OVERLAY_YUV422 0x0100
1843 #define I915_OVERLAY_YUV411 0x0200
1844 #define I915_OVERLAY_YUV420 0x0300
1845 #define I915_OVERLAY_YUV410 0x0400
1847 #define I915_OVERLAY_SWAP_MASK 0xff0000
1848 #define I915_OVERLAY_NO_SWAP 0x000000
1849 #define I915_OVERLAY_UV_SWAP 0x010000
1850 #define I915_OVERLAY_Y_SWAP 0x020000
1851 #define I915_OVERLAY_Y_AND_UV_SWAP 0x030000
1853 #define I915_OVERLAY_FLAGS_MASK 0xff000000
1854 #define I915_OVERLAY_ENABLE 0x01000000
1856 struct drm_intel_overlay_put_image {
1857 /* various flags and src format description */
1859 /* source picture description */
1861 /* stride values and offsets are in bytes, buffer relative */
1862 __u16 stride_Y; /* stride for packed formats */
1864 __u32 offset_Y; /* offset for packet formats */
1870 /* to compensate the scaling factors for partially covered surfaces */
1871 __u16 src_scan_width;
1872 __u16 src_scan_height;
1873 /* output crtc description */
1882 #define I915_OVERLAY_UPDATE_ATTRS (1<<0)
1883 #define I915_OVERLAY_UPDATE_GAMMA (1<<1)
1884 #define I915_OVERLAY_DISABLE_DEST_COLORKEY (1<<2)
1885 struct drm_intel_overlay_attrs {
1900 * Intel sprite handling
1902 * Color keying works with a min/mask/max tuple. Both source and destination
1903 * color keying is allowed.
1906 * Sprite pixels within the min & max values, masked against the color channels
1907 * specified in the mask field, will be transparent. All other pixels will
1908 * be displayed on top of the primary plane. For RGB surfaces, only the min
1909 * and mask fields will be used; ranged compares are not allowed.
1911 * Destination keying:
1912 * Primary plane pixels that match the min value, masked against the color
1913 * channels specified in the mask field, will be replaced by corresponding
1914 * pixels from the sprite plane.
1916 * Note that source & destination keying are exclusive; only one can be
1917 * active on a given plane.
1920 #define I915_SET_COLORKEY_NONE (1<<0) /* Deprecated. Instead set
1921 * flags==0 to disable colorkeying.
1923 #define I915_SET_COLORKEY_DESTINATION (1<<1)
1924 #define I915_SET_COLORKEY_SOURCE (1<<2)
1925 struct drm_intel_sprite_colorkey {
1933 struct drm_i915_gem_wait {
1934 /** Handle of BO we shall wait on */
1937 /** Number of nanoseconds to wait, Returns time remaining. */
1941 struct drm_i915_gem_context_create {
1942 __u32 ctx_id; /* output: id of new context*/
1947 * struct drm_i915_gem_context_create_ext - Structure for creating contexts.
1949 struct drm_i915_gem_context_create_ext {
1950 /** @ctx_id: Id of the created context (output) */
1954 * @flags: Supported flags are:
1956 * I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS:
1958 * Extensions may be appended to this structure and driver must check
1959 * for those. See @extensions.
1961 * I915_CONTEXT_CREATE_FLAGS_SINGLE_TIMELINE
1963 * Created context will have single timeline.
1966 #define I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS (1u << 0)
1967 #define I915_CONTEXT_CREATE_FLAGS_SINGLE_TIMELINE (1u << 1)
1968 #define I915_CONTEXT_CREATE_FLAGS_UNKNOWN \
1969 (-(I915_CONTEXT_CREATE_FLAGS_SINGLE_TIMELINE << 1))
1972 * @extensions: Zero-terminated chain of extensions.
1974 * I915_CONTEXT_CREATE_EXT_SETPARAM:
1975 * Context parameter to set or query during context creation.
1976 * See struct drm_i915_gem_context_create_ext_setparam.
1978 * I915_CONTEXT_CREATE_EXT_CLONE:
1979 * This extension has been removed. On the off chance someone somewhere
1980 * has attempted to use it, never re-use this extension number.
1983 #define I915_CONTEXT_CREATE_EXT_SETPARAM 0
1984 #define I915_CONTEXT_CREATE_EXT_CLONE 1
1988 * struct drm_i915_gem_context_param - Context parameter to set or query.
1990 struct drm_i915_gem_context_param {
1991 /** @ctx_id: Context id */
1994 /** @size: Size of the parameter @value */
1997 /** @param: Parameter to set or query */
1999 #define I915_CONTEXT_PARAM_BAN_PERIOD 0x1
2000 /* I915_CONTEXT_PARAM_NO_ZEROMAP has been removed. On the off chance
2001 * someone somewhere has attempted to use it, never re-use this context
2004 #define I915_CONTEXT_PARAM_NO_ZEROMAP 0x2
2005 #define I915_CONTEXT_PARAM_GTT_SIZE 0x3
2006 #define I915_CONTEXT_PARAM_NO_ERROR_CAPTURE 0x4
2007 #define I915_CONTEXT_PARAM_BANNABLE 0x5
2008 #define I915_CONTEXT_PARAM_PRIORITY 0x6
2009 #define I915_CONTEXT_MAX_USER_PRIORITY 1023 /* inclusive */
2010 #define I915_CONTEXT_DEFAULT_PRIORITY 0
2011 #define I915_CONTEXT_MIN_USER_PRIORITY -1023 /* inclusive */
2013 * When using the following param, value should be a pointer to
2014 * drm_i915_gem_context_param_sseu.
2016 #define I915_CONTEXT_PARAM_SSEU 0x7
2019 * Not all clients may want to attempt automatic recover of a context after
2020 * a hang (for example, some clients may only submit very small incremental
2021 * batches relying on known logical state of previous batches which will never
2022 * recover correctly and each attempt will hang), and so would prefer that
2023 * the context is forever banned instead.
2025 * If set to false (0), after a reset, subsequent (and in flight) rendering
2026 * from this context is discarded, and the client will need to create a new
2027 * context to use instead.
2029 * If set to true (1), the kernel will automatically attempt to recover the
2030 * context by skipping the hanging batch and executing the next batch starting
2031 * from the default context state (discarding the incomplete logical context
2032 * state lost due to the reset).
2034 * On creation, all new contexts are marked as recoverable.
2036 #define I915_CONTEXT_PARAM_RECOVERABLE 0x8
2039 * The id of the associated virtual memory address space (ppGTT) of
2040 * this context. Can be retrieved and passed to another context
2041 * (on the same fd) for both to use the same ppGTT and so share
2042 * address layouts, and avoid reloading the page tables on context
2043 * switches between themselves.
2045 * See DRM_I915_GEM_VM_CREATE and DRM_I915_GEM_VM_DESTROY.
2047 #define I915_CONTEXT_PARAM_VM 0x9
2050 * I915_CONTEXT_PARAM_ENGINES:
2052 * Bind this context to operate on this subset of available engines. Henceforth,
2053 * the I915_EXEC_RING selector for DRM_IOCTL_I915_GEM_EXECBUFFER2 operates as
2054 * an index into this array of engines; I915_EXEC_DEFAULT selecting engine[0]
2055 * and upwards. Slots 0...N are filled in using the specified (class, instance).
2057 * engine_class: I915_ENGINE_CLASS_INVALID,
2058 * engine_instance: I915_ENGINE_CLASS_INVALID_NONE
2059 * to specify a gap in the array that can be filled in later, e.g. by a
2060 * virtual engine used for load balancing.
2062 * Setting the number of engines bound to the context to 0, by passing a zero
2063 * sized argument, will revert back to default settings.
2065 * See struct i915_context_param_engines.
2068 * i915_context_engines_load_balance (I915_CONTEXT_ENGINES_EXT_LOAD_BALANCE)
2069 * i915_context_engines_bond (I915_CONTEXT_ENGINES_EXT_BOND)
2070 * i915_context_engines_parallel_submit (I915_CONTEXT_ENGINES_EXT_PARALLEL_SUBMIT)
2072 #define I915_CONTEXT_PARAM_ENGINES 0xa
2075 * I915_CONTEXT_PARAM_PERSISTENCE:
2077 * Allow the context and active rendering to survive the process until
2078 * completion. Persistence allows fire-and-forget clients to queue up a
2079 * bunch of work, hand the output over to a display server and then quit.
2080 * If the context is marked as not persistent, upon closing (either via
2081 * an explicit DRM_I915_GEM_CONTEXT_DESTROY or implicitly from file closure
2082 * or process termination), the context and any outstanding requests will be
2083 * cancelled (and exported fences for cancelled requests marked as -EIO).
2085 * By default, new contexts allow persistence.
2087 #define I915_CONTEXT_PARAM_PERSISTENCE 0xb
2089 /* This API has been removed. On the off chance someone somewhere has
2090 * attempted to use it, never re-use this context param number.
2092 #define I915_CONTEXT_PARAM_RINGSIZE 0xc
2095 * I915_CONTEXT_PARAM_PROTECTED_CONTENT:
2097 * Mark that the context makes use of protected content, which will result
2098 * in the context being invalidated when the protected content session is.
2099 * Given that the protected content session is killed on suspend, the device
2100 * is kept awake for the lifetime of a protected context, so the user should
2101 * make sure to dispose of them once done.
2102 * This flag can only be set at context creation time and, when set to true,
2103 * must be preceded by an explicit setting of I915_CONTEXT_PARAM_RECOVERABLE
2104 * to false. This flag can't be set to true in conjunction with setting the
2105 * I915_CONTEXT_PARAM_BANNABLE flag to false. Creation example:
2109 * struct drm_i915_gem_context_create_ext_setparam p_protected = {
2111 * .name = I915_CONTEXT_CREATE_EXT_SETPARAM,
2114 * .param = I915_CONTEXT_PARAM_PROTECTED_CONTENT,
2118 * struct drm_i915_gem_context_create_ext_setparam p_norecover = {
2120 * .name = I915_CONTEXT_CREATE_EXT_SETPARAM,
2121 * .next_extension = to_user_pointer(&p_protected),
2124 * .param = I915_CONTEXT_PARAM_RECOVERABLE,
2128 * struct drm_i915_gem_context_create_ext create = {
2129 * .flags = I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS,
2130 * .extensions = to_user_pointer(&p_norecover);
2133 * ctx_id = gem_context_create_ext(drm_fd, &create);
2135 * In addition to the normal failure cases, setting this flag during context
2136 * creation can result in the following errors:
2138 * -ENODEV: feature not available
2139 * -EPERM: trying to mark a recoverable or not bannable context as protected
2140 * -ENXIO: A dependency such as a component driver or firmware is not yet
2141 * loaded so user space may need to attempt again. Depending on the
2142 * device, this error may be reported if protected context creation is
2143 * attempted very early after kernel start because the internal timeout
2144 * waiting for such dependencies is not guaranteed to be larger than
2145 * required (numbers differ depending on system and kernel config):
2146 * - ADL/RPL: dependencies may take up to 3 seconds from kernel start
2147 * while context creation internal timeout is 250 milisecs
2148 * - MTL: dependencies may take up to 8 seconds from kernel start
2149 * while context creation internal timeout is 250 milisecs
2150 * NOTE: such dependencies happen once, so a subsequent call to create a
2151 * protected context after a prior successful call will not experience
2152 * such timeouts and will not return -ENXIO (unless the driver is reloaded,
2153 * or, depending on the device, resumes from a suspended state).
2154 * -EIO: The firmware did not succeed in creating the protected context.
2156 #define I915_CONTEXT_PARAM_PROTECTED_CONTENT 0xd
2159 * I915_CONTEXT_PARAM_LOW_LATENCY:
2161 * Mark this context as a low latency workload which requires aggressive GT
2162 * frequency scaling. Use I915_PARAM_HAS_CONTEXT_FREQ_HINT to check if the kernel
2163 * supports this per context flag.
2165 #define I915_CONTEXT_PARAM_LOW_LATENCY 0xe
2168 * I915_CONTEXT_PARAM_CONTEXT_IMAGE:
2170 * Allows userspace to provide own context images.
2172 * Note that this is a debug API not available on production kernel builds.
2174 #define I915_CONTEXT_PARAM_CONTEXT_IMAGE 0xf
2175 /* Must be kept compact -- no holes and well documented */
2177 /** @value: Context parameter value to be set or queried */
2182 * Context SSEU programming
2184 * It may be necessary for either functional or performance reason to configure
2185 * a context to run with a reduced number of SSEU (where SSEU stands for Slice/
2188 * This is done by configuring SSEU configuration using the below
2189 * @struct drm_i915_gem_context_param_sseu for every supported engine which
2190 * userspace intends to use.
2192 * Not all GPUs or engines support this functionality in which case an error
2193 * code -ENODEV will be returned.
2195 * Also, flexibility of possible SSEU configuration permutations varies between
2196 * GPU generations and software imposed limitations. Requesting such a
2197 * combination will return an error code of -EINVAL.
2199 * NOTE: When perf/OA is active the context's SSEU configuration is ignored in
2200 * favour of a single global setting.
2202 struct drm_i915_gem_context_param_sseu {
2204 * Engine class & instance to be configured or queried.
2206 struct i915_engine_class_instance engine;
2209 * Unknown flags must be cleared to zero.
2212 #define I915_CONTEXT_SSEU_FLAG_ENGINE_INDEX (1u << 0)
2215 * Mask of slices to enable for the context. Valid values are a subset
2216 * of the bitmask value returned for I915_PARAM_SLICE_MASK.
2221 * Mask of subslices to enable for the context. Valid values are a
2222 * subset of the bitmask value return by I915_PARAM_SUBSLICE_MASK.
2224 __u64 subslice_mask;
2227 * Minimum/Maximum number of EUs to enable per subslice for the
2228 * context. min_eus_per_subslice must be inferior or equal to
2229 * max_eus_per_subslice.
2231 __u16 min_eus_per_subslice;
2232 __u16 max_eus_per_subslice;
2235 * Unused for now. Must be cleared to zero.
2241 * DOC: Virtual Engine uAPI
2243 * Virtual engine is a concept where userspace is able to configure a set of
2244 * physical engines, submit a batch buffer, and let the driver execute it on any
2245 * engine from the set as it sees fit.
2247 * This is primarily useful on parts which have multiple instances of a same
2248 * class engine, like for example GT3+ Skylake parts with their two VCS engines.
2250 * For instance userspace can enumerate all engines of a certain class using the
2251 * previously described `Engine Discovery uAPI`_. After that userspace can
2252 * create a GEM context with a placeholder slot for the virtual engine (using
2253 * `I915_ENGINE_CLASS_INVALID` and `I915_ENGINE_CLASS_INVALID_NONE` for class
2254 * and instance respectively) and finally using the
2255 * `I915_CONTEXT_ENGINES_EXT_LOAD_BALANCE` extension place a virtual engine in
2256 * the same reserved slot.
2258 * Example of creating a virtual engine and submitting a batch buffer to it:
2262 * I915_DEFINE_CONTEXT_ENGINES_LOAD_BALANCE(virtual, 2) = {
2263 * .base.name = I915_CONTEXT_ENGINES_EXT_LOAD_BALANCE,
2264 * .engine_index = 0, // Place this virtual engine into engine map slot 0
2265 * .num_siblings = 2,
2266 * .engines = { { I915_ENGINE_CLASS_VIDEO, 0 },
2267 * { I915_ENGINE_CLASS_VIDEO, 1 }, },
2269 * I915_DEFINE_CONTEXT_PARAM_ENGINES(engines, 1) = {
2270 * .engines = { { I915_ENGINE_CLASS_INVALID,
2271 * I915_ENGINE_CLASS_INVALID_NONE } },
2272 * .extensions = to_user_pointer(&virtual), // Chains after load_balance extension
2274 * struct drm_i915_gem_context_create_ext_setparam p_engines = {
2276 * .name = I915_CONTEXT_CREATE_EXT_SETPARAM,
2279 * .param = I915_CONTEXT_PARAM_ENGINES,
2280 * .value = to_user_pointer(&engines),
2281 * .size = sizeof(engines),
2284 * struct drm_i915_gem_context_create_ext create = {
2285 * .flags = I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS,
2286 * .extensions = to_user_pointer(&p_engines);
2289 * ctx_id = gem_context_create_ext(drm_fd, &create);
2291 * // Now we have created a GEM context with its engine map containing a
2292 * // single virtual engine. Submissions to this slot can go either to
2293 * // vcs0 or vcs1, depending on the load balancing algorithm used inside
2294 * // the driver. The load balancing is dynamic from one batch buffer to
2295 * // another and transparent to userspace.
2298 * execbuf.rsvd1 = ctx_id;
2299 * execbuf.flags = 0; // Submits to index 0 which is the virtual engine
2300 * gem_execbuf(drm_fd, &execbuf);
2304 * i915_context_engines_load_balance:
2306 * Enable load balancing across this set of engines.
2308 * Into the I915_EXEC_DEFAULT slot [0], a virtual engine is created that when
2309 * used will proxy the execbuffer request onto one of the set of engines
2310 * in such a way as to distribute the load evenly across the set.
2312 * The set of engines must be compatible (e.g. the same HW class) as they
2313 * will share the same logical GPU context and ring.
2315 * To intermix rendering with the virtual engine and direct rendering onto
2316 * the backing engines (bypassing the load balancing proxy), the context must
2317 * be defined to use a single timeline for all engines.
2319 struct i915_context_engines_load_balance {
2320 struct i915_user_extension base;
2324 __u32 flags; /* all undefined flags must be zero */
2326 __u64 mbz64; /* reserved for future use; must be zero */
2328 struct i915_engine_class_instance engines[];
2329 } __attribute__((packed));
2331 #define I915_DEFINE_CONTEXT_ENGINES_LOAD_BALANCE(name__, N__) struct { \
2332 struct i915_user_extension base; \
2333 __u16 engine_index; \
2334 __u16 num_siblings; \
2337 struct i915_engine_class_instance engines[N__]; \
2338 } __attribute__((packed)) name__
2341 * i915_context_engines_bond:
2343 * Constructed bonded pairs for execution within a virtual engine.
2345 * All engines are equal, but some are more equal than others. Given
2346 * the distribution of resources in the HW, it may be preferable to run
2347 * a request on a given subset of engines in parallel to a request on a
2348 * specific engine. We enable this selection of engines within a virtual
2349 * engine by specifying bonding pairs, for any given master engine we will
2350 * only execute on one of the corresponding siblings within the virtual engine.
2352 * To execute a request in parallel on the master engine and a sibling requires
2353 * coordination with a I915_EXEC_FENCE_SUBMIT.
2355 struct i915_context_engines_bond {
2356 struct i915_user_extension base;
2358 struct i915_engine_class_instance master;
2360 __u16 virtual_index; /* index of virtual engine in ctx->engines[] */
2363 __u64 flags; /* all undefined flags must be zero */
2364 __u64 mbz64[4]; /* reserved for future use; must be zero */
2366 struct i915_engine_class_instance engines[];
2367 } __attribute__((packed));
2369 #define I915_DEFINE_CONTEXT_ENGINES_BOND(name__, N__) struct { \
2370 struct i915_user_extension base; \
2371 struct i915_engine_class_instance master; \
2372 __u16 virtual_index; \
2376 struct i915_engine_class_instance engines[N__]; \
2377 } __attribute__((packed)) name__
2380 * struct i915_context_engines_parallel_submit - Configure engine for
2381 * parallel submission.
2383 * Setup a slot in the context engine map to allow multiple BBs to be submitted
2384 * in a single execbuf IOCTL. Those BBs will then be scheduled to run on the GPU
2385 * in parallel. Multiple hardware contexts are created internally in the i915 to
2386 * run these BBs. Once a slot is configured for N BBs only N BBs can be
2387 * submitted in each execbuf IOCTL and this is implicit behavior e.g. The user
2388 * doesn't tell the execbuf IOCTL there are N BBs, the execbuf IOCTL knows how
2389 * many BBs there are based on the slot's configuration. The N BBs are the last
2390 * N buffer objects or first N if I915_EXEC_BATCH_FIRST is set.
2392 * The default placement behavior is to create implicit bonds between each
2393 * context if each context maps to more than 1 physical engine (e.g. context is
2394 * a virtual engine). Also we only allow contexts of same engine class and these
2395 * contexts must be in logically contiguous order. Examples of the placement
2396 * behavior are described below. Lastly, the default is to not allow BBs to be
2397 * preempted mid-batch. Rather insert coordinated preemption points on all
2398 * hardware contexts between each set of BBs. Flags could be added in the future
2399 * to change both of these default behaviors.
2401 * Returns -EINVAL if hardware context placement configuration is invalid or if
2402 * the placement configuration isn't supported on the platform / submission
2404 * Returns -ENODEV if extension isn't supported on the platform / submission
2407 * .. code-block:: none
2410 * CS[X] = generic engine of same class, logical instance X
2411 * INVALID = I915_ENGINE_CLASS_INVALID, I915_ENGINE_CLASS_INVALID_NONE
2413 * Example 1 pseudo code:
2414 * set_engines(INVALID)
2415 * set_parallel(engine_index=0, width=2, num_siblings=1,
2416 * engines=CS[0],CS[1])
2418 * Results in the following valid placement:
2421 * Example 2 pseudo code:
2422 * set_engines(INVALID)
2423 * set_parallel(engine_index=0, width=2, num_siblings=2,
2424 * engines=CS[0],CS[2],CS[1],CS[3])
2426 * Results in the following valid placements:
2430 * This can be thought of as two virtual engines, each containing two
2431 * engines thereby making a 2D array. However, there are bonds tying the
2432 * entries together and placing restrictions on how they can be scheduled.
2433 * Specifically, the scheduler can choose only vertical columns from the 2D
2434 * array. That is, CS[0] is bonded to CS[1] and CS[2] to CS[3]. So if the
2435 * scheduler wants to submit to CS[0], it must also choose CS[1] and vice
2436 * versa. Same for CS[2] requires also using CS[3].
2437 * VE[0] = CS[0], CS[2]
2438 * VE[1] = CS[1], CS[3]
2440 * Example 3 pseudo code:
2441 * set_engines(INVALID)
2442 * set_parallel(engine_index=0, width=2, num_siblings=2,
2443 * engines=CS[0],CS[1],CS[1],CS[3])
2445 * Results in the following valid and invalid placements:
2447 * CS[1], CS[3] - Not logically contiguous, return -EINVAL
2449 struct i915_context_engines_parallel_submit {
2451 * @base: base user extension.
2453 struct i915_user_extension base;
2456 * @engine_index: slot for parallel engine
2461 * @width: number of contexts per parallel engine or in other words the
2462 * number of batches in each submission
2467 * @num_siblings: number of siblings per context or in other words the
2468 * number of possible placements for each submission
2473 * @mbz16: reserved for future use; must be zero
2478 * @flags: all undefined flags must be zero, currently not defined flags
2483 * @mbz64: reserved for future use; must be zero
2488 * @engines: 2-d array of engine instances to configure parallel engine
2490 * length = width (i) * num_siblings (j)
2491 * index = j + i * num_siblings
2493 struct i915_engine_class_instance engines[];
2497 #define I915_DEFINE_CONTEXT_ENGINES_PARALLEL_SUBMIT(name__, N__) struct { \
2498 struct i915_user_extension base; \
2499 __u16 engine_index; \
2501 __u16 num_siblings; \
2505 struct i915_engine_class_instance engines[N__]; \
2506 } __attribute__((packed)) name__
2509 * DOC: Context Engine Map uAPI
2511 * Context engine map is a new way of addressing engines when submitting batch-
2512 * buffers, replacing the existing way of using identifiers like `I915_EXEC_BLT`
2513 * inside the flags field of `struct drm_i915_gem_execbuffer2`.
2515 * To use it created GEM contexts need to be configured with a list of engines
2516 * the user is intending to submit to. This is accomplished using the
2517 * `I915_CONTEXT_PARAM_ENGINES` parameter and `struct
2518 * i915_context_param_engines`.
2520 * For such contexts the `I915_EXEC_RING_MASK` field becomes an index into the
2523 * Example of creating such context and submitting against it:
2527 * I915_DEFINE_CONTEXT_PARAM_ENGINES(engines, 2) = {
2528 * .engines = { { I915_ENGINE_CLASS_RENDER, 0 },
2529 * { I915_ENGINE_CLASS_COPY, 0 } }
2531 * struct drm_i915_gem_context_create_ext_setparam p_engines = {
2533 * .name = I915_CONTEXT_CREATE_EXT_SETPARAM,
2536 * .param = I915_CONTEXT_PARAM_ENGINES,
2537 * .value = to_user_pointer(&engines),
2538 * .size = sizeof(engines),
2541 * struct drm_i915_gem_context_create_ext create = {
2542 * .flags = I915_CONTEXT_CREATE_FLAGS_USE_EXTENSIONS,
2543 * .extensions = to_user_pointer(&p_engines);
2546 * ctx_id = gem_context_create_ext(drm_fd, &create);
2548 * // We have now created a GEM context with two engines in the map:
2549 * // Index 0 points to rcs0 while index 1 points to bcs0. Other engines
2550 * // will not be accessible from this context.
2553 * execbuf.rsvd1 = ctx_id;
2554 * execbuf.flags = 0; // Submits to index 0, which is rcs0 for this context
2555 * gem_execbuf(drm_fd, &execbuf);
2558 * execbuf.rsvd1 = ctx_id;
2559 * execbuf.flags = 1; // Submits to index 0, which is bcs0 for this context
2560 * gem_execbuf(drm_fd, &execbuf);
2563 struct i915_context_param_engines {
2564 __u64 extensions; /* linked chain of extension blocks, 0 terminates */
2565 #define I915_CONTEXT_ENGINES_EXT_LOAD_BALANCE 0 /* see i915_context_engines_load_balance */
2566 #define I915_CONTEXT_ENGINES_EXT_BOND 1 /* see i915_context_engines_bond */
2567 #define I915_CONTEXT_ENGINES_EXT_PARALLEL_SUBMIT 2 /* see i915_context_engines_parallel_submit */
2568 struct i915_engine_class_instance engines[];
2569 } __attribute__((packed));
2571 #define I915_DEFINE_CONTEXT_PARAM_ENGINES(name__, N__) struct { \
2573 struct i915_engine_class_instance engines[N__]; \
2574 } __attribute__((packed)) name__
2576 struct i915_gem_context_param_context_image {
2577 /** @engine: Engine class & instance to be configured. */
2578 struct i915_engine_class_instance engine;
2580 /** @flags: One of the supported flags or zero. */
2582 #define I915_CONTEXT_IMAGE_FLAG_ENGINE_INDEX (1u << 0)
2584 /** @size: Size of the image blob pointed to by @image. */
2587 /** @mbz: Must be zero. */
2590 /** @image: Userspace memory containing the context image. */
2592 } __attribute__((packed));
2595 * struct drm_i915_gem_context_create_ext_setparam - Context parameter
2596 * to set or query during context creation.
2598 struct drm_i915_gem_context_create_ext_setparam {
2599 /** @base: Extension link. See struct i915_user_extension. */
2600 struct i915_user_extension base;
2603 * @param: Context parameter to set or query.
2604 * See struct drm_i915_gem_context_param.
2606 struct drm_i915_gem_context_param param;
2609 struct drm_i915_gem_context_destroy {
2615 * struct drm_i915_gem_vm_control - Structure to create or destroy VM.
2617 * DRM_I915_GEM_VM_CREATE -
2619 * Create a new virtual memory address space (ppGTT) for use within a context
2620 * on the same file. Extensions can be provided to configure exactly how the
2621 * address space is setup upon creation.
2623 * The id of new VM (bound to the fd) for use with I915_CONTEXT_PARAM_VM is
2624 * returned in the outparam @id.
2626 * An extension chain maybe provided, starting with @extensions, and terminated
2627 * by the @next_extension being 0. Currently, no extensions are defined.
2629 * DRM_I915_GEM_VM_DESTROY -
2631 * Destroys a previously created VM id, specified in @vm_id.
2633 * No extensions or flags are allowed currently, and so must be zero.
2635 struct drm_i915_gem_vm_control {
2636 /** @extensions: Zero-terminated chain of extensions. */
2639 /** @flags: reserved for future usage, currently MBZ */
2642 /** @vm_id: Id of the VM created or to be destroyed */
2646 struct drm_i915_reg_read {
2649 * For 64bit wide registers where the upper 32bits don't immediately
2650 * follow the lower 32bits, the offset of the lower 32bits must
2654 #define I915_REG_READ_8B_WA (1ul << 0)
2656 __u64 val; /* Return value */
2661 * Render engine timestamp - 0x2358 + 64bit - gen7+
2662 * - Note this register returns an invalid value if using the default
2663 * single instruction 8byte read, in order to workaround that pass
2664 * flag I915_REG_READ_8B_WA in offset field.
2669 * struct drm_i915_reset_stats - Return global reset and other context stats
2671 * Driver keeps few stats for each contexts and also global reset count.
2672 * This struct can be used to query those stats.
2674 struct drm_i915_reset_stats {
2675 /** @ctx_id: ID of the requested context */
2681 /** @reset_count: All resets since boot/module reload, for all contexts */
2684 /** @batch_active: Number of batches lost when active in GPU, for this context */
2687 /** @batch_pending: Number of batches lost pending for execution, for this context */
2688 __u32 batch_pending;
2695 * struct drm_i915_gem_userptr - Create GEM object from user allocated memory.
2697 * Userptr objects have several restrictions on what ioctls can be used with the
2700 struct drm_i915_gem_userptr {
2702 * @user_ptr: The pointer to the allocated memory.
2704 * Needs to be aligned to PAGE_SIZE.
2711 * The size in bytes for the allocated memory. This will also become the
2714 * Needs to be aligned to PAGE_SIZE, and should be at least PAGE_SIZE,
2724 * I915_USERPTR_READ_ONLY:
2726 * Mark the object as readonly, this also means GPU access can only be
2727 * readonly. This is only supported on HW which supports readonly access
2728 * through the GTT. If the HW can't support readonly access, an error is
2731 * I915_USERPTR_PROBE:
2733 * Probe the provided @user_ptr range and validate that the @user_ptr is
2734 * indeed pointing to normal memory and that the range is also valid.
2735 * For example if some garbage address is given to the kernel, then this
2738 * Returns -EFAULT if the probe failed.
2740 * Note that this doesn't populate the backing pages, and also doesn't
2741 * guarantee that the object will remain valid when the object is
2744 * The kernel supports this feature if I915_PARAM_HAS_USERPTR_PROBE
2745 * returns a non-zero value.
2747 * I915_USERPTR_UNSYNCHRONIZED:
2749 * NOT USED. Setting this flag will result in an error.
2752 #define I915_USERPTR_READ_ONLY 0x1
2753 #define I915_USERPTR_PROBE 0x2
2754 #define I915_USERPTR_UNSYNCHRONIZED 0x80000000
2756 * @handle: Returned handle for the object.
2758 * Object handles are nonzero.
2763 enum drm_i915_oa_format {
2764 I915_OA_FORMAT_A13 = 1, /* HSW only */
2765 I915_OA_FORMAT_A29, /* HSW only */
2766 I915_OA_FORMAT_A13_B8_C8, /* HSW only */
2767 I915_OA_FORMAT_B4_C8, /* HSW only */
2768 I915_OA_FORMAT_A45_B8_C8, /* HSW only */
2769 I915_OA_FORMAT_B4_C8_A16, /* HSW only */
2770 I915_OA_FORMAT_C4_B8, /* HSW+ */
2774 I915_OA_FORMAT_A12_B8_C8,
2775 I915_OA_FORMAT_A32u40_A4u32_B8_C8,
2778 I915_OAR_FORMAT_A32u40_A4u32_B8_C8,
2779 I915_OA_FORMAT_A24u40_A14u32_B8_C8,
2782 I915_OAM_FORMAT_MPEC8u64_B8_C8,
2783 I915_OAM_FORMAT_MPEC8u32_B8_C8,
2785 I915_OA_FORMAT_MAX /* non-ABI */
2788 enum drm_i915_perf_property_id {
2790 * Open the stream for a specific context handle (as used with
2791 * execbuffer2). A stream opened for a specific context this way
2792 * won't typically require root privileges.
2794 * This property is available in perf revision 1.
2796 DRM_I915_PERF_PROP_CTX_HANDLE = 1,
2799 * A value of 1 requests the inclusion of raw OA unit reports as
2800 * part of stream samples.
2802 * This property is available in perf revision 1.
2804 DRM_I915_PERF_PROP_SAMPLE_OA,
2807 * The value specifies which set of OA unit metrics should be
2808 * configured, defining the contents of any OA unit reports.
2810 * This property is available in perf revision 1.
2812 DRM_I915_PERF_PROP_OA_METRICS_SET,
2815 * The value specifies the size and layout of OA unit reports.
2817 * This property is available in perf revision 1.
2819 DRM_I915_PERF_PROP_OA_FORMAT,
2822 * Specifying this property implicitly requests periodic OA unit
2823 * sampling and (at least on Haswell) the sampling frequency is derived
2824 * from this exponent as follows:
2826 * 80ns * 2^(period_exponent + 1)
2828 * This property is available in perf revision 1.
2830 DRM_I915_PERF_PROP_OA_EXPONENT,
2833 * Specifying this property is only valid when specify a context to
2834 * filter with DRM_I915_PERF_PROP_CTX_HANDLE. Specifying this property
2835 * will hold preemption of the particular context we want to gather
2836 * performance data about. The execbuf2 submissions must include a
2837 * drm_i915_gem_execbuffer_ext_perf parameter for this to apply.
2839 * This property is available in perf revision 3.
2841 DRM_I915_PERF_PROP_HOLD_PREEMPTION,
2844 * Specifying this pins all contexts to the specified SSEU power
2845 * configuration for the duration of the recording.
2847 * This parameter's value is a pointer to a struct
2848 * drm_i915_gem_context_param_sseu.
2850 * This property is available in perf revision 4.
2852 DRM_I915_PERF_PROP_GLOBAL_SSEU,
2855 * This optional parameter specifies the timer interval in nanoseconds
2856 * at which the i915 driver will check the OA buffer for available data.
2857 * Minimum allowed value is 100 microseconds. A default value is used by
2858 * the driver if this parameter is not specified. Note that larger timer
2859 * values will reduce cpu consumption during OA perf captures. However,
2860 * excessively large values would potentially result in OA buffer
2861 * overwrites as captures reach end of the OA buffer.
2863 * This property is available in perf revision 5.
2865 DRM_I915_PERF_PROP_POLL_OA_PERIOD,
2868 * Multiple engines may be mapped to the same OA unit. The OA unit is
2869 * identified by class:instance of any engine mapped to it.
2871 * This parameter specifies the engine class and must be passed along
2872 * with DRM_I915_PERF_PROP_OA_ENGINE_INSTANCE.
2874 * This property is available in perf revision 6.
2876 DRM_I915_PERF_PROP_OA_ENGINE_CLASS,
2879 * This parameter specifies the engine instance and must be passed along
2880 * with DRM_I915_PERF_PROP_OA_ENGINE_CLASS.
2882 * This property is available in perf revision 6.
2884 DRM_I915_PERF_PROP_OA_ENGINE_INSTANCE,
2886 DRM_I915_PERF_PROP_MAX /* non-ABI */
2889 struct drm_i915_perf_open_param {
2891 #define I915_PERF_FLAG_FD_CLOEXEC (1<<0)
2892 #define I915_PERF_FLAG_FD_NONBLOCK (1<<1)
2893 #define I915_PERF_FLAG_DISABLED (1<<2)
2895 /** The number of u64 (id, value) pairs */
2896 __u32 num_properties;
2899 * Pointer to array of u64 (id, value) pairs configuring the stream
2902 __u64 properties_ptr;
2906 * Enable data capture for a stream that was either opened in a disabled state
2907 * via I915_PERF_FLAG_DISABLED or was later disabled via
2908 * I915_PERF_IOCTL_DISABLE.
2910 * It is intended to be cheaper to disable and enable a stream than it may be
2911 * to close and re-open a stream with the same configuration.
2913 * It's undefined whether any pending data for the stream will be lost.
2915 * This ioctl is available in perf revision 1.
2917 #define I915_PERF_IOCTL_ENABLE _IO('i', 0x0)
2920 * Disable data capture for a stream.
2922 * It is an error to try and read a stream that is disabled.
2924 * This ioctl is available in perf revision 1.
2926 #define I915_PERF_IOCTL_DISABLE _IO('i', 0x1)
2929 * Change metrics_set captured by a stream.
2931 * If the stream is bound to a specific context, the configuration change
2932 * will performed inline with that context such that it takes effect before
2933 * the next execbuf submission.
2935 * Returns the previously bound metrics set id, or a negative error code.
2937 * This ioctl is available in perf revision 2.
2939 #define I915_PERF_IOCTL_CONFIG _IO('i', 0x2)
2942 * Common to all i915 perf records
2944 struct drm_i915_perf_record_header {
2950 enum drm_i915_perf_record_type {
2953 * Samples are the work horse record type whose contents are extensible
2954 * and defined when opening an i915 perf stream based on the given
2957 * Boolean properties following the naming convention
2958 * DRM_I915_PERF_SAMPLE_xyz_PROP request the inclusion of 'xyz' data in
2961 * The order of these sample properties given by userspace has no
2962 * affect on the ordering of data within a sample. The order is
2966 * struct drm_i915_perf_record_header header;
2968 * { u32 oa_report[]; } && DRM_I915_PERF_PROP_SAMPLE_OA
2971 DRM_I915_PERF_RECORD_SAMPLE = 1,
2974 * Indicates that one or more OA reports were not written by the
2975 * hardware. This can happen for example if an MI_REPORT_PERF_COUNT
2976 * command collides with periodic sampling - which would be more likely
2977 * at higher sampling frequencies.
2979 DRM_I915_PERF_RECORD_OA_REPORT_LOST = 2,
2982 * An error occurred that resulted in all pending OA reports being lost.
2984 DRM_I915_PERF_RECORD_OA_BUFFER_LOST = 3,
2986 DRM_I915_PERF_RECORD_MAX /* non-ABI */
2990 * struct drm_i915_perf_oa_config
2992 * Structure to upload perf dynamic configuration into the kernel.
2994 struct drm_i915_perf_oa_config {
2998 * String formatted like "%\08x-%\04x-%\04x-%\04x-%\012x"
3005 * Number of mux regs in &mux_regs_ptr.
3012 * Number of boolean regs in &boolean_regs_ptr.
3014 __u32 n_boolean_regs;
3019 * Number of flex regs in &flex_regs_ptr.
3026 * Pointer to tuples of u32 values (register address, value) for mux
3027 * registers. Expected length of buffer is (2 * sizeof(u32) *
3033 * @boolean_regs_ptr:
3035 * Pointer to tuples of u32 values (register address, value) for mux
3036 * registers. Expected length of buffer is (2 * sizeof(u32) *
3039 __u64 boolean_regs_ptr;
3044 * Pointer to tuples of u32 values (register address, value) for mux
3045 * registers. Expected length of buffer is (2 * sizeof(u32) *
3048 __u64 flex_regs_ptr;
3052 * struct drm_i915_query_item - An individual query for the kernel to process.
3054 * The behaviour is determined by the @query_id. Note that exactly what
3055 * @data_ptr is also depends on the specific @query_id.
3057 struct drm_i915_query_item {
3061 * The id for this query. Currently accepted query IDs are:
3062 * - %DRM_I915_QUERY_TOPOLOGY_INFO (see struct drm_i915_query_topology_info)
3063 * - %DRM_I915_QUERY_ENGINE_INFO (see struct drm_i915_engine_info)
3064 * - %DRM_I915_QUERY_PERF_CONFIG (see struct drm_i915_query_perf_config)
3065 * - %DRM_I915_QUERY_MEMORY_REGIONS (see struct drm_i915_query_memory_regions)
3066 * - %DRM_I915_QUERY_HWCONFIG_BLOB (see `GuC HWCONFIG blob uAPI`)
3067 * - %DRM_I915_QUERY_GEOMETRY_SUBSLICES (see struct drm_i915_query_topology_info)
3068 * - %DRM_I915_QUERY_GUC_SUBMISSION_VERSION (see struct drm_i915_query_guc_submission_version)
3071 #define DRM_I915_QUERY_TOPOLOGY_INFO 1
3072 #define DRM_I915_QUERY_ENGINE_INFO 2
3073 #define DRM_I915_QUERY_PERF_CONFIG 3
3074 #define DRM_I915_QUERY_MEMORY_REGIONS 4
3075 #define DRM_I915_QUERY_HWCONFIG_BLOB 5
3076 #define DRM_I915_QUERY_GEOMETRY_SUBSLICES 6
3077 #define DRM_I915_QUERY_GUC_SUBMISSION_VERSION 7
3078 /* Must be kept compact -- no holes and well documented */
3083 * When set to zero by userspace, this is filled with the size of the
3084 * data to be written at the @data_ptr pointer. The kernel sets this
3085 * value to a negative value to signal an error on a particular query
3093 * When &query_id == %DRM_I915_QUERY_TOPOLOGY_INFO, must be 0.
3095 * When &query_id == %DRM_I915_QUERY_PERF_CONFIG, must be one of the
3098 * - %DRM_I915_QUERY_PERF_CONFIG_LIST
3099 * - %DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID
3100 * - %DRM_I915_QUERY_PERF_CONFIG_FOR_UUID
3102 * When &query_id == %DRM_I915_QUERY_GEOMETRY_SUBSLICES must contain
3103 * a struct i915_engine_class_instance that references a render engine.
3106 #define DRM_I915_QUERY_PERF_CONFIG_LIST 1
3107 #define DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID 2
3108 #define DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_ID 3
3113 * Data will be written at the location pointed by @data_ptr when the
3114 * value of @length matches the length of the data to be written by the
3121 * struct drm_i915_query - Supply an array of struct drm_i915_query_item for the
3122 * kernel to fill out.
3124 * Note that this is generally a two step process for each struct
3125 * drm_i915_query_item in the array:
3127 * 1. Call the DRM_IOCTL_I915_QUERY, giving it our array of struct
3128 * drm_i915_query_item, with &drm_i915_query_item.length set to zero. The
3129 * kernel will then fill in the size, in bytes, which tells userspace how
3130 * memory it needs to allocate for the blob(say for an array of properties).
3132 * 2. Next we call DRM_IOCTL_I915_QUERY again, this time with the
3133 * &drm_i915_query_item.data_ptr equal to our newly allocated blob. Note that
3134 * the &drm_i915_query_item.length should still be the same as what the
3135 * kernel previously set. At this point the kernel can fill in the blob.
3137 * Note that for some query items it can make sense for userspace to just pass
3138 * in a buffer/blob equal to or larger than the required size. In this case only
3139 * a single ioctl call is needed. For some smaller query items this can work
3143 struct drm_i915_query {
3144 /** @num_items: The number of elements in the @items_ptr array */
3148 * @flags: Unused for now. Must be cleared to zero.
3155 * Pointer to an array of struct drm_i915_query_item. The number of
3156 * array elements is @num_items.
3162 * struct drm_i915_query_topology_info
3164 * Describes slice/subslice/EU information queried by
3165 * %DRM_I915_QUERY_TOPOLOGY_INFO
3167 struct drm_i915_query_topology_info {
3171 * Unused for now. Must be cleared to zero.
3178 * The number of bits used to express the slice mask.
3185 * The number of bits used to express the subslice mask.
3187 __u16 max_subslices;
3190 * @max_eus_per_subslice:
3192 * The number of bits in the EU mask that correspond to a single
3195 __u16 max_eus_per_subslice;
3200 * Offset in data[] at which the subslice masks are stored.
3202 __u16 subslice_offset;
3207 * Stride at which each of the subslice masks for each slice are
3210 __u16 subslice_stride;
3215 * Offset in data[] at which the EU masks are stored.
3222 * Stride at which each of the EU masks for each subslice are stored.
3229 * Contains 3 pieces of information :
3231 * - The slice mask with one bit per slice telling whether a slice is
3232 * available. The availability of slice X can be queried with the
3233 * following formula :
3237 * (data[X / 8] >> (X % 8)) & 1
3239 * Starting with Xe_HP platforms, Intel hardware no longer has
3240 * traditional slices so i915 will always report a single slice
3241 * (hardcoded slicemask = 0x1) which contains all of the platform's
3242 * subslices. I.e., the mask here does not reflect any of the newer
3243 * hardware concepts such as "gslices" or "cslices" since userspace
3244 * is capable of inferring those from the subslice mask.
3246 * - The subslice mask for each slice with one bit per subslice telling
3247 * whether a subslice is available. Starting with Gen12 we use the
3248 * term "subslice" to refer to what the hardware documentation
3249 * describes as a "dual-subslices." The availability of subslice Y
3250 * in slice X can be queried with the following formula :
3254 * (data[subslice_offset + X * subslice_stride + Y / 8] >> (Y % 8)) & 1
3256 * - The EU mask for each subslice in each slice, with one bit per EU
3257 * telling whether an EU is available. The availability of EU Z in
3258 * subslice Y in slice X can be queried with the following formula :
3263 * (X * max_subslices + Y) * eu_stride +
3271 * DOC: Engine Discovery uAPI
3273 * Engine discovery uAPI is a way of enumerating physical engines present in a
3274 * GPU associated with an open i915 DRM file descriptor. This supersedes the old
3275 * way of using `DRM_IOCTL_I915_GETPARAM` and engine identifiers like
3276 * `I915_PARAM_HAS_BLT`.
3278 * The need for this interface came starting with Icelake and newer GPUs, which
3279 * started to establish a pattern of having multiple engines of a same class,
3280 * where not all instances were always completely functionally equivalent.
3282 * Entry point for this uapi is `DRM_IOCTL_I915_QUERY` with the
3283 * `DRM_I915_QUERY_ENGINE_INFO` as the queried item id.
3285 * Example for getting the list of engines:
3289 * struct drm_i915_query_engine_info *info;
3290 * struct drm_i915_query_item item = {
3291 * .query_id = DRM_I915_QUERY_ENGINE_INFO;
3293 * struct drm_i915_query query = {
3295 * .items_ptr = (uintptr_t)&item,
3299 * // First query the size of the blob we need, this needs to be large
3300 * // enough to hold our array of engines. The kernel will fill out the
3301 * // item.length for us, which is the number of bytes we need.
3303 * // Alternatively a large buffer can be allocated straightaway enabling
3304 * // querying in one pass, in which case item.length should contain the
3305 * // length of the provided buffer.
3306 * err = ioctl(fd, DRM_IOCTL_I915_QUERY, &query);
3309 * info = calloc(1, item.length);
3310 * // Now that we allocated the required number of bytes, we call the ioctl
3311 * // again, this time with the data_ptr pointing to our newly allocated
3312 * // blob, which the kernel can then populate with info on all engines.
3313 * item.data_ptr = (uintptr_t)&info;
3315 * err = ioctl(fd, DRM_IOCTL_I915_QUERY, &query);
3318 * // We can now access each engine in the array
3319 * for (i = 0; i < info->num_engines; i++) {
3320 * struct drm_i915_engine_info einfo = info->engines[i];
3321 * u16 class = einfo.engine.class;
3322 * u16 instance = einfo.engine.instance;
3328 * Each of the enumerated engines, apart from being defined by its class and
3329 * instance (see `struct i915_engine_class_instance`), also can have flags and
3330 * capabilities defined as documented in i915_drm.h.
3332 * For instance video engines which support HEVC encoding will have the
3333 * `I915_VIDEO_CLASS_CAPABILITY_HEVC` capability bit set.
3335 * Engine discovery only fully comes to its own when combined with the new way
3336 * of addressing engines when submitting batch buffers using contexts with
3337 * engine maps configured.
3341 * struct drm_i915_engine_info
3343 * Describes one engine and its capabilities as known to the driver.
3345 struct drm_i915_engine_info {
3346 /** @engine: Engine class and instance. */
3347 struct i915_engine_class_instance engine;
3349 /** @rsvd0: Reserved field. */
3352 /** @flags: Engine flags. */
3354 #define I915_ENGINE_INFO_HAS_LOGICAL_INSTANCE (1 << 0)
3356 /** @capabilities: Capabilities of this engine. */
3358 #define I915_VIDEO_CLASS_CAPABILITY_HEVC (1 << 0)
3359 #define I915_VIDEO_AND_ENHANCE_CLASS_CAPABILITY_SFC (1 << 1)
3361 /** @logical_instance: Logical instance of engine */
3362 __u16 logical_instance;
3364 /** @rsvd1: Reserved fields. */
3366 /** @rsvd2: Reserved fields. */
3371 * struct drm_i915_query_engine_info
3373 * Engine info query enumerates all engines known to the driver by filling in
3374 * an array of struct drm_i915_engine_info structures.
3376 struct drm_i915_query_engine_info {
3377 /** @num_engines: Number of struct drm_i915_engine_info structs following. */
3383 /** @engines: Marker for drm_i915_engine_info structures. */
3384 struct drm_i915_engine_info engines[];
3388 * struct drm_i915_query_perf_config
3390 * Data written by the kernel with query %DRM_I915_QUERY_PERF_CONFIG and
3391 * %DRM_I915_QUERY_GEOMETRY_SUBSLICES.
3393 struct drm_i915_query_perf_config {
3398 * When &drm_i915_query_item.flags ==
3399 * %DRM_I915_QUERY_PERF_CONFIG_LIST, i915 sets this fields to
3400 * the number of configurations available.
3407 * When &drm_i915_query_item.flags ==
3408 * %DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_ID, i915 will use the
3409 * value in this field as configuration identifier to decide
3410 * what data to write into config_ptr.
3417 * When &drm_i915_query_item.flags ==
3418 * %DRM_I915_QUERY_PERF_CONFIG_DATA_FOR_UUID, i915 will use the
3419 * value in this field as configuration identifier to decide
3420 * what data to write into config_ptr.
3422 * String formatted like "%08x-%04x-%04x-%04x-%012x"
3430 * Unused for now. Must be cleared to zero.
3437 * When &drm_i915_query_item.flags == %DRM_I915_QUERY_PERF_CONFIG_LIST,
3438 * i915 will write an array of __u64 of configuration identifiers.
3440 * When &drm_i915_query_item.flags == %DRM_I915_QUERY_PERF_CONFIG_DATA,
3441 * i915 will write a struct drm_i915_perf_oa_config. If the following
3442 * fields of struct drm_i915_perf_oa_config are not set to 0, i915 will
3443 * write into the associated pointers the values of submitted when the
3444 * configuration was created :
3446 * - &drm_i915_perf_oa_config.n_mux_regs
3447 * - &drm_i915_perf_oa_config.n_boolean_regs
3448 * - &drm_i915_perf_oa_config.n_flex_regs
3454 * enum drm_i915_gem_memory_class - Supported memory classes
3456 enum drm_i915_gem_memory_class {
3457 /** @I915_MEMORY_CLASS_SYSTEM: System memory */
3458 I915_MEMORY_CLASS_SYSTEM = 0,
3459 /** @I915_MEMORY_CLASS_DEVICE: Device local-memory */
3460 I915_MEMORY_CLASS_DEVICE,
3464 * struct drm_i915_gem_memory_class_instance - Identify particular memory region
3466 struct drm_i915_gem_memory_class_instance {
3467 /** @memory_class: See enum drm_i915_gem_memory_class */
3470 /** @memory_instance: Which instance */
3471 __u16 memory_instance;
3475 * struct drm_i915_memory_region_info - Describes one region as known to the
3478 * Note this is using both struct drm_i915_query_item and struct drm_i915_query.
3479 * For this new query we are adding the new query id DRM_I915_QUERY_MEMORY_REGIONS
3480 * at &drm_i915_query_item.query_id.
3482 struct drm_i915_memory_region_info {
3483 /** @region: The class:instance pair encoding */
3484 struct drm_i915_gem_memory_class_instance region;
3490 * @probed_size: Memory probed by the driver
3492 * Note that it should not be possible to ever encounter a zero value
3493 * here, also note that no current region type will ever return -1 here.
3494 * Although for future region types, this might be a possibility. The
3495 * same applies to the other size fields.
3500 * @unallocated_size: Estimate of memory remaining
3502 * Requires CAP_PERFMON or CAP_SYS_ADMIN to get reliable accounting.
3503 * Without this (or if this is an older kernel) the value here will
3504 * always equal the @probed_size. Note this is only currently tracked
3505 * for I915_MEMORY_CLASS_DEVICE regions (for other types the value here
3506 * will always equal the @probed_size).
3508 __u64 unallocated_size;
3515 * @probed_cpu_visible_size: Memory probed by the driver
3516 * that is CPU accessible.
3518 * This will be always be <= @probed_size, and the
3519 * remainder (if there is any) will not be CPU
3522 * On systems without small BAR, the @probed_size will
3523 * always equal the @probed_cpu_visible_size, since all
3524 * of it will be CPU accessible.
3526 * Note this is only tracked for
3527 * I915_MEMORY_CLASS_DEVICE regions (for other types the
3528 * value here will always equal the @probed_size).
3530 * Note that if the value returned here is zero, then
3531 * this must be an old kernel which lacks the relevant
3532 * small-bar uAPI support (including
3533 * I915_GEM_CREATE_EXT_FLAG_NEEDS_CPU_ACCESS), but on
3534 * such systems we should never actually end up with a
3535 * small BAR configuration, assuming we are able to load
3536 * the kernel module. Hence it should be safe to treat
3537 * this the same as when @probed_cpu_visible_size ==
3540 __u64 probed_cpu_visible_size;
3543 * @unallocated_cpu_visible_size: Estimate of CPU
3544 * visible memory remaining.
3546 * Note this is only tracked for
3547 * I915_MEMORY_CLASS_DEVICE regions (for other types the
3548 * value here will always equal the
3549 * @probed_cpu_visible_size).
3551 * Requires CAP_PERFMON or CAP_SYS_ADMIN to get reliable
3552 * accounting. Without this the value here will always
3553 * equal the @probed_cpu_visible_size. Note this is only
3554 * currently tracked for I915_MEMORY_CLASS_DEVICE
3555 * regions (for other types the value here will also
3556 * always equal the @probed_cpu_visible_size).
3558 * If this is an older kernel the value here will be
3559 * zero, see also @probed_cpu_visible_size.
3561 __u64 unallocated_cpu_visible_size;
3567 * struct drm_i915_query_memory_regions
3569 * The region info query enumerates all regions known to the driver by filling
3570 * in an array of struct drm_i915_memory_region_info structures.
3572 * Example for getting the list of supported regions:
3576 * struct drm_i915_query_memory_regions *info;
3577 * struct drm_i915_query_item item = {
3578 * .query_id = DRM_I915_QUERY_MEMORY_REGIONS;
3580 * struct drm_i915_query query = {
3582 * .items_ptr = (uintptr_t)&item,
3586 * // First query the size of the blob we need, this needs to be large
3587 * // enough to hold our array of regions. The kernel will fill out the
3588 * // item.length for us, which is the number of bytes we need.
3589 * err = ioctl(fd, DRM_IOCTL_I915_QUERY, &query);
3592 * info = calloc(1, item.length);
3593 * // Now that we allocated the required number of bytes, we call the ioctl
3594 * // again, this time with the data_ptr pointing to our newly allocated
3595 * // blob, which the kernel can then populate with the all the region info.
3596 * item.data_ptr = (uintptr_t)&info,
3598 * err = ioctl(fd, DRM_IOCTL_I915_QUERY, &query);
3601 * // We can now access each region in the array
3602 * for (i = 0; i < info->num_regions; i++) {
3603 * struct drm_i915_memory_region_info mr = info->regions[i];
3604 * u16 class = mr.region.class;
3605 * u16 instance = mr.region.instance;
3612 struct drm_i915_query_memory_regions {
3613 /** @num_regions: Number of supported regions */
3619 /** @regions: Info about each supported region */
3620 struct drm_i915_memory_region_info regions[];
3624 * struct drm_i915_query_guc_submission_version - query GuC submission interface version
3626 struct drm_i915_query_guc_submission_version {
3627 /** @branch: Firmware branch version. */
3629 /** @major: Firmware major version. */
3631 /** @minor: Firmware minor version. */
3633 /** @patch: Firmware patch version. */
3638 * DOC: GuC HWCONFIG blob uAPI
3640 * The GuC produces a blob with information about the current device.
3641 * i915 reads this blob from GuC and makes it available via this uAPI.
3643 * The format and meaning of the blob content are documented in the
3644 * Programmer's Reference Manual.
3648 * struct drm_i915_gem_create_ext - Existing gem_create behaviour, with added
3649 * extension support using struct i915_user_extension.
3651 * Note that new buffer flags should be added here, at least for the stuff that
3652 * is immutable. Previously we would have two ioctls, one to create the object
3653 * with gem_create, and another to apply various parameters, however this
3654 * creates some ambiguity for the params which are considered immutable. Also in
3655 * general we're phasing out the various SET/GET ioctls.
3657 struct drm_i915_gem_create_ext {
3659 * @size: Requested size for the object.
3661 * The (page-aligned) allocated size for the object will be returned.
3663 * On platforms like DG2/ATS the kernel will always use 64K or larger
3664 * pages for I915_MEMORY_CLASS_DEVICE. The kernel also requires a
3665 * minimum of 64K GTT alignment for such objects.
3667 * NOTE: Previously the ABI here required a minimum GTT alignment of 2M
3668 * on DG2/ATS, due to how the hardware implemented 64K GTT page support,
3669 * where we had the following complications:
3671 * 1) The entire PDE (which covers a 2MB virtual address range), must
3672 * contain only 64K PTEs, i.e mixing 4K and 64K PTEs in the same
3673 * PDE is forbidden by the hardware.
3675 * 2) We still need to support 4K PTEs for I915_MEMORY_CLASS_SYSTEM
3678 * However on actual production HW this was completely changed to now
3679 * allow setting a TLB hint at the PTE level (see PS64), which is a lot
3680 * more flexible than the above. With this the 2M restriction was
3681 * dropped where we now only require 64K.
3686 * @handle: Returned handle for the object.
3688 * Object handles are nonzero.
3693 * @flags: Optional flags.
3697 * I915_GEM_CREATE_EXT_FLAG_NEEDS_CPU_ACCESS - Signal to the kernel that
3698 * the object will need to be accessed via the CPU.
3700 * Only valid when placing objects in I915_MEMORY_CLASS_DEVICE, and only
3701 * strictly required on configurations where some subset of the device
3702 * memory is directly visible/mappable through the CPU (which we also
3703 * call small BAR), like on some DG2+ systems. Note that this is quite
3704 * undesirable, but due to various factors like the client CPU, BIOS etc
3705 * it's something we can expect to see in the wild. See
3706 * &drm_i915_memory_region_info.probed_cpu_visible_size for how to
3707 * determine if this system applies.
3709 * Note that one of the placements MUST be I915_MEMORY_CLASS_SYSTEM, to
3710 * ensure the kernel can always spill the allocation to system memory,
3711 * if the object can't be allocated in the mappable part of
3712 * I915_MEMORY_CLASS_DEVICE.
3714 * Also note that since the kernel only supports flat-CCS on objects
3715 * that can *only* be placed in I915_MEMORY_CLASS_DEVICE, we therefore
3716 * don't support I915_GEM_CREATE_EXT_FLAG_NEEDS_CPU_ACCESS together with
3719 * Without this hint, the kernel will assume that non-mappable
3720 * I915_MEMORY_CLASS_DEVICE is preferred for this object. Note that the
3721 * kernel can still migrate the object to the mappable part, as a last
3722 * resort, if userspace ever CPU faults this object, but this might be
3723 * expensive, and so ideally should be avoided.
3725 * On older kernels which lack the relevant small-bar uAPI support (see
3726 * also &drm_i915_memory_region_info.probed_cpu_visible_size),
3727 * usage of the flag will result in an error, but it should NEVER be
3728 * possible to end up with a small BAR configuration, assuming we can
3729 * also successfully load the i915 kernel module. In such cases the
3730 * entire I915_MEMORY_CLASS_DEVICE region will be CPU accessible, and as
3731 * such there are zero restrictions on where the object can be placed.
3733 #define I915_GEM_CREATE_EXT_FLAG_NEEDS_CPU_ACCESS (1 << 0)
3737 * @extensions: The chain of extensions to apply to this object.
3739 * This will be useful in the future when we need to support several
3740 * different extensions, and we need to apply more than one when
3741 * creating the object. See struct i915_user_extension.
3743 * If we don't supply any extensions then we get the same old gem_create
3746 * For I915_GEM_CREATE_EXT_MEMORY_REGIONS usage see
3747 * struct drm_i915_gem_create_ext_memory_regions.
3749 * For I915_GEM_CREATE_EXT_PROTECTED_CONTENT usage see
3750 * struct drm_i915_gem_create_ext_protected_content.
3752 * For I915_GEM_CREATE_EXT_SET_PAT usage see
3753 * struct drm_i915_gem_create_ext_set_pat.
3755 #define I915_GEM_CREATE_EXT_MEMORY_REGIONS 0
3756 #define I915_GEM_CREATE_EXT_PROTECTED_CONTENT 1
3757 #define I915_GEM_CREATE_EXT_SET_PAT 2
3762 * struct drm_i915_gem_create_ext_memory_regions - The
3763 * I915_GEM_CREATE_EXT_MEMORY_REGIONS extension.
3765 * Set the object with the desired set of placements/regions in priority
3766 * order. Each entry must be unique and supported by the device.
3768 * This is provided as an array of struct drm_i915_gem_memory_class_instance, or
3769 * an equivalent layout of class:instance pair encodings. See struct
3770 * drm_i915_query_memory_regions and DRM_I915_QUERY_MEMORY_REGIONS for how to
3771 * query the supported regions for a device.
3773 * As an example, on discrete devices, if we wish to set the placement as
3774 * device local-memory we can do something like:
3778 * struct drm_i915_gem_memory_class_instance region_lmem = {
3779 * .memory_class = I915_MEMORY_CLASS_DEVICE,
3780 * .memory_instance = 0,
3782 * struct drm_i915_gem_create_ext_memory_regions regions = {
3783 * .base = { .name = I915_GEM_CREATE_EXT_MEMORY_REGIONS },
3784 * .regions = (uintptr_t)®ion_lmem,
3787 * struct drm_i915_gem_create_ext create_ext = {
3788 * .size = 16 * PAGE_SIZE,
3789 * .extensions = (uintptr_t)®ions,
3792 * int err = ioctl(fd, DRM_IOCTL_I915_GEM_CREATE_EXT, &create_ext);
3795 * At which point we get the object handle in &drm_i915_gem_create_ext.handle,
3796 * along with the final object size in &drm_i915_gem_create_ext.size, which
3797 * should account for any rounding up, if required.
3799 * Note that userspace has no means of knowing the current backing region
3800 * for objects where @num_regions is larger than one. The kernel will only
3801 * ensure that the priority order of the @regions array is honoured, either
3802 * when initially placing the object, or when moving memory around due to
3805 * On Flat-CCS capable HW, compression is supported for the objects residing
3806 * in I915_MEMORY_CLASS_DEVICE. When such objects (compressed) have other
3807 * memory class in @regions and migrated (by i915, due to memory
3808 * constraints) to the non I915_MEMORY_CLASS_DEVICE region, then i915 needs to
3809 * decompress the content. But i915 doesn't have the required information to
3810 * decompress the userspace compressed objects.
3812 * So i915 supports Flat-CCS, on the objects which can reside only on
3813 * I915_MEMORY_CLASS_DEVICE regions.
3815 struct drm_i915_gem_create_ext_memory_regions {
3816 /** @base: Extension link. See struct i915_user_extension. */
3817 struct i915_user_extension base;
3821 /** @num_regions: Number of elements in the @regions array. */
3824 * @regions: The regions/placements array.
3826 * An array of struct drm_i915_gem_memory_class_instance.
3832 * struct drm_i915_gem_create_ext_protected_content - The
3833 * I915_OBJECT_PARAM_PROTECTED_CONTENT extension.
3835 * If this extension is provided, buffer contents are expected to be protected
3836 * by PXP encryption and require decryption for scan out and processing. This
3837 * is only possible on platforms that have PXP enabled, on all other scenarios
3838 * using this extension will cause the ioctl to fail and return -ENODEV. The
3839 * flags parameter is reserved for future expansion and must currently be set
3842 * The buffer contents are considered invalid after a PXP session teardown.
3844 * The encryption is guaranteed to be processed correctly only if the object
3845 * is submitted with a context created using the
3846 * I915_CONTEXT_PARAM_PROTECTED_CONTENT flag. This will also enable extra checks
3847 * at submission time on the validity of the objects involved.
3849 * Below is an example on how to create a protected object:
3853 * struct drm_i915_gem_create_ext_protected_content protected_ext = {
3854 * .base = { .name = I915_GEM_CREATE_EXT_PROTECTED_CONTENT },
3857 * struct drm_i915_gem_create_ext create_ext = {
3858 * .size = PAGE_SIZE,
3859 * .extensions = (uintptr_t)&protected_ext,
3862 * int err = ioctl(fd, DRM_IOCTL_I915_GEM_CREATE_EXT, &create_ext);
3865 struct drm_i915_gem_create_ext_protected_content {
3866 /** @base: Extension link. See struct i915_user_extension. */
3867 struct i915_user_extension base;
3868 /** @flags: reserved for future usage, currently MBZ */
3873 * struct drm_i915_gem_create_ext_set_pat - The
3874 * I915_GEM_CREATE_EXT_SET_PAT extension.
3876 * If this extension is provided, the specified caching policy (PAT index) is
3877 * applied to the buffer object.
3879 * Below is an example on how to create an object with specific caching policy:
3883 * struct drm_i915_gem_create_ext_set_pat set_pat_ext = {
3884 * .base = { .name = I915_GEM_CREATE_EXT_SET_PAT },
3887 * struct drm_i915_gem_create_ext create_ext = {
3888 * .size = PAGE_SIZE,
3889 * .extensions = (uintptr_t)&set_pat_ext,
3892 * int err = ioctl(fd, DRM_IOCTL_I915_GEM_CREATE_EXT, &create_ext);
3895 struct drm_i915_gem_create_ext_set_pat {
3896 /** @base: Extension link. See struct i915_user_extension. */
3897 struct i915_user_extension base;
3899 * @pat_index: PAT index to be set
3900 * PAT index is a bit field in Page Table Entry to control caching
3901 * behaviors for GPU accesses. The definition of PAT index is
3902 * platform dependent and can be found in hardware specifications,
3905 /** @rsvd: reserved for future use */
3909 /* ID of the protected content session managed by i915 when PXP is active */
3910 #define I915_PROTECTED_CONTENT_DEFAULT_SESSION 0xf
3912 #if defined(__cplusplus)
3916 #endif /* _UAPI_I915_DRM_H_ */