2 * SPDX-License-Identifier: MIT
4 * Copyright © 2016 Intel Corporation
7 #include <linux/highmem.h>
8 #include <linux/prime_numbers.h>
10 #include "gem/i915_gem_internal.h"
11 #include "gem/i915_gem_lmem.h"
12 #include "gem/i915_gem_region.h"
13 #include "gem/i915_gem_ttm.h"
14 #include "gem/i915_gem_ttm_move.h"
15 #include "gt/intel_engine_pm.h"
16 #include "gt/intel_gpu_commands.h"
17 #include "gt/intel_gt.h"
18 #include "gt/intel_gt_pm.h"
19 #include "gt/intel_migrate.h"
20 #include "i915_ttm_buddy_manager.h"
22 #include "huge_gem_object.h"
23 #include "i915_selftest.h"
24 #include "selftests/i915_random.h"
25 #include "selftests/igt_flush_test.h"
26 #include "selftests/igt_reset.h"
27 #include "selftests/igt_mmap.h"
38 static u64 swizzle_bit(unsigned int bit, u64 offset)
40 return (offset & BIT_ULL(bit)) >> (bit - 6);
43 static u64 tiled_offset(const struct tile *tile, u64 v)
47 if (tile->tiling == I915_TILING_NONE)
50 y = div64_u64_rem(v, tile->stride, &x);
51 v = div64_u64_rem(y, tile->height, &y) * tile->stride * tile->height;
53 if (tile->tiling == I915_TILING_X) {
55 v += div64_u64_rem(x, tile->width, &x) << tile->size;
57 } else if (tile->width == 128) {
58 const unsigned int ytile_span = 16;
59 const unsigned int ytile_height = 512;
62 v += div64_u64_rem(x, ytile_span, &x) * ytile_height;
65 const unsigned int ytile_span = 32;
66 const unsigned int ytile_height = 256;
69 v += div64_u64_rem(x, ytile_span, &x) * ytile_height;
73 switch (tile->swizzle) {
74 case I915_BIT_6_SWIZZLE_9:
75 v ^= swizzle_bit(9, v);
77 case I915_BIT_6_SWIZZLE_9_10:
78 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v);
80 case I915_BIT_6_SWIZZLE_9_11:
81 v ^= swizzle_bit(9, v) ^ swizzle_bit(11, v);
83 case I915_BIT_6_SWIZZLE_9_10_11:
84 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v) ^ swizzle_bit(11, v);
91 static int check_partial_mapping(struct drm_i915_gem_object *obj,
92 const struct tile *tile,
93 struct rnd_state *prng)
95 const unsigned long npages = obj->base.size / PAGE_SIZE;
96 struct drm_i915_private *i915 = to_i915(obj->base.dev);
97 struct i915_gtt_view view;
107 err = i915_gem_object_set_tiling(obj, tile->tiling, tile->stride);
109 pr_err("Failed to set tiling mode=%u, stride=%u, err=%d\n",
110 tile->tiling, tile->stride, err);
114 GEM_BUG_ON(i915_gem_object_get_tiling(obj) != tile->tiling);
115 GEM_BUG_ON(i915_gem_object_get_stride(obj) != tile->stride);
117 i915_gem_object_lock(obj, NULL);
118 err = i915_gem_object_set_to_gtt_domain(obj, true);
119 i915_gem_object_unlock(obj);
121 pr_err("Failed to flush to GTT write domain; err=%d\n", err);
125 page = i915_prandom_u32_max_state(npages, prng);
126 view = compute_partial_view(obj, page, MIN_CHUNK_PAGES);
128 vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE);
130 pr_err("Failed to pin partial view: offset=%lu; err=%d\n",
131 page, (int)PTR_ERR(vma));
135 n = page - view.partial.offset;
136 GEM_BUG_ON(n >= view.partial.size);
138 io = i915_vma_pin_iomap(vma);
141 pr_err("Failed to iomap partial view: offset=%lu; err=%d\n",
142 page, (int)PTR_ERR(io));
147 iowrite32(page, io + n * PAGE_SIZE / sizeof(*io));
148 i915_vma_unpin_iomap(vma);
150 offset = tiled_offset(tile, page << PAGE_SHIFT);
151 if (offset >= obj->base.size)
154 intel_gt_flush_ggtt_writes(to_gt(i915));
156 p = i915_gem_object_get_page(obj, offset >> PAGE_SHIFT);
157 cpu = kmap(p) + offset_in_page(offset);
158 drm_clflush_virt_range(cpu, sizeof(*cpu));
159 if (*cpu != (u32)page) {
160 pr_err("Partial view for %lu [%u] (offset=%llu, size=%u [%llu, row size %u], fence=%d, tiling=%d, stride=%d) misalignment, expected write to page (%llu + %u [0x%llx]) of 0x%x, found 0x%x\n",
164 vma->size >> PAGE_SHIFT,
165 tile->tiling ? tile_row_pages(obj) : 0,
166 vma->fence ? vma->fence->id : -1, tile->tiling, tile->stride,
167 offset >> PAGE_SHIFT,
168 (unsigned int)offset_in_page(offset),
174 drm_clflush_virt_range(cpu, sizeof(*cpu));
178 i915_gem_object_lock(obj, NULL);
179 i915_vma_destroy(vma);
180 i915_gem_object_unlock(obj);
184 static int check_partial_mappings(struct drm_i915_gem_object *obj,
185 const struct tile *tile,
186 unsigned long end_time)
188 const unsigned int nreal = obj->scratch / PAGE_SIZE;
189 const unsigned long npages = obj->base.size / PAGE_SIZE;
190 struct drm_i915_private *i915 = to_i915(obj->base.dev);
191 struct i915_vma *vma;
195 err = i915_gem_object_set_tiling(obj, tile->tiling, tile->stride);
197 pr_err("Failed to set tiling mode=%u, stride=%u, err=%d\n",
198 tile->tiling, tile->stride, err);
202 GEM_BUG_ON(i915_gem_object_get_tiling(obj) != tile->tiling);
203 GEM_BUG_ON(i915_gem_object_get_stride(obj) != tile->stride);
205 i915_gem_object_lock(obj, NULL);
206 err = i915_gem_object_set_to_gtt_domain(obj, true);
207 i915_gem_object_unlock(obj);
209 pr_err("Failed to flush to GTT write domain; err=%d\n", err);
213 for_each_prime_number_from(page, 1, npages) {
214 struct i915_gtt_view view =
215 compute_partial_view(obj, page, MIN_CHUNK_PAGES);
222 GEM_BUG_ON(view.partial.size > nreal);
225 vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE);
227 pr_err("Failed to pin partial view: offset=%lu; err=%d\n",
228 page, (int)PTR_ERR(vma));
232 n = page - view.partial.offset;
233 GEM_BUG_ON(n >= view.partial.size);
235 io = i915_vma_pin_iomap(vma);
238 pr_err("Failed to iomap partial view: offset=%lu; err=%d\n",
239 page, (int)PTR_ERR(io));
243 iowrite32(page, io + n * PAGE_SIZE / sizeof(*io));
244 i915_vma_unpin_iomap(vma);
246 offset = tiled_offset(tile, page << PAGE_SHIFT);
247 if (offset >= obj->base.size)
250 intel_gt_flush_ggtt_writes(to_gt(i915));
252 p = i915_gem_object_get_page(obj, offset >> PAGE_SHIFT);
253 cpu = kmap(p) + offset_in_page(offset);
254 drm_clflush_virt_range(cpu, sizeof(*cpu));
255 if (*cpu != (u32)page) {
256 pr_err("Partial view for %lu [%u] (offset=%llu, size=%u [%llu, row size %u], fence=%d, tiling=%d, stride=%d) misalignment, expected write to page (%llu + %u [0x%llx]) of 0x%x, found 0x%x\n",
260 vma->size >> PAGE_SHIFT,
261 tile->tiling ? tile_row_pages(obj) : 0,
262 vma->fence ? vma->fence->id : -1, tile->tiling, tile->stride,
263 offset >> PAGE_SHIFT,
264 (unsigned int)offset_in_page(offset),
270 drm_clflush_virt_range(cpu, sizeof(*cpu));
275 i915_gem_object_lock(obj, NULL);
276 i915_vma_destroy(vma);
277 i915_gem_object_unlock(obj);
279 if (igt_timeout(end_time,
280 "%s: timed out after tiling=%d stride=%d\n",
281 __func__, tile->tiling, tile->stride))
289 setup_tile_size(struct tile *tile, struct drm_i915_private *i915)
291 if (GRAPHICS_VER(i915) <= 2) {
295 } else if (tile->tiling == I915_TILING_Y &&
296 HAS_128_BYTE_Y_TILING(i915)) {
306 if (GRAPHICS_VER(i915) < 4)
307 return 8192 / tile->width;
308 else if (GRAPHICS_VER(i915) < 7)
309 return 128 * I965_FENCE_MAX_PITCH_VAL / tile->width;
311 return 128 * GEN7_FENCE_MAX_PITCH_VAL / tile->width;
314 static int igt_partial_tiling(void *arg)
316 const unsigned int nreal = 1 << 12; /* largest tile row x2 */
317 struct drm_i915_private *i915 = arg;
318 struct drm_i915_gem_object *obj;
319 intel_wakeref_t wakeref;
323 if (!i915_ggtt_has_aperture(to_gt(i915)->ggtt))
326 /* We want to check the page mapping and fencing of a large object
327 * mmapped through the GTT. The object we create is larger than can
328 * possibly be mmaped as a whole, and so we must use partial GGTT vma.
329 * We then check that a write through each partial GGTT vma ends up
330 * in the right set of pages within the object, and with the expected
331 * tiling, which we verify by manual swizzling.
334 obj = huge_gem_object(i915,
336 (1 + next_prime_number(to_gt(i915)->ggtt->vm.total >> PAGE_SHIFT)) << PAGE_SHIFT);
340 err = i915_gem_object_pin_pages_unlocked(obj);
342 pr_err("Failed to allocate %u pages (%lu total), err=%d\n",
343 nreal, obj->base.size / PAGE_SIZE, err);
347 wakeref = intel_runtime_pm_get(&i915->runtime_pm);
357 tile.swizzle = I915_BIT_6_SWIZZLE_NONE;
358 tile.tiling = I915_TILING_NONE;
360 err = check_partial_mappings(obj, &tile, end);
361 if (err && err != -EINTR)
365 for (tiling = I915_TILING_X; tiling <= I915_TILING_Y; tiling++) {
367 unsigned int max_pitch;
371 if (i915->gem_quirks & GEM_QUIRK_PIN_SWIZZLED_PAGES)
373 * The swizzling pattern is actually unknown as it
374 * varies based on physical address of each page.
375 * See i915_gem_detect_bit_6_swizzle().
379 tile.tiling = tiling;
382 tile.swizzle = to_gt(i915)->ggtt->bit_6_swizzle_x;
385 tile.swizzle = to_gt(i915)->ggtt->bit_6_swizzle_y;
389 GEM_BUG_ON(tile.swizzle == I915_BIT_6_SWIZZLE_UNKNOWN);
390 if (tile.swizzle == I915_BIT_6_SWIZZLE_9_17 ||
391 tile.swizzle == I915_BIT_6_SWIZZLE_9_10_17)
394 max_pitch = setup_tile_size(&tile, i915);
396 for (pitch = max_pitch; pitch; pitch >>= 1) {
397 tile.stride = tile.width * pitch;
398 err = check_partial_mappings(obj, &tile, end);
404 if (pitch > 2 && GRAPHICS_VER(i915) >= 4) {
405 tile.stride = tile.width * (pitch - 1);
406 err = check_partial_mappings(obj, &tile, end);
413 if (pitch < max_pitch && GRAPHICS_VER(i915) >= 4) {
414 tile.stride = tile.width * (pitch + 1);
415 err = check_partial_mappings(obj, &tile, end);
423 if (GRAPHICS_VER(i915) >= 4) {
424 for_each_prime_number(pitch, max_pitch) {
425 tile.stride = tile.width * pitch;
426 err = check_partial_mappings(obj, &tile, end);
438 intel_runtime_pm_put(&i915->runtime_pm, wakeref);
439 i915_gem_object_unpin_pages(obj);
441 i915_gem_object_put(obj);
445 static int igt_smoke_tiling(void *arg)
447 const unsigned int nreal = 1 << 12; /* largest tile row x2 */
448 struct drm_i915_private *i915 = arg;
449 struct drm_i915_gem_object *obj;
450 intel_wakeref_t wakeref;
451 I915_RND_STATE(prng);
456 if (!i915_ggtt_has_aperture(to_gt(i915)->ggtt))
460 * igt_partial_tiling() does an exhastive check of partial tiling
461 * chunking, but will undoubtably run out of time. Here, we do a
462 * randomised search and hope over many runs of 1s with different
463 * seeds we will do a thorough check.
465 * Remember to look at the st_seed if we see a flip-flop in BAT!
468 if (i915->gem_quirks & GEM_QUIRK_PIN_SWIZZLED_PAGES)
471 obj = huge_gem_object(i915,
473 (1 + next_prime_number(to_gt(i915)->ggtt->vm.total >> PAGE_SHIFT)) << PAGE_SHIFT);
477 err = i915_gem_object_pin_pages_unlocked(obj);
479 pr_err("Failed to allocate %u pages (%lu total), err=%d\n",
480 nreal, obj->base.size / PAGE_SIZE, err);
484 wakeref = intel_runtime_pm_get(&i915->runtime_pm);
491 i915_prandom_u32_max_state(I915_TILING_Y + 1, &prng);
492 switch (tile.tiling) {
493 case I915_TILING_NONE:
498 tile.swizzle = I915_BIT_6_SWIZZLE_NONE;
502 tile.swizzle = to_gt(i915)->ggtt->bit_6_swizzle_x;
505 tile.swizzle = to_gt(i915)->ggtt->bit_6_swizzle_y;
509 if (tile.swizzle == I915_BIT_6_SWIZZLE_9_17 ||
510 tile.swizzle == I915_BIT_6_SWIZZLE_9_10_17)
513 if (tile.tiling != I915_TILING_NONE) {
514 unsigned int max_pitch = setup_tile_size(&tile, i915);
517 i915_prandom_u32_max_state(max_pitch, &prng);
518 tile.stride = (1 + tile.stride) * tile.width;
519 if (GRAPHICS_VER(i915) < 4)
520 tile.stride = rounddown_pow_of_two(tile.stride);
523 err = check_partial_mapping(obj, &tile, &prng);
528 } while (!__igt_timeout(end, NULL));
530 pr_info("%s: Completed %lu trials\n", __func__, count);
532 intel_runtime_pm_put(&i915->runtime_pm, wakeref);
533 i915_gem_object_unpin_pages(obj);
535 i915_gem_object_put(obj);
539 static int make_obj_busy(struct drm_i915_gem_object *obj)
541 struct drm_i915_private *i915 = to_i915(obj->base.dev);
542 struct intel_engine_cs *engine;
544 for_each_uabi_engine(engine, i915) {
545 struct i915_request *rq;
546 struct i915_vma *vma;
547 struct i915_gem_ww_ctx ww;
550 vma = i915_vma_instance(obj, &engine->gt->ggtt->vm, NULL);
554 i915_gem_ww_ctx_init(&ww, false);
556 err = i915_gem_object_lock(obj, &ww);
558 err = i915_vma_pin_ww(vma, &ww, 0, 0, PIN_USER);
562 rq = intel_engine_create_kernel_request(engine);
568 err = i915_request_await_object(rq, vma->obj, true);
570 err = i915_vma_move_to_active(vma, rq,
573 i915_request_add(rq);
577 if (err == -EDEADLK) {
578 err = i915_gem_ww_ctx_backoff(&ww);
582 i915_gem_ww_ctx_fini(&ww);
587 i915_gem_object_put(obj); /* leave it only alive via its active ref */
591 static enum i915_mmap_type default_mapping(struct drm_i915_private *i915)
594 return I915_MMAP_TYPE_FIXED;
596 return I915_MMAP_TYPE_GTT;
599 static struct drm_i915_gem_object *
600 create_sys_or_internal(struct drm_i915_private *i915,
603 if (HAS_LMEM(i915)) {
604 struct intel_memory_region *sys_region =
605 i915->mm.regions[INTEL_REGION_SMEM];
607 return __i915_gem_object_create_user(i915, size, &sys_region, 1);
610 return i915_gem_object_create_internal(i915, size);
613 static bool assert_mmap_offset(struct drm_i915_private *i915,
617 struct drm_i915_gem_object *obj;
621 obj = create_sys_or_internal(i915, size);
623 return expected && expected == PTR_ERR(obj);
625 ret = __assign_mmap_offset(obj, default_mapping(i915), &offset, NULL);
626 i915_gem_object_put(obj);
628 return ret == expected;
631 static void disable_retire_worker(struct drm_i915_private *i915)
633 i915_gem_driver_unregister__shrinker(i915);
634 intel_gt_pm_get(to_gt(i915));
635 cancel_delayed_work_sync(&to_gt(i915)->requests.retire_work);
638 static void restore_retire_worker(struct drm_i915_private *i915)
640 igt_flush_test(i915);
641 intel_gt_pm_put(to_gt(i915));
642 i915_gem_driver_register__shrinker(i915);
645 static void mmap_offset_lock(struct drm_i915_private *i915)
646 __acquires(&i915->drm.vma_offset_manager->vm_lock)
648 write_lock(&i915->drm.vma_offset_manager->vm_lock);
651 static void mmap_offset_unlock(struct drm_i915_private *i915)
652 __releases(&i915->drm.vma_offset_manager->vm_lock)
654 write_unlock(&i915->drm.vma_offset_manager->vm_lock);
657 static int igt_mmap_offset_exhaustion(void *arg)
659 struct drm_i915_private *i915 = arg;
660 struct drm_mm *mm = &i915->drm.vma_offset_manager->vm_addr_space_mm;
661 struct drm_i915_gem_object *obj;
662 struct drm_mm_node *hole, *next;
665 int enospc = HAS_LMEM(i915) ? -ENXIO : -ENOSPC;
667 /* Disable background reaper */
668 disable_retire_worker(i915);
669 GEM_BUG_ON(!to_gt(i915)->awake);
670 intel_gt_retire_requests(to_gt(i915));
671 i915_gem_drain_freed_objects(i915);
673 /* Trim the device mmap space to only a page */
674 mmap_offset_lock(i915);
675 loop = 1; /* PAGE_SIZE units */
676 list_for_each_entry_safe(hole, next, &mm->hole_stack, hole_stack) {
677 struct drm_mm_node *resv;
679 resv = kzalloc(sizeof(*resv), GFP_NOWAIT);
685 resv->start = drm_mm_hole_node_start(hole) + loop;
686 resv->size = hole->hole_size - loop;
695 pr_debug("Reserving hole [%llx + %llx]\n",
696 resv->start, resv->size);
698 err = drm_mm_reserve_node(mm, resv);
700 pr_err("Failed to trim VMA manager, err=%d\n", err);
705 GEM_BUG_ON(!list_is_singular(&mm->hole_stack));
706 mmap_offset_unlock(i915);
709 if (!assert_mmap_offset(i915, PAGE_SIZE, 0)) {
710 pr_err("Unable to insert object into single page hole\n");
716 if (!assert_mmap_offset(i915, 2 * PAGE_SIZE, enospc)) {
717 pr_err("Unexpectedly succeeded in inserting too large object into single page hole\n");
722 /* Fill the hole, further allocation attempts should then fail */
723 obj = create_sys_or_internal(i915, PAGE_SIZE);
726 pr_err("Unable to create object for reclaimed hole\n");
730 err = __assign_mmap_offset(obj, default_mapping(i915), &offset, NULL);
732 pr_err("Unable to insert object into reclaimed hole\n");
736 if (!assert_mmap_offset(i915, PAGE_SIZE, enospc)) {
737 pr_err("Unexpectedly succeeded in inserting object into no holes!\n");
742 i915_gem_object_put(obj);
744 /* Now fill with busy dead objects that we expect to reap */
745 for (loop = 0; loop < 3; loop++) {
746 if (intel_gt_is_wedged(to_gt(i915)))
749 obj = i915_gem_object_create_internal(i915, PAGE_SIZE);
755 err = make_obj_busy(obj);
757 pr_err("[loop %d] Failed to busy the object\n", loop);
763 mmap_offset_lock(i915);
765 drm_mm_for_each_node_safe(hole, next, mm) {
766 if (hole->color != -1ul)
769 drm_mm_remove_node(hole);
772 mmap_offset_unlock(i915);
773 restore_retire_worker(i915);
776 i915_gem_object_put(obj);
780 static int gtt_set(struct drm_i915_gem_object *obj)
782 struct i915_vma *vma;
786 vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, PIN_MAPPABLE);
790 intel_gt_pm_get(vma->vm->gt);
791 map = i915_vma_pin_iomap(vma);
798 memset_io(map, POISON_INUSE, obj->base.size);
799 i915_vma_unpin_iomap(vma);
802 intel_gt_pm_put(vma->vm->gt);
806 static int gtt_check(struct drm_i915_gem_object *obj)
808 struct i915_vma *vma;
812 vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, PIN_MAPPABLE);
816 intel_gt_pm_get(vma->vm->gt);
817 map = i915_vma_pin_iomap(vma);
824 if (memchr_inv((void __force *)map, POISON_FREE, obj->base.size)) {
825 pr_err("%s: Write via mmap did not land in backing store (GTT)\n",
826 obj->mm.region->name);
829 i915_vma_unpin_iomap(vma);
832 intel_gt_pm_put(vma->vm->gt);
836 static int wc_set(struct drm_i915_gem_object *obj)
840 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC);
842 return PTR_ERR(vaddr);
844 memset(vaddr, POISON_INUSE, obj->base.size);
845 i915_gem_object_flush_map(obj);
846 i915_gem_object_unpin_map(obj);
851 static int wc_check(struct drm_i915_gem_object *obj)
856 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC);
858 return PTR_ERR(vaddr);
860 if (memchr_inv(vaddr, POISON_FREE, obj->base.size)) {
861 pr_err("%s: Write via mmap did not land in backing store (WC)\n",
862 obj->mm.region->name);
865 i915_gem_object_unpin_map(obj);
870 static bool can_mmap(struct drm_i915_gem_object *obj, enum i915_mmap_type type)
872 struct drm_i915_private *i915 = to_i915(obj->base.dev);
875 if (obj->ops->mmap_offset)
876 return type == I915_MMAP_TYPE_FIXED;
877 else if (type == I915_MMAP_TYPE_FIXED)
880 if (type == I915_MMAP_TYPE_GTT &&
881 !i915_ggtt_has_aperture(to_gt(i915)->ggtt))
884 i915_gem_object_lock(obj, NULL);
885 no_map = (type != I915_MMAP_TYPE_GTT &&
886 !i915_gem_object_has_struct_page(obj) &&
887 !i915_gem_object_has_iomem(obj));
888 i915_gem_object_unlock(obj);
893 #define expand32(x) (((x) << 0) | ((x) << 8) | ((x) << 16) | ((x) << 24))
894 static int __igt_mmap(struct drm_i915_private *i915,
895 struct drm_i915_gem_object *obj,
896 enum i915_mmap_type type)
898 struct vm_area_struct *area;
903 if (!can_mmap(obj, type))
912 err = __assign_mmap_offset(obj, type, &offset, NULL);
916 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED);
917 if (IS_ERR_VALUE(addr))
920 pr_debug("igt_mmap(%s, %d) @ %lx\n", obj->mm.region->name, type, addr);
922 mmap_read_lock(current->mm);
923 area = vma_lookup(current->mm, addr);
924 mmap_read_unlock(current->mm);
926 pr_err("%s: Did not create a vm_area_struct for the mmap\n",
927 obj->mm.region->name);
932 for (i = 0; i < obj->base.size / sizeof(u32); i++) {
933 u32 __user *ux = u64_to_user_ptr((u64)(addr + i * sizeof(*ux)));
936 if (get_user(x, ux)) {
937 pr_err("%s: Unable to read from mmap, offset:%zd\n",
938 obj->mm.region->name, i * sizeof(x));
943 if (x != expand32(POISON_INUSE)) {
944 pr_err("%s: Read incorrect value from mmap, offset:%zd, found:%x, expected:%x\n",
945 obj->mm.region->name,
946 i * sizeof(x), x, expand32(POISON_INUSE));
951 x = expand32(POISON_FREE);
952 if (put_user(x, ux)) {
953 pr_err("%s: Unable to write to mmap, offset:%zd\n",
954 obj->mm.region->name, i * sizeof(x));
960 if (type == I915_MMAP_TYPE_GTT)
961 intel_gt_flush_ggtt_writes(to_gt(i915));
965 err = gtt_check(obj);
967 vm_munmap(addr, obj->base.size);
971 static int igt_mmap(void *arg)
973 struct drm_i915_private *i915 = arg;
974 struct intel_memory_region *mr;
975 enum intel_region_id id;
977 for_each_memory_region(mr, i915, id) {
978 unsigned long sizes[] = {
988 for (i = 0; i < ARRAY_SIZE(sizes); i++) {
989 struct drm_i915_gem_object *obj;
992 obj = __i915_gem_object_create_user(i915, sizes[i], &mr, 1);
993 if (obj == ERR_PTR(-ENODEV))
999 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_GTT);
1001 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_WC);
1003 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_FIXED);
1005 i915_gem_object_put(obj);
1014 static void igt_close_objects(struct drm_i915_private *i915,
1015 struct list_head *objects)
1017 struct drm_i915_gem_object *obj, *on;
1019 list_for_each_entry_safe(obj, on, objects, st_link) {
1020 i915_gem_object_lock(obj, NULL);
1021 if (i915_gem_object_has_pinned_pages(obj))
1022 i915_gem_object_unpin_pages(obj);
1023 /* No polluting the memory region between tests */
1024 __i915_gem_object_put_pages(obj);
1025 i915_gem_object_unlock(obj);
1026 list_del(&obj->st_link);
1027 i915_gem_object_put(obj);
1032 i915_gem_drain_freed_objects(i915);
1035 static void igt_make_evictable(struct list_head *objects)
1037 struct drm_i915_gem_object *obj;
1039 list_for_each_entry(obj, objects, st_link) {
1040 i915_gem_object_lock(obj, NULL);
1041 if (i915_gem_object_has_pinned_pages(obj))
1042 i915_gem_object_unpin_pages(obj);
1043 i915_gem_object_unlock(obj);
1049 static int igt_fill_mappable(struct intel_memory_region *mr,
1050 struct list_head *objects)
1058 struct drm_i915_gem_object *obj;
1060 obj = i915_gem_object_create_region(mr, size, 0, 0);
1066 list_add(&obj->st_link, objects);
1068 err = i915_gem_object_pin_pages_unlocked(obj);
1070 if (err != -ENXIO && err != -ENOMEM)
1073 if (size == mr->min_page_size) {
1082 total += obj->base.size;
1085 pr_info("%s filled=%lluMiB\n", __func__, total >> 20);
1089 igt_close_objects(mr->i915, objects);
1093 static int ___igt_mmap_migrate(struct drm_i915_private *i915,
1094 struct drm_i915_gem_object *obj,
1098 struct vm_area_struct *area;
1101 pr_info("igt_mmap(%s, %d) @ %lx\n",
1102 obj->mm.region->name, I915_MMAP_TYPE_FIXED, addr);
1104 mmap_read_lock(current->mm);
1105 area = vma_lookup(current->mm, addr);
1106 mmap_read_unlock(current->mm);
1108 pr_err("%s: Did not create a vm_area_struct for the mmap\n",
1109 obj->mm.region->name);
1114 for (i = 0; i < obj->base.size / sizeof(u32); i++) {
1115 u32 __user *ux = u64_to_user_ptr((u64)(addr + i * sizeof(*ux)));
1118 if (get_user(x, ux)) {
1121 pr_err("%s: Unable to read from mmap, offset:%zd\n",
1122 obj->mm.region->name, i * sizeof(x));
1130 pr_err("%s: Faulted unmappable memory\n",
1131 obj->mm.region->name);
1136 if (x != expand32(POISON_INUSE)) {
1137 pr_err("%s: Read incorrect value from mmap, offset:%zd, found:%x, expected:%x\n",
1138 obj->mm.region->name,
1139 i * sizeof(x), x, expand32(POISON_INUSE));
1144 x = expand32(POISON_FREE);
1145 if (put_user(x, ux)) {
1146 pr_err("%s: Unable to write to mmap, offset:%zd\n",
1147 obj->mm.region->name, i * sizeof(x));
1157 obj->flags &= ~I915_BO_ALLOC_GPU_ONLY;
1158 err = wc_check(obj);
1161 vm_munmap(addr, obj->base.size);
1165 #define IGT_MMAP_MIGRATE_TOPDOWN (1 << 0)
1166 #define IGT_MMAP_MIGRATE_FILL (1 << 1)
1167 #define IGT_MMAP_MIGRATE_EVICTABLE (1 << 2)
1168 #define IGT_MMAP_MIGRATE_UNFAULTABLE (1 << 3)
1169 #define IGT_MMAP_MIGRATE_FAIL_GPU (1 << 4)
1170 static int __igt_mmap_migrate(struct intel_memory_region **placements,
1172 struct intel_memory_region *expected_mr,
1175 struct drm_i915_private *i915 = placements[0]->i915;
1176 struct drm_i915_gem_object *obj;
1177 struct i915_request *rq = NULL;
1183 obj = __i915_gem_object_create_user(i915, PAGE_SIZE,
1187 return PTR_ERR(obj);
1189 if (flags & IGT_MMAP_MIGRATE_TOPDOWN)
1190 obj->flags |= I915_BO_ALLOC_GPU_ONLY;
1192 err = __assign_mmap_offset(obj, I915_MMAP_TYPE_FIXED, &offset, NULL);
1197 * This will eventually create a GEM context, due to opening dummy drm
1198 * file, which needs a tiny amount of mappable device memory for the top
1199 * level paging structures(and perhaps scratch), so make sure we
1200 * allocate early, to avoid tears.
1202 addr = igt_mmap_offset(i915, offset, obj->base.size,
1203 PROT_WRITE, MAP_SHARED);
1204 if (IS_ERR_VALUE(addr)) {
1209 if (flags & IGT_MMAP_MIGRATE_FILL) {
1210 err = igt_fill_mappable(placements[0], &objects);
1215 err = i915_gem_object_lock(obj, NULL);
1219 err = i915_gem_object_pin_pages(obj);
1221 i915_gem_object_unlock(obj);
1225 err = intel_context_migrate_clear(to_gt(i915)->migrate.context, NULL,
1226 obj->mm.pages->sgl, obj->cache_level,
1227 i915_gem_object_is_lmem(obj),
1228 expand32(POISON_INUSE), &rq);
1229 i915_gem_object_unpin_pages(obj);
1231 err = dma_resv_reserve_fences(obj->base.resv, 1);
1233 dma_resv_add_fence(obj->base.resv, &rq->fence,
1234 DMA_RESV_USAGE_KERNEL);
1235 i915_request_put(rq);
1237 i915_gem_object_unlock(obj);
1241 if (flags & IGT_MMAP_MIGRATE_EVICTABLE)
1242 igt_make_evictable(&objects);
1244 if (flags & IGT_MMAP_MIGRATE_FAIL_GPU) {
1245 err = i915_gem_object_lock(obj, NULL);
1250 * Ensure we only simulate the gpu failuire when faulting the
1253 err = i915_gem_object_wait_moving_fence(obj, true);
1254 i915_gem_object_unlock(obj);
1257 i915_ttm_migrate_set_failure_modes(true, false);
1260 err = ___igt_mmap_migrate(i915, obj, addr,
1261 flags & IGT_MMAP_MIGRATE_UNFAULTABLE);
1263 if (!err && obj->mm.region != expected_mr) {
1264 pr_err("%s region mismatch %s\n", __func__, expected_mr->name);
1268 if (flags & IGT_MMAP_MIGRATE_FAIL_GPU) {
1269 struct intel_gt *gt;
1272 i915_ttm_migrate_set_failure_modes(false, false);
1274 for_each_gt(gt, i915, id) {
1275 intel_wakeref_t wakeref;
1278 mutex_lock(>->reset.mutex);
1279 wedged = test_bit(I915_WEDGED, >->reset.flags);
1280 mutex_unlock(>->reset.mutex);
1282 pr_err("gt(%u) not wedged\n", id);
1287 wakeref = intel_runtime_pm_get(gt->uncore->rpm);
1288 igt_global_reset_lock(gt);
1289 intel_gt_reset(gt, ALL_ENGINES, NULL);
1290 igt_global_reset_unlock(gt);
1291 intel_runtime_pm_put(gt->uncore->rpm, wakeref);
1294 if (!i915_gem_object_has_unknown_state(obj)) {
1295 pr_err("object missing unknown_state\n");
1301 i915_gem_object_put(obj);
1302 igt_close_objects(i915, &objects);
1306 static int igt_mmap_migrate(void *arg)
1308 struct drm_i915_private *i915 = arg;
1309 struct intel_memory_region *system = i915->mm.regions[INTEL_REGION_SMEM];
1310 struct intel_memory_region *mr;
1311 enum intel_region_id id;
1313 for_each_memory_region(mr, i915, id) {
1314 struct intel_memory_region *mixed[] = { mr, system };
1315 struct intel_memory_region *single[] = { mr };
1316 struct ttm_resource_manager *man = mr->region_private;
1317 resource_size_t saved_io_size;
1327 * For testing purposes let's force small BAR, if not already
1330 saved_io_size = mr->io_size;
1331 if (mr->io_size == mr->total) {
1332 resource_size_t io_size = mr->io_size;
1334 io_size = rounddown_pow_of_two(io_size >> 1);
1335 if (io_size < PAGE_SIZE)
1338 mr->io_size = io_size;
1339 i915_ttm_buddy_man_force_visible_size(man,
1340 io_size >> PAGE_SHIFT);
1344 * Allocate in the mappable portion, should be no suprises here.
1346 err = __igt_mmap_migrate(mixed, ARRAY_SIZE(mixed), mr, 0);
1351 * Allocate in the non-mappable portion, but force migrating to
1352 * the mappable portion on fault (LMEM -> LMEM)
1354 err = __igt_mmap_migrate(single, ARRAY_SIZE(single), mr,
1355 IGT_MMAP_MIGRATE_TOPDOWN |
1356 IGT_MMAP_MIGRATE_FILL |
1357 IGT_MMAP_MIGRATE_EVICTABLE);
1362 * Allocate in the non-mappable portion, but force spilling into
1363 * system memory on fault (LMEM -> SMEM)
1365 err = __igt_mmap_migrate(mixed, ARRAY_SIZE(mixed), system,
1366 IGT_MMAP_MIGRATE_TOPDOWN |
1367 IGT_MMAP_MIGRATE_FILL);
1372 * Allocate in the non-mappable portion, but since the mappable
1373 * portion is already full, and we can't spill to system memory,
1374 * then we should expect the fault to fail.
1376 err = __igt_mmap_migrate(single, ARRAY_SIZE(single), mr,
1377 IGT_MMAP_MIGRATE_TOPDOWN |
1378 IGT_MMAP_MIGRATE_FILL |
1379 IGT_MMAP_MIGRATE_UNFAULTABLE);
1384 * Allocate in the non-mappable portion, but force migrating to
1385 * the mappable portion on fault (LMEM -> LMEM). We then also
1386 * simulate a gpu error when moving the pages when faulting the
1387 * pages, which should result in wedging the gpu and returning
1388 * SIGBUS in the fault handler, since we can't fallback to
1391 err = __igt_mmap_migrate(single, ARRAY_SIZE(single), mr,
1392 IGT_MMAP_MIGRATE_TOPDOWN |
1393 IGT_MMAP_MIGRATE_FILL |
1394 IGT_MMAP_MIGRATE_EVICTABLE |
1395 IGT_MMAP_MIGRATE_FAIL_GPU |
1396 IGT_MMAP_MIGRATE_UNFAULTABLE);
1398 mr->io_size = saved_io_size;
1399 i915_ttm_buddy_man_force_visible_size(man,
1400 mr->io_size >> PAGE_SHIFT);
1408 static const char *repr_mmap_type(enum i915_mmap_type type)
1411 case I915_MMAP_TYPE_GTT: return "gtt";
1412 case I915_MMAP_TYPE_WB: return "wb";
1413 case I915_MMAP_TYPE_WC: return "wc";
1414 case I915_MMAP_TYPE_UC: return "uc";
1415 case I915_MMAP_TYPE_FIXED: return "fixed";
1416 default: return "unknown";
1420 static bool can_access(struct drm_i915_gem_object *obj)
1424 i915_gem_object_lock(obj, NULL);
1425 access = i915_gem_object_has_struct_page(obj) ||
1426 i915_gem_object_has_iomem(obj);
1427 i915_gem_object_unlock(obj);
1432 static int __igt_mmap_access(struct drm_i915_private *i915,
1433 struct drm_i915_gem_object *obj,
1434 enum i915_mmap_type type)
1436 unsigned long __user *ptr;
1443 memset(&A, 0xAA, sizeof(A));
1444 memset(&B, 0xBB, sizeof(B));
1446 if (!can_mmap(obj, type) || !can_access(obj))
1449 err = __assign_mmap_offset(obj, type, &offset, NULL);
1453 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED);
1454 if (IS_ERR_VALUE(addr))
1456 ptr = (unsigned long __user *)addr;
1458 err = __put_user(A, ptr);
1460 pr_err("%s(%s): failed to write into user mmap\n",
1461 obj->mm.region->name, repr_mmap_type(type));
1465 intel_gt_flush_ggtt_writes(to_gt(i915));
1467 err = access_process_vm(current, addr, &x, sizeof(x), 0);
1468 if (err != sizeof(x)) {
1469 pr_err("%s(%s): access_process_vm() read failed\n",
1470 obj->mm.region->name, repr_mmap_type(type));
1474 err = access_process_vm(current, addr, &B, sizeof(B), FOLL_WRITE);
1475 if (err != sizeof(B)) {
1476 pr_err("%s(%s): access_process_vm() write failed\n",
1477 obj->mm.region->name, repr_mmap_type(type));
1481 intel_gt_flush_ggtt_writes(to_gt(i915));
1483 err = __get_user(y, ptr);
1485 pr_err("%s(%s): failed to read from user mmap\n",
1486 obj->mm.region->name, repr_mmap_type(type));
1490 if (x != A || y != B) {
1491 pr_err("%s(%s): failed to read/write values, found (%lx, %lx)\n",
1492 obj->mm.region->name, repr_mmap_type(type),
1499 vm_munmap(addr, obj->base.size);
1503 static int igt_mmap_access(void *arg)
1505 struct drm_i915_private *i915 = arg;
1506 struct intel_memory_region *mr;
1507 enum intel_region_id id;
1509 for_each_memory_region(mr, i915, id) {
1510 struct drm_i915_gem_object *obj;
1516 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1);
1517 if (obj == ERR_PTR(-ENODEV))
1521 return PTR_ERR(obj);
1523 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_GTT);
1525 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_WB);
1527 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_WC);
1529 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_UC);
1531 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_FIXED);
1533 i915_gem_object_put(obj);
1541 static int __igt_mmap_gpu(struct drm_i915_private *i915,
1542 struct drm_i915_gem_object *obj,
1543 enum i915_mmap_type type)
1545 struct intel_engine_cs *engine;
1553 * Verify that the mmap access into the backing store aligns with
1554 * that of the GPU, i.e. that mmap is indeed writing into the same
1555 * page as being read by the GPU.
1558 if (!can_mmap(obj, type))
1567 err = __assign_mmap_offset(obj, type, &offset, NULL);
1571 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED);
1572 if (IS_ERR_VALUE(addr))
1575 ux = u64_to_user_ptr((u64)addr);
1576 bbe = MI_BATCH_BUFFER_END;
1577 if (put_user(bbe, ux)) {
1578 pr_err("%s: Unable to write to mmap\n", obj->mm.region->name);
1583 if (type == I915_MMAP_TYPE_GTT)
1584 intel_gt_flush_ggtt_writes(to_gt(i915));
1586 for_each_uabi_engine(engine, i915) {
1587 struct i915_request *rq;
1588 struct i915_vma *vma;
1589 struct i915_gem_ww_ctx ww;
1591 vma = i915_vma_instance(obj, engine->kernel_context->vm, NULL);
1597 i915_gem_ww_ctx_init(&ww, false);
1599 err = i915_gem_object_lock(obj, &ww);
1601 err = i915_vma_pin_ww(vma, &ww, 0, 0, PIN_USER);
1605 rq = i915_request_create(engine->kernel_context);
1611 err = i915_request_await_object(rq, vma->obj, false);
1613 err = i915_vma_move_to_active(vma, rq, 0);
1615 err = engine->emit_bb_start(rq, vma->node.start, 0, 0);
1616 i915_request_get(rq);
1617 i915_request_add(rq);
1619 if (i915_request_wait(rq, 0, HZ / 5) < 0) {
1620 struct drm_printer p =
1621 drm_info_printer(engine->i915->drm.dev);
1623 pr_err("%s(%s, %s): Failed to execute batch\n",
1624 __func__, engine->name, obj->mm.region->name);
1625 intel_engine_dump(engine, &p,
1626 "%s\n", engine->name);
1628 intel_gt_set_wedged(engine->gt);
1631 i915_request_put(rq);
1634 i915_vma_unpin(vma);
1636 if (err == -EDEADLK) {
1637 err = i915_gem_ww_ctx_backoff(&ww);
1641 i915_gem_ww_ctx_fini(&ww);
1647 vm_munmap(addr, obj->base.size);
1651 static int igt_mmap_gpu(void *arg)
1653 struct drm_i915_private *i915 = arg;
1654 struct intel_memory_region *mr;
1655 enum intel_region_id id;
1657 for_each_memory_region(mr, i915, id) {
1658 struct drm_i915_gem_object *obj;
1664 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1);
1665 if (obj == ERR_PTR(-ENODEV))
1669 return PTR_ERR(obj);
1671 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_GTT);
1673 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_WC);
1675 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_FIXED);
1677 i915_gem_object_put(obj);
1685 static int check_present_pte(pte_t *pte, unsigned long addr, void *data)
1687 if (!pte_present(*pte) || pte_none(*pte)) {
1688 pr_err("missing PTE:%lx\n",
1689 (addr - (unsigned long)data) >> PAGE_SHIFT);
1696 static int check_absent_pte(pte_t *pte, unsigned long addr, void *data)
1698 if (pte_present(*pte) && !pte_none(*pte)) {
1699 pr_err("present PTE:%lx; expected to be revoked\n",
1700 (addr - (unsigned long)data) >> PAGE_SHIFT);
1707 static int check_present(unsigned long addr, unsigned long len)
1709 return apply_to_page_range(current->mm, addr, len,
1710 check_present_pte, (void *)addr);
1713 static int check_absent(unsigned long addr, unsigned long len)
1715 return apply_to_page_range(current->mm, addr, len,
1716 check_absent_pte, (void *)addr);
1719 static int prefault_range(u64 start, u64 len)
1721 const char __user *addr, *end;
1722 char __maybe_unused c;
1725 addr = u64_to_user_ptr(start);
1728 for (; addr < end; addr += PAGE_SIZE) {
1729 err = __get_user(c, addr);
1734 return __get_user(c, end - 1);
1737 static int __igt_mmap_revoke(struct drm_i915_private *i915,
1738 struct drm_i915_gem_object *obj,
1739 enum i915_mmap_type type)
1745 if (!can_mmap(obj, type))
1748 err = __assign_mmap_offset(obj, type, &offset, NULL);
1752 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED);
1753 if (IS_ERR_VALUE(addr))
1756 err = prefault_range(addr, obj->base.size);
1760 err = check_present(addr, obj->base.size);
1762 pr_err("%s: was not present\n", obj->mm.region->name);
1767 * After unbinding the object from the GGTT, its address may be reused
1768 * for other objects. Ergo we have to revoke the previous mmap PTE
1769 * access as it no longer points to the same object.
1771 i915_gem_object_lock(obj, NULL);
1772 err = i915_gem_object_unbind(obj, I915_GEM_OBJECT_UNBIND_ACTIVE);
1773 i915_gem_object_unlock(obj);
1775 pr_err("Failed to unbind object!\n");
1779 if (type != I915_MMAP_TYPE_GTT) {
1780 i915_gem_object_lock(obj, NULL);
1781 __i915_gem_object_put_pages(obj);
1782 i915_gem_object_unlock(obj);
1783 if (i915_gem_object_has_pages(obj)) {
1784 pr_err("Failed to put-pages object!\n");
1790 err = check_absent(addr, obj->base.size);
1792 pr_err("%s: was not absent\n", obj->mm.region->name);
1797 vm_munmap(addr, obj->base.size);
1801 static int igt_mmap_revoke(void *arg)
1803 struct drm_i915_private *i915 = arg;
1804 struct intel_memory_region *mr;
1805 enum intel_region_id id;
1807 for_each_memory_region(mr, i915, id) {
1808 struct drm_i915_gem_object *obj;
1814 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1);
1815 if (obj == ERR_PTR(-ENODEV))
1819 return PTR_ERR(obj);
1821 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_GTT);
1823 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_WC);
1825 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_FIXED);
1827 i915_gem_object_put(obj);
1835 int i915_gem_mman_live_selftests(struct drm_i915_private *i915)
1837 static const struct i915_subtest tests[] = {
1838 SUBTEST(igt_partial_tiling),
1839 SUBTEST(igt_smoke_tiling),
1840 SUBTEST(igt_mmap_offset_exhaustion),
1842 SUBTEST(igt_mmap_migrate),
1843 SUBTEST(igt_mmap_access),
1844 SUBTEST(igt_mmap_revoke),
1845 SUBTEST(igt_mmap_gpu),
1848 return i915_live_subtests(tests, i915);