1 /* 2 * SPDX-License-Identifier: MIT 3 * 4 * Copyright © 2016 Intel Corporation 5 */ 6 7 #include <linux/prime_numbers.h> 8 9 #include "gt/intel_engine_pm.h" 10 #include "gt/intel_gpu_commands.h" 11 #include "gt/intel_gt.h" 12 #include "gt/intel_gt_pm.h" 13 #include "gem/i915_gem_region.h" 14 #include "huge_gem_object.h" 15 #include "i915_selftest.h" 16 #include "selftests/i915_random.h" 17 #include "selftests/igt_flush_test.h" 18 #include "selftests/igt_mmap.h" 19 20 struct tile { 21 unsigned int width; 22 unsigned int height; 23 unsigned int stride; 24 unsigned int size; 25 unsigned int tiling; 26 unsigned int swizzle; 27 }; 28 29 static u64 swizzle_bit(unsigned int bit, u64 offset) 30 { 31 return (offset & BIT_ULL(bit)) >> (bit - 6); 32 } 33 34 static u64 tiled_offset(const struct tile *tile, u64 v) 35 { 36 u64 x, y; 37 38 if (tile->tiling == I915_TILING_NONE) 39 return v; 40 41 y = div64_u64_rem(v, tile->stride, &x); 42 v = div64_u64_rem(y, tile->height, &y) * tile->stride * tile->height; 43 44 if (tile->tiling == I915_TILING_X) { 45 v += y * tile->width; 46 v += div64_u64_rem(x, tile->width, &x) << tile->size; 47 v += x; 48 } else if (tile->width == 128) { 49 const unsigned int ytile_span = 16; 50 const unsigned int ytile_height = 512; 51 52 v += y * ytile_span; 53 v += div64_u64_rem(x, ytile_span, &x) * ytile_height; 54 v += x; 55 } else { 56 const unsigned int ytile_span = 32; 57 const unsigned int ytile_height = 256; 58 59 v += y * ytile_span; 60 v += div64_u64_rem(x, ytile_span, &x) * ytile_height; 61 v += x; 62 } 63 64 switch (tile->swizzle) { 65 case I915_BIT_6_SWIZZLE_9: 66 v ^= swizzle_bit(9, v); 67 break; 68 case I915_BIT_6_SWIZZLE_9_10: 69 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v); 70 break; 71 case I915_BIT_6_SWIZZLE_9_11: 72 v ^= swizzle_bit(9, v) ^ swizzle_bit(11, v); 73 break; 74 case I915_BIT_6_SWIZZLE_9_10_11: 75 v ^= swizzle_bit(9, v) ^ swizzle_bit(10, v) ^ swizzle_bit(11, v); 76 break; 77 } 78 79 return v; 80 } 81 82 static int check_partial_mapping(struct drm_i915_gem_object *obj, 83 const struct tile *tile, 84 struct rnd_state *prng) 85 { 86 const unsigned long npages = obj->base.size / PAGE_SIZE; 87 struct i915_ggtt_view view; 88 struct i915_vma *vma; 89 unsigned long page; 90 u32 __iomem *io; 91 struct page *p; 92 unsigned int n; 93 u64 offset; 94 u32 *cpu; 95 int err; 96 97 err = i915_gem_object_set_tiling(obj, tile->tiling, tile->stride); 98 if (err) { 99 pr_err("Failed to set tiling mode=%u, stride=%u, err=%d\n", 100 tile->tiling, tile->stride, err); 101 return err; 102 } 103 104 GEM_BUG_ON(i915_gem_object_get_tiling(obj) != tile->tiling); 105 GEM_BUG_ON(i915_gem_object_get_stride(obj) != tile->stride); 106 107 i915_gem_object_lock(obj, NULL); 108 err = i915_gem_object_set_to_gtt_domain(obj, true); 109 i915_gem_object_unlock(obj); 110 if (err) { 111 pr_err("Failed to flush to GTT write domain; err=%d\n", err); 112 return err; 113 } 114 115 page = i915_prandom_u32_max_state(npages, prng); 116 view = compute_partial_view(obj, page, MIN_CHUNK_PAGES); 117 118 vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE); 119 if (IS_ERR(vma)) { 120 pr_err("Failed to pin partial view: offset=%lu; err=%d\n", 121 page, (int)PTR_ERR(vma)); 122 return PTR_ERR(vma); 123 } 124 125 n = page - view.partial.offset; 126 GEM_BUG_ON(n >= view.partial.size); 127 128 io = i915_vma_pin_iomap(vma); 129 i915_vma_unpin(vma); 130 if (IS_ERR(io)) { 131 pr_err("Failed to iomap partial view: offset=%lu; err=%d\n", 132 page, (int)PTR_ERR(io)); 133 err = PTR_ERR(io); 134 goto out; 135 } 136 137 iowrite32(page, io + n * PAGE_SIZE / sizeof(*io)); 138 i915_vma_unpin_iomap(vma); 139 140 offset = tiled_offset(tile, page << PAGE_SHIFT); 141 if (offset >= obj->base.size) 142 goto out; 143 144 intel_gt_flush_ggtt_writes(&to_i915(obj->base.dev)->gt); 145 146 p = i915_gem_object_get_page(obj, offset >> PAGE_SHIFT); 147 cpu = kmap(p) + offset_in_page(offset); 148 drm_clflush_virt_range(cpu, sizeof(*cpu)); 149 if (*cpu != (u32)page) { 150 pr_err("Partial view for %lu [%u] (offset=%llu, size=%u [%llu, row size %u], fence=%d, tiling=%d, stride=%d) misalignment, expected write to page (%llu + %u [0x%llx]) of 0x%x, found 0x%x\n", 151 page, n, 152 view.partial.offset, 153 view.partial.size, 154 vma->size >> PAGE_SHIFT, 155 tile->tiling ? tile_row_pages(obj) : 0, 156 vma->fence ? vma->fence->id : -1, tile->tiling, tile->stride, 157 offset >> PAGE_SHIFT, 158 (unsigned int)offset_in_page(offset), 159 offset, 160 (u32)page, *cpu); 161 err = -EINVAL; 162 } 163 *cpu = 0; 164 drm_clflush_virt_range(cpu, sizeof(*cpu)); 165 kunmap(p); 166 167 out: 168 __i915_vma_put(vma); 169 return err; 170 } 171 172 static int check_partial_mappings(struct drm_i915_gem_object *obj, 173 const struct tile *tile, 174 unsigned long end_time) 175 { 176 const unsigned int nreal = obj->scratch / PAGE_SIZE; 177 const unsigned long npages = obj->base.size / PAGE_SIZE; 178 struct i915_vma *vma; 179 unsigned long page; 180 int err; 181 182 err = i915_gem_object_set_tiling(obj, tile->tiling, tile->stride); 183 if (err) { 184 pr_err("Failed to set tiling mode=%u, stride=%u, err=%d\n", 185 tile->tiling, tile->stride, err); 186 return err; 187 } 188 189 GEM_BUG_ON(i915_gem_object_get_tiling(obj) != tile->tiling); 190 GEM_BUG_ON(i915_gem_object_get_stride(obj) != tile->stride); 191 192 i915_gem_object_lock(obj, NULL); 193 err = i915_gem_object_set_to_gtt_domain(obj, true); 194 i915_gem_object_unlock(obj); 195 if (err) { 196 pr_err("Failed to flush to GTT write domain; err=%d\n", err); 197 return err; 198 } 199 200 for_each_prime_number_from(page, 1, npages) { 201 struct i915_ggtt_view view = 202 compute_partial_view(obj, page, MIN_CHUNK_PAGES); 203 u32 __iomem *io; 204 struct page *p; 205 unsigned int n; 206 u64 offset; 207 u32 *cpu; 208 209 GEM_BUG_ON(view.partial.size > nreal); 210 cond_resched(); 211 212 vma = i915_gem_object_ggtt_pin(obj, &view, 0, 0, PIN_MAPPABLE); 213 if (IS_ERR(vma)) { 214 pr_err("Failed to pin partial view: offset=%lu; err=%d\n", 215 page, (int)PTR_ERR(vma)); 216 return PTR_ERR(vma); 217 } 218 219 n = page - view.partial.offset; 220 GEM_BUG_ON(n >= view.partial.size); 221 222 io = i915_vma_pin_iomap(vma); 223 i915_vma_unpin(vma); 224 if (IS_ERR(io)) { 225 pr_err("Failed to iomap partial view: offset=%lu; err=%d\n", 226 page, (int)PTR_ERR(io)); 227 return PTR_ERR(io); 228 } 229 230 iowrite32(page, io + n * PAGE_SIZE / sizeof(*io)); 231 i915_vma_unpin_iomap(vma); 232 233 offset = tiled_offset(tile, page << PAGE_SHIFT); 234 if (offset >= obj->base.size) 235 continue; 236 237 intel_gt_flush_ggtt_writes(&to_i915(obj->base.dev)->gt); 238 239 p = i915_gem_object_get_page(obj, offset >> PAGE_SHIFT); 240 cpu = kmap(p) + offset_in_page(offset); 241 drm_clflush_virt_range(cpu, sizeof(*cpu)); 242 if (*cpu != (u32)page) { 243 pr_err("Partial view for %lu [%u] (offset=%llu, size=%u [%llu, row size %u], fence=%d, tiling=%d, stride=%d) misalignment, expected write to page (%llu + %u [0x%llx]) of 0x%x, found 0x%x\n", 244 page, n, 245 view.partial.offset, 246 view.partial.size, 247 vma->size >> PAGE_SHIFT, 248 tile->tiling ? tile_row_pages(obj) : 0, 249 vma->fence ? vma->fence->id : -1, tile->tiling, tile->stride, 250 offset >> PAGE_SHIFT, 251 (unsigned int)offset_in_page(offset), 252 offset, 253 (u32)page, *cpu); 254 err = -EINVAL; 255 } 256 *cpu = 0; 257 drm_clflush_virt_range(cpu, sizeof(*cpu)); 258 kunmap(p); 259 if (err) 260 return err; 261 262 __i915_vma_put(vma); 263 264 if (igt_timeout(end_time, 265 "%s: timed out after tiling=%d stride=%d\n", 266 __func__, tile->tiling, tile->stride)) 267 return -EINTR; 268 } 269 270 return 0; 271 } 272 273 static unsigned int 274 setup_tile_size(struct tile *tile, struct drm_i915_private *i915) 275 { 276 if (GRAPHICS_VER(i915) <= 2) { 277 tile->height = 16; 278 tile->width = 128; 279 tile->size = 11; 280 } else if (tile->tiling == I915_TILING_Y && 281 HAS_128_BYTE_Y_TILING(i915)) { 282 tile->height = 32; 283 tile->width = 128; 284 tile->size = 12; 285 } else { 286 tile->height = 8; 287 tile->width = 512; 288 tile->size = 12; 289 } 290 291 if (GRAPHICS_VER(i915) < 4) 292 return 8192 / tile->width; 293 else if (GRAPHICS_VER(i915) < 7) 294 return 128 * I965_FENCE_MAX_PITCH_VAL / tile->width; 295 else 296 return 128 * GEN7_FENCE_MAX_PITCH_VAL / tile->width; 297 } 298 299 static int igt_partial_tiling(void *arg) 300 { 301 const unsigned int nreal = 1 << 12; /* largest tile row x2 */ 302 struct drm_i915_private *i915 = arg; 303 struct drm_i915_gem_object *obj; 304 intel_wakeref_t wakeref; 305 int tiling; 306 int err; 307 308 if (!i915_ggtt_has_aperture(&i915->ggtt)) 309 return 0; 310 311 /* We want to check the page mapping and fencing of a large object 312 * mmapped through the GTT. The object we create is larger than can 313 * possibly be mmaped as a whole, and so we must use partial GGTT vma. 314 * We then check that a write through each partial GGTT vma ends up 315 * in the right set of pages within the object, and with the expected 316 * tiling, which we verify by manual swizzling. 317 */ 318 319 obj = huge_gem_object(i915, 320 nreal << PAGE_SHIFT, 321 (1 + next_prime_number(i915->ggtt.vm.total >> PAGE_SHIFT)) << PAGE_SHIFT); 322 if (IS_ERR(obj)) 323 return PTR_ERR(obj); 324 325 err = i915_gem_object_pin_pages_unlocked(obj); 326 if (err) { 327 pr_err("Failed to allocate %u pages (%lu total), err=%d\n", 328 nreal, obj->base.size / PAGE_SIZE, err); 329 goto out; 330 } 331 332 wakeref = intel_runtime_pm_get(&i915->runtime_pm); 333 334 if (1) { 335 IGT_TIMEOUT(end); 336 struct tile tile; 337 338 tile.height = 1; 339 tile.width = 1; 340 tile.size = 0; 341 tile.stride = 0; 342 tile.swizzle = I915_BIT_6_SWIZZLE_NONE; 343 tile.tiling = I915_TILING_NONE; 344 345 err = check_partial_mappings(obj, &tile, end); 346 if (err && err != -EINTR) 347 goto out_unlock; 348 } 349 350 for (tiling = I915_TILING_X; tiling <= I915_TILING_Y; tiling++) { 351 IGT_TIMEOUT(end); 352 unsigned int max_pitch; 353 unsigned int pitch; 354 struct tile tile; 355 356 if (i915->quirks & QUIRK_PIN_SWIZZLED_PAGES) 357 /* 358 * The swizzling pattern is actually unknown as it 359 * varies based on physical address of each page. 360 * See i915_gem_detect_bit_6_swizzle(). 361 */ 362 break; 363 364 tile.tiling = tiling; 365 switch (tiling) { 366 case I915_TILING_X: 367 tile.swizzle = i915->ggtt.bit_6_swizzle_x; 368 break; 369 case I915_TILING_Y: 370 tile.swizzle = i915->ggtt.bit_6_swizzle_y; 371 break; 372 } 373 374 GEM_BUG_ON(tile.swizzle == I915_BIT_6_SWIZZLE_UNKNOWN); 375 if (tile.swizzle == I915_BIT_6_SWIZZLE_9_17 || 376 tile.swizzle == I915_BIT_6_SWIZZLE_9_10_17) 377 continue; 378 379 max_pitch = setup_tile_size(&tile, i915); 380 381 for (pitch = max_pitch; pitch; pitch >>= 1) { 382 tile.stride = tile.width * pitch; 383 err = check_partial_mappings(obj, &tile, end); 384 if (err == -EINTR) 385 goto next_tiling; 386 if (err) 387 goto out_unlock; 388 389 if (pitch > 2 && GRAPHICS_VER(i915) >= 4) { 390 tile.stride = tile.width * (pitch - 1); 391 err = check_partial_mappings(obj, &tile, end); 392 if (err == -EINTR) 393 goto next_tiling; 394 if (err) 395 goto out_unlock; 396 } 397 398 if (pitch < max_pitch && GRAPHICS_VER(i915) >= 4) { 399 tile.stride = tile.width * (pitch + 1); 400 err = check_partial_mappings(obj, &tile, end); 401 if (err == -EINTR) 402 goto next_tiling; 403 if (err) 404 goto out_unlock; 405 } 406 } 407 408 if (GRAPHICS_VER(i915) >= 4) { 409 for_each_prime_number(pitch, max_pitch) { 410 tile.stride = tile.width * pitch; 411 err = check_partial_mappings(obj, &tile, end); 412 if (err == -EINTR) 413 goto next_tiling; 414 if (err) 415 goto out_unlock; 416 } 417 } 418 419 next_tiling: ; 420 } 421 422 out_unlock: 423 intel_runtime_pm_put(&i915->runtime_pm, wakeref); 424 i915_gem_object_unpin_pages(obj); 425 out: 426 i915_gem_object_put(obj); 427 return err; 428 } 429 430 static int igt_smoke_tiling(void *arg) 431 { 432 const unsigned int nreal = 1 << 12; /* largest tile row x2 */ 433 struct drm_i915_private *i915 = arg; 434 struct drm_i915_gem_object *obj; 435 intel_wakeref_t wakeref; 436 I915_RND_STATE(prng); 437 unsigned long count; 438 IGT_TIMEOUT(end); 439 int err; 440 441 if (!i915_ggtt_has_aperture(&i915->ggtt)) 442 return 0; 443 444 /* 445 * igt_partial_tiling() does an exhastive check of partial tiling 446 * chunking, but will undoubtably run out of time. Here, we do a 447 * randomised search and hope over many runs of 1s with different 448 * seeds we will do a thorough check. 449 * 450 * Remember to look at the st_seed if we see a flip-flop in BAT! 451 */ 452 453 if (i915->quirks & QUIRK_PIN_SWIZZLED_PAGES) 454 return 0; 455 456 obj = huge_gem_object(i915, 457 nreal << PAGE_SHIFT, 458 (1 + next_prime_number(i915->ggtt.vm.total >> PAGE_SHIFT)) << PAGE_SHIFT); 459 if (IS_ERR(obj)) 460 return PTR_ERR(obj); 461 462 err = i915_gem_object_pin_pages_unlocked(obj); 463 if (err) { 464 pr_err("Failed to allocate %u pages (%lu total), err=%d\n", 465 nreal, obj->base.size / PAGE_SIZE, err); 466 goto out; 467 } 468 469 wakeref = intel_runtime_pm_get(&i915->runtime_pm); 470 471 count = 0; 472 do { 473 struct tile tile; 474 475 tile.tiling = 476 i915_prandom_u32_max_state(I915_TILING_Y + 1, &prng); 477 switch (tile.tiling) { 478 case I915_TILING_NONE: 479 tile.height = 1; 480 tile.width = 1; 481 tile.size = 0; 482 tile.stride = 0; 483 tile.swizzle = I915_BIT_6_SWIZZLE_NONE; 484 break; 485 486 case I915_TILING_X: 487 tile.swizzle = i915->ggtt.bit_6_swizzle_x; 488 break; 489 case I915_TILING_Y: 490 tile.swizzle = i915->ggtt.bit_6_swizzle_y; 491 break; 492 } 493 494 if (tile.swizzle == I915_BIT_6_SWIZZLE_9_17 || 495 tile.swizzle == I915_BIT_6_SWIZZLE_9_10_17) 496 continue; 497 498 if (tile.tiling != I915_TILING_NONE) { 499 unsigned int max_pitch = setup_tile_size(&tile, i915); 500 501 tile.stride = 502 i915_prandom_u32_max_state(max_pitch, &prng); 503 tile.stride = (1 + tile.stride) * tile.width; 504 if (GRAPHICS_VER(i915) < 4) 505 tile.stride = rounddown_pow_of_two(tile.stride); 506 } 507 508 err = check_partial_mapping(obj, &tile, &prng); 509 if (err) 510 break; 511 512 count++; 513 } while (!__igt_timeout(end, NULL)); 514 515 pr_info("%s: Completed %lu trials\n", __func__, count); 516 517 intel_runtime_pm_put(&i915->runtime_pm, wakeref); 518 i915_gem_object_unpin_pages(obj); 519 out: 520 i915_gem_object_put(obj); 521 return err; 522 } 523 524 static int make_obj_busy(struct drm_i915_gem_object *obj) 525 { 526 struct drm_i915_private *i915 = to_i915(obj->base.dev); 527 struct intel_engine_cs *engine; 528 529 for_each_uabi_engine(engine, i915) { 530 struct i915_request *rq; 531 struct i915_vma *vma; 532 struct i915_gem_ww_ctx ww; 533 int err; 534 535 vma = i915_vma_instance(obj, &engine->gt->ggtt->vm, NULL); 536 if (IS_ERR(vma)) 537 return PTR_ERR(vma); 538 539 i915_gem_ww_ctx_init(&ww, false); 540 retry: 541 err = i915_gem_object_lock(obj, &ww); 542 if (!err) 543 err = i915_vma_pin_ww(vma, &ww, 0, 0, PIN_USER); 544 if (err) 545 goto err; 546 547 rq = intel_engine_create_kernel_request(engine); 548 if (IS_ERR(rq)) { 549 err = PTR_ERR(rq); 550 goto err_unpin; 551 } 552 553 err = i915_request_await_object(rq, vma->obj, true); 554 if (err == 0) 555 err = i915_vma_move_to_active(vma, rq, 556 EXEC_OBJECT_WRITE); 557 558 i915_request_add(rq); 559 err_unpin: 560 i915_vma_unpin(vma); 561 err: 562 if (err == -EDEADLK) { 563 err = i915_gem_ww_ctx_backoff(&ww); 564 if (!err) 565 goto retry; 566 } 567 i915_gem_ww_ctx_fini(&ww); 568 if (err) 569 return err; 570 } 571 572 i915_gem_object_put(obj); /* leave it only alive via its active ref */ 573 return 0; 574 } 575 576 static enum i915_mmap_type default_mapping(struct drm_i915_private *i915) 577 { 578 if (HAS_LMEM(i915)) 579 return I915_MMAP_TYPE_FIXED; 580 581 return I915_MMAP_TYPE_GTT; 582 } 583 584 static bool assert_mmap_offset(struct drm_i915_private *i915, 585 unsigned long size, 586 int expected) 587 { 588 struct drm_i915_gem_object *obj; 589 u64 offset; 590 int ret; 591 592 obj = i915_gem_object_create_internal(i915, size); 593 if (IS_ERR(obj)) 594 return expected && expected == PTR_ERR(obj); 595 596 ret = __assign_mmap_offset(obj, default_mapping(i915), &offset, NULL); 597 i915_gem_object_put(obj); 598 599 return ret == expected; 600 } 601 602 static void disable_retire_worker(struct drm_i915_private *i915) 603 { 604 i915_gem_driver_unregister__shrinker(i915); 605 intel_gt_pm_get(&i915->gt); 606 cancel_delayed_work_sync(&i915->gt.requests.retire_work); 607 } 608 609 static void restore_retire_worker(struct drm_i915_private *i915) 610 { 611 igt_flush_test(i915); 612 intel_gt_pm_put(&i915->gt); 613 i915_gem_driver_register__shrinker(i915); 614 } 615 616 static void mmap_offset_lock(struct drm_i915_private *i915) 617 __acquires(&i915->drm.vma_offset_manager->vm_lock) 618 { 619 write_lock(&i915->drm.vma_offset_manager->vm_lock); 620 } 621 622 static void mmap_offset_unlock(struct drm_i915_private *i915) 623 __releases(&i915->drm.vma_offset_manager->vm_lock) 624 { 625 write_unlock(&i915->drm.vma_offset_manager->vm_lock); 626 } 627 628 static int igt_mmap_offset_exhaustion(void *arg) 629 { 630 struct drm_i915_private *i915 = arg; 631 struct drm_mm *mm = &i915->drm.vma_offset_manager->vm_addr_space_mm; 632 struct drm_i915_gem_object *obj; 633 struct drm_mm_node *hole, *next; 634 int loop, err = 0; 635 u64 offset; 636 637 /* Disable background reaper */ 638 disable_retire_worker(i915); 639 GEM_BUG_ON(!i915->gt.awake); 640 intel_gt_retire_requests(&i915->gt); 641 i915_gem_drain_freed_objects(i915); 642 643 /* Trim the device mmap space to only a page */ 644 mmap_offset_lock(i915); 645 loop = 1; /* PAGE_SIZE units */ 646 list_for_each_entry_safe(hole, next, &mm->hole_stack, hole_stack) { 647 struct drm_mm_node *resv; 648 649 resv = kzalloc(sizeof(*resv), GFP_NOWAIT); 650 if (!resv) { 651 err = -ENOMEM; 652 goto out_park; 653 } 654 655 resv->start = drm_mm_hole_node_start(hole) + loop; 656 resv->size = hole->hole_size - loop; 657 resv->color = -1ul; 658 loop = 0; 659 660 if (!resv->size) { 661 kfree(resv); 662 continue; 663 } 664 665 pr_debug("Reserving hole [%llx + %llx]\n", 666 resv->start, resv->size); 667 668 err = drm_mm_reserve_node(mm, resv); 669 if (err) { 670 pr_err("Failed to trim VMA manager, err=%d\n", err); 671 kfree(resv); 672 goto out_park; 673 } 674 } 675 GEM_BUG_ON(!list_is_singular(&mm->hole_stack)); 676 mmap_offset_unlock(i915); 677 678 /* Just fits! */ 679 if (!assert_mmap_offset(i915, PAGE_SIZE, 0)) { 680 pr_err("Unable to insert object into single page hole\n"); 681 err = -EINVAL; 682 goto out; 683 } 684 685 /* Too large */ 686 if (!assert_mmap_offset(i915, 2 * PAGE_SIZE, -ENOSPC)) { 687 pr_err("Unexpectedly succeeded in inserting too large object into single page hole\n"); 688 err = -EINVAL; 689 goto out; 690 } 691 692 /* Fill the hole, further allocation attempts should then fail */ 693 obj = i915_gem_object_create_internal(i915, PAGE_SIZE); 694 if (IS_ERR(obj)) { 695 err = PTR_ERR(obj); 696 pr_err("Unable to create object for reclaimed hole\n"); 697 goto out; 698 } 699 700 err = __assign_mmap_offset(obj, default_mapping(i915), &offset, NULL); 701 if (err) { 702 pr_err("Unable to insert object into reclaimed hole\n"); 703 goto err_obj; 704 } 705 706 if (!assert_mmap_offset(i915, PAGE_SIZE, -ENOSPC)) { 707 pr_err("Unexpectedly succeeded in inserting object into no holes!\n"); 708 err = -EINVAL; 709 goto err_obj; 710 } 711 712 i915_gem_object_put(obj); 713 714 /* Now fill with busy dead objects that we expect to reap */ 715 for (loop = 0; loop < 3; loop++) { 716 if (intel_gt_is_wedged(&i915->gt)) 717 break; 718 719 obj = i915_gem_object_create_internal(i915, PAGE_SIZE); 720 if (IS_ERR(obj)) { 721 err = PTR_ERR(obj); 722 goto out; 723 } 724 725 err = make_obj_busy(obj); 726 if (err) { 727 pr_err("[loop %d] Failed to busy the object\n", loop); 728 goto err_obj; 729 } 730 } 731 732 out: 733 mmap_offset_lock(i915); 734 out_park: 735 drm_mm_for_each_node_safe(hole, next, mm) { 736 if (hole->color != -1ul) 737 continue; 738 739 drm_mm_remove_node(hole); 740 kfree(hole); 741 } 742 mmap_offset_unlock(i915); 743 restore_retire_worker(i915); 744 return err; 745 err_obj: 746 i915_gem_object_put(obj); 747 goto out; 748 } 749 750 static int gtt_set(struct drm_i915_gem_object *obj) 751 { 752 struct i915_vma *vma; 753 void __iomem *map; 754 int err = 0; 755 756 vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, PIN_MAPPABLE); 757 if (IS_ERR(vma)) 758 return PTR_ERR(vma); 759 760 intel_gt_pm_get(vma->vm->gt); 761 map = i915_vma_pin_iomap(vma); 762 i915_vma_unpin(vma); 763 if (IS_ERR(map)) { 764 err = PTR_ERR(map); 765 goto out; 766 } 767 768 memset_io(map, POISON_INUSE, obj->base.size); 769 i915_vma_unpin_iomap(vma); 770 771 out: 772 intel_gt_pm_put(vma->vm->gt); 773 return err; 774 } 775 776 static int gtt_check(struct drm_i915_gem_object *obj) 777 { 778 struct i915_vma *vma; 779 void __iomem *map; 780 int err = 0; 781 782 vma = i915_gem_object_ggtt_pin(obj, NULL, 0, 0, PIN_MAPPABLE); 783 if (IS_ERR(vma)) 784 return PTR_ERR(vma); 785 786 intel_gt_pm_get(vma->vm->gt); 787 map = i915_vma_pin_iomap(vma); 788 i915_vma_unpin(vma); 789 if (IS_ERR(map)) { 790 err = PTR_ERR(map); 791 goto out; 792 } 793 794 if (memchr_inv((void __force *)map, POISON_FREE, obj->base.size)) { 795 pr_err("%s: Write via mmap did not land in backing store (GTT)\n", 796 obj->mm.region->name); 797 err = -EINVAL; 798 } 799 i915_vma_unpin_iomap(vma); 800 801 out: 802 intel_gt_pm_put(vma->vm->gt); 803 return err; 804 } 805 806 static int wc_set(struct drm_i915_gem_object *obj) 807 { 808 void *vaddr; 809 810 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC); 811 if (IS_ERR(vaddr)) 812 return PTR_ERR(vaddr); 813 814 memset(vaddr, POISON_INUSE, obj->base.size); 815 i915_gem_object_flush_map(obj); 816 i915_gem_object_unpin_map(obj); 817 818 return 0; 819 } 820 821 static int wc_check(struct drm_i915_gem_object *obj) 822 { 823 void *vaddr; 824 int err = 0; 825 826 vaddr = i915_gem_object_pin_map_unlocked(obj, I915_MAP_WC); 827 if (IS_ERR(vaddr)) 828 return PTR_ERR(vaddr); 829 830 if (memchr_inv(vaddr, POISON_FREE, obj->base.size)) { 831 pr_err("%s: Write via mmap did not land in backing store (WC)\n", 832 obj->mm.region->name); 833 err = -EINVAL; 834 } 835 i915_gem_object_unpin_map(obj); 836 837 return err; 838 } 839 840 static bool can_mmap(struct drm_i915_gem_object *obj, enum i915_mmap_type type) 841 { 842 struct drm_i915_private *i915 = to_i915(obj->base.dev); 843 bool no_map; 844 845 if (HAS_LMEM(i915)) 846 return type == I915_MMAP_TYPE_FIXED; 847 else if (type == I915_MMAP_TYPE_FIXED) 848 return false; 849 850 if (type == I915_MMAP_TYPE_GTT && 851 !i915_ggtt_has_aperture(&to_i915(obj->base.dev)->ggtt)) 852 return false; 853 854 i915_gem_object_lock(obj, NULL); 855 no_map = (type != I915_MMAP_TYPE_GTT && 856 !i915_gem_object_has_struct_page(obj) && 857 !i915_gem_object_has_iomem(obj)); 858 i915_gem_object_unlock(obj); 859 860 return !no_map; 861 } 862 863 #define expand32(x) (((x) << 0) | ((x) << 8) | ((x) << 16) | ((x) << 24)) 864 static int __igt_mmap(struct drm_i915_private *i915, 865 struct drm_i915_gem_object *obj, 866 enum i915_mmap_type type) 867 { 868 struct vm_area_struct *area; 869 unsigned long addr; 870 int err, i; 871 u64 offset; 872 873 if (!can_mmap(obj, type)) 874 return 0; 875 876 err = wc_set(obj); 877 if (err == -ENXIO) 878 err = gtt_set(obj); 879 if (err) 880 return err; 881 882 err = __assign_mmap_offset(obj, type, &offset, NULL); 883 if (err) 884 return err; 885 886 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED); 887 if (IS_ERR_VALUE(addr)) 888 return addr; 889 890 pr_debug("igt_mmap(%s, %d) @ %lx\n", obj->mm.region->name, type, addr); 891 892 area = vma_lookup(current->mm, addr); 893 if (!area) { 894 pr_err("%s: Did not create a vm_area_struct for the mmap\n", 895 obj->mm.region->name); 896 err = -EINVAL; 897 goto out_unmap; 898 } 899 900 for (i = 0; i < obj->base.size / sizeof(u32); i++) { 901 u32 __user *ux = u64_to_user_ptr((u64)(addr + i * sizeof(*ux))); 902 u32 x; 903 904 if (get_user(x, ux)) { 905 pr_err("%s: Unable to read from mmap, offset:%zd\n", 906 obj->mm.region->name, i * sizeof(x)); 907 err = -EFAULT; 908 goto out_unmap; 909 } 910 911 if (x != expand32(POISON_INUSE)) { 912 pr_err("%s: Read incorrect value from mmap, offset:%zd, found:%x, expected:%x\n", 913 obj->mm.region->name, 914 i * sizeof(x), x, expand32(POISON_INUSE)); 915 err = -EINVAL; 916 goto out_unmap; 917 } 918 919 x = expand32(POISON_FREE); 920 if (put_user(x, ux)) { 921 pr_err("%s: Unable to write to mmap, offset:%zd\n", 922 obj->mm.region->name, i * sizeof(x)); 923 err = -EFAULT; 924 goto out_unmap; 925 } 926 } 927 928 if (type == I915_MMAP_TYPE_GTT) 929 intel_gt_flush_ggtt_writes(&i915->gt); 930 931 err = wc_check(obj); 932 if (err == -ENXIO) 933 err = gtt_check(obj); 934 out_unmap: 935 vm_munmap(addr, obj->base.size); 936 return err; 937 } 938 939 static int igt_mmap(void *arg) 940 { 941 struct drm_i915_private *i915 = arg; 942 struct intel_memory_region *mr; 943 enum intel_region_id id; 944 945 for_each_memory_region(mr, i915, id) { 946 unsigned long sizes[] = { 947 PAGE_SIZE, 948 mr->min_page_size, 949 SZ_4M, 950 }; 951 int i; 952 953 for (i = 0; i < ARRAY_SIZE(sizes); i++) { 954 struct drm_i915_gem_object *obj; 955 int err; 956 957 obj = __i915_gem_object_create_user(i915, sizes[i], &mr, 1); 958 if (obj == ERR_PTR(-ENODEV)) 959 continue; 960 961 if (IS_ERR(obj)) 962 return PTR_ERR(obj); 963 964 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_GTT); 965 if (err == 0) 966 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_WC); 967 if (err == 0) 968 err = __igt_mmap(i915, obj, I915_MMAP_TYPE_FIXED); 969 970 i915_gem_object_put(obj); 971 if (err) 972 return err; 973 } 974 } 975 976 return 0; 977 } 978 979 static const char *repr_mmap_type(enum i915_mmap_type type) 980 { 981 switch (type) { 982 case I915_MMAP_TYPE_GTT: return "gtt"; 983 case I915_MMAP_TYPE_WB: return "wb"; 984 case I915_MMAP_TYPE_WC: return "wc"; 985 case I915_MMAP_TYPE_UC: return "uc"; 986 case I915_MMAP_TYPE_FIXED: return "fixed"; 987 default: return "unknown"; 988 } 989 } 990 991 static bool can_access(struct drm_i915_gem_object *obj) 992 { 993 bool access; 994 995 i915_gem_object_lock(obj, NULL); 996 access = i915_gem_object_has_struct_page(obj) || 997 i915_gem_object_has_iomem(obj); 998 i915_gem_object_unlock(obj); 999 1000 return access; 1001 } 1002 1003 static int __igt_mmap_access(struct drm_i915_private *i915, 1004 struct drm_i915_gem_object *obj, 1005 enum i915_mmap_type type) 1006 { 1007 unsigned long __user *ptr; 1008 unsigned long A, B; 1009 unsigned long x, y; 1010 unsigned long addr; 1011 int err; 1012 u64 offset; 1013 1014 memset(&A, 0xAA, sizeof(A)); 1015 memset(&B, 0xBB, sizeof(B)); 1016 1017 if (!can_mmap(obj, type) || !can_access(obj)) 1018 return 0; 1019 1020 err = __assign_mmap_offset(obj, type, &offset, NULL); 1021 if (err) 1022 return err; 1023 1024 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED); 1025 if (IS_ERR_VALUE(addr)) 1026 return addr; 1027 ptr = (unsigned long __user *)addr; 1028 1029 err = __put_user(A, ptr); 1030 if (err) { 1031 pr_err("%s(%s): failed to write into user mmap\n", 1032 obj->mm.region->name, repr_mmap_type(type)); 1033 goto out_unmap; 1034 } 1035 1036 intel_gt_flush_ggtt_writes(&i915->gt); 1037 1038 err = access_process_vm(current, addr, &x, sizeof(x), 0); 1039 if (err != sizeof(x)) { 1040 pr_err("%s(%s): access_process_vm() read failed\n", 1041 obj->mm.region->name, repr_mmap_type(type)); 1042 goto out_unmap; 1043 } 1044 1045 err = access_process_vm(current, addr, &B, sizeof(B), FOLL_WRITE); 1046 if (err != sizeof(B)) { 1047 pr_err("%s(%s): access_process_vm() write failed\n", 1048 obj->mm.region->name, repr_mmap_type(type)); 1049 goto out_unmap; 1050 } 1051 1052 intel_gt_flush_ggtt_writes(&i915->gt); 1053 1054 err = __get_user(y, ptr); 1055 if (err) { 1056 pr_err("%s(%s): failed to read from user mmap\n", 1057 obj->mm.region->name, repr_mmap_type(type)); 1058 goto out_unmap; 1059 } 1060 1061 if (x != A || y != B) { 1062 pr_err("%s(%s): failed to read/write values, found (%lx, %lx)\n", 1063 obj->mm.region->name, repr_mmap_type(type), 1064 x, y); 1065 err = -EINVAL; 1066 goto out_unmap; 1067 } 1068 1069 out_unmap: 1070 vm_munmap(addr, obj->base.size); 1071 return err; 1072 } 1073 1074 static int igt_mmap_access(void *arg) 1075 { 1076 struct drm_i915_private *i915 = arg; 1077 struct intel_memory_region *mr; 1078 enum intel_region_id id; 1079 1080 for_each_memory_region(mr, i915, id) { 1081 struct drm_i915_gem_object *obj; 1082 int err; 1083 1084 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1); 1085 if (obj == ERR_PTR(-ENODEV)) 1086 continue; 1087 1088 if (IS_ERR(obj)) 1089 return PTR_ERR(obj); 1090 1091 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_GTT); 1092 if (err == 0) 1093 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_WB); 1094 if (err == 0) 1095 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_WC); 1096 if (err == 0) 1097 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_UC); 1098 if (err == 0) 1099 err = __igt_mmap_access(i915, obj, I915_MMAP_TYPE_FIXED); 1100 1101 i915_gem_object_put(obj); 1102 if (err) 1103 return err; 1104 } 1105 1106 return 0; 1107 } 1108 1109 static int __igt_mmap_gpu(struct drm_i915_private *i915, 1110 struct drm_i915_gem_object *obj, 1111 enum i915_mmap_type type) 1112 { 1113 struct intel_engine_cs *engine; 1114 unsigned long addr; 1115 u32 __user *ux; 1116 u32 bbe; 1117 int err; 1118 u64 offset; 1119 1120 /* 1121 * Verify that the mmap access into the backing store aligns with 1122 * that of the GPU, i.e. that mmap is indeed writing into the same 1123 * page as being read by the GPU. 1124 */ 1125 1126 if (!can_mmap(obj, type)) 1127 return 0; 1128 1129 err = wc_set(obj); 1130 if (err == -ENXIO) 1131 err = gtt_set(obj); 1132 if (err) 1133 return err; 1134 1135 err = __assign_mmap_offset(obj, type, &offset, NULL); 1136 if (err) 1137 return err; 1138 1139 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED); 1140 if (IS_ERR_VALUE(addr)) 1141 return addr; 1142 1143 ux = u64_to_user_ptr((u64)addr); 1144 bbe = MI_BATCH_BUFFER_END; 1145 if (put_user(bbe, ux)) { 1146 pr_err("%s: Unable to write to mmap\n", obj->mm.region->name); 1147 err = -EFAULT; 1148 goto out_unmap; 1149 } 1150 1151 if (type == I915_MMAP_TYPE_GTT) 1152 intel_gt_flush_ggtt_writes(&i915->gt); 1153 1154 for_each_uabi_engine(engine, i915) { 1155 struct i915_request *rq; 1156 struct i915_vma *vma; 1157 struct i915_gem_ww_ctx ww; 1158 1159 vma = i915_vma_instance(obj, engine->kernel_context->vm, NULL); 1160 if (IS_ERR(vma)) { 1161 err = PTR_ERR(vma); 1162 goto out_unmap; 1163 } 1164 1165 i915_gem_ww_ctx_init(&ww, false); 1166 retry: 1167 err = i915_gem_object_lock(obj, &ww); 1168 if (!err) 1169 err = i915_vma_pin_ww(vma, &ww, 0, 0, PIN_USER); 1170 if (err) 1171 goto out_ww; 1172 1173 rq = i915_request_create(engine->kernel_context); 1174 if (IS_ERR(rq)) { 1175 err = PTR_ERR(rq); 1176 goto out_unpin; 1177 } 1178 1179 err = i915_request_await_object(rq, vma->obj, false); 1180 if (err == 0) 1181 err = i915_vma_move_to_active(vma, rq, 0); 1182 1183 err = engine->emit_bb_start(rq, vma->node.start, 0, 0); 1184 i915_request_get(rq); 1185 i915_request_add(rq); 1186 1187 if (i915_request_wait(rq, 0, HZ / 5) < 0) { 1188 struct drm_printer p = 1189 drm_info_printer(engine->i915->drm.dev); 1190 1191 pr_err("%s(%s, %s): Failed to execute batch\n", 1192 __func__, engine->name, obj->mm.region->name); 1193 intel_engine_dump(engine, &p, 1194 "%s\n", engine->name); 1195 1196 intel_gt_set_wedged(engine->gt); 1197 err = -EIO; 1198 } 1199 i915_request_put(rq); 1200 1201 out_unpin: 1202 i915_vma_unpin(vma); 1203 out_ww: 1204 if (err == -EDEADLK) { 1205 err = i915_gem_ww_ctx_backoff(&ww); 1206 if (!err) 1207 goto retry; 1208 } 1209 i915_gem_ww_ctx_fini(&ww); 1210 if (err) 1211 goto out_unmap; 1212 } 1213 1214 out_unmap: 1215 vm_munmap(addr, obj->base.size); 1216 return err; 1217 } 1218 1219 static int igt_mmap_gpu(void *arg) 1220 { 1221 struct drm_i915_private *i915 = arg; 1222 struct intel_memory_region *mr; 1223 enum intel_region_id id; 1224 1225 for_each_memory_region(mr, i915, id) { 1226 struct drm_i915_gem_object *obj; 1227 int err; 1228 1229 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1); 1230 if (obj == ERR_PTR(-ENODEV)) 1231 continue; 1232 1233 if (IS_ERR(obj)) 1234 return PTR_ERR(obj); 1235 1236 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_GTT); 1237 if (err == 0) 1238 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_WC); 1239 if (err == 0) 1240 err = __igt_mmap_gpu(i915, obj, I915_MMAP_TYPE_FIXED); 1241 1242 i915_gem_object_put(obj); 1243 if (err) 1244 return err; 1245 } 1246 1247 return 0; 1248 } 1249 1250 static int check_present_pte(pte_t *pte, unsigned long addr, void *data) 1251 { 1252 if (!pte_present(*pte) || pte_none(*pte)) { 1253 pr_err("missing PTE:%lx\n", 1254 (addr - (unsigned long)data) >> PAGE_SHIFT); 1255 return -EINVAL; 1256 } 1257 1258 return 0; 1259 } 1260 1261 static int check_absent_pte(pte_t *pte, unsigned long addr, void *data) 1262 { 1263 if (pte_present(*pte) && !pte_none(*pte)) { 1264 pr_err("present PTE:%lx; expected to be revoked\n", 1265 (addr - (unsigned long)data) >> PAGE_SHIFT); 1266 return -EINVAL; 1267 } 1268 1269 return 0; 1270 } 1271 1272 static int check_present(unsigned long addr, unsigned long len) 1273 { 1274 return apply_to_page_range(current->mm, addr, len, 1275 check_present_pte, (void *)addr); 1276 } 1277 1278 static int check_absent(unsigned long addr, unsigned long len) 1279 { 1280 return apply_to_page_range(current->mm, addr, len, 1281 check_absent_pte, (void *)addr); 1282 } 1283 1284 static int prefault_range(u64 start, u64 len) 1285 { 1286 const char __user *addr, *end; 1287 char __maybe_unused c; 1288 int err; 1289 1290 addr = u64_to_user_ptr(start); 1291 end = addr + len; 1292 1293 for (; addr < end; addr += PAGE_SIZE) { 1294 err = __get_user(c, addr); 1295 if (err) 1296 return err; 1297 } 1298 1299 return __get_user(c, end - 1); 1300 } 1301 1302 static int __igt_mmap_revoke(struct drm_i915_private *i915, 1303 struct drm_i915_gem_object *obj, 1304 enum i915_mmap_type type) 1305 { 1306 unsigned long addr; 1307 int err; 1308 u64 offset; 1309 1310 if (!can_mmap(obj, type)) 1311 return 0; 1312 1313 err = __assign_mmap_offset(obj, type, &offset, NULL); 1314 if (err) 1315 return err; 1316 1317 addr = igt_mmap_offset(i915, offset, obj->base.size, PROT_WRITE, MAP_SHARED); 1318 if (IS_ERR_VALUE(addr)) 1319 return addr; 1320 1321 err = prefault_range(addr, obj->base.size); 1322 if (err) 1323 goto out_unmap; 1324 1325 err = check_present(addr, obj->base.size); 1326 if (err) { 1327 pr_err("%s: was not present\n", obj->mm.region->name); 1328 goto out_unmap; 1329 } 1330 1331 /* 1332 * After unbinding the object from the GGTT, its address may be reused 1333 * for other objects. Ergo we have to revoke the previous mmap PTE 1334 * access as it no longer points to the same object. 1335 */ 1336 err = i915_gem_object_unbind(obj, I915_GEM_OBJECT_UNBIND_ACTIVE); 1337 if (err) { 1338 pr_err("Failed to unbind object!\n"); 1339 goto out_unmap; 1340 } 1341 1342 if (type != I915_MMAP_TYPE_GTT) { 1343 i915_gem_object_lock(obj, NULL); 1344 __i915_gem_object_put_pages(obj); 1345 i915_gem_object_unlock(obj); 1346 if (i915_gem_object_has_pages(obj)) { 1347 pr_err("Failed to put-pages object!\n"); 1348 err = -EINVAL; 1349 goto out_unmap; 1350 } 1351 } 1352 1353 if (!obj->ops->mmap_ops) { 1354 err = check_absent(addr, obj->base.size); 1355 if (err) { 1356 pr_err("%s: was not absent\n", obj->mm.region->name); 1357 goto out_unmap; 1358 } 1359 } else { 1360 /* ttm allows access to evicted regions by design */ 1361 1362 err = check_present(addr, obj->base.size); 1363 if (err) { 1364 pr_err("%s: was not present\n", obj->mm.region->name); 1365 goto out_unmap; 1366 } 1367 } 1368 1369 out_unmap: 1370 vm_munmap(addr, obj->base.size); 1371 return err; 1372 } 1373 1374 static int igt_mmap_revoke(void *arg) 1375 { 1376 struct drm_i915_private *i915 = arg; 1377 struct intel_memory_region *mr; 1378 enum intel_region_id id; 1379 1380 for_each_memory_region(mr, i915, id) { 1381 struct drm_i915_gem_object *obj; 1382 int err; 1383 1384 obj = __i915_gem_object_create_user(i915, PAGE_SIZE, &mr, 1); 1385 if (obj == ERR_PTR(-ENODEV)) 1386 continue; 1387 1388 if (IS_ERR(obj)) 1389 return PTR_ERR(obj); 1390 1391 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_GTT); 1392 if (err == 0) 1393 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_WC); 1394 if (err == 0) 1395 err = __igt_mmap_revoke(i915, obj, I915_MMAP_TYPE_FIXED); 1396 1397 i915_gem_object_put(obj); 1398 if (err) 1399 return err; 1400 } 1401 1402 return 0; 1403 } 1404 1405 int i915_gem_mman_live_selftests(struct drm_i915_private *i915) 1406 { 1407 static const struct i915_subtest tests[] = { 1408 SUBTEST(igt_partial_tiling), 1409 SUBTEST(igt_smoke_tiling), 1410 SUBTEST(igt_mmap_offset_exhaustion), 1411 SUBTEST(igt_mmap), 1412 SUBTEST(igt_mmap_access), 1413 SUBTEST(igt_mmap_revoke), 1414 SUBTEST(igt_mmap_gpu), 1415 }; 1416 1417 return i915_subtests(tests, i915); 1418 } 1419