1 /* 2 * Copyright © 2016 Intel Corporation 3 * 4 * Permission is hereby granted, free of charge, to any person obtaining a 5 * copy of this software and associated documentation files (the "Software"), 6 * to deal in the Software without restriction, including without limitation 7 * the rights to use, copy, modify, merge, publish, distribute, sublicense, 8 * and/or sell copies of the Software, and to permit persons to whom the 9 * Software is furnished to do so, subject to the following conditions: 10 * 11 * The above copyright notice and this permission notice (including the next 12 * paragraph) shall be included in all copies or substantial portions of the 13 * Software. 14 * 15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL 18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING 20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS 21 * IN THE SOFTWARE. 22 * 23 */ 24 25 #include <linux/list_sort.h> 26 #include <linux/prime_numbers.h> 27 28 #include "gem/i915_gem_context.h" 29 #include "gem/i915_gem_internal.h" 30 #include "gem/i915_gem_region.h" 31 #include "gem/selftests/mock_context.h" 32 #include "gt/intel_context.h" 33 #include "gt/intel_gpu_commands.h" 34 #include "gt/intel_gtt.h" 35 36 #include "i915_random.h" 37 #include "i915_selftest.h" 38 #include "i915_vma_resource.h" 39 40 #include "mock_drm.h" 41 #include "mock_gem_device.h" 42 #include "mock_gtt.h" 43 #include "igt_flush_test.h" 44 45 static void cleanup_freed_objects(struct drm_i915_private *i915) 46 { 47 i915_gem_drain_freed_objects(i915); 48 } 49 50 static void fake_free_pages(struct drm_i915_gem_object *obj, 51 struct sg_table *pages) 52 { 53 sg_free_table(pages); 54 kfree(pages); 55 } 56 57 static int fake_get_pages(struct drm_i915_gem_object *obj) 58 { 59 #define GFP (GFP_KERNEL | __GFP_NOWARN | __GFP_NORETRY) 60 #define PFN_BIAS 0x1000 61 struct sg_table *pages; 62 struct scatterlist *sg; 63 unsigned int sg_page_sizes; 64 typeof(obj->base.size) rem; 65 66 pages = kmalloc(sizeof(*pages), GFP); 67 if (!pages) 68 return -ENOMEM; 69 70 rem = round_up(obj->base.size, BIT(31)) >> 31; 71 if (sg_alloc_table(pages, rem, GFP)) { 72 kfree(pages); 73 return -ENOMEM; 74 } 75 76 sg_page_sizes = 0; 77 rem = obj->base.size; 78 for (sg = pages->sgl; sg; sg = sg_next(sg)) { 79 unsigned long len = min_t(typeof(rem), rem, BIT(31)); 80 81 GEM_BUG_ON(!len); 82 sg_set_page(sg, pfn_to_page(PFN_BIAS), len, 0); 83 sg_dma_address(sg) = page_to_phys(sg_page(sg)); 84 sg_dma_len(sg) = len; 85 sg_page_sizes |= len; 86 87 rem -= len; 88 } 89 GEM_BUG_ON(rem); 90 91 __i915_gem_object_set_pages(obj, pages, sg_page_sizes); 92 93 return 0; 94 #undef GFP 95 } 96 97 static void fake_put_pages(struct drm_i915_gem_object *obj, 98 struct sg_table *pages) 99 { 100 fake_free_pages(obj, pages); 101 obj->mm.dirty = false; 102 } 103 104 static const struct drm_i915_gem_object_ops fake_ops = { 105 .name = "fake-gem", 106 .flags = I915_GEM_OBJECT_IS_SHRINKABLE, 107 .get_pages = fake_get_pages, 108 .put_pages = fake_put_pages, 109 }; 110 111 static struct drm_i915_gem_object * 112 fake_dma_object(struct drm_i915_private *i915, u64 size) 113 { 114 static struct lock_class_key lock_class; 115 struct drm_i915_gem_object *obj; 116 117 GEM_BUG_ON(!size); 118 GEM_BUG_ON(!IS_ALIGNED(size, I915_GTT_PAGE_SIZE)); 119 120 if (overflows_type(size, obj->base.size)) 121 return ERR_PTR(-E2BIG); 122 123 obj = i915_gem_object_alloc(); 124 if (!obj) 125 goto err; 126 127 drm_gem_private_object_init(&i915->drm, &obj->base, size); 128 i915_gem_object_init(obj, &fake_ops, &lock_class, 0); 129 130 i915_gem_object_set_volatile(obj); 131 132 obj->write_domain = I915_GEM_DOMAIN_CPU; 133 obj->read_domains = I915_GEM_DOMAIN_CPU; 134 obj->cache_level = I915_CACHE_NONE; 135 136 /* Preallocate the "backing storage" */ 137 if (i915_gem_object_pin_pages_unlocked(obj)) 138 goto err_obj; 139 140 i915_gem_object_unpin_pages(obj); 141 return obj; 142 143 err_obj: 144 i915_gem_object_put(obj); 145 err: 146 return ERR_PTR(-ENOMEM); 147 } 148 149 static int igt_ppgtt_alloc(void *arg) 150 { 151 struct drm_i915_private *dev_priv = arg; 152 struct i915_ppgtt *ppgtt; 153 struct i915_gem_ww_ctx ww; 154 u64 size, last, limit; 155 int err = 0; 156 157 /* Allocate a ppggt and try to fill the entire range */ 158 159 if (!HAS_PPGTT(dev_priv)) 160 return 0; 161 162 ppgtt = i915_ppgtt_create(to_gt(dev_priv), 0); 163 if (IS_ERR(ppgtt)) 164 return PTR_ERR(ppgtt); 165 166 if (!ppgtt->vm.allocate_va_range) 167 goto err_ppgtt_cleanup; 168 169 /* 170 * While we only allocate the page tables here and so we could 171 * address a much larger GTT than we could actually fit into 172 * RAM, a practical limit is the amount of physical pages in the system. 173 * This should ensure that we do not run into the oomkiller during 174 * the test and take down the machine wilfully. 175 */ 176 limit = totalram_pages() << PAGE_SHIFT; 177 limit = min(ppgtt->vm.total, limit); 178 179 i915_gem_ww_ctx_init(&ww, false); 180 retry: 181 err = i915_vm_lock_objects(&ppgtt->vm, &ww); 182 if (err) 183 goto err_ppgtt_cleanup; 184 185 /* Check we can allocate the entire range */ 186 for (size = 4096; size <= limit; size <<= 2) { 187 struct i915_vm_pt_stash stash = {}; 188 189 err = i915_vm_alloc_pt_stash(&ppgtt->vm, &stash, size); 190 if (err) 191 goto err_ppgtt_cleanup; 192 193 err = i915_vm_map_pt_stash(&ppgtt->vm, &stash); 194 if (err) { 195 i915_vm_free_pt_stash(&ppgtt->vm, &stash); 196 goto err_ppgtt_cleanup; 197 } 198 199 ppgtt->vm.allocate_va_range(&ppgtt->vm, &stash, 0, size); 200 cond_resched(); 201 202 ppgtt->vm.clear_range(&ppgtt->vm, 0, size); 203 204 i915_vm_free_pt_stash(&ppgtt->vm, &stash); 205 } 206 207 /* Check we can incrementally allocate the entire range */ 208 for (last = 0, size = 4096; size <= limit; last = size, size <<= 2) { 209 struct i915_vm_pt_stash stash = {}; 210 211 err = i915_vm_alloc_pt_stash(&ppgtt->vm, &stash, size - last); 212 if (err) 213 goto err_ppgtt_cleanup; 214 215 err = i915_vm_map_pt_stash(&ppgtt->vm, &stash); 216 if (err) { 217 i915_vm_free_pt_stash(&ppgtt->vm, &stash); 218 goto err_ppgtt_cleanup; 219 } 220 221 ppgtt->vm.allocate_va_range(&ppgtt->vm, &stash, 222 last, size - last); 223 cond_resched(); 224 225 i915_vm_free_pt_stash(&ppgtt->vm, &stash); 226 } 227 228 err_ppgtt_cleanup: 229 if (err == -EDEADLK) { 230 err = i915_gem_ww_ctx_backoff(&ww); 231 if (!err) 232 goto retry; 233 } 234 i915_gem_ww_ctx_fini(&ww); 235 236 i915_vm_put(&ppgtt->vm); 237 return err; 238 } 239 240 static int lowlevel_hole(struct i915_address_space *vm, 241 u64 hole_start, u64 hole_end, 242 unsigned long end_time) 243 { 244 const unsigned int min_alignment = 245 i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 246 I915_RND_STATE(seed_prng); 247 struct i915_vma_resource *mock_vma_res; 248 unsigned int size; 249 250 mock_vma_res = kzalloc(sizeof(*mock_vma_res), GFP_KERNEL); 251 if (!mock_vma_res) 252 return -ENOMEM; 253 254 /* Keep creating larger objects until one cannot fit into the hole */ 255 for (size = 12; (hole_end - hole_start) >> size; size++) { 256 I915_RND_SUBSTATE(prng, seed_prng); 257 struct drm_i915_gem_object *obj; 258 unsigned int *order, count, n; 259 u64 hole_size, aligned_size; 260 261 aligned_size = max_t(u32, ilog2(min_alignment), size); 262 hole_size = (hole_end - hole_start) >> aligned_size; 263 if (hole_size > KMALLOC_MAX_SIZE / sizeof(u32)) 264 hole_size = KMALLOC_MAX_SIZE / sizeof(u32); 265 count = hole_size >> 1; 266 if (!count) { 267 pr_debug("%s: hole is too small [%llx - %llx] >> %d: %lld\n", 268 __func__, hole_start, hole_end, size, hole_size); 269 break; 270 } 271 272 do { 273 order = i915_random_order(count, &prng); 274 if (order) 275 break; 276 } while (count >>= 1); 277 if (!count) { 278 kfree(mock_vma_res); 279 return -ENOMEM; 280 } 281 GEM_BUG_ON(!order); 282 283 GEM_BUG_ON(count * BIT_ULL(aligned_size) > vm->total); 284 GEM_BUG_ON(hole_start + count * BIT_ULL(aligned_size) > hole_end); 285 286 /* Ignore allocation failures (i.e. don't report them as 287 * a test failure) as we are purposefully allocating very 288 * large objects without checking that we have sufficient 289 * memory. We expect to hit -ENOMEM. 290 */ 291 292 obj = fake_dma_object(vm->i915, BIT_ULL(size)); 293 if (IS_ERR(obj)) { 294 kfree(order); 295 break; 296 } 297 298 GEM_BUG_ON(obj->base.size != BIT_ULL(size)); 299 300 if (i915_gem_object_pin_pages_unlocked(obj)) { 301 i915_gem_object_put(obj); 302 kfree(order); 303 break; 304 } 305 306 for (n = 0; n < count; n++) { 307 u64 addr = hole_start + order[n] * BIT_ULL(aligned_size); 308 intel_wakeref_t wakeref; 309 310 GEM_BUG_ON(addr + BIT_ULL(aligned_size) > vm->total); 311 312 if (igt_timeout(end_time, 313 "%s timed out before %d/%d\n", 314 __func__, n, count)) { 315 hole_end = hole_start; /* quit */ 316 break; 317 } 318 319 if (vm->allocate_va_range) { 320 struct i915_vm_pt_stash stash = {}; 321 struct i915_gem_ww_ctx ww; 322 int err; 323 324 i915_gem_ww_ctx_init(&ww, false); 325 retry: 326 err = i915_vm_lock_objects(vm, &ww); 327 if (err) 328 goto alloc_vm_end; 329 330 err = -ENOMEM; 331 if (i915_vm_alloc_pt_stash(vm, &stash, 332 BIT_ULL(size))) 333 goto alloc_vm_end; 334 335 err = i915_vm_map_pt_stash(vm, &stash); 336 if (!err) 337 vm->allocate_va_range(vm, &stash, 338 addr, BIT_ULL(size)); 339 i915_vm_free_pt_stash(vm, &stash); 340 alloc_vm_end: 341 if (err == -EDEADLK) { 342 err = i915_gem_ww_ctx_backoff(&ww); 343 if (!err) 344 goto retry; 345 } 346 i915_gem_ww_ctx_fini(&ww); 347 348 if (err) 349 break; 350 } 351 352 mock_vma_res->bi.pages = obj->mm.pages; 353 mock_vma_res->node_size = BIT_ULL(aligned_size); 354 mock_vma_res->start = addr; 355 356 with_intel_runtime_pm(vm->gt->uncore->rpm, wakeref) 357 vm->insert_entries(vm, mock_vma_res, 358 I915_CACHE_NONE, 0); 359 } 360 count = n; 361 362 i915_random_reorder(order, count, &prng); 363 for (n = 0; n < count; n++) { 364 u64 addr = hole_start + order[n] * BIT_ULL(aligned_size); 365 intel_wakeref_t wakeref; 366 367 GEM_BUG_ON(addr + BIT_ULL(size) > vm->total); 368 with_intel_runtime_pm(vm->gt->uncore->rpm, wakeref) 369 vm->clear_range(vm, addr, BIT_ULL(size)); 370 } 371 372 i915_gem_object_unpin_pages(obj); 373 i915_gem_object_put(obj); 374 375 kfree(order); 376 377 cleanup_freed_objects(vm->i915); 378 } 379 380 kfree(mock_vma_res); 381 return 0; 382 } 383 384 static void close_object_list(struct list_head *objects, 385 struct i915_address_space *vm) 386 { 387 struct drm_i915_gem_object *obj, *on; 388 int ignored; 389 390 list_for_each_entry_safe(obj, on, objects, st_link) { 391 struct i915_vma *vma; 392 393 vma = i915_vma_instance(obj, vm, NULL); 394 if (!IS_ERR(vma)) 395 ignored = i915_vma_unbind_unlocked(vma); 396 397 list_del(&obj->st_link); 398 i915_gem_object_put(obj); 399 } 400 } 401 402 static int fill_hole(struct i915_address_space *vm, 403 u64 hole_start, u64 hole_end, 404 unsigned long end_time) 405 { 406 const u64 hole_size = hole_end - hole_start; 407 struct drm_i915_gem_object *obj; 408 const unsigned int min_alignment = 409 i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 410 const unsigned long max_pages = 411 min_t(u64, ULONG_MAX - 1, (hole_size / 2) >> ilog2(min_alignment)); 412 const unsigned long max_step = max(int_sqrt(max_pages), 2UL); 413 unsigned long npages, prime, flags; 414 struct i915_vma *vma; 415 LIST_HEAD(objects); 416 int err; 417 418 /* Try binding many VMA working inwards from either edge */ 419 420 flags = PIN_OFFSET_FIXED | PIN_USER; 421 if (i915_is_ggtt(vm)) 422 flags |= PIN_GLOBAL; 423 424 for_each_prime_number_from(prime, 2, max_step) { 425 for (npages = 1; npages <= max_pages; npages *= prime) { 426 const u64 full_size = npages << PAGE_SHIFT; 427 const struct { 428 const char *name; 429 u64 offset; 430 int step; 431 } phases[] = { 432 { "top-down", hole_end, -1, }, 433 { "bottom-up", hole_start, 1, }, 434 { } 435 }, *p; 436 437 obj = fake_dma_object(vm->i915, full_size); 438 if (IS_ERR(obj)) 439 break; 440 441 list_add(&obj->st_link, &objects); 442 443 /* Align differing sized objects against the edges, and 444 * check we don't walk off into the void when binding 445 * them into the GTT. 446 */ 447 for (p = phases; p->name; p++) { 448 u64 offset; 449 450 offset = p->offset; 451 list_for_each_entry(obj, &objects, st_link) { 452 u64 aligned_size = round_up(obj->base.size, 453 min_alignment); 454 455 vma = i915_vma_instance(obj, vm, NULL); 456 if (IS_ERR(vma)) 457 continue; 458 459 if (p->step < 0) { 460 if (offset < hole_start + aligned_size) 461 break; 462 offset -= aligned_size; 463 } 464 465 err = i915_vma_pin(vma, 0, 0, offset | flags); 466 if (err) { 467 pr_err("%s(%s) pin (forward) failed with err=%d on size=%lu pages (prime=%lu), offset=%llx\n", 468 __func__, p->name, err, npages, prime, offset); 469 goto err; 470 } 471 472 if (!drm_mm_node_allocated(&vma->node) || 473 i915_vma_misplaced(vma, 0, 0, offset | flags)) { 474 pr_err("%s(%s) (forward) insert failed: vma.node=%llx + %llx [allocated? %d], expected offset %llx\n", 475 __func__, p->name, vma->node.start, vma->node.size, drm_mm_node_allocated(&vma->node), 476 offset); 477 err = -EINVAL; 478 goto err; 479 } 480 481 i915_vma_unpin(vma); 482 483 if (p->step > 0) { 484 if (offset + aligned_size > hole_end) 485 break; 486 offset += aligned_size; 487 } 488 } 489 490 offset = p->offset; 491 list_for_each_entry(obj, &objects, st_link) { 492 u64 aligned_size = round_up(obj->base.size, 493 min_alignment); 494 495 vma = i915_vma_instance(obj, vm, NULL); 496 if (IS_ERR(vma)) 497 continue; 498 499 if (p->step < 0) { 500 if (offset < hole_start + aligned_size) 501 break; 502 offset -= aligned_size; 503 } 504 505 if (!drm_mm_node_allocated(&vma->node) || 506 i915_vma_misplaced(vma, 0, 0, offset | flags)) { 507 pr_err("%s(%s) (forward) moved vma.node=%llx + %llx, expected offset %llx\n", 508 __func__, p->name, vma->node.start, vma->node.size, 509 offset); 510 err = -EINVAL; 511 goto err; 512 } 513 514 err = i915_vma_unbind_unlocked(vma); 515 if (err) { 516 pr_err("%s(%s) (forward) unbind of vma.node=%llx + %llx failed with err=%d\n", 517 __func__, p->name, vma->node.start, vma->node.size, 518 err); 519 goto err; 520 } 521 522 if (p->step > 0) { 523 if (offset + aligned_size > hole_end) 524 break; 525 offset += aligned_size; 526 } 527 } 528 529 offset = p->offset; 530 list_for_each_entry_reverse(obj, &objects, st_link) { 531 u64 aligned_size = round_up(obj->base.size, 532 min_alignment); 533 534 vma = i915_vma_instance(obj, vm, NULL); 535 if (IS_ERR(vma)) 536 continue; 537 538 if (p->step < 0) { 539 if (offset < hole_start + aligned_size) 540 break; 541 offset -= aligned_size; 542 } 543 544 err = i915_vma_pin(vma, 0, 0, offset | flags); 545 if (err) { 546 pr_err("%s(%s) pin (backward) failed with err=%d on size=%lu pages (prime=%lu), offset=%llx\n", 547 __func__, p->name, err, npages, prime, offset); 548 goto err; 549 } 550 551 if (!drm_mm_node_allocated(&vma->node) || 552 i915_vma_misplaced(vma, 0, 0, offset | flags)) { 553 pr_err("%s(%s) (backward) insert failed: vma.node=%llx + %llx [allocated? %d], expected offset %llx\n", 554 __func__, p->name, vma->node.start, vma->node.size, drm_mm_node_allocated(&vma->node), 555 offset); 556 err = -EINVAL; 557 goto err; 558 } 559 560 i915_vma_unpin(vma); 561 562 if (p->step > 0) { 563 if (offset + aligned_size > hole_end) 564 break; 565 offset += aligned_size; 566 } 567 } 568 569 offset = p->offset; 570 list_for_each_entry_reverse(obj, &objects, st_link) { 571 u64 aligned_size = round_up(obj->base.size, 572 min_alignment); 573 574 vma = i915_vma_instance(obj, vm, NULL); 575 if (IS_ERR(vma)) 576 continue; 577 578 if (p->step < 0) { 579 if (offset < hole_start + aligned_size) 580 break; 581 offset -= aligned_size; 582 } 583 584 if (!drm_mm_node_allocated(&vma->node) || 585 i915_vma_misplaced(vma, 0, 0, offset | flags)) { 586 pr_err("%s(%s) (backward) moved vma.node=%llx + %llx [allocated? %d], expected offset %llx\n", 587 __func__, p->name, vma->node.start, vma->node.size, drm_mm_node_allocated(&vma->node), 588 offset); 589 err = -EINVAL; 590 goto err; 591 } 592 593 err = i915_vma_unbind_unlocked(vma); 594 if (err) { 595 pr_err("%s(%s) (backward) unbind of vma.node=%llx + %llx failed with err=%d\n", 596 __func__, p->name, vma->node.start, vma->node.size, 597 err); 598 goto err; 599 } 600 601 if (p->step > 0) { 602 if (offset + aligned_size > hole_end) 603 break; 604 offset += aligned_size; 605 } 606 } 607 } 608 609 if (igt_timeout(end_time, "%s timed out (npages=%lu, prime=%lu)\n", 610 __func__, npages, prime)) { 611 err = -EINTR; 612 goto err; 613 } 614 } 615 616 close_object_list(&objects, vm); 617 cleanup_freed_objects(vm->i915); 618 } 619 620 return 0; 621 622 err: 623 close_object_list(&objects, vm); 624 return err; 625 } 626 627 static int walk_hole(struct i915_address_space *vm, 628 u64 hole_start, u64 hole_end, 629 unsigned long end_time) 630 { 631 const u64 hole_size = hole_end - hole_start; 632 const unsigned long max_pages = 633 min_t(u64, ULONG_MAX - 1, hole_size >> PAGE_SHIFT); 634 unsigned long min_alignment; 635 unsigned long flags; 636 u64 size; 637 638 /* Try binding a single VMA in different positions within the hole */ 639 640 flags = PIN_OFFSET_FIXED | PIN_USER; 641 if (i915_is_ggtt(vm)) 642 flags |= PIN_GLOBAL; 643 644 min_alignment = i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 645 646 for_each_prime_number_from(size, 1, max_pages) { 647 struct drm_i915_gem_object *obj; 648 struct i915_vma *vma; 649 u64 addr; 650 int err = 0; 651 652 obj = fake_dma_object(vm->i915, size << PAGE_SHIFT); 653 if (IS_ERR(obj)) 654 break; 655 656 vma = i915_vma_instance(obj, vm, NULL); 657 if (IS_ERR(vma)) { 658 err = PTR_ERR(vma); 659 goto err_put; 660 } 661 662 for (addr = hole_start; 663 addr + obj->base.size < hole_end; 664 addr += round_up(obj->base.size, min_alignment)) { 665 err = i915_vma_pin(vma, 0, 0, addr | flags); 666 if (err) { 667 pr_err("%s bind failed at %llx + %llx [hole %llx- %llx] with err=%d\n", 668 __func__, addr, vma->size, 669 hole_start, hole_end, err); 670 goto err_put; 671 } 672 i915_vma_unpin(vma); 673 674 if (!drm_mm_node_allocated(&vma->node) || 675 i915_vma_misplaced(vma, 0, 0, addr | flags)) { 676 pr_err("%s incorrect at %llx + %llx\n", 677 __func__, addr, vma->size); 678 err = -EINVAL; 679 goto err_put; 680 } 681 682 err = i915_vma_unbind_unlocked(vma); 683 if (err) { 684 pr_err("%s unbind failed at %llx + %llx with err=%d\n", 685 __func__, addr, vma->size, err); 686 goto err_put; 687 } 688 689 GEM_BUG_ON(drm_mm_node_allocated(&vma->node)); 690 691 if (igt_timeout(end_time, 692 "%s timed out at %llx\n", 693 __func__, addr)) { 694 err = -EINTR; 695 goto err_put; 696 } 697 } 698 699 err_put: 700 i915_gem_object_put(obj); 701 if (err) 702 return err; 703 704 cleanup_freed_objects(vm->i915); 705 } 706 707 return 0; 708 } 709 710 static int pot_hole(struct i915_address_space *vm, 711 u64 hole_start, u64 hole_end, 712 unsigned long end_time) 713 { 714 struct drm_i915_gem_object *obj; 715 struct i915_vma *vma; 716 unsigned int min_alignment; 717 unsigned long flags; 718 unsigned int pot; 719 int err = 0; 720 721 flags = PIN_OFFSET_FIXED | PIN_USER; 722 if (i915_is_ggtt(vm)) 723 flags |= PIN_GLOBAL; 724 725 min_alignment = i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 726 727 obj = i915_gem_object_create_internal(vm->i915, 2 * I915_GTT_PAGE_SIZE); 728 if (IS_ERR(obj)) 729 return PTR_ERR(obj); 730 731 vma = i915_vma_instance(obj, vm, NULL); 732 if (IS_ERR(vma)) { 733 err = PTR_ERR(vma); 734 goto err_obj; 735 } 736 737 /* Insert a pair of pages across every pot boundary within the hole */ 738 for (pot = fls64(hole_end - 1) - 1; 739 pot > ilog2(2 * min_alignment); 740 pot--) { 741 u64 step = BIT_ULL(pot); 742 u64 addr; 743 744 for (addr = round_up(hole_start + min_alignment, step) - min_alignment; 745 addr <= round_down(hole_end - (2 * min_alignment), step) - min_alignment; 746 addr += step) { 747 err = i915_vma_pin(vma, 0, 0, addr | flags); 748 if (err) { 749 pr_err("%s failed to pin object at %llx in hole [%llx - %llx], with err=%d\n", 750 __func__, 751 addr, 752 hole_start, hole_end, 753 err); 754 goto err_obj; 755 } 756 757 if (!drm_mm_node_allocated(&vma->node) || 758 i915_vma_misplaced(vma, 0, 0, addr | flags)) { 759 pr_err("%s incorrect at %llx + %llx\n", 760 __func__, addr, vma->size); 761 i915_vma_unpin(vma); 762 err = i915_vma_unbind_unlocked(vma); 763 err = -EINVAL; 764 goto err_obj; 765 } 766 767 i915_vma_unpin(vma); 768 err = i915_vma_unbind_unlocked(vma); 769 GEM_BUG_ON(err); 770 } 771 772 if (igt_timeout(end_time, 773 "%s timed out after %d/%d\n", 774 __func__, pot, fls64(hole_end - 1) - 1)) { 775 err = -EINTR; 776 goto err_obj; 777 } 778 } 779 780 err_obj: 781 i915_gem_object_put(obj); 782 return err; 783 } 784 785 static int drunk_hole(struct i915_address_space *vm, 786 u64 hole_start, u64 hole_end, 787 unsigned long end_time) 788 { 789 I915_RND_STATE(prng); 790 unsigned int min_alignment; 791 unsigned int size; 792 unsigned long flags; 793 794 flags = PIN_OFFSET_FIXED | PIN_USER; 795 if (i915_is_ggtt(vm)) 796 flags |= PIN_GLOBAL; 797 798 min_alignment = i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 799 800 /* Keep creating larger objects until one cannot fit into the hole */ 801 for (size = 12; (hole_end - hole_start) >> size; size++) { 802 struct drm_i915_gem_object *obj; 803 unsigned int *order, count, n; 804 struct i915_vma *vma; 805 u64 hole_size, aligned_size; 806 int err = -ENODEV; 807 808 aligned_size = max_t(u32, ilog2(min_alignment), size); 809 hole_size = (hole_end - hole_start) >> aligned_size; 810 if (hole_size > KMALLOC_MAX_SIZE / sizeof(u32)) 811 hole_size = KMALLOC_MAX_SIZE / sizeof(u32); 812 count = hole_size >> 1; 813 if (!count) { 814 pr_debug("%s: hole is too small [%llx - %llx] >> %d: %lld\n", 815 __func__, hole_start, hole_end, size, hole_size); 816 break; 817 } 818 819 do { 820 order = i915_random_order(count, &prng); 821 if (order) 822 break; 823 } while (count >>= 1); 824 if (!count) 825 return -ENOMEM; 826 GEM_BUG_ON(!order); 827 828 /* Ignore allocation failures (i.e. don't report them as 829 * a test failure) as we are purposefully allocating very 830 * large objects without checking that we have sufficient 831 * memory. We expect to hit -ENOMEM. 832 */ 833 834 obj = fake_dma_object(vm->i915, BIT_ULL(size)); 835 if (IS_ERR(obj)) { 836 kfree(order); 837 break; 838 } 839 840 vma = i915_vma_instance(obj, vm, NULL); 841 if (IS_ERR(vma)) { 842 err = PTR_ERR(vma); 843 goto err_obj; 844 } 845 846 GEM_BUG_ON(vma->size != BIT_ULL(size)); 847 848 for (n = 0; n < count; n++) { 849 u64 addr = hole_start + order[n] * BIT_ULL(aligned_size); 850 851 err = i915_vma_pin(vma, 0, 0, addr | flags); 852 if (err) { 853 pr_err("%s failed to pin object at %llx + %llx in hole [%llx - %llx], with err=%d\n", 854 __func__, 855 addr, BIT_ULL(size), 856 hole_start, hole_end, 857 err); 858 goto err_obj; 859 } 860 861 if (!drm_mm_node_allocated(&vma->node) || 862 i915_vma_misplaced(vma, 0, 0, addr | flags)) { 863 pr_err("%s incorrect at %llx + %llx\n", 864 __func__, addr, BIT_ULL(size)); 865 i915_vma_unpin(vma); 866 err = i915_vma_unbind_unlocked(vma); 867 err = -EINVAL; 868 goto err_obj; 869 } 870 871 i915_vma_unpin(vma); 872 err = i915_vma_unbind_unlocked(vma); 873 GEM_BUG_ON(err); 874 875 if (igt_timeout(end_time, 876 "%s timed out after %d/%d\n", 877 __func__, n, count)) { 878 err = -EINTR; 879 goto err_obj; 880 } 881 } 882 883 err_obj: 884 i915_gem_object_put(obj); 885 kfree(order); 886 if (err) 887 return err; 888 889 cleanup_freed_objects(vm->i915); 890 } 891 892 return 0; 893 } 894 895 static int __shrink_hole(struct i915_address_space *vm, 896 u64 hole_start, u64 hole_end, 897 unsigned long end_time) 898 { 899 struct drm_i915_gem_object *obj; 900 unsigned long flags = PIN_OFFSET_FIXED | PIN_USER; 901 unsigned int min_alignment; 902 unsigned int order = 12; 903 LIST_HEAD(objects); 904 int err = 0; 905 u64 addr; 906 907 min_alignment = i915_vm_min_alignment(vm, INTEL_MEMORY_SYSTEM); 908 909 /* Keep creating larger objects until one cannot fit into the hole */ 910 for (addr = hole_start; addr < hole_end; ) { 911 struct i915_vma *vma; 912 u64 size = BIT_ULL(order++); 913 914 size = min(size, hole_end - addr); 915 obj = fake_dma_object(vm->i915, size); 916 if (IS_ERR(obj)) { 917 err = PTR_ERR(obj); 918 break; 919 } 920 921 list_add(&obj->st_link, &objects); 922 923 vma = i915_vma_instance(obj, vm, NULL); 924 if (IS_ERR(vma)) { 925 err = PTR_ERR(vma); 926 break; 927 } 928 929 GEM_BUG_ON(vma->size != size); 930 931 err = i915_vma_pin(vma, 0, 0, addr | flags); 932 if (err) { 933 pr_err("%s failed to pin object at %llx + %llx in hole [%llx - %llx], with err=%d\n", 934 __func__, addr, size, hole_start, hole_end, err); 935 break; 936 } 937 938 if (!drm_mm_node_allocated(&vma->node) || 939 i915_vma_misplaced(vma, 0, 0, addr | flags)) { 940 pr_err("%s incorrect at %llx + %llx\n", 941 __func__, addr, size); 942 i915_vma_unpin(vma); 943 err = i915_vma_unbind_unlocked(vma); 944 err = -EINVAL; 945 break; 946 } 947 948 i915_vma_unpin(vma); 949 addr += round_up(size, min_alignment); 950 951 /* 952 * Since we are injecting allocation faults at random intervals, 953 * wait for this allocation to complete before we change the 954 * faultinjection. 955 */ 956 err = i915_vma_sync(vma); 957 if (err) 958 break; 959 960 if (igt_timeout(end_time, 961 "%s timed out at ofset %llx [%llx - %llx]\n", 962 __func__, addr, hole_start, hole_end)) { 963 err = -EINTR; 964 break; 965 } 966 } 967 968 close_object_list(&objects, vm); 969 cleanup_freed_objects(vm->i915); 970 return err; 971 } 972 973 static int shrink_hole(struct i915_address_space *vm, 974 u64 hole_start, u64 hole_end, 975 unsigned long end_time) 976 { 977 unsigned long prime; 978 int err; 979 980 vm->fault_attr.probability = 999; 981 atomic_set(&vm->fault_attr.times, -1); 982 983 for_each_prime_number_from(prime, 0, ULONG_MAX - 1) { 984 vm->fault_attr.interval = prime; 985 err = __shrink_hole(vm, hole_start, hole_end, end_time); 986 if (err) 987 break; 988 } 989 990 memset(&vm->fault_attr, 0, sizeof(vm->fault_attr)); 991 992 return err; 993 } 994 995 static int shrink_boom(struct i915_address_space *vm, 996 u64 hole_start, u64 hole_end, 997 unsigned long end_time) 998 { 999 unsigned int sizes[] = { SZ_2M, SZ_1G }; 1000 struct drm_i915_gem_object *purge; 1001 struct drm_i915_gem_object *explode; 1002 int err; 1003 int i; 1004 1005 /* 1006 * Catch the case which shrink_hole seems to miss. The setup here 1007 * requires invoking the shrinker as we do the alloc_pt/alloc_pd, while 1008 * ensuring that all vma assiocated with the respective pd/pdp are 1009 * unpinned at the time. 1010 */ 1011 1012 for (i = 0; i < ARRAY_SIZE(sizes); ++i) { 1013 unsigned int flags = PIN_USER | PIN_OFFSET_FIXED; 1014 unsigned int size = sizes[i]; 1015 struct i915_vma *vma; 1016 1017 purge = fake_dma_object(vm->i915, size); 1018 if (IS_ERR(purge)) 1019 return PTR_ERR(purge); 1020 1021 vma = i915_vma_instance(purge, vm, NULL); 1022 if (IS_ERR(vma)) { 1023 err = PTR_ERR(vma); 1024 goto err_purge; 1025 } 1026 1027 err = i915_vma_pin(vma, 0, 0, flags); 1028 if (err) 1029 goto err_purge; 1030 1031 /* Should now be ripe for purging */ 1032 i915_vma_unpin(vma); 1033 1034 explode = fake_dma_object(vm->i915, size); 1035 if (IS_ERR(explode)) { 1036 err = PTR_ERR(explode); 1037 goto err_purge; 1038 } 1039 1040 vm->fault_attr.probability = 100; 1041 vm->fault_attr.interval = 1; 1042 atomic_set(&vm->fault_attr.times, -1); 1043 1044 vma = i915_vma_instance(explode, vm, NULL); 1045 if (IS_ERR(vma)) { 1046 err = PTR_ERR(vma); 1047 goto err_explode; 1048 } 1049 1050 err = i915_vma_pin(vma, 0, 0, flags | size); 1051 if (err) 1052 goto err_explode; 1053 1054 i915_vma_unpin(vma); 1055 1056 i915_gem_object_put(purge); 1057 i915_gem_object_put(explode); 1058 1059 memset(&vm->fault_attr, 0, sizeof(vm->fault_attr)); 1060 cleanup_freed_objects(vm->i915); 1061 } 1062 1063 return 0; 1064 1065 err_explode: 1066 i915_gem_object_put(explode); 1067 err_purge: 1068 i915_gem_object_put(purge); 1069 memset(&vm->fault_attr, 0, sizeof(vm->fault_attr)); 1070 return err; 1071 } 1072 1073 static int misaligned_case(struct i915_address_space *vm, struct intel_memory_region *mr, 1074 u64 addr, u64 size, unsigned long flags) 1075 { 1076 struct drm_i915_gem_object *obj; 1077 struct i915_vma *vma; 1078 int err = 0; 1079 u64 expected_vma_size, expected_node_size; 1080 bool is_stolen = mr->type == INTEL_MEMORY_STOLEN_SYSTEM || 1081 mr->type == INTEL_MEMORY_STOLEN_LOCAL; 1082 1083 obj = i915_gem_object_create_region(mr, size, 0, 0); 1084 if (IS_ERR(obj)) { 1085 /* if iGVT-g or DMAR is active, stolen mem will be uninitialized */ 1086 if (PTR_ERR(obj) == -ENODEV && is_stolen) 1087 return 0; 1088 return PTR_ERR(obj); 1089 } 1090 1091 vma = i915_vma_instance(obj, vm, NULL); 1092 if (IS_ERR(vma)) { 1093 err = PTR_ERR(vma); 1094 goto err_put; 1095 } 1096 1097 err = i915_vma_pin(vma, 0, 0, addr | flags); 1098 if (err) 1099 goto err_put; 1100 i915_vma_unpin(vma); 1101 1102 if (!drm_mm_node_allocated(&vma->node)) { 1103 err = -EINVAL; 1104 goto err_put; 1105 } 1106 1107 if (i915_vma_misplaced(vma, 0, 0, addr | flags)) { 1108 err = -EINVAL; 1109 goto err_put; 1110 } 1111 1112 expected_vma_size = round_up(size, 1 << (ffs(vma->resource->page_sizes_gtt) - 1)); 1113 expected_node_size = expected_vma_size; 1114 1115 if (HAS_64K_PAGES(vm->i915) && i915_gem_object_is_lmem(obj)) { 1116 /* 1117 * The compact-pt should expand lmem node to 2MB for the ppGTT, 1118 * for all other cases we should only expect 64K. 1119 */ 1120 expected_vma_size = round_up(size, I915_GTT_PAGE_SIZE_64K); 1121 if (NEEDS_COMPACT_PT(vm->i915) && !i915_is_ggtt(vm)) 1122 expected_node_size = round_up(size, I915_GTT_PAGE_SIZE_2M); 1123 else 1124 expected_node_size = round_up(size, I915_GTT_PAGE_SIZE_64K); 1125 } 1126 1127 if (vma->size != expected_vma_size || vma->node.size != expected_node_size) { 1128 err = i915_vma_unbind_unlocked(vma); 1129 err = -EBADSLT; 1130 goto err_put; 1131 } 1132 1133 err = i915_vma_unbind_unlocked(vma); 1134 if (err) 1135 goto err_put; 1136 1137 GEM_BUG_ON(drm_mm_node_allocated(&vma->node)); 1138 1139 err_put: 1140 i915_gem_object_put(obj); 1141 cleanup_freed_objects(vm->i915); 1142 return err; 1143 } 1144 1145 static int misaligned_pin(struct i915_address_space *vm, 1146 u64 hole_start, u64 hole_end, 1147 unsigned long end_time) 1148 { 1149 struct intel_memory_region *mr; 1150 enum intel_region_id id; 1151 unsigned long flags = PIN_OFFSET_FIXED | PIN_USER; 1152 int err = 0; 1153 u64 hole_size = hole_end - hole_start; 1154 1155 if (i915_is_ggtt(vm)) 1156 flags |= PIN_GLOBAL; 1157 1158 for_each_memory_region(mr, vm->i915, id) { 1159 u64 min_alignment = i915_vm_min_alignment(vm, mr->type); 1160 u64 size = min_alignment; 1161 u64 addr = round_down(hole_start + (hole_size / 2), min_alignment); 1162 1163 /* avoid -ENOSPC on very small hole setups */ 1164 if (hole_size < 3 * min_alignment) 1165 continue; 1166 1167 /* we can't test < 4k alignment due to flags being encoded in lower bits */ 1168 if (min_alignment != I915_GTT_PAGE_SIZE_4K) { 1169 err = misaligned_case(vm, mr, addr + (min_alignment / 2), size, flags); 1170 /* misaligned should error with -EINVAL*/ 1171 if (!err) 1172 err = -EBADSLT; 1173 if (err != -EINVAL) 1174 return err; 1175 } 1176 1177 /* test for vma->size expansion to min page size */ 1178 err = misaligned_case(vm, mr, addr, PAGE_SIZE, flags); 1179 if (err) 1180 return err; 1181 1182 /* test for intermediate size not expanding vma->size for large alignments */ 1183 err = misaligned_case(vm, mr, addr, size / 2, flags); 1184 if (err) 1185 return err; 1186 } 1187 1188 return 0; 1189 } 1190 1191 static int exercise_ppgtt(struct drm_i915_private *dev_priv, 1192 int (*func)(struct i915_address_space *vm, 1193 u64 hole_start, u64 hole_end, 1194 unsigned long end_time)) 1195 { 1196 struct i915_ppgtt *ppgtt; 1197 IGT_TIMEOUT(end_time); 1198 struct file *file; 1199 int err; 1200 1201 if (!HAS_FULL_PPGTT(dev_priv)) 1202 return 0; 1203 1204 file = mock_file(dev_priv); 1205 if (IS_ERR(file)) 1206 return PTR_ERR(file); 1207 1208 ppgtt = i915_ppgtt_create(to_gt(dev_priv), 0); 1209 if (IS_ERR(ppgtt)) { 1210 err = PTR_ERR(ppgtt); 1211 goto out_free; 1212 } 1213 GEM_BUG_ON(offset_in_page(ppgtt->vm.total)); 1214 assert_vm_alive(&ppgtt->vm); 1215 1216 err = func(&ppgtt->vm, 0, ppgtt->vm.total, end_time); 1217 1218 i915_vm_put(&ppgtt->vm); 1219 1220 out_free: 1221 fput(file); 1222 return err; 1223 } 1224 1225 static int igt_ppgtt_fill(void *arg) 1226 { 1227 return exercise_ppgtt(arg, fill_hole); 1228 } 1229 1230 static int igt_ppgtt_walk(void *arg) 1231 { 1232 return exercise_ppgtt(arg, walk_hole); 1233 } 1234 1235 static int igt_ppgtt_pot(void *arg) 1236 { 1237 return exercise_ppgtt(arg, pot_hole); 1238 } 1239 1240 static int igt_ppgtt_drunk(void *arg) 1241 { 1242 return exercise_ppgtt(arg, drunk_hole); 1243 } 1244 1245 static int igt_ppgtt_lowlevel(void *arg) 1246 { 1247 return exercise_ppgtt(arg, lowlevel_hole); 1248 } 1249 1250 static int igt_ppgtt_shrink(void *arg) 1251 { 1252 return exercise_ppgtt(arg, shrink_hole); 1253 } 1254 1255 static int igt_ppgtt_shrink_boom(void *arg) 1256 { 1257 return exercise_ppgtt(arg, shrink_boom); 1258 } 1259 1260 static int igt_ppgtt_misaligned_pin(void *arg) 1261 { 1262 return exercise_ppgtt(arg, misaligned_pin); 1263 } 1264 1265 static int sort_holes(void *priv, const struct list_head *A, 1266 const struct list_head *B) 1267 { 1268 struct drm_mm_node *a = list_entry(A, typeof(*a), hole_stack); 1269 struct drm_mm_node *b = list_entry(B, typeof(*b), hole_stack); 1270 1271 if (a->start < b->start) 1272 return -1; 1273 else 1274 return 1; 1275 } 1276 1277 static int exercise_ggtt(struct drm_i915_private *i915, 1278 int (*func)(struct i915_address_space *vm, 1279 u64 hole_start, u64 hole_end, 1280 unsigned long end_time)) 1281 { 1282 struct i915_ggtt *ggtt = to_gt(i915)->ggtt; 1283 u64 hole_start, hole_end, last = 0; 1284 struct drm_mm_node *node; 1285 IGT_TIMEOUT(end_time); 1286 int err = 0; 1287 1288 restart: 1289 list_sort(NULL, &ggtt->vm.mm.hole_stack, sort_holes); 1290 drm_mm_for_each_hole(node, &ggtt->vm.mm, hole_start, hole_end) { 1291 if (hole_start < last) 1292 continue; 1293 1294 if (ggtt->vm.mm.color_adjust) 1295 ggtt->vm.mm.color_adjust(node, 0, 1296 &hole_start, &hole_end); 1297 if (hole_start >= hole_end) 1298 continue; 1299 1300 err = func(&ggtt->vm, hole_start, hole_end, end_time); 1301 if (err) 1302 break; 1303 1304 /* As we have manipulated the drm_mm, the list may be corrupt */ 1305 last = hole_end; 1306 goto restart; 1307 } 1308 1309 return err; 1310 } 1311 1312 static int igt_ggtt_fill(void *arg) 1313 { 1314 return exercise_ggtt(arg, fill_hole); 1315 } 1316 1317 static int igt_ggtt_walk(void *arg) 1318 { 1319 return exercise_ggtt(arg, walk_hole); 1320 } 1321 1322 static int igt_ggtt_pot(void *arg) 1323 { 1324 return exercise_ggtt(arg, pot_hole); 1325 } 1326 1327 static int igt_ggtt_drunk(void *arg) 1328 { 1329 return exercise_ggtt(arg, drunk_hole); 1330 } 1331 1332 static int igt_ggtt_lowlevel(void *arg) 1333 { 1334 return exercise_ggtt(arg, lowlevel_hole); 1335 } 1336 1337 static int igt_ggtt_misaligned_pin(void *arg) 1338 { 1339 return exercise_ggtt(arg, misaligned_pin); 1340 } 1341 1342 static int igt_ggtt_page(void *arg) 1343 { 1344 const unsigned int count = PAGE_SIZE/sizeof(u32); 1345 I915_RND_STATE(prng); 1346 struct drm_i915_private *i915 = arg; 1347 struct i915_ggtt *ggtt = to_gt(i915)->ggtt; 1348 struct drm_i915_gem_object *obj; 1349 intel_wakeref_t wakeref; 1350 struct drm_mm_node tmp; 1351 unsigned int *order, n; 1352 int err; 1353 1354 if (!i915_ggtt_has_aperture(ggtt)) 1355 return 0; 1356 1357 obj = i915_gem_object_create_internal(i915, PAGE_SIZE); 1358 if (IS_ERR(obj)) 1359 return PTR_ERR(obj); 1360 1361 err = i915_gem_object_pin_pages_unlocked(obj); 1362 if (err) 1363 goto out_free; 1364 1365 memset(&tmp, 0, sizeof(tmp)); 1366 mutex_lock(&ggtt->vm.mutex); 1367 err = drm_mm_insert_node_in_range(&ggtt->vm.mm, &tmp, 1368 count * PAGE_SIZE, 0, 1369 I915_COLOR_UNEVICTABLE, 1370 0, ggtt->mappable_end, 1371 DRM_MM_INSERT_LOW); 1372 mutex_unlock(&ggtt->vm.mutex); 1373 if (err) 1374 goto out_unpin; 1375 1376 wakeref = intel_runtime_pm_get(&i915->runtime_pm); 1377 1378 for (n = 0; n < count; n++) { 1379 u64 offset = tmp.start + n * PAGE_SIZE; 1380 1381 ggtt->vm.insert_page(&ggtt->vm, 1382 i915_gem_object_get_dma_address(obj, 0), 1383 offset, I915_CACHE_NONE, 0); 1384 } 1385 1386 order = i915_random_order(count, &prng); 1387 if (!order) { 1388 err = -ENOMEM; 1389 goto out_remove; 1390 } 1391 1392 for (n = 0; n < count; n++) { 1393 u64 offset = tmp.start + order[n] * PAGE_SIZE; 1394 u32 __iomem *vaddr; 1395 1396 vaddr = io_mapping_map_atomic_wc(&ggtt->iomap, offset); 1397 iowrite32(n, vaddr + n); 1398 io_mapping_unmap_atomic(vaddr); 1399 } 1400 intel_gt_flush_ggtt_writes(ggtt->vm.gt); 1401 1402 i915_random_reorder(order, count, &prng); 1403 for (n = 0; n < count; n++) { 1404 u64 offset = tmp.start + order[n] * PAGE_SIZE; 1405 u32 __iomem *vaddr; 1406 u32 val; 1407 1408 vaddr = io_mapping_map_atomic_wc(&ggtt->iomap, offset); 1409 val = ioread32(vaddr + n); 1410 io_mapping_unmap_atomic(vaddr); 1411 1412 if (val != n) { 1413 pr_err("insert page failed: found %d, expected %d\n", 1414 val, n); 1415 err = -EINVAL; 1416 break; 1417 } 1418 } 1419 1420 kfree(order); 1421 out_remove: 1422 ggtt->vm.clear_range(&ggtt->vm, tmp.start, tmp.size); 1423 intel_runtime_pm_put(&i915->runtime_pm, wakeref); 1424 mutex_lock(&ggtt->vm.mutex); 1425 drm_mm_remove_node(&tmp); 1426 mutex_unlock(&ggtt->vm.mutex); 1427 out_unpin: 1428 i915_gem_object_unpin_pages(obj); 1429 out_free: 1430 i915_gem_object_put(obj); 1431 return err; 1432 } 1433 1434 static void track_vma_bind(struct i915_vma *vma) 1435 { 1436 struct drm_i915_gem_object *obj = vma->obj; 1437 1438 __i915_gem_object_pin_pages(obj); 1439 1440 GEM_BUG_ON(atomic_read(&vma->pages_count)); 1441 atomic_set(&vma->pages_count, I915_VMA_PAGES_ACTIVE); 1442 __i915_gem_object_pin_pages(obj); 1443 vma->pages = obj->mm.pages; 1444 vma->resource->bi.pages = vma->pages; 1445 1446 mutex_lock(&vma->vm->mutex); 1447 list_move_tail(&vma->vm_link, &vma->vm->bound_list); 1448 mutex_unlock(&vma->vm->mutex); 1449 } 1450 1451 static int exercise_mock(struct drm_i915_private *i915, 1452 int (*func)(struct i915_address_space *vm, 1453 u64 hole_start, u64 hole_end, 1454 unsigned long end_time)) 1455 { 1456 const u64 limit = totalram_pages() << PAGE_SHIFT; 1457 struct i915_address_space *vm; 1458 struct i915_gem_context *ctx; 1459 IGT_TIMEOUT(end_time); 1460 int err; 1461 1462 ctx = mock_context(i915, "mock"); 1463 if (!ctx) 1464 return -ENOMEM; 1465 1466 vm = i915_gem_context_get_eb_vm(ctx); 1467 err = func(vm, 0, min(vm->total, limit), end_time); 1468 i915_vm_put(vm); 1469 1470 mock_context_close(ctx); 1471 return err; 1472 } 1473 1474 static int igt_mock_fill(void *arg) 1475 { 1476 struct i915_ggtt *ggtt = arg; 1477 1478 return exercise_mock(ggtt->vm.i915, fill_hole); 1479 } 1480 1481 static int igt_mock_walk(void *arg) 1482 { 1483 struct i915_ggtt *ggtt = arg; 1484 1485 return exercise_mock(ggtt->vm.i915, walk_hole); 1486 } 1487 1488 static int igt_mock_pot(void *arg) 1489 { 1490 struct i915_ggtt *ggtt = arg; 1491 1492 return exercise_mock(ggtt->vm.i915, pot_hole); 1493 } 1494 1495 static int igt_mock_drunk(void *arg) 1496 { 1497 struct i915_ggtt *ggtt = arg; 1498 1499 return exercise_mock(ggtt->vm.i915, drunk_hole); 1500 } 1501 1502 static int reserve_gtt_with_resource(struct i915_vma *vma, u64 offset) 1503 { 1504 struct i915_address_space *vm = vma->vm; 1505 struct i915_vma_resource *vma_res; 1506 struct drm_i915_gem_object *obj = vma->obj; 1507 int err; 1508 1509 vma_res = i915_vma_resource_alloc(); 1510 if (IS_ERR(vma_res)) 1511 return PTR_ERR(vma_res); 1512 1513 mutex_lock(&vm->mutex); 1514 err = i915_gem_gtt_reserve(vm, NULL, &vma->node, obj->base.size, 1515 offset, 1516 obj->cache_level, 1517 0); 1518 if (!err) { 1519 i915_vma_resource_init_from_vma(vma_res, vma); 1520 vma->resource = vma_res; 1521 } else { 1522 kfree(vma_res); 1523 } 1524 mutex_unlock(&vm->mutex); 1525 1526 return err; 1527 } 1528 1529 static int igt_gtt_reserve(void *arg) 1530 { 1531 struct i915_ggtt *ggtt = arg; 1532 struct drm_i915_gem_object *obj, *on; 1533 I915_RND_STATE(prng); 1534 LIST_HEAD(objects); 1535 u64 total; 1536 int err = -ENODEV; 1537 1538 /* i915_gem_gtt_reserve() tries to reserve the precise range 1539 * for the node, and evicts if it has to. So our test checks that 1540 * it can give us the requsted space and prevent overlaps. 1541 */ 1542 1543 /* Start by filling the GGTT */ 1544 for (total = 0; 1545 total + 2 * I915_GTT_PAGE_SIZE <= ggtt->vm.total; 1546 total += 2 * I915_GTT_PAGE_SIZE) { 1547 struct i915_vma *vma; 1548 1549 obj = i915_gem_object_create_internal(ggtt->vm.i915, 1550 2 * PAGE_SIZE); 1551 if (IS_ERR(obj)) { 1552 err = PTR_ERR(obj); 1553 goto out; 1554 } 1555 1556 err = i915_gem_object_pin_pages_unlocked(obj); 1557 if (err) { 1558 i915_gem_object_put(obj); 1559 goto out; 1560 } 1561 1562 list_add(&obj->st_link, &objects); 1563 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1564 if (IS_ERR(vma)) { 1565 err = PTR_ERR(vma); 1566 goto out; 1567 } 1568 1569 err = reserve_gtt_with_resource(vma, total); 1570 if (err) { 1571 pr_err("i915_gem_gtt_reserve (pass 1) failed at %llu/%llu with err=%d\n", 1572 total, ggtt->vm.total, err); 1573 goto out; 1574 } 1575 track_vma_bind(vma); 1576 1577 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1578 if (vma->node.start != total || 1579 vma->node.size != 2*I915_GTT_PAGE_SIZE) { 1580 pr_err("i915_gem_gtt_reserve (pass 1) placement failed, found (%llx + %llx), expected (%llx + %llx)\n", 1581 vma->node.start, vma->node.size, 1582 total, 2*I915_GTT_PAGE_SIZE); 1583 err = -EINVAL; 1584 goto out; 1585 } 1586 } 1587 1588 /* Now we start forcing evictions */ 1589 for (total = I915_GTT_PAGE_SIZE; 1590 total + 2 * I915_GTT_PAGE_SIZE <= ggtt->vm.total; 1591 total += 2 * I915_GTT_PAGE_SIZE) { 1592 struct i915_vma *vma; 1593 1594 obj = i915_gem_object_create_internal(ggtt->vm.i915, 1595 2 * PAGE_SIZE); 1596 if (IS_ERR(obj)) { 1597 err = PTR_ERR(obj); 1598 goto out; 1599 } 1600 1601 err = i915_gem_object_pin_pages_unlocked(obj); 1602 if (err) { 1603 i915_gem_object_put(obj); 1604 goto out; 1605 } 1606 1607 list_add(&obj->st_link, &objects); 1608 1609 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1610 if (IS_ERR(vma)) { 1611 err = PTR_ERR(vma); 1612 goto out; 1613 } 1614 1615 err = reserve_gtt_with_resource(vma, total); 1616 if (err) { 1617 pr_err("i915_gem_gtt_reserve (pass 2) failed at %llu/%llu with err=%d\n", 1618 total, ggtt->vm.total, err); 1619 goto out; 1620 } 1621 track_vma_bind(vma); 1622 1623 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1624 if (vma->node.start != total || 1625 vma->node.size != 2*I915_GTT_PAGE_SIZE) { 1626 pr_err("i915_gem_gtt_reserve (pass 2) placement failed, found (%llx + %llx), expected (%llx + %llx)\n", 1627 vma->node.start, vma->node.size, 1628 total, 2*I915_GTT_PAGE_SIZE); 1629 err = -EINVAL; 1630 goto out; 1631 } 1632 } 1633 1634 /* And then try at random */ 1635 list_for_each_entry_safe(obj, on, &objects, st_link) { 1636 struct i915_vma *vma; 1637 u64 offset; 1638 1639 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1640 if (IS_ERR(vma)) { 1641 err = PTR_ERR(vma); 1642 goto out; 1643 } 1644 1645 err = i915_vma_unbind_unlocked(vma); 1646 if (err) { 1647 pr_err("i915_vma_unbind failed with err=%d!\n", err); 1648 goto out; 1649 } 1650 1651 offset = igt_random_offset(&prng, 1652 0, ggtt->vm.total, 1653 2 * I915_GTT_PAGE_SIZE, 1654 I915_GTT_MIN_ALIGNMENT); 1655 1656 err = reserve_gtt_with_resource(vma, offset); 1657 if (err) { 1658 pr_err("i915_gem_gtt_reserve (pass 3) failed at %llu/%llu with err=%d\n", 1659 total, ggtt->vm.total, err); 1660 goto out; 1661 } 1662 track_vma_bind(vma); 1663 1664 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1665 if (vma->node.start != offset || 1666 vma->node.size != 2*I915_GTT_PAGE_SIZE) { 1667 pr_err("i915_gem_gtt_reserve (pass 3) placement failed, found (%llx + %llx), expected (%llx + %llx)\n", 1668 vma->node.start, vma->node.size, 1669 offset, 2*I915_GTT_PAGE_SIZE); 1670 err = -EINVAL; 1671 goto out; 1672 } 1673 } 1674 1675 out: 1676 list_for_each_entry_safe(obj, on, &objects, st_link) { 1677 i915_gem_object_unpin_pages(obj); 1678 i915_gem_object_put(obj); 1679 } 1680 return err; 1681 } 1682 1683 static int insert_gtt_with_resource(struct i915_vma *vma) 1684 { 1685 struct i915_address_space *vm = vma->vm; 1686 struct i915_vma_resource *vma_res; 1687 struct drm_i915_gem_object *obj = vma->obj; 1688 int err; 1689 1690 vma_res = i915_vma_resource_alloc(); 1691 if (IS_ERR(vma_res)) 1692 return PTR_ERR(vma_res); 1693 1694 mutex_lock(&vm->mutex); 1695 err = i915_gem_gtt_insert(vm, NULL, &vma->node, obj->base.size, 0, 1696 obj->cache_level, 0, vm->total, 0); 1697 if (!err) { 1698 i915_vma_resource_init_from_vma(vma_res, vma); 1699 vma->resource = vma_res; 1700 } else { 1701 kfree(vma_res); 1702 } 1703 mutex_unlock(&vm->mutex); 1704 1705 return err; 1706 } 1707 1708 static int igt_gtt_insert(void *arg) 1709 { 1710 struct i915_ggtt *ggtt = arg; 1711 struct drm_i915_gem_object *obj, *on; 1712 struct drm_mm_node tmp = {}; 1713 const struct invalid_insert { 1714 u64 size; 1715 u64 alignment; 1716 u64 start, end; 1717 } invalid_insert[] = { 1718 { 1719 ggtt->vm.total + I915_GTT_PAGE_SIZE, 0, 1720 0, ggtt->vm.total, 1721 }, 1722 { 1723 2*I915_GTT_PAGE_SIZE, 0, 1724 0, I915_GTT_PAGE_SIZE, 1725 }, 1726 { 1727 -(u64)I915_GTT_PAGE_SIZE, 0, 1728 0, 4*I915_GTT_PAGE_SIZE, 1729 }, 1730 { 1731 -(u64)2*I915_GTT_PAGE_SIZE, 2*I915_GTT_PAGE_SIZE, 1732 0, 4*I915_GTT_PAGE_SIZE, 1733 }, 1734 { 1735 I915_GTT_PAGE_SIZE, I915_GTT_MIN_ALIGNMENT << 1, 1736 I915_GTT_MIN_ALIGNMENT, I915_GTT_MIN_ALIGNMENT << 1, 1737 }, 1738 {} 1739 }, *ii; 1740 LIST_HEAD(objects); 1741 u64 total; 1742 int err = -ENODEV; 1743 1744 /* i915_gem_gtt_insert() tries to allocate some free space in the GTT 1745 * to the node, evicting if required. 1746 */ 1747 1748 /* Check a couple of obviously invalid requests */ 1749 for (ii = invalid_insert; ii->size; ii++) { 1750 mutex_lock(&ggtt->vm.mutex); 1751 err = i915_gem_gtt_insert(&ggtt->vm, NULL, &tmp, 1752 ii->size, ii->alignment, 1753 I915_COLOR_UNEVICTABLE, 1754 ii->start, ii->end, 1755 0); 1756 mutex_unlock(&ggtt->vm.mutex); 1757 if (err != -ENOSPC) { 1758 pr_err("Invalid i915_gem_gtt_insert(.size=%llx, .alignment=%llx, .start=%llx, .end=%llx) succeeded (err=%d)\n", 1759 ii->size, ii->alignment, ii->start, ii->end, 1760 err); 1761 return -EINVAL; 1762 } 1763 } 1764 1765 /* Start by filling the GGTT */ 1766 for (total = 0; 1767 total + I915_GTT_PAGE_SIZE <= ggtt->vm.total; 1768 total += I915_GTT_PAGE_SIZE) { 1769 struct i915_vma *vma; 1770 1771 obj = i915_gem_object_create_internal(ggtt->vm.i915, 1772 I915_GTT_PAGE_SIZE); 1773 if (IS_ERR(obj)) { 1774 err = PTR_ERR(obj); 1775 goto out; 1776 } 1777 1778 err = i915_gem_object_pin_pages_unlocked(obj); 1779 if (err) { 1780 i915_gem_object_put(obj); 1781 goto out; 1782 } 1783 1784 list_add(&obj->st_link, &objects); 1785 1786 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1787 if (IS_ERR(vma)) { 1788 err = PTR_ERR(vma); 1789 goto out; 1790 } 1791 1792 err = insert_gtt_with_resource(vma); 1793 if (err == -ENOSPC) { 1794 /* maxed out the GGTT space */ 1795 i915_gem_object_put(obj); 1796 break; 1797 } 1798 if (err) { 1799 pr_err("i915_gem_gtt_insert (pass 1) failed at %llu/%llu with err=%d\n", 1800 total, ggtt->vm.total, err); 1801 goto out; 1802 } 1803 track_vma_bind(vma); 1804 __i915_vma_pin(vma); 1805 1806 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1807 } 1808 1809 list_for_each_entry(obj, &objects, st_link) { 1810 struct i915_vma *vma; 1811 1812 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1813 if (IS_ERR(vma)) { 1814 err = PTR_ERR(vma); 1815 goto out; 1816 } 1817 1818 if (!drm_mm_node_allocated(&vma->node)) { 1819 pr_err("VMA was unexpectedly evicted!\n"); 1820 err = -EINVAL; 1821 goto out; 1822 } 1823 1824 __i915_vma_unpin(vma); 1825 } 1826 1827 /* If we then reinsert, we should find the same hole */ 1828 list_for_each_entry_safe(obj, on, &objects, st_link) { 1829 struct i915_vma *vma; 1830 u64 offset; 1831 1832 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1833 if (IS_ERR(vma)) { 1834 err = PTR_ERR(vma); 1835 goto out; 1836 } 1837 1838 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1839 offset = vma->node.start; 1840 1841 err = i915_vma_unbind_unlocked(vma); 1842 if (err) { 1843 pr_err("i915_vma_unbind failed with err=%d!\n", err); 1844 goto out; 1845 } 1846 1847 err = insert_gtt_with_resource(vma); 1848 if (err) { 1849 pr_err("i915_gem_gtt_insert (pass 2) failed at %llu/%llu with err=%d\n", 1850 total, ggtt->vm.total, err); 1851 goto out; 1852 } 1853 track_vma_bind(vma); 1854 1855 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1856 if (vma->node.start != offset) { 1857 pr_err("i915_gem_gtt_insert did not return node to its previous location (the only hole), expected address %llx, found %llx\n", 1858 offset, vma->node.start); 1859 err = -EINVAL; 1860 goto out; 1861 } 1862 } 1863 1864 /* And then force evictions */ 1865 for (total = 0; 1866 total + 2 * I915_GTT_PAGE_SIZE <= ggtt->vm.total; 1867 total += 2 * I915_GTT_PAGE_SIZE) { 1868 struct i915_vma *vma; 1869 1870 obj = i915_gem_object_create_internal(ggtt->vm.i915, 1871 2 * I915_GTT_PAGE_SIZE); 1872 if (IS_ERR(obj)) { 1873 err = PTR_ERR(obj); 1874 goto out; 1875 } 1876 1877 err = i915_gem_object_pin_pages_unlocked(obj); 1878 if (err) { 1879 i915_gem_object_put(obj); 1880 goto out; 1881 } 1882 1883 list_add(&obj->st_link, &objects); 1884 1885 vma = i915_vma_instance(obj, &ggtt->vm, NULL); 1886 if (IS_ERR(vma)) { 1887 err = PTR_ERR(vma); 1888 goto out; 1889 } 1890 1891 err = insert_gtt_with_resource(vma); 1892 if (err) { 1893 pr_err("i915_gem_gtt_insert (pass 3) failed at %llu/%llu with err=%d\n", 1894 total, ggtt->vm.total, err); 1895 goto out; 1896 } 1897 track_vma_bind(vma); 1898 1899 GEM_BUG_ON(!drm_mm_node_allocated(&vma->node)); 1900 } 1901 1902 out: 1903 list_for_each_entry_safe(obj, on, &objects, st_link) { 1904 i915_gem_object_unpin_pages(obj); 1905 i915_gem_object_put(obj); 1906 } 1907 return err; 1908 } 1909 1910 int i915_gem_gtt_mock_selftests(void) 1911 { 1912 static const struct i915_subtest tests[] = { 1913 SUBTEST(igt_mock_drunk), 1914 SUBTEST(igt_mock_walk), 1915 SUBTEST(igt_mock_pot), 1916 SUBTEST(igt_mock_fill), 1917 SUBTEST(igt_gtt_reserve), 1918 SUBTEST(igt_gtt_insert), 1919 }; 1920 struct drm_i915_private *i915; 1921 struct intel_gt *gt; 1922 int err; 1923 1924 i915 = mock_gem_device(); 1925 if (!i915) 1926 return -ENOMEM; 1927 1928 /* allocate the ggtt */ 1929 err = intel_gt_assign_ggtt(to_gt(i915)); 1930 if (err) 1931 goto out_put; 1932 1933 gt = to_gt(i915); 1934 1935 mock_init_ggtt(gt); 1936 1937 err = i915_subtests(tests, gt->ggtt); 1938 1939 mock_device_flush(i915); 1940 i915_gem_drain_freed_objects(i915); 1941 mock_fini_ggtt(gt->ggtt); 1942 1943 out_put: 1944 mock_destroy_device(i915); 1945 return err; 1946 } 1947 1948 static int context_sync(struct intel_context *ce) 1949 { 1950 struct i915_request *rq; 1951 long timeout; 1952 1953 rq = intel_context_create_request(ce); 1954 if (IS_ERR(rq)) 1955 return PTR_ERR(rq); 1956 1957 i915_request_get(rq); 1958 i915_request_add(rq); 1959 1960 timeout = i915_request_wait(rq, 0, HZ / 5); 1961 i915_request_put(rq); 1962 1963 return timeout < 0 ? -EIO : 0; 1964 } 1965 1966 static struct i915_request * 1967 submit_batch(struct intel_context *ce, u64 addr) 1968 { 1969 struct i915_request *rq; 1970 int err; 1971 1972 rq = intel_context_create_request(ce); 1973 if (IS_ERR(rq)) 1974 return rq; 1975 1976 err = 0; 1977 if (rq->engine->emit_init_breadcrumb) /* detect a hang */ 1978 err = rq->engine->emit_init_breadcrumb(rq); 1979 if (err == 0) 1980 err = rq->engine->emit_bb_start(rq, addr, 0, 0); 1981 1982 if (err == 0) 1983 i915_request_get(rq); 1984 i915_request_add(rq); 1985 1986 return err ? ERR_PTR(err) : rq; 1987 } 1988 1989 static u32 *spinner(u32 *batch, int i) 1990 { 1991 return batch + i * 64 / sizeof(*batch) + 4; 1992 } 1993 1994 static void end_spin(u32 *batch, int i) 1995 { 1996 *spinner(batch, i) = MI_BATCH_BUFFER_END; 1997 wmb(); 1998 } 1999 2000 static int igt_cs_tlb(void *arg) 2001 { 2002 const unsigned int count = PAGE_SIZE / 64; 2003 const unsigned int chunk_size = count * PAGE_SIZE; 2004 struct drm_i915_private *i915 = arg; 2005 struct drm_i915_gem_object *bbe, *act, *out; 2006 struct i915_gem_engines_iter it; 2007 struct i915_address_space *vm; 2008 struct i915_gem_context *ctx; 2009 struct intel_context *ce; 2010 struct i915_vma *vma; 2011 I915_RND_STATE(prng); 2012 struct file *file; 2013 unsigned int i; 2014 u32 *result; 2015 u32 *batch; 2016 int err = 0; 2017 2018 /* 2019 * Our mission here is to fool the hardware to execute something 2020 * from scratch as it has not seen the batch move (due to missing 2021 * the TLB invalidate). 2022 */ 2023 2024 file = mock_file(i915); 2025 if (IS_ERR(file)) 2026 return PTR_ERR(file); 2027 2028 ctx = live_context(i915, file); 2029 if (IS_ERR(ctx)) { 2030 err = PTR_ERR(ctx); 2031 goto out_unlock; 2032 } 2033 2034 vm = i915_gem_context_get_eb_vm(ctx); 2035 if (i915_is_ggtt(vm)) 2036 goto out_vm; 2037 2038 /* Create two pages; dummy we prefill the TLB, and intended */ 2039 bbe = i915_gem_object_create_internal(i915, PAGE_SIZE); 2040 if (IS_ERR(bbe)) { 2041 err = PTR_ERR(bbe); 2042 goto out_vm; 2043 } 2044 2045 batch = i915_gem_object_pin_map_unlocked(bbe, I915_MAP_WC); 2046 if (IS_ERR(batch)) { 2047 err = PTR_ERR(batch); 2048 goto out_put_bbe; 2049 } 2050 memset32(batch, MI_BATCH_BUFFER_END, PAGE_SIZE / sizeof(u32)); 2051 i915_gem_object_flush_map(bbe); 2052 i915_gem_object_unpin_map(bbe); 2053 2054 act = i915_gem_object_create_internal(i915, PAGE_SIZE); 2055 if (IS_ERR(act)) { 2056 err = PTR_ERR(act); 2057 goto out_put_bbe; 2058 } 2059 2060 /* Track the execution of each request by writing into different slot */ 2061 batch = i915_gem_object_pin_map_unlocked(act, I915_MAP_WC); 2062 if (IS_ERR(batch)) { 2063 err = PTR_ERR(batch); 2064 goto out_put_act; 2065 } 2066 for (i = 0; i < count; i++) { 2067 u32 *cs = batch + i * 64 / sizeof(*cs); 2068 u64 addr = (vm->total - PAGE_SIZE) + i * sizeof(u32); 2069 2070 GEM_BUG_ON(GRAPHICS_VER(i915) < 6); 2071 cs[0] = MI_STORE_DWORD_IMM_GEN4; 2072 if (GRAPHICS_VER(i915) >= 8) { 2073 cs[1] = lower_32_bits(addr); 2074 cs[2] = upper_32_bits(addr); 2075 cs[3] = i; 2076 cs[4] = MI_NOOP; 2077 cs[5] = MI_BATCH_BUFFER_START_GEN8; 2078 } else { 2079 cs[1] = 0; 2080 cs[2] = lower_32_bits(addr); 2081 cs[3] = i; 2082 cs[4] = MI_NOOP; 2083 cs[5] = MI_BATCH_BUFFER_START; 2084 } 2085 } 2086 2087 out = i915_gem_object_create_internal(i915, PAGE_SIZE); 2088 if (IS_ERR(out)) { 2089 err = PTR_ERR(out); 2090 goto out_put_batch; 2091 } 2092 i915_gem_object_set_cache_coherency(out, I915_CACHING_CACHED); 2093 2094 vma = i915_vma_instance(out, vm, NULL); 2095 if (IS_ERR(vma)) { 2096 err = PTR_ERR(vma); 2097 goto out_put_out; 2098 } 2099 2100 err = i915_vma_pin(vma, 0, 0, 2101 PIN_USER | 2102 PIN_OFFSET_FIXED | 2103 (vm->total - PAGE_SIZE)); 2104 if (err) 2105 goto out_put_out; 2106 GEM_BUG_ON(vma->node.start != vm->total - PAGE_SIZE); 2107 2108 result = i915_gem_object_pin_map_unlocked(out, I915_MAP_WB); 2109 if (IS_ERR(result)) { 2110 err = PTR_ERR(result); 2111 goto out_put_out; 2112 } 2113 2114 for_each_gem_engine(ce, i915_gem_context_lock_engines(ctx), it) { 2115 IGT_TIMEOUT(end_time); 2116 unsigned long pass = 0; 2117 2118 if (!intel_engine_can_store_dword(ce->engine)) 2119 continue; 2120 2121 while (!__igt_timeout(end_time, NULL)) { 2122 struct i915_vm_pt_stash stash = {}; 2123 struct i915_request *rq; 2124 struct i915_gem_ww_ctx ww; 2125 struct i915_vma_resource *vma_res; 2126 u64 offset; 2127 2128 offset = igt_random_offset(&prng, 2129 0, vm->total - PAGE_SIZE, 2130 chunk_size, PAGE_SIZE); 2131 2132 memset32(result, STACK_MAGIC, PAGE_SIZE / sizeof(u32)); 2133 2134 vma = i915_vma_instance(bbe, vm, NULL); 2135 if (IS_ERR(vma)) { 2136 err = PTR_ERR(vma); 2137 goto end; 2138 } 2139 2140 i915_gem_object_lock(bbe, NULL); 2141 err = i915_vma_get_pages(vma); 2142 i915_gem_object_unlock(bbe); 2143 if (err) 2144 goto end; 2145 2146 vma_res = i915_vma_resource_alloc(); 2147 if (IS_ERR(vma_res)) { 2148 i915_vma_put_pages(vma); 2149 err = PTR_ERR(vma_res); 2150 goto end; 2151 } 2152 2153 i915_gem_ww_ctx_init(&ww, false); 2154 retry: 2155 err = i915_vm_lock_objects(vm, &ww); 2156 if (err) 2157 goto end_ww; 2158 2159 err = i915_vm_alloc_pt_stash(vm, &stash, chunk_size); 2160 if (err) 2161 goto end_ww; 2162 2163 err = i915_vm_map_pt_stash(vm, &stash); 2164 if (!err) 2165 vm->allocate_va_range(vm, &stash, offset, chunk_size); 2166 i915_vm_free_pt_stash(vm, &stash); 2167 end_ww: 2168 if (err == -EDEADLK) { 2169 err = i915_gem_ww_ctx_backoff(&ww); 2170 if (!err) 2171 goto retry; 2172 } 2173 i915_gem_ww_ctx_fini(&ww); 2174 if (err) { 2175 kfree(vma_res); 2176 goto end; 2177 } 2178 2179 i915_vma_resource_init_from_vma(vma_res, vma); 2180 /* Prime the TLB with the dummy pages */ 2181 for (i = 0; i < count; i++) { 2182 vma_res->start = offset + i * PAGE_SIZE; 2183 vm->insert_entries(vm, vma_res, I915_CACHE_NONE, 2184 0); 2185 2186 rq = submit_batch(ce, vma_res->start); 2187 if (IS_ERR(rq)) { 2188 err = PTR_ERR(rq); 2189 i915_vma_resource_fini(vma_res); 2190 kfree(vma_res); 2191 goto end; 2192 } 2193 i915_request_put(rq); 2194 } 2195 i915_vma_resource_fini(vma_res); 2196 i915_vma_put_pages(vma); 2197 2198 err = context_sync(ce); 2199 if (err) { 2200 pr_err("%s: dummy setup timed out\n", 2201 ce->engine->name); 2202 kfree(vma_res); 2203 goto end; 2204 } 2205 2206 vma = i915_vma_instance(act, vm, NULL); 2207 if (IS_ERR(vma)) { 2208 kfree(vma_res); 2209 err = PTR_ERR(vma); 2210 goto end; 2211 } 2212 2213 i915_gem_object_lock(act, NULL); 2214 err = i915_vma_get_pages(vma); 2215 i915_gem_object_unlock(act); 2216 if (err) { 2217 kfree(vma_res); 2218 goto end; 2219 } 2220 2221 i915_vma_resource_init_from_vma(vma_res, vma); 2222 /* Replace the TLB with target batches */ 2223 for (i = 0; i < count; i++) { 2224 struct i915_request *rq; 2225 u32 *cs = batch + i * 64 / sizeof(*cs); 2226 u64 addr; 2227 2228 vma_res->start = offset + i * PAGE_SIZE; 2229 vm->insert_entries(vm, vma_res, I915_CACHE_NONE, 0); 2230 2231 addr = vma_res->start + i * 64; 2232 cs[4] = MI_NOOP; 2233 cs[6] = lower_32_bits(addr); 2234 cs[7] = upper_32_bits(addr); 2235 wmb(); 2236 2237 rq = submit_batch(ce, addr); 2238 if (IS_ERR(rq)) { 2239 err = PTR_ERR(rq); 2240 i915_vma_resource_fini(vma_res); 2241 kfree(vma_res); 2242 goto end; 2243 } 2244 2245 /* Wait until the context chain has started */ 2246 if (i == 0) { 2247 while (READ_ONCE(result[i]) && 2248 !i915_request_completed(rq)) 2249 cond_resched(); 2250 } else { 2251 end_spin(batch, i - 1); 2252 } 2253 2254 i915_request_put(rq); 2255 } 2256 end_spin(batch, count - 1); 2257 2258 i915_vma_resource_fini(vma_res); 2259 kfree(vma_res); 2260 i915_vma_put_pages(vma); 2261 2262 err = context_sync(ce); 2263 if (err) { 2264 pr_err("%s: writes timed out\n", 2265 ce->engine->name); 2266 goto end; 2267 } 2268 2269 for (i = 0; i < count; i++) { 2270 if (result[i] != i) { 2271 pr_err("%s: Write lost on pass %lu, at offset %llx, index %d, found %x, expected %x\n", 2272 ce->engine->name, pass, 2273 offset, i, result[i], i); 2274 err = -EINVAL; 2275 goto end; 2276 } 2277 } 2278 2279 vm->clear_range(vm, offset, chunk_size); 2280 pass++; 2281 } 2282 } 2283 end: 2284 if (igt_flush_test(i915)) 2285 err = -EIO; 2286 i915_gem_context_unlock_engines(ctx); 2287 i915_gem_object_unpin_map(out); 2288 out_put_out: 2289 i915_gem_object_put(out); 2290 out_put_batch: 2291 i915_gem_object_unpin_map(act); 2292 out_put_act: 2293 i915_gem_object_put(act); 2294 out_put_bbe: 2295 i915_gem_object_put(bbe); 2296 out_vm: 2297 i915_vm_put(vm); 2298 out_unlock: 2299 fput(file); 2300 return err; 2301 } 2302 2303 int i915_gem_gtt_live_selftests(struct drm_i915_private *i915) 2304 { 2305 static const struct i915_subtest tests[] = { 2306 SUBTEST(igt_ppgtt_alloc), 2307 SUBTEST(igt_ppgtt_lowlevel), 2308 SUBTEST(igt_ppgtt_drunk), 2309 SUBTEST(igt_ppgtt_walk), 2310 SUBTEST(igt_ppgtt_pot), 2311 SUBTEST(igt_ppgtt_fill), 2312 SUBTEST(igt_ppgtt_shrink), 2313 SUBTEST(igt_ppgtt_shrink_boom), 2314 SUBTEST(igt_ppgtt_misaligned_pin), 2315 SUBTEST(igt_ggtt_lowlevel), 2316 SUBTEST(igt_ggtt_drunk), 2317 SUBTEST(igt_ggtt_walk), 2318 SUBTEST(igt_ggtt_pot), 2319 SUBTEST(igt_ggtt_fill), 2320 SUBTEST(igt_ggtt_page), 2321 SUBTEST(igt_ggtt_misaligned_pin), 2322 SUBTEST(igt_cs_tlb), 2323 }; 2324 2325 GEM_BUG_ON(offset_in_page(to_gt(i915)->ggtt->vm.total)); 2326 2327 return i915_subtests(tests, i915); 2328 } 2329