1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Copyright (C) 2013 Red Hat 4 * Author: Rob Clark <robdclark@gmail.com> 5 */ 6 7 #include <linux/dma-map-ops.h> 8 #include <linux/spinlock.h> 9 #include <linux/shmem_fs.h> 10 #include <linux/dma-buf.h> 11 #include <linux/pfn_t.h> 12 13 #include <drm/drm_prime.h> 14 15 #include "msm_drv.h" 16 #include "msm_fence.h" 17 #include "msm_gem.h" 18 #include "msm_gpu.h" 19 #include "msm_mmu.h" 20 21 static void update_inactive(struct msm_gem_object *msm_obj); 22 23 static dma_addr_t physaddr(struct drm_gem_object *obj) 24 { 25 struct msm_gem_object *msm_obj = to_msm_bo(obj); 26 struct msm_drm_private *priv = obj->dev->dev_private; 27 return (((dma_addr_t)msm_obj->vram_node->start) << PAGE_SHIFT) + 28 priv->vram.paddr; 29 } 30 31 static bool use_pages(struct drm_gem_object *obj) 32 { 33 struct msm_gem_object *msm_obj = to_msm_bo(obj); 34 return !msm_obj->vram_node; 35 } 36 37 /* 38 * Cache sync.. this is a bit over-complicated, to fit dma-mapping 39 * API. Really GPU cache is out of scope here (handled on cmdstream) 40 * and all we need to do is invalidate newly allocated pages before 41 * mapping to CPU as uncached/writecombine. 42 * 43 * On top of this, we have the added headache, that depending on 44 * display generation, the display's iommu may be wired up to either 45 * the toplevel drm device (mdss), or to the mdp sub-node, meaning 46 * that here we either have dma-direct or iommu ops. 47 * 48 * Let this be a cautionary tail of abstraction gone wrong. 49 */ 50 51 static void sync_for_device(struct msm_gem_object *msm_obj) 52 { 53 struct device *dev = msm_obj->base.dev->dev; 54 55 dma_map_sgtable(dev, msm_obj->sgt, DMA_BIDIRECTIONAL, 0); 56 } 57 58 static void sync_for_cpu(struct msm_gem_object *msm_obj) 59 { 60 struct device *dev = msm_obj->base.dev->dev; 61 62 dma_unmap_sgtable(dev, msm_obj->sgt, DMA_BIDIRECTIONAL, 0); 63 } 64 65 /* allocate pages from VRAM carveout, used when no IOMMU: */ 66 static struct page **get_pages_vram(struct drm_gem_object *obj, int npages) 67 { 68 struct msm_gem_object *msm_obj = to_msm_bo(obj); 69 struct msm_drm_private *priv = obj->dev->dev_private; 70 dma_addr_t paddr; 71 struct page **p; 72 int ret, i; 73 74 p = kvmalloc_array(npages, sizeof(struct page *), GFP_KERNEL); 75 if (!p) 76 return ERR_PTR(-ENOMEM); 77 78 spin_lock(&priv->vram.lock); 79 ret = drm_mm_insert_node(&priv->vram.mm, msm_obj->vram_node, npages); 80 spin_unlock(&priv->vram.lock); 81 if (ret) { 82 kvfree(p); 83 return ERR_PTR(ret); 84 } 85 86 paddr = physaddr(obj); 87 for (i = 0; i < npages; i++) { 88 p[i] = phys_to_page(paddr); 89 paddr += PAGE_SIZE; 90 } 91 92 return p; 93 } 94 95 static struct page **get_pages(struct drm_gem_object *obj) 96 { 97 struct msm_gem_object *msm_obj = to_msm_bo(obj); 98 99 GEM_WARN_ON(!msm_gem_is_locked(obj)); 100 101 if (!msm_obj->pages) { 102 struct drm_device *dev = obj->dev; 103 struct page **p; 104 int npages = obj->size >> PAGE_SHIFT; 105 106 if (use_pages(obj)) 107 p = drm_gem_get_pages(obj); 108 else 109 p = get_pages_vram(obj, npages); 110 111 if (IS_ERR(p)) { 112 DRM_DEV_ERROR(dev->dev, "could not get pages: %ld\n", 113 PTR_ERR(p)); 114 return p; 115 } 116 117 msm_obj->pages = p; 118 119 msm_obj->sgt = drm_prime_pages_to_sg(obj->dev, p, npages); 120 if (IS_ERR(msm_obj->sgt)) { 121 void *ptr = ERR_CAST(msm_obj->sgt); 122 123 DRM_DEV_ERROR(dev->dev, "failed to allocate sgt\n"); 124 msm_obj->sgt = NULL; 125 return ptr; 126 } 127 128 /* For non-cached buffers, ensure the new pages are clean 129 * because display controller, GPU, etc. are not coherent: 130 */ 131 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED)) 132 sync_for_device(msm_obj); 133 134 GEM_WARN_ON(msm_obj->active_count); 135 update_inactive(msm_obj); 136 } 137 138 return msm_obj->pages; 139 } 140 141 static void put_pages_vram(struct drm_gem_object *obj) 142 { 143 struct msm_gem_object *msm_obj = to_msm_bo(obj); 144 struct msm_drm_private *priv = obj->dev->dev_private; 145 146 spin_lock(&priv->vram.lock); 147 drm_mm_remove_node(msm_obj->vram_node); 148 spin_unlock(&priv->vram.lock); 149 150 kvfree(msm_obj->pages); 151 } 152 153 static void put_pages(struct drm_gem_object *obj) 154 { 155 struct msm_gem_object *msm_obj = to_msm_bo(obj); 156 157 if (msm_obj->pages) { 158 if (msm_obj->sgt) { 159 /* For non-cached buffers, ensure the new 160 * pages are clean because display controller, 161 * GPU, etc. are not coherent: 162 */ 163 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED)) 164 sync_for_cpu(msm_obj); 165 166 sg_free_table(msm_obj->sgt); 167 kfree(msm_obj->sgt); 168 msm_obj->sgt = NULL; 169 } 170 171 if (use_pages(obj)) 172 drm_gem_put_pages(obj, msm_obj->pages, true, false); 173 else 174 put_pages_vram(obj); 175 176 msm_obj->pages = NULL; 177 } 178 } 179 180 struct page **msm_gem_get_pages(struct drm_gem_object *obj) 181 { 182 struct msm_gem_object *msm_obj = to_msm_bo(obj); 183 struct page **p; 184 185 msm_gem_lock(obj); 186 187 if (GEM_WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) { 188 msm_gem_unlock(obj); 189 return ERR_PTR(-EBUSY); 190 } 191 192 p = get_pages(obj); 193 msm_gem_unlock(obj); 194 return p; 195 } 196 197 void msm_gem_put_pages(struct drm_gem_object *obj) 198 { 199 /* when we start tracking the pin count, then do something here */ 200 } 201 202 int msm_gem_mmap_obj(struct drm_gem_object *obj, 203 struct vm_area_struct *vma) 204 { 205 struct msm_gem_object *msm_obj = to_msm_bo(obj); 206 207 vma->vm_flags &= ~VM_PFNMAP; 208 vma->vm_flags |= VM_MIXEDMAP; 209 210 if (msm_obj->flags & MSM_BO_WC) { 211 vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags)); 212 } else if (msm_obj->flags & MSM_BO_UNCACHED) { 213 vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags)); 214 } else { 215 /* 216 * Shunt off cached objs to shmem file so they have their own 217 * address_space (so unmap_mapping_range does what we want, 218 * in particular in the case of mmap'd dmabufs) 219 */ 220 vma->vm_pgoff = 0; 221 vma_set_file(vma, obj->filp); 222 223 vma->vm_page_prot = vm_get_page_prot(vma->vm_flags); 224 } 225 226 return 0; 227 } 228 229 int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma) 230 { 231 int ret; 232 233 ret = drm_gem_mmap(filp, vma); 234 if (ret) { 235 DBG("mmap failed: %d", ret); 236 return ret; 237 } 238 239 return msm_gem_mmap_obj(vma->vm_private_data, vma); 240 } 241 242 static vm_fault_t msm_gem_fault(struct vm_fault *vmf) 243 { 244 struct vm_area_struct *vma = vmf->vma; 245 struct drm_gem_object *obj = vma->vm_private_data; 246 struct msm_gem_object *msm_obj = to_msm_bo(obj); 247 struct page **pages; 248 unsigned long pfn; 249 pgoff_t pgoff; 250 int err; 251 vm_fault_t ret; 252 253 /* 254 * vm_ops.open/drm_gem_mmap_obj and close get and put 255 * a reference on obj. So, we dont need to hold one here. 256 */ 257 err = msm_gem_lock_interruptible(obj); 258 if (err) { 259 ret = VM_FAULT_NOPAGE; 260 goto out; 261 } 262 263 if (GEM_WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) { 264 msm_gem_unlock(obj); 265 return VM_FAULT_SIGBUS; 266 } 267 268 /* make sure we have pages attached now */ 269 pages = get_pages(obj); 270 if (IS_ERR(pages)) { 271 ret = vmf_error(PTR_ERR(pages)); 272 goto out_unlock; 273 } 274 275 /* We don't use vmf->pgoff since that has the fake offset: */ 276 pgoff = (vmf->address - vma->vm_start) >> PAGE_SHIFT; 277 278 pfn = page_to_pfn(pages[pgoff]); 279 280 VERB("Inserting %p pfn %lx, pa %lx", (void *)vmf->address, 281 pfn, pfn << PAGE_SHIFT); 282 283 ret = vmf_insert_mixed(vma, vmf->address, __pfn_to_pfn_t(pfn, PFN_DEV)); 284 out_unlock: 285 msm_gem_unlock(obj); 286 out: 287 return ret; 288 } 289 290 /** get mmap offset */ 291 static uint64_t mmap_offset(struct drm_gem_object *obj) 292 { 293 struct drm_device *dev = obj->dev; 294 int ret; 295 296 GEM_WARN_ON(!msm_gem_is_locked(obj)); 297 298 /* Make it mmapable */ 299 ret = drm_gem_create_mmap_offset(obj); 300 301 if (ret) { 302 DRM_DEV_ERROR(dev->dev, "could not allocate mmap offset\n"); 303 return 0; 304 } 305 306 return drm_vma_node_offset_addr(&obj->vma_node); 307 } 308 309 uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj) 310 { 311 uint64_t offset; 312 313 msm_gem_lock(obj); 314 offset = mmap_offset(obj); 315 msm_gem_unlock(obj); 316 return offset; 317 } 318 319 static struct msm_gem_vma *add_vma(struct drm_gem_object *obj, 320 struct msm_gem_address_space *aspace) 321 { 322 struct msm_gem_object *msm_obj = to_msm_bo(obj); 323 struct msm_gem_vma *vma; 324 325 GEM_WARN_ON(!msm_gem_is_locked(obj)); 326 327 vma = kzalloc(sizeof(*vma), GFP_KERNEL); 328 if (!vma) 329 return ERR_PTR(-ENOMEM); 330 331 vma->aspace = aspace; 332 333 list_add_tail(&vma->list, &msm_obj->vmas); 334 335 return vma; 336 } 337 338 static struct msm_gem_vma *lookup_vma(struct drm_gem_object *obj, 339 struct msm_gem_address_space *aspace) 340 { 341 struct msm_gem_object *msm_obj = to_msm_bo(obj); 342 struct msm_gem_vma *vma; 343 344 GEM_WARN_ON(!msm_gem_is_locked(obj)); 345 346 list_for_each_entry(vma, &msm_obj->vmas, list) { 347 if (vma->aspace == aspace) 348 return vma; 349 } 350 351 return NULL; 352 } 353 354 static void del_vma(struct msm_gem_vma *vma) 355 { 356 if (!vma) 357 return; 358 359 list_del(&vma->list); 360 kfree(vma); 361 } 362 363 /** 364 * If close is true, this also closes the VMA (releasing the allocated 365 * iova range) in addition to removing the iommu mapping. In the eviction 366 * case (!close), we keep the iova allocated, but only remove the iommu 367 * mapping. 368 */ 369 static void 370 put_iova_spaces(struct drm_gem_object *obj, bool close) 371 { 372 struct msm_gem_object *msm_obj = to_msm_bo(obj); 373 struct msm_gem_vma *vma; 374 375 GEM_WARN_ON(!msm_gem_is_locked(obj)); 376 377 list_for_each_entry(vma, &msm_obj->vmas, list) { 378 if (vma->aspace) { 379 msm_gem_purge_vma(vma->aspace, vma); 380 if (close) 381 msm_gem_close_vma(vma->aspace, vma); 382 } 383 } 384 } 385 386 /* Called with msm_obj locked */ 387 static void 388 put_iova_vmas(struct drm_gem_object *obj) 389 { 390 struct msm_gem_object *msm_obj = to_msm_bo(obj); 391 struct msm_gem_vma *vma, *tmp; 392 393 GEM_WARN_ON(!msm_gem_is_locked(obj)); 394 395 list_for_each_entry_safe(vma, tmp, &msm_obj->vmas, list) { 396 del_vma(vma); 397 } 398 } 399 400 static int get_iova_locked(struct drm_gem_object *obj, 401 struct msm_gem_address_space *aspace, uint64_t *iova, 402 u64 range_start, u64 range_end) 403 { 404 struct msm_gem_vma *vma; 405 int ret = 0; 406 407 GEM_WARN_ON(!msm_gem_is_locked(obj)); 408 409 vma = lookup_vma(obj, aspace); 410 411 if (!vma) { 412 vma = add_vma(obj, aspace); 413 if (IS_ERR(vma)) 414 return PTR_ERR(vma); 415 416 ret = msm_gem_init_vma(aspace, vma, obj->size >> PAGE_SHIFT, 417 range_start, range_end); 418 if (ret) { 419 del_vma(vma); 420 return ret; 421 } 422 } 423 424 *iova = vma->iova; 425 return 0; 426 } 427 428 static int msm_gem_pin_iova(struct drm_gem_object *obj, 429 struct msm_gem_address_space *aspace) 430 { 431 struct msm_gem_object *msm_obj = to_msm_bo(obj); 432 struct msm_gem_vma *vma; 433 struct page **pages; 434 int ret, prot = IOMMU_READ; 435 436 if (!(msm_obj->flags & MSM_BO_GPU_READONLY)) 437 prot |= IOMMU_WRITE; 438 439 if (msm_obj->flags & MSM_BO_MAP_PRIV) 440 prot |= IOMMU_PRIV; 441 442 GEM_WARN_ON(!msm_gem_is_locked(obj)); 443 444 if (GEM_WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) 445 return -EBUSY; 446 447 vma = lookup_vma(obj, aspace); 448 if (GEM_WARN_ON(!vma)) 449 return -EINVAL; 450 451 pages = get_pages(obj); 452 if (IS_ERR(pages)) 453 return PTR_ERR(pages); 454 455 ret = msm_gem_map_vma(aspace, vma, prot, 456 msm_obj->sgt, obj->size >> PAGE_SHIFT); 457 458 if (!ret) 459 msm_obj->pin_count++; 460 461 return ret; 462 } 463 464 static int get_and_pin_iova_range_locked(struct drm_gem_object *obj, 465 struct msm_gem_address_space *aspace, uint64_t *iova, 466 u64 range_start, u64 range_end) 467 { 468 u64 local; 469 int ret; 470 471 GEM_WARN_ON(!msm_gem_is_locked(obj)); 472 473 ret = get_iova_locked(obj, aspace, &local, 474 range_start, range_end); 475 476 if (!ret) 477 ret = msm_gem_pin_iova(obj, aspace); 478 479 if (!ret) 480 *iova = local; 481 482 return ret; 483 } 484 485 /* 486 * get iova and pin it. Should have a matching put 487 * limits iova to specified range (in pages) 488 */ 489 int msm_gem_get_and_pin_iova_range(struct drm_gem_object *obj, 490 struct msm_gem_address_space *aspace, uint64_t *iova, 491 u64 range_start, u64 range_end) 492 { 493 int ret; 494 495 msm_gem_lock(obj); 496 ret = get_and_pin_iova_range_locked(obj, aspace, iova, range_start, range_end); 497 msm_gem_unlock(obj); 498 499 return ret; 500 } 501 502 int msm_gem_get_and_pin_iova_locked(struct drm_gem_object *obj, 503 struct msm_gem_address_space *aspace, uint64_t *iova) 504 { 505 return get_and_pin_iova_range_locked(obj, aspace, iova, 0, U64_MAX); 506 } 507 508 /* get iova and pin it. Should have a matching put */ 509 int msm_gem_get_and_pin_iova(struct drm_gem_object *obj, 510 struct msm_gem_address_space *aspace, uint64_t *iova) 511 { 512 return msm_gem_get_and_pin_iova_range(obj, aspace, iova, 0, U64_MAX); 513 } 514 515 /* 516 * Get an iova but don't pin it. Doesn't need a put because iovas are currently 517 * valid for the life of the object 518 */ 519 int msm_gem_get_iova(struct drm_gem_object *obj, 520 struct msm_gem_address_space *aspace, uint64_t *iova) 521 { 522 int ret; 523 524 msm_gem_lock(obj); 525 ret = get_iova_locked(obj, aspace, iova, 0, U64_MAX); 526 msm_gem_unlock(obj); 527 528 return ret; 529 } 530 531 /* get iova without taking a reference, used in places where you have 532 * already done a 'msm_gem_get_and_pin_iova' or 'msm_gem_get_iova' 533 */ 534 uint64_t msm_gem_iova(struct drm_gem_object *obj, 535 struct msm_gem_address_space *aspace) 536 { 537 struct msm_gem_vma *vma; 538 539 msm_gem_lock(obj); 540 vma = lookup_vma(obj, aspace); 541 msm_gem_unlock(obj); 542 GEM_WARN_ON(!vma); 543 544 return vma ? vma->iova : 0; 545 } 546 547 /* 548 * Locked variant of msm_gem_unpin_iova() 549 */ 550 void msm_gem_unpin_iova_locked(struct drm_gem_object *obj, 551 struct msm_gem_address_space *aspace) 552 { 553 struct msm_gem_object *msm_obj = to_msm_bo(obj); 554 struct msm_gem_vma *vma; 555 556 GEM_WARN_ON(!msm_gem_is_locked(obj)); 557 558 vma = lookup_vma(obj, aspace); 559 560 if (!GEM_WARN_ON(!vma)) { 561 msm_gem_unmap_vma(aspace, vma); 562 563 msm_obj->pin_count--; 564 GEM_WARN_ON(msm_obj->pin_count < 0); 565 566 update_inactive(msm_obj); 567 } 568 } 569 570 /* 571 * Unpin a iova by updating the reference counts. The memory isn't actually 572 * purged until something else (shrinker, mm_notifier, destroy, etc) decides 573 * to get rid of it 574 */ 575 void msm_gem_unpin_iova(struct drm_gem_object *obj, 576 struct msm_gem_address_space *aspace) 577 { 578 msm_gem_lock(obj); 579 msm_gem_unpin_iova_locked(obj, aspace); 580 msm_gem_unlock(obj); 581 } 582 583 int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev, 584 struct drm_mode_create_dumb *args) 585 { 586 args->pitch = align_pitch(args->width, args->bpp); 587 args->size = PAGE_ALIGN(args->pitch * args->height); 588 return msm_gem_new_handle(dev, file, args->size, 589 MSM_BO_SCANOUT | MSM_BO_WC, &args->handle, "dumb"); 590 } 591 592 int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev, 593 uint32_t handle, uint64_t *offset) 594 { 595 struct drm_gem_object *obj; 596 int ret = 0; 597 598 /* GEM does all our handle to object mapping */ 599 obj = drm_gem_object_lookup(file, handle); 600 if (obj == NULL) { 601 ret = -ENOENT; 602 goto fail; 603 } 604 605 *offset = msm_gem_mmap_offset(obj); 606 607 drm_gem_object_put(obj); 608 609 fail: 610 return ret; 611 } 612 613 static void *get_vaddr(struct drm_gem_object *obj, unsigned madv) 614 { 615 struct msm_gem_object *msm_obj = to_msm_bo(obj); 616 int ret = 0; 617 618 GEM_WARN_ON(!msm_gem_is_locked(obj)); 619 620 if (obj->import_attach) 621 return ERR_PTR(-ENODEV); 622 623 if (GEM_WARN_ON(msm_obj->madv > madv)) { 624 DRM_DEV_ERROR(obj->dev->dev, "Invalid madv state: %u vs %u\n", 625 msm_obj->madv, madv); 626 return ERR_PTR(-EBUSY); 627 } 628 629 /* increment vmap_count *before* vmap() call, so shrinker can 630 * check vmap_count (is_vunmapable()) outside of msm_obj lock. 631 * This guarantees that we won't try to msm_gem_vunmap() this 632 * same object from within the vmap() call (while we already 633 * hold msm_obj lock) 634 */ 635 msm_obj->vmap_count++; 636 637 if (!msm_obj->vaddr) { 638 struct page **pages = get_pages(obj); 639 if (IS_ERR(pages)) { 640 ret = PTR_ERR(pages); 641 goto fail; 642 } 643 msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT, 644 VM_MAP, pgprot_writecombine(PAGE_KERNEL)); 645 if (msm_obj->vaddr == NULL) { 646 ret = -ENOMEM; 647 goto fail; 648 } 649 } 650 651 return msm_obj->vaddr; 652 653 fail: 654 msm_obj->vmap_count--; 655 return ERR_PTR(ret); 656 } 657 658 void *msm_gem_get_vaddr_locked(struct drm_gem_object *obj) 659 { 660 return get_vaddr(obj, MSM_MADV_WILLNEED); 661 } 662 663 void *msm_gem_get_vaddr(struct drm_gem_object *obj) 664 { 665 void *ret; 666 667 msm_gem_lock(obj); 668 ret = msm_gem_get_vaddr_locked(obj); 669 msm_gem_unlock(obj); 670 671 return ret; 672 } 673 674 /* 675 * Don't use this! It is for the very special case of dumping 676 * submits from GPU hangs or faults, were the bo may already 677 * be MSM_MADV_DONTNEED, but we know the buffer is still on the 678 * active list. 679 */ 680 void *msm_gem_get_vaddr_active(struct drm_gem_object *obj) 681 { 682 return get_vaddr(obj, __MSM_MADV_PURGED); 683 } 684 685 void msm_gem_put_vaddr_locked(struct drm_gem_object *obj) 686 { 687 struct msm_gem_object *msm_obj = to_msm_bo(obj); 688 689 GEM_WARN_ON(!msm_gem_is_locked(obj)); 690 GEM_WARN_ON(msm_obj->vmap_count < 1); 691 692 msm_obj->vmap_count--; 693 } 694 695 void msm_gem_put_vaddr(struct drm_gem_object *obj) 696 { 697 msm_gem_lock(obj); 698 msm_gem_put_vaddr_locked(obj); 699 msm_gem_unlock(obj); 700 } 701 702 /* Update madvise status, returns true if not purged, else 703 * false or -errno. 704 */ 705 int msm_gem_madvise(struct drm_gem_object *obj, unsigned madv) 706 { 707 struct msm_gem_object *msm_obj = to_msm_bo(obj); 708 709 msm_gem_lock(obj); 710 711 if (msm_obj->madv != __MSM_MADV_PURGED) 712 msm_obj->madv = madv; 713 714 madv = msm_obj->madv; 715 716 /* If the obj is inactive, we might need to move it 717 * between inactive lists 718 */ 719 if (msm_obj->active_count == 0) 720 update_inactive(msm_obj); 721 722 msm_gem_unlock(obj); 723 724 return (madv != __MSM_MADV_PURGED); 725 } 726 727 void msm_gem_purge(struct drm_gem_object *obj) 728 { 729 struct drm_device *dev = obj->dev; 730 struct msm_gem_object *msm_obj = to_msm_bo(obj); 731 732 GEM_WARN_ON(!msm_gem_is_locked(obj)); 733 GEM_WARN_ON(!is_purgeable(msm_obj)); 734 735 /* Get rid of any iommu mapping(s): */ 736 put_iova_spaces(obj, true); 737 738 msm_gem_vunmap(obj); 739 740 drm_vma_node_unmap(&obj->vma_node, dev->anon_inode->i_mapping); 741 742 put_pages(obj); 743 744 put_iova_vmas(obj); 745 746 msm_obj->madv = __MSM_MADV_PURGED; 747 update_inactive(msm_obj); 748 749 drm_gem_free_mmap_offset(obj); 750 751 /* Our goal here is to return as much of the memory as 752 * is possible back to the system as we are called from OOM. 753 * To do this we must instruct the shmfs to drop all of its 754 * backing pages, *now*. 755 */ 756 shmem_truncate_range(file_inode(obj->filp), 0, (loff_t)-1); 757 758 invalidate_mapping_pages(file_inode(obj->filp)->i_mapping, 759 0, (loff_t)-1); 760 } 761 762 void msm_gem_vunmap(struct drm_gem_object *obj) 763 { 764 struct msm_gem_object *msm_obj = to_msm_bo(obj); 765 766 GEM_WARN_ON(!msm_gem_is_locked(obj)); 767 768 if (!msm_obj->vaddr || GEM_WARN_ON(!is_vunmapable(msm_obj))) 769 return; 770 771 vunmap(msm_obj->vaddr); 772 msm_obj->vaddr = NULL; 773 } 774 775 /* must be called before _move_to_active().. */ 776 int msm_gem_sync_object(struct drm_gem_object *obj, 777 struct msm_fence_context *fctx, bool exclusive) 778 { 779 struct dma_resv_list *fobj; 780 struct dma_fence *fence; 781 int i, ret; 782 783 fobj = dma_resv_get_list(obj->resv); 784 if (!fobj || (fobj->shared_count == 0)) { 785 fence = dma_resv_get_excl(obj->resv); 786 /* don't need to wait on our own fences, since ring is fifo */ 787 if (fence && (fence->context != fctx->context)) { 788 ret = dma_fence_wait(fence, true); 789 if (ret) 790 return ret; 791 } 792 } 793 794 if (!exclusive || !fobj) 795 return 0; 796 797 for (i = 0; i < fobj->shared_count; i++) { 798 fence = rcu_dereference_protected(fobj->shared[i], 799 dma_resv_held(obj->resv)); 800 if (fence->context != fctx->context) { 801 ret = dma_fence_wait(fence, true); 802 if (ret) 803 return ret; 804 } 805 } 806 807 return 0; 808 } 809 810 void msm_gem_active_get(struct drm_gem_object *obj, struct msm_gpu *gpu) 811 { 812 struct msm_gem_object *msm_obj = to_msm_bo(obj); 813 struct msm_drm_private *priv = obj->dev->dev_private; 814 815 might_sleep(); 816 GEM_WARN_ON(!msm_gem_is_locked(obj)); 817 GEM_WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED); 818 GEM_WARN_ON(msm_obj->dontneed); 819 GEM_WARN_ON(!msm_obj->sgt); 820 821 if (msm_obj->active_count++ == 0) { 822 mutex_lock(&priv->mm_lock); 823 if (msm_obj->evictable) 824 mark_unevictable(msm_obj); 825 list_del(&msm_obj->mm_list); 826 list_add_tail(&msm_obj->mm_list, &gpu->active_list); 827 mutex_unlock(&priv->mm_lock); 828 } 829 } 830 831 void msm_gem_active_put(struct drm_gem_object *obj) 832 { 833 struct msm_gem_object *msm_obj = to_msm_bo(obj); 834 835 might_sleep(); 836 GEM_WARN_ON(!msm_gem_is_locked(obj)); 837 838 if (--msm_obj->active_count == 0) { 839 update_inactive(msm_obj); 840 } 841 } 842 843 static void update_inactive(struct msm_gem_object *msm_obj) 844 { 845 struct msm_drm_private *priv = msm_obj->base.dev->dev_private; 846 847 GEM_WARN_ON(!msm_gem_is_locked(&msm_obj->base)); 848 849 if (msm_obj->active_count != 0) 850 return; 851 852 mutex_lock(&priv->mm_lock); 853 854 if (msm_obj->dontneed) 855 mark_unpurgeable(msm_obj); 856 if (msm_obj->evictable) 857 mark_unevictable(msm_obj); 858 859 list_del(&msm_obj->mm_list); 860 if ((msm_obj->madv == MSM_MADV_WILLNEED) && msm_obj->sgt) { 861 list_add_tail(&msm_obj->mm_list, &priv->inactive_willneed); 862 mark_evictable(msm_obj); 863 } else if (msm_obj->madv == MSM_MADV_DONTNEED) { 864 list_add_tail(&msm_obj->mm_list, &priv->inactive_dontneed); 865 mark_purgeable(msm_obj); 866 } else { 867 GEM_WARN_ON((msm_obj->madv != __MSM_MADV_PURGED) && msm_obj->sgt); 868 list_add_tail(&msm_obj->mm_list, &priv->inactive_unpinned); 869 } 870 871 mutex_unlock(&priv->mm_lock); 872 } 873 874 int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op, ktime_t *timeout) 875 { 876 bool write = !!(op & MSM_PREP_WRITE); 877 unsigned long remain = 878 op & MSM_PREP_NOSYNC ? 0 : timeout_to_jiffies(timeout); 879 long ret; 880 881 ret = dma_resv_wait_timeout_rcu(obj->resv, write, 882 true, remain); 883 if (ret == 0) 884 return remain == 0 ? -EBUSY : -ETIMEDOUT; 885 else if (ret < 0) 886 return ret; 887 888 /* TODO cache maintenance */ 889 890 return 0; 891 } 892 893 int msm_gem_cpu_fini(struct drm_gem_object *obj) 894 { 895 /* TODO cache maintenance */ 896 return 0; 897 } 898 899 #ifdef CONFIG_DEBUG_FS 900 static void describe_fence(struct dma_fence *fence, const char *type, 901 struct seq_file *m) 902 { 903 if (!dma_fence_is_signaled(fence)) 904 seq_printf(m, "\t%9s: %s %s seq %llu\n", type, 905 fence->ops->get_driver_name(fence), 906 fence->ops->get_timeline_name(fence), 907 fence->seqno); 908 } 909 910 void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m, 911 struct msm_gem_stats *stats) 912 { 913 struct msm_gem_object *msm_obj = to_msm_bo(obj); 914 struct dma_resv *robj = obj->resv; 915 struct dma_resv_list *fobj; 916 struct dma_fence *fence; 917 struct msm_gem_vma *vma; 918 uint64_t off = drm_vma_node_start(&obj->vma_node); 919 const char *madv; 920 921 msm_gem_lock(obj); 922 923 stats->all.count++; 924 stats->all.size += obj->size; 925 926 if (is_active(msm_obj)) { 927 stats->active.count++; 928 stats->active.size += obj->size; 929 } 930 931 if (msm_obj->pages) { 932 stats->resident.count++; 933 stats->resident.size += obj->size; 934 } 935 936 switch (msm_obj->madv) { 937 case __MSM_MADV_PURGED: 938 stats->purged.count++; 939 stats->purged.size += obj->size; 940 madv = " purged"; 941 break; 942 case MSM_MADV_DONTNEED: 943 stats->purgeable.count++; 944 stats->purgeable.size += obj->size; 945 madv = " purgeable"; 946 break; 947 case MSM_MADV_WILLNEED: 948 default: 949 madv = ""; 950 break; 951 } 952 953 seq_printf(m, "%08x: %c %2d (%2d) %08llx %p", 954 msm_obj->flags, is_active(msm_obj) ? 'A' : 'I', 955 obj->name, kref_read(&obj->refcount), 956 off, msm_obj->vaddr); 957 958 seq_printf(m, " %08zu %9s %-32s\n", obj->size, madv, msm_obj->name); 959 960 if (!list_empty(&msm_obj->vmas)) { 961 962 seq_puts(m, " vmas:"); 963 964 list_for_each_entry(vma, &msm_obj->vmas, list) { 965 const char *name, *comm; 966 if (vma->aspace) { 967 struct msm_gem_address_space *aspace = vma->aspace; 968 struct task_struct *task = 969 get_pid_task(aspace->pid, PIDTYPE_PID); 970 if (task) { 971 comm = kstrdup(task->comm, GFP_KERNEL); 972 } else { 973 comm = NULL; 974 } 975 name = aspace->name; 976 } else { 977 name = comm = NULL; 978 } 979 seq_printf(m, " [%s%s%s: aspace=%p, %08llx,%s,inuse=%d]", 980 name, comm ? ":" : "", comm ? comm : "", 981 vma->aspace, vma->iova, 982 vma->mapped ? "mapped" : "unmapped", 983 vma->inuse); 984 kfree(comm); 985 } 986 987 seq_puts(m, "\n"); 988 } 989 990 rcu_read_lock(); 991 fobj = rcu_dereference(robj->fence); 992 if (fobj) { 993 unsigned int i, shared_count = fobj->shared_count; 994 995 for (i = 0; i < shared_count; i++) { 996 fence = rcu_dereference(fobj->shared[i]); 997 describe_fence(fence, "Shared", m); 998 } 999 } 1000 1001 fence = rcu_dereference(robj->fence_excl); 1002 if (fence) 1003 describe_fence(fence, "Exclusive", m); 1004 rcu_read_unlock(); 1005 1006 msm_gem_unlock(obj); 1007 } 1008 1009 void msm_gem_describe_objects(struct list_head *list, struct seq_file *m) 1010 { 1011 struct msm_gem_stats stats = {}; 1012 struct msm_gem_object *msm_obj; 1013 1014 seq_puts(m, " flags id ref offset kaddr size madv name\n"); 1015 list_for_each_entry(msm_obj, list, node) { 1016 struct drm_gem_object *obj = &msm_obj->base; 1017 seq_puts(m, " "); 1018 msm_gem_describe(obj, m, &stats); 1019 } 1020 1021 seq_printf(m, "Total: %4d objects, %9zu bytes\n", 1022 stats.all.count, stats.all.size); 1023 seq_printf(m, "Active: %4d objects, %9zu bytes\n", 1024 stats.active.count, stats.active.size); 1025 seq_printf(m, "Resident: %4d objects, %9zu bytes\n", 1026 stats.resident.count, stats.resident.size); 1027 seq_printf(m, "Purgeable: %4d objects, %9zu bytes\n", 1028 stats.purgeable.count, stats.purgeable.size); 1029 seq_printf(m, "Purged: %4d objects, %9zu bytes\n", 1030 stats.purged.count, stats.purged.size); 1031 } 1032 #endif 1033 1034 /* don't call directly! Use drm_gem_object_put_locked() and friends */ 1035 void msm_gem_free_object(struct drm_gem_object *obj) 1036 { 1037 struct msm_gem_object *msm_obj = to_msm_bo(obj); 1038 struct drm_device *dev = obj->dev; 1039 struct msm_drm_private *priv = dev->dev_private; 1040 1041 mutex_lock(&priv->obj_lock); 1042 list_del(&msm_obj->node); 1043 mutex_unlock(&priv->obj_lock); 1044 1045 mutex_lock(&priv->mm_lock); 1046 if (msm_obj->dontneed) 1047 mark_unpurgeable(msm_obj); 1048 list_del(&msm_obj->mm_list); 1049 mutex_unlock(&priv->mm_lock); 1050 1051 msm_gem_lock(obj); 1052 1053 /* object should not be on active list: */ 1054 GEM_WARN_ON(is_active(msm_obj)); 1055 1056 put_iova_spaces(obj, true); 1057 1058 if (obj->import_attach) { 1059 GEM_WARN_ON(msm_obj->vaddr); 1060 1061 /* Don't drop the pages for imported dmabuf, as they are not 1062 * ours, just free the array we allocated: 1063 */ 1064 kvfree(msm_obj->pages); 1065 1066 put_iova_vmas(obj); 1067 1068 /* dma_buf_detach() grabs resv lock, so we need to unlock 1069 * prior to drm_prime_gem_destroy 1070 */ 1071 msm_gem_unlock(obj); 1072 1073 drm_prime_gem_destroy(obj, msm_obj->sgt); 1074 } else { 1075 msm_gem_vunmap(obj); 1076 put_pages(obj); 1077 put_iova_vmas(obj); 1078 msm_gem_unlock(obj); 1079 } 1080 1081 drm_gem_object_release(obj); 1082 1083 kfree(msm_obj); 1084 } 1085 1086 /* convenience method to construct a GEM buffer object, and userspace handle */ 1087 int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file, 1088 uint32_t size, uint32_t flags, uint32_t *handle, 1089 char *name) 1090 { 1091 struct drm_gem_object *obj; 1092 int ret; 1093 1094 obj = msm_gem_new(dev, size, flags); 1095 1096 if (IS_ERR(obj)) 1097 return PTR_ERR(obj); 1098 1099 if (name) 1100 msm_gem_object_set_name(obj, "%s", name); 1101 1102 ret = drm_gem_handle_create(file, obj, handle); 1103 1104 /* drop reference from allocate - handle holds it now */ 1105 drm_gem_object_put(obj); 1106 1107 return ret; 1108 } 1109 1110 static const struct vm_operations_struct vm_ops = { 1111 .fault = msm_gem_fault, 1112 .open = drm_gem_vm_open, 1113 .close = drm_gem_vm_close, 1114 }; 1115 1116 static const struct drm_gem_object_funcs msm_gem_object_funcs = { 1117 .free = msm_gem_free_object, 1118 .pin = msm_gem_prime_pin, 1119 .unpin = msm_gem_prime_unpin, 1120 .get_sg_table = msm_gem_prime_get_sg_table, 1121 .vmap = msm_gem_prime_vmap, 1122 .vunmap = msm_gem_prime_vunmap, 1123 .vm_ops = &vm_ops, 1124 }; 1125 1126 static int msm_gem_new_impl(struct drm_device *dev, 1127 uint32_t size, uint32_t flags, 1128 struct drm_gem_object **obj) 1129 { 1130 struct msm_gem_object *msm_obj; 1131 1132 switch (flags & MSM_BO_CACHE_MASK) { 1133 case MSM_BO_UNCACHED: 1134 case MSM_BO_CACHED: 1135 case MSM_BO_WC: 1136 break; 1137 default: 1138 DRM_DEV_ERROR(dev->dev, "invalid cache flag: %x\n", 1139 (flags & MSM_BO_CACHE_MASK)); 1140 return -EINVAL; 1141 } 1142 1143 msm_obj = kzalloc(sizeof(*msm_obj), GFP_KERNEL); 1144 if (!msm_obj) 1145 return -ENOMEM; 1146 1147 msm_obj->flags = flags; 1148 msm_obj->madv = MSM_MADV_WILLNEED; 1149 1150 INIT_LIST_HEAD(&msm_obj->submit_entry); 1151 INIT_LIST_HEAD(&msm_obj->vmas); 1152 1153 *obj = &msm_obj->base; 1154 (*obj)->funcs = &msm_gem_object_funcs; 1155 1156 return 0; 1157 } 1158 1159 static struct drm_gem_object *_msm_gem_new(struct drm_device *dev, 1160 uint32_t size, uint32_t flags, bool struct_mutex_locked) 1161 { 1162 struct msm_drm_private *priv = dev->dev_private; 1163 struct msm_gem_object *msm_obj; 1164 struct drm_gem_object *obj = NULL; 1165 bool use_vram = false; 1166 int ret; 1167 1168 size = PAGE_ALIGN(size); 1169 1170 if (!msm_use_mmu(dev)) 1171 use_vram = true; 1172 else if ((flags & (MSM_BO_STOLEN | MSM_BO_SCANOUT)) && priv->vram.size) 1173 use_vram = true; 1174 1175 if (GEM_WARN_ON(use_vram && !priv->vram.size)) 1176 return ERR_PTR(-EINVAL); 1177 1178 /* Disallow zero sized objects as they make the underlying 1179 * infrastructure grumpy 1180 */ 1181 if (size == 0) 1182 return ERR_PTR(-EINVAL); 1183 1184 ret = msm_gem_new_impl(dev, size, flags, &obj); 1185 if (ret) 1186 goto fail; 1187 1188 msm_obj = to_msm_bo(obj); 1189 1190 if (use_vram) { 1191 struct msm_gem_vma *vma; 1192 struct page **pages; 1193 1194 drm_gem_private_object_init(dev, obj, size); 1195 1196 msm_gem_lock(obj); 1197 1198 vma = add_vma(obj, NULL); 1199 msm_gem_unlock(obj); 1200 if (IS_ERR(vma)) { 1201 ret = PTR_ERR(vma); 1202 goto fail; 1203 } 1204 1205 to_msm_bo(obj)->vram_node = &vma->node; 1206 1207 msm_gem_lock(obj); 1208 pages = get_pages(obj); 1209 msm_gem_unlock(obj); 1210 if (IS_ERR(pages)) { 1211 ret = PTR_ERR(pages); 1212 goto fail; 1213 } 1214 1215 vma->iova = physaddr(obj); 1216 } else { 1217 ret = drm_gem_object_init(dev, obj, size); 1218 if (ret) 1219 goto fail; 1220 /* 1221 * Our buffers are kept pinned, so allocating them from the 1222 * MOVABLE zone is a really bad idea, and conflicts with CMA. 1223 * See comments above new_inode() why this is required _and_ 1224 * expected if you're going to pin these pages. 1225 */ 1226 mapping_set_gfp_mask(obj->filp->f_mapping, GFP_HIGHUSER); 1227 } 1228 1229 mutex_lock(&priv->mm_lock); 1230 list_add_tail(&msm_obj->mm_list, &priv->inactive_unpinned); 1231 mutex_unlock(&priv->mm_lock); 1232 1233 mutex_lock(&priv->obj_lock); 1234 list_add_tail(&msm_obj->node, &priv->objects); 1235 mutex_unlock(&priv->obj_lock); 1236 1237 return obj; 1238 1239 fail: 1240 if (struct_mutex_locked) { 1241 drm_gem_object_put_locked(obj); 1242 } else { 1243 drm_gem_object_put(obj); 1244 } 1245 return ERR_PTR(ret); 1246 } 1247 1248 struct drm_gem_object *msm_gem_new_locked(struct drm_device *dev, 1249 uint32_t size, uint32_t flags) 1250 { 1251 return _msm_gem_new(dev, size, flags, true); 1252 } 1253 1254 struct drm_gem_object *msm_gem_new(struct drm_device *dev, 1255 uint32_t size, uint32_t flags) 1256 { 1257 return _msm_gem_new(dev, size, flags, false); 1258 } 1259 1260 struct drm_gem_object *msm_gem_import(struct drm_device *dev, 1261 struct dma_buf *dmabuf, struct sg_table *sgt) 1262 { 1263 struct msm_drm_private *priv = dev->dev_private; 1264 struct msm_gem_object *msm_obj; 1265 struct drm_gem_object *obj; 1266 uint32_t size; 1267 int ret, npages; 1268 1269 /* if we don't have IOMMU, don't bother pretending we can import: */ 1270 if (!msm_use_mmu(dev)) { 1271 DRM_DEV_ERROR(dev->dev, "cannot import without IOMMU\n"); 1272 return ERR_PTR(-EINVAL); 1273 } 1274 1275 size = PAGE_ALIGN(dmabuf->size); 1276 1277 ret = msm_gem_new_impl(dev, size, MSM_BO_WC, &obj); 1278 if (ret) 1279 goto fail; 1280 1281 drm_gem_private_object_init(dev, obj, size); 1282 1283 npages = size / PAGE_SIZE; 1284 1285 msm_obj = to_msm_bo(obj); 1286 msm_gem_lock(obj); 1287 msm_obj->sgt = sgt; 1288 msm_obj->pages = kvmalloc_array(npages, sizeof(struct page *), GFP_KERNEL); 1289 if (!msm_obj->pages) { 1290 msm_gem_unlock(obj); 1291 ret = -ENOMEM; 1292 goto fail; 1293 } 1294 1295 ret = drm_prime_sg_to_page_array(sgt, msm_obj->pages, npages); 1296 if (ret) { 1297 msm_gem_unlock(obj); 1298 goto fail; 1299 } 1300 1301 msm_gem_unlock(obj); 1302 1303 mutex_lock(&priv->mm_lock); 1304 list_add_tail(&msm_obj->mm_list, &priv->inactive_unpinned); 1305 mutex_unlock(&priv->mm_lock); 1306 1307 mutex_lock(&priv->obj_lock); 1308 list_add_tail(&msm_obj->node, &priv->objects); 1309 mutex_unlock(&priv->obj_lock); 1310 1311 return obj; 1312 1313 fail: 1314 drm_gem_object_put(obj); 1315 return ERR_PTR(ret); 1316 } 1317 1318 static void *_msm_gem_kernel_new(struct drm_device *dev, uint32_t size, 1319 uint32_t flags, struct msm_gem_address_space *aspace, 1320 struct drm_gem_object **bo, uint64_t *iova, bool locked) 1321 { 1322 void *vaddr; 1323 struct drm_gem_object *obj = _msm_gem_new(dev, size, flags, locked); 1324 int ret; 1325 1326 if (IS_ERR(obj)) 1327 return ERR_CAST(obj); 1328 1329 if (iova) { 1330 ret = msm_gem_get_and_pin_iova(obj, aspace, iova); 1331 if (ret) 1332 goto err; 1333 } 1334 1335 vaddr = msm_gem_get_vaddr(obj); 1336 if (IS_ERR(vaddr)) { 1337 msm_gem_unpin_iova(obj, aspace); 1338 ret = PTR_ERR(vaddr); 1339 goto err; 1340 } 1341 1342 if (bo) 1343 *bo = obj; 1344 1345 return vaddr; 1346 err: 1347 if (locked) 1348 drm_gem_object_put_locked(obj); 1349 else 1350 drm_gem_object_put(obj); 1351 1352 return ERR_PTR(ret); 1353 1354 } 1355 1356 void *msm_gem_kernel_new(struct drm_device *dev, uint32_t size, 1357 uint32_t flags, struct msm_gem_address_space *aspace, 1358 struct drm_gem_object **bo, uint64_t *iova) 1359 { 1360 return _msm_gem_kernel_new(dev, size, flags, aspace, bo, iova, false); 1361 } 1362 1363 void *msm_gem_kernel_new_locked(struct drm_device *dev, uint32_t size, 1364 uint32_t flags, struct msm_gem_address_space *aspace, 1365 struct drm_gem_object **bo, uint64_t *iova) 1366 { 1367 return _msm_gem_kernel_new(dev, size, flags, aspace, bo, iova, true); 1368 } 1369 1370 void msm_gem_kernel_put(struct drm_gem_object *bo, 1371 struct msm_gem_address_space *aspace, bool locked) 1372 { 1373 if (IS_ERR_OR_NULL(bo)) 1374 return; 1375 1376 msm_gem_put_vaddr(bo); 1377 msm_gem_unpin_iova(bo, aspace); 1378 1379 if (locked) 1380 drm_gem_object_put_locked(bo); 1381 else 1382 drm_gem_object_put(bo); 1383 } 1384 1385 void msm_gem_object_set_name(struct drm_gem_object *bo, const char *fmt, ...) 1386 { 1387 struct msm_gem_object *msm_obj = to_msm_bo(bo); 1388 va_list ap; 1389 1390 if (!fmt) 1391 return; 1392 1393 va_start(ap, fmt); 1394 vsnprintf(msm_obj->name, sizeof(msm_obj->name), fmt, ap); 1395 va_end(ap); 1396 } 1397