1 // SPDX-License-Identifier: GPL-2.0-only 2 /* 3 * Copyright (C) 2013 Red Hat 4 * Author: Rob Clark <robdclark@gmail.com> 5 */ 6 7 #include <linux/dma-map-ops.h> 8 #include <linux/spinlock.h> 9 #include <linux/shmem_fs.h> 10 #include <linux/dma-buf.h> 11 #include <linux/pfn_t.h> 12 13 #include <drm/drm_prime.h> 14 15 #include "msm_drv.h" 16 #include "msm_fence.h" 17 #include "msm_gem.h" 18 #include "msm_gpu.h" 19 #include "msm_mmu.h" 20 21 static void update_inactive(struct msm_gem_object *msm_obj); 22 23 static dma_addr_t physaddr(struct drm_gem_object *obj) 24 { 25 struct msm_gem_object *msm_obj = to_msm_bo(obj); 26 struct msm_drm_private *priv = obj->dev->dev_private; 27 return (((dma_addr_t)msm_obj->vram_node->start) << PAGE_SHIFT) + 28 priv->vram.paddr; 29 } 30 31 static bool use_pages(struct drm_gem_object *obj) 32 { 33 struct msm_gem_object *msm_obj = to_msm_bo(obj); 34 return !msm_obj->vram_node; 35 } 36 37 /* 38 * Cache sync.. this is a bit over-complicated, to fit dma-mapping 39 * API. Really GPU cache is out of scope here (handled on cmdstream) 40 * and all we need to do is invalidate newly allocated pages before 41 * mapping to CPU as uncached/writecombine. 42 * 43 * On top of this, we have the added headache, that depending on 44 * display generation, the display's iommu may be wired up to either 45 * the toplevel drm device (mdss), or to the mdp sub-node, meaning 46 * that here we either have dma-direct or iommu ops. 47 * 48 * Let this be a cautionary tail of abstraction gone wrong. 49 */ 50 51 static void sync_for_device(struct msm_gem_object *msm_obj) 52 { 53 struct device *dev = msm_obj->base.dev->dev; 54 55 dma_map_sgtable(dev, msm_obj->sgt, DMA_BIDIRECTIONAL, 0); 56 } 57 58 static void sync_for_cpu(struct msm_gem_object *msm_obj) 59 { 60 struct device *dev = msm_obj->base.dev->dev; 61 62 dma_unmap_sgtable(dev, msm_obj->sgt, DMA_BIDIRECTIONAL, 0); 63 } 64 65 /* allocate pages from VRAM carveout, used when no IOMMU: */ 66 static struct page **get_pages_vram(struct drm_gem_object *obj, int npages) 67 { 68 struct msm_gem_object *msm_obj = to_msm_bo(obj); 69 struct msm_drm_private *priv = obj->dev->dev_private; 70 dma_addr_t paddr; 71 struct page **p; 72 int ret, i; 73 74 p = kvmalloc_array(npages, sizeof(struct page *), GFP_KERNEL); 75 if (!p) 76 return ERR_PTR(-ENOMEM); 77 78 spin_lock(&priv->vram.lock); 79 ret = drm_mm_insert_node(&priv->vram.mm, msm_obj->vram_node, npages); 80 spin_unlock(&priv->vram.lock); 81 if (ret) { 82 kvfree(p); 83 return ERR_PTR(ret); 84 } 85 86 paddr = physaddr(obj); 87 for (i = 0; i < npages; i++) { 88 p[i] = phys_to_page(paddr); 89 paddr += PAGE_SIZE; 90 } 91 92 return p; 93 } 94 95 static struct page **get_pages(struct drm_gem_object *obj) 96 { 97 struct msm_gem_object *msm_obj = to_msm_bo(obj); 98 99 WARN_ON(!msm_gem_is_locked(obj)); 100 101 if (!msm_obj->pages) { 102 struct drm_device *dev = obj->dev; 103 struct page **p; 104 int npages = obj->size >> PAGE_SHIFT; 105 106 if (use_pages(obj)) 107 p = drm_gem_get_pages(obj); 108 else 109 p = get_pages_vram(obj, npages); 110 111 if (IS_ERR(p)) { 112 DRM_DEV_ERROR(dev->dev, "could not get pages: %ld\n", 113 PTR_ERR(p)); 114 return p; 115 } 116 117 msm_obj->pages = p; 118 119 msm_obj->sgt = drm_prime_pages_to_sg(obj->dev, p, npages); 120 if (IS_ERR(msm_obj->sgt)) { 121 void *ptr = ERR_CAST(msm_obj->sgt); 122 123 DRM_DEV_ERROR(dev->dev, "failed to allocate sgt\n"); 124 msm_obj->sgt = NULL; 125 return ptr; 126 } 127 128 /* For non-cached buffers, ensure the new pages are clean 129 * because display controller, GPU, etc. are not coherent: 130 */ 131 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED)) 132 sync_for_device(msm_obj); 133 } 134 135 return msm_obj->pages; 136 } 137 138 static void put_pages_vram(struct drm_gem_object *obj) 139 { 140 struct msm_gem_object *msm_obj = to_msm_bo(obj); 141 struct msm_drm_private *priv = obj->dev->dev_private; 142 143 spin_lock(&priv->vram.lock); 144 drm_mm_remove_node(msm_obj->vram_node); 145 spin_unlock(&priv->vram.lock); 146 147 kvfree(msm_obj->pages); 148 } 149 150 static void put_pages(struct drm_gem_object *obj) 151 { 152 struct msm_gem_object *msm_obj = to_msm_bo(obj); 153 154 if (msm_obj->pages) { 155 if (msm_obj->sgt) { 156 /* For non-cached buffers, ensure the new 157 * pages are clean because display controller, 158 * GPU, etc. are not coherent: 159 */ 160 if (msm_obj->flags & (MSM_BO_WC|MSM_BO_UNCACHED)) 161 sync_for_cpu(msm_obj); 162 163 sg_free_table(msm_obj->sgt); 164 kfree(msm_obj->sgt); 165 } 166 167 if (use_pages(obj)) 168 drm_gem_put_pages(obj, msm_obj->pages, true, false); 169 else 170 put_pages_vram(obj); 171 172 msm_obj->pages = NULL; 173 } 174 } 175 176 struct page **msm_gem_get_pages(struct drm_gem_object *obj) 177 { 178 struct msm_gem_object *msm_obj = to_msm_bo(obj); 179 struct page **p; 180 181 msm_gem_lock(obj); 182 183 if (WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) { 184 msm_gem_unlock(obj); 185 return ERR_PTR(-EBUSY); 186 } 187 188 p = get_pages(obj); 189 msm_gem_unlock(obj); 190 return p; 191 } 192 193 void msm_gem_put_pages(struct drm_gem_object *obj) 194 { 195 /* when we start tracking the pin count, then do something here */ 196 } 197 198 int msm_gem_mmap_obj(struct drm_gem_object *obj, 199 struct vm_area_struct *vma) 200 { 201 struct msm_gem_object *msm_obj = to_msm_bo(obj); 202 203 vma->vm_flags &= ~VM_PFNMAP; 204 vma->vm_flags |= VM_MIXEDMAP; 205 206 if (msm_obj->flags & MSM_BO_WC) { 207 vma->vm_page_prot = pgprot_writecombine(vm_get_page_prot(vma->vm_flags)); 208 } else if (msm_obj->flags & MSM_BO_UNCACHED) { 209 vma->vm_page_prot = pgprot_noncached(vm_get_page_prot(vma->vm_flags)); 210 } else { 211 /* 212 * Shunt off cached objs to shmem file so they have their own 213 * address_space (so unmap_mapping_range does what we want, 214 * in particular in the case of mmap'd dmabufs) 215 */ 216 vma->vm_pgoff = 0; 217 vma_set_file(vma, obj->filp); 218 219 vma->vm_page_prot = vm_get_page_prot(vma->vm_flags); 220 } 221 222 return 0; 223 } 224 225 int msm_gem_mmap(struct file *filp, struct vm_area_struct *vma) 226 { 227 int ret; 228 229 ret = drm_gem_mmap(filp, vma); 230 if (ret) { 231 DBG("mmap failed: %d", ret); 232 return ret; 233 } 234 235 return msm_gem_mmap_obj(vma->vm_private_data, vma); 236 } 237 238 static vm_fault_t msm_gem_fault(struct vm_fault *vmf) 239 { 240 struct vm_area_struct *vma = vmf->vma; 241 struct drm_gem_object *obj = vma->vm_private_data; 242 struct msm_gem_object *msm_obj = to_msm_bo(obj); 243 struct page **pages; 244 unsigned long pfn; 245 pgoff_t pgoff; 246 int err; 247 vm_fault_t ret; 248 249 /* 250 * vm_ops.open/drm_gem_mmap_obj and close get and put 251 * a reference on obj. So, we dont need to hold one here. 252 */ 253 err = msm_gem_lock_interruptible(obj); 254 if (err) { 255 ret = VM_FAULT_NOPAGE; 256 goto out; 257 } 258 259 if (WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) { 260 msm_gem_unlock(obj); 261 return VM_FAULT_SIGBUS; 262 } 263 264 /* make sure we have pages attached now */ 265 pages = get_pages(obj); 266 if (IS_ERR(pages)) { 267 ret = vmf_error(PTR_ERR(pages)); 268 goto out_unlock; 269 } 270 271 /* We don't use vmf->pgoff since that has the fake offset: */ 272 pgoff = (vmf->address - vma->vm_start) >> PAGE_SHIFT; 273 274 pfn = page_to_pfn(pages[pgoff]); 275 276 VERB("Inserting %p pfn %lx, pa %lx", (void *)vmf->address, 277 pfn, pfn << PAGE_SHIFT); 278 279 ret = vmf_insert_mixed(vma, vmf->address, __pfn_to_pfn_t(pfn, PFN_DEV)); 280 out_unlock: 281 msm_gem_unlock(obj); 282 out: 283 return ret; 284 } 285 286 /** get mmap offset */ 287 static uint64_t mmap_offset(struct drm_gem_object *obj) 288 { 289 struct drm_device *dev = obj->dev; 290 int ret; 291 292 WARN_ON(!msm_gem_is_locked(obj)); 293 294 /* Make it mmapable */ 295 ret = drm_gem_create_mmap_offset(obj); 296 297 if (ret) { 298 DRM_DEV_ERROR(dev->dev, "could not allocate mmap offset\n"); 299 return 0; 300 } 301 302 return drm_vma_node_offset_addr(&obj->vma_node); 303 } 304 305 uint64_t msm_gem_mmap_offset(struct drm_gem_object *obj) 306 { 307 uint64_t offset; 308 309 msm_gem_lock(obj); 310 offset = mmap_offset(obj); 311 msm_gem_unlock(obj); 312 return offset; 313 } 314 315 static struct msm_gem_vma *add_vma(struct drm_gem_object *obj, 316 struct msm_gem_address_space *aspace) 317 { 318 struct msm_gem_object *msm_obj = to_msm_bo(obj); 319 struct msm_gem_vma *vma; 320 321 WARN_ON(!msm_gem_is_locked(obj)); 322 323 vma = kzalloc(sizeof(*vma), GFP_KERNEL); 324 if (!vma) 325 return ERR_PTR(-ENOMEM); 326 327 vma->aspace = aspace; 328 329 list_add_tail(&vma->list, &msm_obj->vmas); 330 331 return vma; 332 } 333 334 static struct msm_gem_vma *lookup_vma(struct drm_gem_object *obj, 335 struct msm_gem_address_space *aspace) 336 { 337 struct msm_gem_object *msm_obj = to_msm_bo(obj); 338 struct msm_gem_vma *vma; 339 340 WARN_ON(!msm_gem_is_locked(obj)); 341 342 list_for_each_entry(vma, &msm_obj->vmas, list) { 343 if (vma->aspace == aspace) 344 return vma; 345 } 346 347 return NULL; 348 } 349 350 static void del_vma(struct msm_gem_vma *vma) 351 { 352 if (!vma) 353 return; 354 355 list_del(&vma->list); 356 kfree(vma); 357 } 358 359 /* Called with msm_obj locked */ 360 static void 361 put_iova_spaces(struct drm_gem_object *obj) 362 { 363 struct msm_gem_object *msm_obj = to_msm_bo(obj); 364 struct msm_gem_vma *vma; 365 366 WARN_ON(!msm_gem_is_locked(obj)); 367 368 list_for_each_entry(vma, &msm_obj->vmas, list) { 369 if (vma->aspace) { 370 msm_gem_purge_vma(vma->aspace, vma); 371 msm_gem_close_vma(vma->aspace, vma); 372 } 373 } 374 } 375 376 /* Called with msm_obj locked */ 377 static void 378 put_iova_vmas(struct drm_gem_object *obj) 379 { 380 struct msm_gem_object *msm_obj = to_msm_bo(obj); 381 struct msm_gem_vma *vma, *tmp; 382 383 WARN_ON(!msm_gem_is_locked(obj)); 384 385 list_for_each_entry_safe(vma, tmp, &msm_obj->vmas, list) { 386 del_vma(vma); 387 } 388 } 389 390 static int get_iova_locked(struct drm_gem_object *obj, 391 struct msm_gem_address_space *aspace, uint64_t *iova, 392 u64 range_start, u64 range_end) 393 { 394 struct msm_gem_vma *vma; 395 int ret = 0; 396 397 WARN_ON(!msm_gem_is_locked(obj)); 398 399 vma = lookup_vma(obj, aspace); 400 401 if (!vma) { 402 vma = add_vma(obj, aspace); 403 if (IS_ERR(vma)) 404 return PTR_ERR(vma); 405 406 ret = msm_gem_init_vma(aspace, vma, obj->size >> PAGE_SHIFT, 407 range_start, range_end); 408 if (ret) { 409 del_vma(vma); 410 return ret; 411 } 412 } 413 414 *iova = vma->iova; 415 return 0; 416 } 417 418 static int msm_gem_pin_iova(struct drm_gem_object *obj, 419 struct msm_gem_address_space *aspace) 420 { 421 struct msm_gem_object *msm_obj = to_msm_bo(obj); 422 struct msm_gem_vma *vma; 423 struct page **pages; 424 int prot = IOMMU_READ; 425 426 if (!(msm_obj->flags & MSM_BO_GPU_READONLY)) 427 prot |= IOMMU_WRITE; 428 429 if (msm_obj->flags & MSM_BO_MAP_PRIV) 430 prot |= IOMMU_PRIV; 431 432 WARN_ON(!msm_gem_is_locked(obj)); 433 434 if (WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED)) 435 return -EBUSY; 436 437 vma = lookup_vma(obj, aspace); 438 if (WARN_ON(!vma)) 439 return -EINVAL; 440 441 pages = get_pages(obj); 442 if (IS_ERR(pages)) 443 return PTR_ERR(pages); 444 445 return msm_gem_map_vma(aspace, vma, prot, 446 msm_obj->sgt, obj->size >> PAGE_SHIFT); 447 } 448 449 static int get_and_pin_iova_range_locked(struct drm_gem_object *obj, 450 struct msm_gem_address_space *aspace, uint64_t *iova, 451 u64 range_start, u64 range_end) 452 { 453 u64 local; 454 int ret; 455 456 WARN_ON(!msm_gem_is_locked(obj)); 457 458 ret = get_iova_locked(obj, aspace, &local, 459 range_start, range_end); 460 461 if (!ret) 462 ret = msm_gem_pin_iova(obj, aspace); 463 464 if (!ret) 465 *iova = local; 466 467 return ret; 468 } 469 470 /* 471 * get iova and pin it. Should have a matching put 472 * limits iova to specified range (in pages) 473 */ 474 int msm_gem_get_and_pin_iova_range(struct drm_gem_object *obj, 475 struct msm_gem_address_space *aspace, uint64_t *iova, 476 u64 range_start, u64 range_end) 477 { 478 int ret; 479 480 msm_gem_lock(obj); 481 ret = get_and_pin_iova_range_locked(obj, aspace, iova, range_start, range_end); 482 msm_gem_unlock(obj); 483 484 return ret; 485 } 486 487 int msm_gem_get_and_pin_iova_locked(struct drm_gem_object *obj, 488 struct msm_gem_address_space *aspace, uint64_t *iova) 489 { 490 return get_and_pin_iova_range_locked(obj, aspace, iova, 0, U64_MAX); 491 } 492 493 /* get iova and pin it. Should have a matching put */ 494 int msm_gem_get_and_pin_iova(struct drm_gem_object *obj, 495 struct msm_gem_address_space *aspace, uint64_t *iova) 496 { 497 return msm_gem_get_and_pin_iova_range(obj, aspace, iova, 0, U64_MAX); 498 } 499 500 /* 501 * Get an iova but don't pin it. Doesn't need a put because iovas are currently 502 * valid for the life of the object 503 */ 504 int msm_gem_get_iova(struct drm_gem_object *obj, 505 struct msm_gem_address_space *aspace, uint64_t *iova) 506 { 507 int ret; 508 509 msm_gem_lock(obj); 510 ret = get_iova_locked(obj, aspace, iova, 0, U64_MAX); 511 msm_gem_unlock(obj); 512 513 return ret; 514 } 515 516 /* get iova without taking a reference, used in places where you have 517 * already done a 'msm_gem_get_and_pin_iova' or 'msm_gem_get_iova' 518 */ 519 uint64_t msm_gem_iova(struct drm_gem_object *obj, 520 struct msm_gem_address_space *aspace) 521 { 522 struct msm_gem_vma *vma; 523 524 msm_gem_lock(obj); 525 vma = lookup_vma(obj, aspace); 526 msm_gem_unlock(obj); 527 WARN_ON(!vma); 528 529 return vma ? vma->iova : 0; 530 } 531 532 /* 533 * Locked variant of msm_gem_unpin_iova() 534 */ 535 void msm_gem_unpin_iova_locked(struct drm_gem_object *obj, 536 struct msm_gem_address_space *aspace) 537 { 538 struct msm_gem_vma *vma; 539 540 WARN_ON(!msm_gem_is_locked(obj)); 541 542 vma = lookup_vma(obj, aspace); 543 544 if (!WARN_ON(!vma)) 545 msm_gem_unmap_vma(aspace, vma); 546 } 547 548 /* 549 * Unpin a iova by updating the reference counts. The memory isn't actually 550 * purged until something else (shrinker, mm_notifier, destroy, etc) decides 551 * to get rid of it 552 */ 553 void msm_gem_unpin_iova(struct drm_gem_object *obj, 554 struct msm_gem_address_space *aspace) 555 { 556 msm_gem_lock(obj); 557 msm_gem_unpin_iova_locked(obj, aspace); 558 msm_gem_unlock(obj); 559 } 560 561 int msm_gem_dumb_create(struct drm_file *file, struct drm_device *dev, 562 struct drm_mode_create_dumb *args) 563 { 564 args->pitch = align_pitch(args->width, args->bpp); 565 args->size = PAGE_ALIGN(args->pitch * args->height); 566 return msm_gem_new_handle(dev, file, args->size, 567 MSM_BO_SCANOUT | MSM_BO_WC, &args->handle, "dumb"); 568 } 569 570 int msm_gem_dumb_map_offset(struct drm_file *file, struct drm_device *dev, 571 uint32_t handle, uint64_t *offset) 572 { 573 struct drm_gem_object *obj; 574 int ret = 0; 575 576 /* GEM does all our handle to object mapping */ 577 obj = drm_gem_object_lookup(file, handle); 578 if (obj == NULL) { 579 ret = -ENOENT; 580 goto fail; 581 } 582 583 *offset = msm_gem_mmap_offset(obj); 584 585 drm_gem_object_put(obj); 586 587 fail: 588 return ret; 589 } 590 591 static void *get_vaddr(struct drm_gem_object *obj, unsigned madv) 592 { 593 struct msm_gem_object *msm_obj = to_msm_bo(obj); 594 int ret = 0; 595 596 WARN_ON(!msm_gem_is_locked(obj)); 597 598 if (obj->import_attach) 599 return ERR_PTR(-ENODEV); 600 601 if (WARN_ON(msm_obj->madv > madv)) { 602 DRM_DEV_ERROR(obj->dev->dev, "Invalid madv state: %u vs %u\n", 603 msm_obj->madv, madv); 604 return ERR_PTR(-EBUSY); 605 } 606 607 /* increment vmap_count *before* vmap() call, so shrinker can 608 * check vmap_count (is_vunmapable()) outside of msm_obj lock. 609 * This guarantees that we won't try to msm_gem_vunmap() this 610 * same object from within the vmap() call (while we already 611 * hold msm_obj lock) 612 */ 613 msm_obj->vmap_count++; 614 615 if (!msm_obj->vaddr) { 616 struct page **pages = get_pages(obj); 617 if (IS_ERR(pages)) { 618 ret = PTR_ERR(pages); 619 goto fail; 620 } 621 msm_obj->vaddr = vmap(pages, obj->size >> PAGE_SHIFT, 622 VM_MAP, pgprot_writecombine(PAGE_KERNEL)); 623 if (msm_obj->vaddr == NULL) { 624 ret = -ENOMEM; 625 goto fail; 626 } 627 } 628 629 return msm_obj->vaddr; 630 631 fail: 632 msm_obj->vmap_count--; 633 return ERR_PTR(ret); 634 } 635 636 void *msm_gem_get_vaddr_locked(struct drm_gem_object *obj) 637 { 638 return get_vaddr(obj, MSM_MADV_WILLNEED); 639 } 640 641 void *msm_gem_get_vaddr(struct drm_gem_object *obj) 642 { 643 void *ret; 644 645 msm_gem_lock(obj); 646 ret = msm_gem_get_vaddr_locked(obj); 647 msm_gem_unlock(obj); 648 649 return ret; 650 } 651 652 /* 653 * Don't use this! It is for the very special case of dumping 654 * submits from GPU hangs or faults, were the bo may already 655 * be MSM_MADV_DONTNEED, but we know the buffer is still on the 656 * active list. 657 */ 658 void *msm_gem_get_vaddr_active(struct drm_gem_object *obj) 659 { 660 return get_vaddr(obj, __MSM_MADV_PURGED); 661 } 662 663 void msm_gem_put_vaddr_locked(struct drm_gem_object *obj) 664 { 665 struct msm_gem_object *msm_obj = to_msm_bo(obj); 666 667 WARN_ON(!msm_gem_is_locked(obj)); 668 WARN_ON(msm_obj->vmap_count < 1); 669 670 msm_obj->vmap_count--; 671 } 672 673 void msm_gem_put_vaddr(struct drm_gem_object *obj) 674 { 675 msm_gem_lock(obj); 676 msm_gem_put_vaddr_locked(obj); 677 msm_gem_unlock(obj); 678 } 679 680 /* Update madvise status, returns true if not purged, else 681 * false or -errno. 682 */ 683 int msm_gem_madvise(struct drm_gem_object *obj, unsigned madv) 684 { 685 struct msm_gem_object *msm_obj = to_msm_bo(obj); 686 687 msm_gem_lock(obj); 688 689 if (msm_obj->madv != __MSM_MADV_PURGED) 690 msm_obj->madv = madv; 691 692 madv = msm_obj->madv; 693 694 /* If the obj is inactive, we might need to move it 695 * between inactive lists 696 */ 697 if (msm_obj->active_count == 0) 698 update_inactive(msm_obj); 699 700 msm_gem_unlock(obj); 701 702 return (madv != __MSM_MADV_PURGED); 703 } 704 705 void msm_gem_purge(struct drm_gem_object *obj) 706 { 707 struct drm_device *dev = obj->dev; 708 struct msm_gem_object *msm_obj = to_msm_bo(obj); 709 710 WARN_ON(!is_purgeable(msm_obj)); 711 WARN_ON(obj->import_attach); 712 713 put_iova_spaces(obj); 714 715 msm_gem_vunmap(obj); 716 717 put_pages(obj); 718 719 put_iova_vmas(obj); 720 721 msm_obj->madv = __MSM_MADV_PURGED; 722 mark_unpurgable(msm_obj); 723 724 drm_vma_node_unmap(&obj->vma_node, dev->anon_inode->i_mapping); 725 drm_gem_free_mmap_offset(obj); 726 727 /* Our goal here is to return as much of the memory as 728 * is possible back to the system as we are called from OOM. 729 * To do this we must instruct the shmfs to drop all of its 730 * backing pages, *now*. 731 */ 732 shmem_truncate_range(file_inode(obj->filp), 0, (loff_t)-1); 733 734 invalidate_mapping_pages(file_inode(obj->filp)->i_mapping, 735 0, (loff_t)-1); 736 } 737 738 void msm_gem_vunmap(struct drm_gem_object *obj) 739 { 740 struct msm_gem_object *msm_obj = to_msm_bo(obj); 741 742 WARN_ON(!msm_gem_is_locked(obj)); 743 744 if (!msm_obj->vaddr || WARN_ON(!is_vunmapable(msm_obj))) 745 return; 746 747 vunmap(msm_obj->vaddr); 748 msm_obj->vaddr = NULL; 749 } 750 751 /* must be called before _move_to_active().. */ 752 int msm_gem_sync_object(struct drm_gem_object *obj, 753 struct msm_fence_context *fctx, bool exclusive) 754 { 755 struct dma_resv_list *fobj; 756 struct dma_fence *fence; 757 int i, ret; 758 759 fobj = dma_resv_get_list(obj->resv); 760 if (!fobj || (fobj->shared_count == 0)) { 761 fence = dma_resv_get_excl(obj->resv); 762 /* don't need to wait on our own fences, since ring is fifo */ 763 if (fence && (fence->context != fctx->context)) { 764 ret = dma_fence_wait(fence, true); 765 if (ret) 766 return ret; 767 } 768 } 769 770 if (!exclusive || !fobj) 771 return 0; 772 773 for (i = 0; i < fobj->shared_count; i++) { 774 fence = rcu_dereference_protected(fobj->shared[i], 775 dma_resv_held(obj->resv)); 776 if (fence->context != fctx->context) { 777 ret = dma_fence_wait(fence, true); 778 if (ret) 779 return ret; 780 } 781 } 782 783 return 0; 784 } 785 786 void msm_gem_active_get(struct drm_gem_object *obj, struct msm_gpu *gpu) 787 { 788 struct msm_gem_object *msm_obj = to_msm_bo(obj); 789 struct msm_drm_private *priv = obj->dev->dev_private; 790 791 might_sleep(); 792 WARN_ON(!msm_gem_is_locked(obj)); 793 WARN_ON(msm_obj->madv != MSM_MADV_WILLNEED); 794 WARN_ON(msm_obj->dontneed); 795 796 if (msm_obj->active_count++ == 0) { 797 mutex_lock(&priv->mm_lock); 798 list_del(&msm_obj->mm_list); 799 list_add_tail(&msm_obj->mm_list, &gpu->active_list); 800 mutex_unlock(&priv->mm_lock); 801 } 802 } 803 804 void msm_gem_active_put(struct drm_gem_object *obj) 805 { 806 struct msm_gem_object *msm_obj = to_msm_bo(obj); 807 808 might_sleep(); 809 WARN_ON(!msm_gem_is_locked(obj)); 810 811 if (--msm_obj->active_count == 0) { 812 update_inactive(msm_obj); 813 } 814 } 815 816 static void update_inactive(struct msm_gem_object *msm_obj) 817 { 818 struct msm_drm_private *priv = msm_obj->base.dev->dev_private; 819 820 mutex_lock(&priv->mm_lock); 821 WARN_ON(msm_obj->active_count != 0); 822 823 if (msm_obj->dontneed) 824 mark_unpurgable(msm_obj); 825 826 list_del(&msm_obj->mm_list); 827 if (msm_obj->madv == MSM_MADV_WILLNEED) { 828 list_add_tail(&msm_obj->mm_list, &priv->inactive_willneed); 829 } else if (msm_obj->madv == MSM_MADV_DONTNEED) { 830 list_add_tail(&msm_obj->mm_list, &priv->inactive_dontneed); 831 mark_purgable(msm_obj); 832 } else { 833 WARN_ON(msm_obj->madv != __MSM_MADV_PURGED); 834 list_add_tail(&msm_obj->mm_list, &priv->inactive_purged); 835 } 836 837 mutex_unlock(&priv->mm_lock); 838 } 839 840 int msm_gem_cpu_prep(struct drm_gem_object *obj, uint32_t op, ktime_t *timeout) 841 { 842 bool write = !!(op & MSM_PREP_WRITE); 843 unsigned long remain = 844 op & MSM_PREP_NOSYNC ? 0 : timeout_to_jiffies(timeout); 845 long ret; 846 847 ret = dma_resv_wait_timeout_rcu(obj->resv, write, 848 true, remain); 849 if (ret == 0) 850 return remain == 0 ? -EBUSY : -ETIMEDOUT; 851 else if (ret < 0) 852 return ret; 853 854 /* TODO cache maintenance */ 855 856 return 0; 857 } 858 859 int msm_gem_cpu_fini(struct drm_gem_object *obj) 860 { 861 /* TODO cache maintenance */ 862 return 0; 863 } 864 865 #ifdef CONFIG_DEBUG_FS 866 static void describe_fence(struct dma_fence *fence, const char *type, 867 struct seq_file *m) 868 { 869 if (!dma_fence_is_signaled(fence)) 870 seq_printf(m, "\t%9s: %s %s seq %llu\n", type, 871 fence->ops->get_driver_name(fence), 872 fence->ops->get_timeline_name(fence), 873 fence->seqno); 874 } 875 876 void msm_gem_describe(struct drm_gem_object *obj, struct seq_file *m, 877 struct msm_gem_stats *stats) 878 { 879 struct msm_gem_object *msm_obj = to_msm_bo(obj); 880 struct dma_resv *robj = obj->resv; 881 struct dma_resv_list *fobj; 882 struct dma_fence *fence; 883 struct msm_gem_vma *vma; 884 uint64_t off = drm_vma_node_start(&obj->vma_node); 885 const char *madv; 886 887 msm_gem_lock(obj); 888 889 stats->all.count++; 890 stats->all.size += obj->size; 891 892 if (is_active(msm_obj)) { 893 stats->active.count++; 894 stats->active.size += obj->size; 895 } 896 897 switch (msm_obj->madv) { 898 case __MSM_MADV_PURGED: 899 stats->purged.count++; 900 stats->purged.size += obj->size; 901 madv = " purged"; 902 break; 903 case MSM_MADV_DONTNEED: 904 stats->purgable.count++; 905 stats->purgable.size += obj->size; 906 madv = " purgeable"; 907 break; 908 case MSM_MADV_WILLNEED: 909 default: 910 madv = ""; 911 break; 912 } 913 914 seq_printf(m, "%08x: %c %2d (%2d) %08llx %p", 915 msm_obj->flags, is_active(msm_obj) ? 'A' : 'I', 916 obj->name, kref_read(&obj->refcount), 917 off, msm_obj->vaddr); 918 919 seq_printf(m, " %08zu %9s %-32s\n", obj->size, madv, msm_obj->name); 920 921 if (!list_empty(&msm_obj->vmas)) { 922 923 seq_puts(m, " vmas:"); 924 925 list_for_each_entry(vma, &msm_obj->vmas, list) { 926 const char *name, *comm; 927 if (vma->aspace) { 928 struct msm_gem_address_space *aspace = vma->aspace; 929 struct task_struct *task = 930 get_pid_task(aspace->pid, PIDTYPE_PID); 931 if (task) { 932 comm = kstrdup(task->comm, GFP_KERNEL); 933 } else { 934 comm = NULL; 935 } 936 name = aspace->name; 937 } else { 938 name = comm = NULL; 939 } 940 seq_printf(m, " [%s%s%s: aspace=%p, %08llx,%s,inuse=%d]", 941 name, comm ? ":" : "", comm ? comm : "", 942 vma->aspace, vma->iova, 943 vma->mapped ? "mapped" : "unmapped", 944 vma->inuse); 945 kfree(comm); 946 } 947 948 seq_puts(m, "\n"); 949 } 950 951 rcu_read_lock(); 952 fobj = rcu_dereference(robj->fence); 953 if (fobj) { 954 unsigned int i, shared_count = fobj->shared_count; 955 956 for (i = 0; i < shared_count; i++) { 957 fence = rcu_dereference(fobj->shared[i]); 958 describe_fence(fence, "Shared", m); 959 } 960 } 961 962 fence = rcu_dereference(robj->fence_excl); 963 if (fence) 964 describe_fence(fence, "Exclusive", m); 965 rcu_read_unlock(); 966 967 msm_gem_unlock(obj); 968 } 969 970 void msm_gem_describe_objects(struct list_head *list, struct seq_file *m) 971 { 972 struct msm_gem_stats stats = {}; 973 struct msm_gem_object *msm_obj; 974 975 seq_puts(m, " flags id ref offset kaddr size madv name\n"); 976 list_for_each_entry(msm_obj, list, node) { 977 struct drm_gem_object *obj = &msm_obj->base; 978 seq_puts(m, " "); 979 msm_gem_describe(obj, m, &stats); 980 } 981 982 seq_printf(m, "Total: %4d objects, %9zu bytes\n", 983 stats.all.count, stats.all.size); 984 seq_printf(m, "Active: %4d objects, %9zu bytes\n", 985 stats.active.count, stats.active.size); 986 seq_printf(m, "Purgable: %4d objects, %9zu bytes\n", 987 stats.purgable.count, stats.purgable.size); 988 seq_printf(m, "Purged: %4d objects, %9zu bytes\n", 989 stats.purged.count, stats.purged.size); 990 } 991 #endif 992 993 /* don't call directly! Use drm_gem_object_put_locked() and friends */ 994 void msm_gem_free_object(struct drm_gem_object *obj) 995 { 996 struct msm_gem_object *msm_obj = to_msm_bo(obj); 997 struct drm_device *dev = obj->dev; 998 struct msm_drm_private *priv = dev->dev_private; 999 1000 mutex_lock(&priv->obj_lock); 1001 list_del(&msm_obj->node); 1002 mutex_unlock(&priv->obj_lock); 1003 1004 mutex_lock(&priv->mm_lock); 1005 if (msm_obj->dontneed) 1006 mark_unpurgable(msm_obj); 1007 list_del(&msm_obj->mm_list); 1008 mutex_unlock(&priv->mm_lock); 1009 1010 msm_gem_lock(obj); 1011 1012 /* object should not be on active list: */ 1013 WARN_ON(is_active(msm_obj)); 1014 1015 put_iova_spaces(obj); 1016 1017 if (obj->import_attach) { 1018 WARN_ON(msm_obj->vaddr); 1019 1020 /* Don't drop the pages for imported dmabuf, as they are not 1021 * ours, just free the array we allocated: 1022 */ 1023 kvfree(msm_obj->pages); 1024 1025 put_iova_vmas(obj); 1026 1027 /* dma_buf_detach() grabs resv lock, so we need to unlock 1028 * prior to drm_prime_gem_destroy 1029 */ 1030 msm_gem_unlock(obj); 1031 1032 drm_prime_gem_destroy(obj, msm_obj->sgt); 1033 } else { 1034 msm_gem_vunmap(obj); 1035 put_pages(obj); 1036 put_iova_vmas(obj); 1037 msm_gem_unlock(obj); 1038 } 1039 1040 drm_gem_object_release(obj); 1041 1042 kfree(msm_obj); 1043 } 1044 1045 /* convenience method to construct a GEM buffer object, and userspace handle */ 1046 int msm_gem_new_handle(struct drm_device *dev, struct drm_file *file, 1047 uint32_t size, uint32_t flags, uint32_t *handle, 1048 char *name) 1049 { 1050 struct drm_gem_object *obj; 1051 int ret; 1052 1053 obj = msm_gem_new(dev, size, flags); 1054 1055 if (IS_ERR(obj)) 1056 return PTR_ERR(obj); 1057 1058 if (name) 1059 msm_gem_object_set_name(obj, "%s", name); 1060 1061 ret = drm_gem_handle_create(file, obj, handle); 1062 1063 /* drop reference from allocate - handle holds it now */ 1064 drm_gem_object_put(obj); 1065 1066 return ret; 1067 } 1068 1069 static const struct vm_operations_struct vm_ops = { 1070 .fault = msm_gem_fault, 1071 .open = drm_gem_vm_open, 1072 .close = drm_gem_vm_close, 1073 }; 1074 1075 static const struct drm_gem_object_funcs msm_gem_object_funcs = { 1076 .free = msm_gem_free_object, 1077 .pin = msm_gem_prime_pin, 1078 .unpin = msm_gem_prime_unpin, 1079 .get_sg_table = msm_gem_prime_get_sg_table, 1080 .vmap = msm_gem_prime_vmap, 1081 .vunmap = msm_gem_prime_vunmap, 1082 .vm_ops = &vm_ops, 1083 }; 1084 1085 static int msm_gem_new_impl(struct drm_device *dev, 1086 uint32_t size, uint32_t flags, 1087 struct drm_gem_object **obj) 1088 { 1089 struct msm_gem_object *msm_obj; 1090 1091 switch (flags & MSM_BO_CACHE_MASK) { 1092 case MSM_BO_UNCACHED: 1093 case MSM_BO_CACHED: 1094 case MSM_BO_WC: 1095 break; 1096 default: 1097 DRM_DEV_ERROR(dev->dev, "invalid cache flag: %x\n", 1098 (flags & MSM_BO_CACHE_MASK)); 1099 return -EINVAL; 1100 } 1101 1102 msm_obj = kzalloc(sizeof(*msm_obj), GFP_KERNEL); 1103 if (!msm_obj) 1104 return -ENOMEM; 1105 1106 msm_obj->flags = flags; 1107 msm_obj->madv = MSM_MADV_WILLNEED; 1108 1109 INIT_LIST_HEAD(&msm_obj->submit_entry); 1110 INIT_LIST_HEAD(&msm_obj->vmas); 1111 1112 *obj = &msm_obj->base; 1113 (*obj)->funcs = &msm_gem_object_funcs; 1114 1115 return 0; 1116 } 1117 1118 static struct drm_gem_object *_msm_gem_new(struct drm_device *dev, 1119 uint32_t size, uint32_t flags, bool struct_mutex_locked) 1120 { 1121 struct msm_drm_private *priv = dev->dev_private; 1122 struct msm_gem_object *msm_obj; 1123 struct drm_gem_object *obj = NULL; 1124 bool use_vram = false; 1125 int ret; 1126 1127 size = PAGE_ALIGN(size); 1128 1129 if (!msm_use_mmu(dev)) 1130 use_vram = true; 1131 else if ((flags & (MSM_BO_STOLEN | MSM_BO_SCANOUT)) && priv->vram.size) 1132 use_vram = true; 1133 1134 if (WARN_ON(use_vram && !priv->vram.size)) 1135 return ERR_PTR(-EINVAL); 1136 1137 /* Disallow zero sized objects as they make the underlying 1138 * infrastructure grumpy 1139 */ 1140 if (size == 0) 1141 return ERR_PTR(-EINVAL); 1142 1143 ret = msm_gem_new_impl(dev, size, flags, &obj); 1144 if (ret) 1145 goto fail; 1146 1147 msm_obj = to_msm_bo(obj); 1148 1149 if (use_vram) { 1150 struct msm_gem_vma *vma; 1151 struct page **pages; 1152 1153 drm_gem_private_object_init(dev, obj, size); 1154 1155 msm_gem_lock(obj); 1156 1157 vma = add_vma(obj, NULL); 1158 msm_gem_unlock(obj); 1159 if (IS_ERR(vma)) { 1160 ret = PTR_ERR(vma); 1161 goto fail; 1162 } 1163 1164 to_msm_bo(obj)->vram_node = &vma->node; 1165 1166 msm_gem_lock(obj); 1167 pages = get_pages(obj); 1168 msm_gem_unlock(obj); 1169 if (IS_ERR(pages)) { 1170 ret = PTR_ERR(pages); 1171 goto fail; 1172 } 1173 1174 vma->iova = physaddr(obj); 1175 } else { 1176 ret = drm_gem_object_init(dev, obj, size); 1177 if (ret) 1178 goto fail; 1179 /* 1180 * Our buffers are kept pinned, so allocating them from the 1181 * MOVABLE zone is a really bad idea, and conflicts with CMA. 1182 * See comments above new_inode() why this is required _and_ 1183 * expected if you're going to pin these pages. 1184 */ 1185 mapping_set_gfp_mask(obj->filp->f_mapping, GFP_HIGHUSER); 1186 } 1187 1188 mutex_lock(&priv->mm_lock); 1189 /* Initially obj is idle, obj->madv == WILLNEED: */ 1190 list_add_tail(&msm_obj->mm_list, &priv->inactive_willneed); 1191 mutex_unlock(&priv->mm_lock); 1192 1193 mutex_lock(&priv->obj_lock); 1194 list_add_tail(&msm_obj->node, &priv->objects); 1195 mutex_unlock(&priv->obj_lock); 1196 1197 return obj; 1198 1199 fail: 1200 if (struct_mutex_locked) { 1201 drm_gem_object_put_locked(obj); 1202 } else { 1203 drm_gem_object_put(obj); 1204 } 1205 return ERR_PTR(ret); 1206 } 1207 1208 struct drm_gem_object *msm_gem_new_locked(struct drm_device *dev, 1209 uint32_t size, uint32_t flags) 1210 { 1211 return _msm_gem_new(dev, size, flags, true); 1212 } 1213 1214 struct drm_gem_object *msm_gem_new(struct drm_device *dev, 1215 uint32_t size, uint32_t flags) 1216 { 1217 return _msm_gem_new(dev, size, flags, false); 1218 } 1219 1220 struct drm_gem_object *msm_gem_import(struct drm_device *dev, 1221 struct dma_buf *dmabuf, struct sg_table *sgt) 1222 { 1223 struct msm_drm_private *priv = dev->dev_private; 1224 struct msm_gem_object *msm_obj; 1225 struct drm_gem_object *obj; 1226 uint32_t size; 1227 int ret, npages; 1228 1229 /* if we don't have IOMMU, don't bother pretending we can import: */ 1230 if (!msm_use_mmu(dev)) { 1231 DRM_DEV_ERROR(dev->dev, "cannot import without IOMMU\n"); 1232 return ERR_PTR(-EINVAL); 1233 } 1234 1235 size = PAGE_ALIGN(dmabuf->size); 1236 1237 ret = msm_gem_new_impl(dev, size, MSM_BO_WC, &obj); 1238 if (ret) 1239 goto fail; 1240 1241 drm_gem_private_object_init(dev, obj, size); 1242 1243 npages = size / PAGE_SIZE; 1244 1245 msm_obj = to_msm_bo(obj); 1246 msm_gem_lock(obj); 1247 msm_obj->sgt = sgt; 1248 msm_obj->pages = kvmalloc_array(npages, sizeof(struct page *), GFP_KERNEL); 1249 if (!msm_obj->pages) { 1250 msm_gem_unlock(obj); 1251 ret = -ENOMEM; 1252 goto fail; 1253 } 1254 1255 ret = drm_prime_sg_to_page_array(sgt, msm_obj->pages, npages); 1256 if (ret) { 1257 msm_gem_unlock(obj); 1258 goto fail; 1259 } 1260 1261 msm_gem_unlock(obj); 1262 1263 mutex_lock(&priv->mm_lock); 1264 list_add_tail(&msm_obj->mm_list, &priv->inactive_willneed); 1265 mutex_unlock(&priv->mm_lock); 1266 1267 mutex_lock(&priv->obj_lock); 1268 list_add_tail(&msm_obj->node, &priv->objects); 1269 mutex_unlock(&priv->obj_lock); 1270 1271 return obj; 1272 1273 fail: 1274 drm_gem_object_put(obj); 1275 return ERR_PTR(ret); 1276 } 1277 1278 static void *_msm_gem_kernel_new(struct drm_device *dev, uint32_t size, 1279 uint32_t flags, struct msm_gem_address_space *aspace, 1280 struct drm_gem_object **bo, uint64_t *iova, bool locked) 1281 { 1282 void *vaddr; 1283 struct drm_gem_object *obj = _msm_gem_new(dev, size, flags, locked); 1284 int ret; 1285 1286 if (IS_ERR(obj)) 1287 return ERR_CAST(obj); 1288 1289 if (iova) { 1290 ret = msm_gem_get_and_pin_iova(obj, aspace, iova); 1291 if (ret) 1292 goto err; 1293 } 1294 1295 vaddr = msm_gem_get_vaddr(obj); 1296 if (IS_ERR(vaddr)) { 1297 msm_gem_unpin_iova(obj, aspace); 1298 ret = PTR_ERR(vaddr); 1299 goto err; 1300 } 1301 1302 if (bo) 1303 *bo = obj; 1304 1305 return vaddr; 1306 err: 1307 if (locked) 1308 drm_gem_object_put_locked(obj); 1309 else 1310 drm_gem_object_put(obj); 1311 1312 return ERR_PTR(ret); 1313 1314 } 1315 1316 void *msm_gem_kernel_new(struct drm_device *dev, uint32_t size, 1317 uint32_t flags, struct msm_gem_address_space *aspace, 1318 struct drm_gem_object **bo, uint64_t *iova) 1319 { 1320 return _msm_gem_kernel_new(dev, size, flags, aspace, bo, iova, false); 1321 } 1322 1323 void *msm_gem_kernel_new_locked(struct drm_device *dev, uint32_t size, 1324 uint32_t flags, struct msm_gem_address_space *aspace, 1325 struct drm_gem_object **bo, uint64_t *iova) 1326 { 1327 return _msm_gem_kernel_new(dev, size, flags, aspace, bo, iova, true); 1328 } 1329 1330 void msm_gem_kernel_put(struct drm_gem_object *bo, 1331 struct msm_gem_address_space *aspace, bool locked) 1332 { 1333 if (IS_ERR_OR_NULL(bo)) 1334 return; 1335 1336 msm_gem_put_vaddr(bo); 1337 msm_gem_unpin_iova(bo, aspace); 1338 1339 if (locked) 1340 drm_gem_object_put_locked(bo); 1341 else 1342 drm_gem_object_put(bo); 1343 } 1344 1345 void msm_gem_object_set_name(struct drm_gem_object *bo, const char *fmt, ...) 1346 { 1347 struct msm_gem_object *msm_obj = to_msm_bo(bo); 1348 va_list ap; 1349 1350 if (!fmt) 1351 return; 1352 1353 va_start(ap, fmt); 1354 vsnprintf(msm_obj->name, sizeof(msm_obj->name), fmt, ap); 1355 va_end(ap); 1356 } 1357