1 // SPDX-License-Identifier: GPL-2.0 OR MIT
2 /**************************************************************************
3  *
4  * Copyright 2009-2023 VMware, Inc., Palo Alto, CA., USA
5  *
6  * Permission is hereby granted, free of charge, to any person obtaining a
7  * copy of this software and associated documentation files (the
8  * "Software"), to deal in the Software without restriction, including
9  * without limitation the rights to use, copy, modify, merge, publish,
10  * distribute, sub license, and/or sell copies of the Software, and to
11  * permit persons to whom the Software is furnished to do so, subject to
12  * the following conditions:
13  *
14  * The above copyright notice and this permission notice (including the
15  * next paragraph) shall be included in all copies or substantial portions
16  * of the Software.
17  *
18  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
21  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
22  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
23  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
24  * USE OR OTHER DEALINGS IN THE SOFTWARE.
25  *
26  **************************************************************************/
27 
28 #include "vmwgfx_bo.h"
29 #include "vmwgfx_drv.h"
30 #include <drm/ttm/ttm_placement.h>
31 
32 static const struct ttm_place vram_placement_flags = {
33 	.fpfn = 0,
34 	.lpfn = 0,
35 	.mem_type = TTM_PL_VRAM,
36 	.flags = 0
37 };
38 
39 static const struct ttm_place sys_placement_flags = {
40 	.fpfn = 0,
41 	.lpfn = 0,
42 	.mem_type = TTM_PL_SYSTEM,
43 	.flags = 0
44 };
45 
46 static const struct ttm_place gmr_placement_flags = {
47 	.fpfn = 0,
48 	.lpfn = 0,
49 	.mem_type = VMW_PL_GMR,
50 	.flags = 0
51 };
52 
53 struct ttm_placement vmw_vram_placement = {
54 	.num_placement = 1,
55 	.placement = &vram_placement_flags,
56 	.num_busy_placement = 1,
57 	.busy_placement = &vram_placement_flags
58 };
59 
60 static const struct ttm_place vram_gmr_placement_flags[] = {
61 	{
62 		.fpfn = 0,
63 		.lpfn = 0,
64 		.mem_type = TTM_PL_VRAM,
65 		.flags = 0
66 	}, {
67 		.fpfn = 0,
68 		.lpfn = 0,
69 		.mem_type = VMW_PL_GMR,
70 		.flags = 0
71 	}
72 };
73 
74 struct ttm_placement vmw_vram_gmr_placement = {
75 	.num_placement = 2,
76 	.placement = vram_gmr_placement_flags,
77 	.num_busy_placement = 1,
78 	.busy_placement = &gmr_placement_flags
79 };
80 
81 struct ttm_placement vmw_sys_placement = {
82 	.num_placement = 1,
83 	.placement = &sys_placement_flags,
84 	.num_busy_placement = 1,
85 	.busy_placement = &sys_placement_flags
86 };
87 
88 const size_t vmw_tt_size = sizeof(struct vmw_ttm_tt);
89 
90 /**
91  * __vmw_piter_non_sg_next: Helper functions to advance
92  * a struct vmw_piter iterator.
93  *
94  * @viter: Pointer to the iterator.
95  *
96  * These functions return false if past the end of the list,
97  * true otherwise. Functions are selected depending on the current
98  * DMA mapping mode.
99  */
100 static bool __vmw_piter_non_sg_next(struct vmw_piter *viter)
101 {
102 	return ++(viter->i) < viter->num_pages;
103 }
104 
105 static bool __vmw_piter_sg_next(struct vmw_piter *viter)
106 {
107 	bool ret = __vmw_piter_non_sg_next(viter);
108 
109 	return __sg_page_iter_dma_next(&viter->iter) && ret;
110 }
111 
112 
113 static dma_addr_t __vmw_piter_dma_addr(struct vmw_piter *viter)
114 {
115 	return viter->addrs[viter->i];
116 }
117 
118 static dma_addr_t __vmw_piter_sg_addr(struct vmw_piter *viter)
119 {
120 	return sg_page_iter_dma_address(&viter->iter);
121 }
122 
123 
124 /**
125  * vmw_piter_start - Initialize a struct vmw_piter.
126  *
127  * @viter: Pointer to the iterator to initialize
128  * @vsgt: Pointer to a struct vmw_sg_table to initialize from
129  * @p_offset: Pointer offset used to update current array position
130  *
131  * Note that we're following the convention of __sg_page_iter_start, so that
132  * the iterator doesn't point to a valid page after initialization; it has
133  * to be advanced one step first.
134  */
135 void vmw_piter_start(struct vmw_piter *viter, const struct vmw_sg_table *vsgt,
136 		     unsigned long p_offset)
137 {
138 	viter->i = p_offset - 1;
139 	viter->num_pages = vsgt->num_pages;
140 	viter->pages = vsgt->pages;
141 	switch (vsgt->mode) {
142 	case vmw_dma_alloc_coherent:
143 		viter->next = &__vmw_piter_non_sg_next;
144 		viter->dma_address = &__vmw_piter_dma_addr;
145 		viter->addrs = vsgt->addrs;
146 		break;
147 	case vmw_dma_map_populate:
148 	case vmw_dma_map_bind:
149 		viter->next = &__vmw_piter_sg_next;
150 		viter->dma_address = &__vmw_piter_sg_addr;
151 		__sg_page_iter_start(&viter->iter.base, vsgt->sgt->sgl,
152 				     vsgt->sgt->orig_nents, p_offset);
153 		break;
154 	default:
155 		BUG();
156 	}
157 }
158 
159 /**
160  * vmw_ttm_unmap_from_dma - unmap  device addresses previsouly mapped for
161  * TTM pages
162  *
163  * @vmw_tt: Pointer to a struct vmw_ttm_backend
164  *
165  * Used to free dma mappings previously mapped by vmw_ttm_map_for_dma.
166  */
167 static void vmw_ttm_unmap_from_dma(struct vmw_ttm_tt *vmw_tt)
168 {
169 	struct device *dev = vmw_tt->dev_priv->drm.dev;
170 
171 	dma_unmap_sgtable(dev, &vmw_tt->sgt, DMA_BIDIRECTIONAL, 0);
172 	vmw_tt->sgt.nents = vmw_tt->sgt.orig_nents;
173 }
174 
175 /**
176  * vmw_ttm_map_for_dma - map TTM pages to get device addresses
177  *
178  * @vmw_tt: Pointer to a struct vmw_ttm_backend
179  *
180  * This function is used to get device addresses from the kernel DMA layer.
181  * However, it's violating the DMA API in that when this operation has been
182  * performed, it's illegal for the CPU to write to the pages without first
183  * unmapping the DMA mappings, or calling dma_sync_sg_for_cpu(). It is
184  * therefore only legal to call this function if we know that the function
185  * dma_sync_sg_for_cpu() is a NOP, and dma_sync_sg_for_device() is at most
186  * a CPU write buffer flush.
187  */
188 static int vmw_ttm_map_for_dma(struct vmw_ttm_tt *vmw_tt)
189 {
190 	struct device *dev = vmw_tt->dev_priv->drm.dev;
191 
192 	return dma_map_sgtable(dev, &vmw_tt->sgt, DMA_BIDIRECTIONAL, 0);
193 }
194 
195 /**
196  * vmw_ttm_map_dma - Make sure TTM pages are visible to the device
197  *
198  * @vmw_tt: Pointer to a struct vmw_ttm_tt
199  *
200  * Select the correct function for and make sure the TTM pages are
201  * visible to the device. Allocate storage for the device mappings.
202  * If a mapping has already been performed, indicated by the storage
203  * pointer being non NULL, the function returns success.
204  */
205 static int vmw_ttm_map_dma(struct vmw_ttm_tt *vmw_tt)
206 {
207 	struct vmw_private *dev_priv = vmw_tt->dev_priv;
208 	struct vmw_sg_table *vsgt = &vmw_tt->vsgt;
209 	int ret = 0;
210 
211 	if (vmw_tt->mapped)
212 		return 0;
213 
214 	vsgt->mode = dev_priv->map_mode;
215 	vsgt->pages = vmw_tt->dma_ttm.pages;
216 	vsgt->num_pages = vmw_tt->dma_ttm.num_pages;
217 	vsgt->addrs = vmw_tt->dma_ttm.dma_address;
218 	vsgt->sgt = NULL;
219 
220 	switch (dev_priv->map_mode) {
221 	case vmw_dma_map_bind:
222 	case vmw_dma_map_populate:
223 		vsgt->sgt = &vmw_tt->sgt;
224 		ret = sg_alloc_table_from_pages_segment(
225 			&vmw_tt->sgt, vsgt->pages, vsgt->num_pages, 0,
226 			(unsigned long)vsgt->num_pages << PAGE_SHIFT,
227 			dma_get_max_seg_size(dev_priv->drm.dev), GFP_KERNEL);
228 		if (ret)
229 			goto out_sg_alloc_fail;
230 
231 		ret = vmw_ttm_map_for_dma(vmw_tt);
232 		if (unlikely(ret != 0))
233 			goto out_map_fail;
234 
235 		break;
236 	default:
237 		break;
238 	}
239 
240 	vmw_tt->mapped = true;
241 	return 0;
242 
243 out_map_fail:
244 	sg_free_table(vmw_tt->vsgt.sgt);
245 	vmw_tt->vsgt.sgt = NULL;
246 out_sg_alloc_fail:
247 	return ret;
248 }
249 
250 /**
251  * vmw_ttm_unmap_dma - Tear down any TTM page device mappings
252  *
253  * @vmw_tt: Pointer to a struct vmw_ttm_tt
254  *
255  * Tear down any previously set up device DMA mappings and free
256  * any storage space allocated for them. If there are no mappings set up,
257  * this function is a NOP.
258  */
259 static void vmw_ttm_unmap_dma(struct vmw_ttm_tt *vmw_tt)
260 {
261 	struct vmw_private *dev_priv = vmw_tt->dev_priv;
262 
263 	if (!vmw_tt->vsgt.sgt)
264 		return;
265 
266 	switch (dev_priv->map_mode) {
267 	case vmw_dma_map_bind:
268 	case vmw_dma_map_populate:
269 		vmw_ttm_unmap_from_dma(vmw_tt);
270 		sg_free_table(vmw_tt->vsgt.sgt);
271 		vmw_tt->vsgt.sgt = NULL;
272 		break;
273 	default:
274 		break;
275 	}
276 	vmw_tt->mapped = false;
277 }
278 
279 /**
280  * vmw_bo_sg_table - Return a struct vmw_sg_table object for a
281  * TTM buffer object
282  *
283  * @bo: Pointer to a struct ttm_buffer_object
284  *
285  * Returns a pointer to a struct vmw_sg_table object. The object should
286  * not be freed after use.
287  * Note that for the device addresses to be valid, the buffer object must
288  * either be reserved or pinned.
289  */
290 const struct vmw_sg_table *vmw_bo_sg_table(struct ttm_buffer_object *bo)
291 {
292 	struct vmw_ttm_tt *vmw_tt =
293 		container_of(bo->ttm, struct vmw_ttm_tt, dma_ttm);
294 
295 	return &vmw_tt->vsgt;
296 }
297 
298 
299 static int vmw_ttm_bind(struct ttm_device *bdev,
300 			struct ttm_tt *ttm, struct ttm_resource *bo_mem)
301 {
302 	struct vmw_ttm_tt *vmw_be =
303 		container_of(ttm, struct vmw_ttm_tt, dma_ttm);
304 	int ret = 0;
305 
306 	if (!bo_mem)
307 		return -EINVAL;
308 
309 	if (vmw_be->bound)
310 		return 0;
311 
312 	ret = vmw_ttm_map_dma(vmw_be);
313 	if (unlikely(ret != 0))
314 		return ret;
315 
316 	vmw_be->gmr_id = bo_mem->start;
317 	vmw_be->mem_type = bo_mem->mem_type;
318 
319 	switch (bo_mem->mem_type) {
320 	case VMW_PL_GMR:
321 		ret = vmw_gmr_bind(vmw_be->dev_priv, &vmw_be->vsgt,
322 				    ttm->num_pages, vmw_be->gmr_id);
323 		break;
324 	case VMW_PL_MOB:
325 		if (unlikely(vmw_be->mob == NULL)) {
326 			vmw_be->mob =
327 				vmw_mob_create(ttm->num_pages);
328 			if (unlikely(vmw_be->mob == NULL))
329 				return -ENOMEM;
330 		}
331 
332 		ret = vmw_mob_bind(vmw_be->dev_priv, vmw_be->mob,
333 				    &vmw_be->vsgt, ttm->num_pages,
334 				    vmw_be->gmr_id);
335 		break;
336 	case VMW_PL_SYSTEM:
337 		/* Nothing to be done for a system bind */
338 		break;
339 	default:
340 		BUG();
341 	}
342 	vmw_be->bound = true;
343 	return ret;
344 }
345 
346 static void vmw_ttm_unbind(struct ttm_device *bdev,
347 			   struct ttm_tt *ttm)
348 {
349 	struct vmw_ttm_tt *vmw_be =
350 		container_of(ttm, struct vmw_ttm_tt, dma_ttm);
351 
352 	if (!vmw_be->bound)
353 		return;
354 
355 	switch (vmw_be->mem_type) {
356 	case VMW_PL_GMR:
357 		vmw_gmr_unbind(vmw_be->dev_priv, vmw_be->gmr_id);
358 		break;
359 	case VMW_PL_MOB:
360 		vmw_mob_unbind(vmw_be->dev_priv, vmw_be->mob);
361 		break;
362 	case VMW_PL_SYSTEM:
363 		break;
364 	default:
365 		BUG();
366 	}
367 
368 	if (vmw_be->dev_priv->map_mode == vmw_dma_map_bind)
369 		vmw_ttm_unmap_dma(vmw_be);
370 	vmw_be->bound = false;
371 }
372 
373 
374 static void vmw_ttm_destroy(struct ttm_device *bdev, struct ttm_tt *ttm)
375 {
376 	struct vmw_ttm_tt *vmw_be =
377 		container_of(ttm, struct vmw_ttm_tt, dma_ttm);
378 
379 	vmw_ttm_unmap_dma(vmw_be);
380 	ttm_tt_fini(ttm);
381 	if (vmw_be->mob)
382 		vmw_mob_destroy(vmw_be->mob);
383 
384 	kfree(vmw_be);
385 }
386 
387 
388 static int vmw_ttm_populate(struct ttm_device *bdev,
389 			    struct ttm_tt *ttm, struct ttm_operation_ctx *ctx)
390 {
391 	int ret;
392 
393 	/* TODO: maybe completely drop this ? */
394 	if (ttm_tt_is_populated(ttm))
395 		return 0;
396 
397 	ret = ttm_pool_alloc(&bdev->pool, ttm, ctx);
398 
399 	return ret;
400 }
401 
402 static void vmw_ttm_unpopulate(struct ttm_device *bdev,
403 			       struct ttm_tt *ttm)
404 {
405 	struct vmw_ttm_tt *vmw_tt = container_of(ttm, struct vmw_ttm_tt,
406 						 dma_ttm);
407 
408 	vmw_ttm_unbind(bdev, ttm);
409 
410 	if (vmw_tt->mob) {
411 		vmw_mob_destroy(vmw_tt->mob);
412 		vmw_tt->mob = NULL;
413 	}
414 
415 	vmw_ttm_unmap_dma(vmw_tt);
416 
417 	ttm_pool_free(&bdev->pool, ttm);
418 }
419 
420 static struct ttm_tt *vmw_ttm_tt_create(struct ttm_buffer_object *bo,
421 					uint32_t page_flags)
422 {
423 	struct vmw_ttm_tt *vmw_be;
424 	int ret;
425 
426 	vmw_be = kzalloc(sizeof(*vmw_be), GFP_KERNEL);
427 	if (!vmw_be)
428 		return NULL;
429 
430 	vmw_be->dev_priv = vmw_priv_from_ttm(bo->bdev);
431 	vmw_be->mob = NULL;
432 
433 	if (vmw_be->dev_priv->map_mode == vmw_dma_alloc_coherent)
434 		ret = ttm_sg_tt_init(&vmw_be->dma_ttm, bo, page_flags,
435 				     ttm_cached);
436 	else
437 		ret = ttm_tt_init(&vmw_be->dma_ttm, bo, page_flags,
438 				  ttm_cached, 0);
439 	if (unlikely(ret != 0))
440 		goto out_no_init;
441 
442 	return &vmw_be->dma_ttm;
443 out_no_init:
444 	kfree(vmw_be);
445 	return NULL;
446 }
447 
448 static void vmw_evict_flags(struct ttm_buffer_object *bo,
449 		     struct ttm_placement *placement)
450 {
451 	*placement = vmw_sys_placement;
452 }
453 
454 static int vmw_ttm_io_mem_reserve(struct ttm_device *bdev, struct ttm_resource *mem)
455 {
456 	struct vmw_private *dev_priv = vmw_priv_from_ttm(bdev);
457 
458 	switch (mem->mem_type) {
459 	case TTM_PL_SYSTEM:
460 	case VMW_PL_SYSTEM:
461 	case VMW_PL_GMR:
462 	case VMW_PL_MOB:
463 		return 0;
464 	case TTM_PL_VRAM:
465 		mem->bus.offset = (mem->start << PAGE_SHIFT) +
466 			dev_priv->vram_start;
467 		mem->bus.is_iomem = true;
468 		mem->bus.caching = ttm_cached;
469 		break;
470 	default:
471 		return -EINVAL;
472 	}
473 	return 0;
474 }
475 
476 /**
477  * vmw_move_notify - TTM move_notify_callback
478  *
479  * @bo: The TTM buffer object about to move.
480  * @old_mem: The old memory where we move from
481  * @new_mem: The struct ttm_resource indicating to what memory
482  *       region the move is taking place.
483  *
484  * Calls move_notify for all subsystems needing it.
485  * (currently only resources).
486  */
487 static void vmw_move_notify(struct ttm_buffer_object *bo,
488 			    struct ttm_resource *old_mem,
489 			    struct ttm_resource *new_mem)
490 {
491 	vmw_bo_move_notify(bo, new_mem);
492 	vmw_query_move_notify(bo, old_mem, new_mem);
493 }
494 
495 
496 /**
497  * vmw_swap_notify - TTM move_notify_callback
498  *
499  * @bo: The TTM buffer object about to be swapped out.
500  */
501 static void vmw_swap_notify(struct ttm_buffer_object *bo)
502 {
503 	vmw_bo_swap_notify(bo);
504 	(void) ttm_bo_wait(bo, false, false);
505 }
506 
507 static bool vmw_memtype_is_system(uint32_t mem_type)
508 {
509 	return mem_type == TTM_PL_SYSTEM || mem_type == VMW_PL_SYSTEM;
510 }
511 
512 static int vmw_move(struct ttm_buffer_object *bo,
513 		    bool evict,
514 		    struct ttm_operation_ctx *ctx,
515 		    struct ttm_resource *new_mem,
516 		    struct ttm_place *hop)
517 {
518 	struct ttm_resource_manager *new_man;
519 	struct ttm_resource_manager *old_man = NULL;
520 	int ret = 0;
521 
522 	new_man = ttm_manager_type(bo->bdev, new_mem->mem_type);
523 	if (bo->resource)
524 		old_man = ttm_manager_type(bo->bdev, bo->resource->mem_type);
525 
526 	if (new_man->use_tt && !vmw_memtype_is_system(new_mem->mem_type)) {
527 		ret = vmw_ttm_bind(bo->bdev, bo->ttm, new_mem);
528 		if (ret)
529 			return ret;
530 	}
531 
532 	if (!bo->resource || (bo->resource->mem_type == TTM_PL_SYSTEM &&
533 			      bo->ttm == NULL)) {
534 		ttm_bo_move_null(bo, new_mem);
535 		return 0;
536 	}
537 
538 	vmw_move_notify(bo, bo->resource, new_mem);
539 
540 	if (old_man && old_man->use_tt && new_man->use_tt) {
541 		if (vmw_memtype_is_system(bo->resource->mem_type)) {
542 			ttm_bo_move_null(bo, new_mem);
543 			return 0;
544 		}
545 		ret = ttm_bo_wait_ctx(bo, ctx);
546 		if (ret)
547 			goto fail;
548 
549 		vmw_ttm_unbind(bo->bdev, bo->ttm);
550 		ttm_resource_free(bo, &bo->resource);
551 		ttm_bo_assign_mem(bo, new_mem);
552 		return 0;
553 	} else {
554 		ret = ttm_bo_move_memcpy(bo, ctx, new_mem);
555 		if (ret)
556 			goto fail;
557 	}
558 	return 0;
559 fail:
560 	vmw_move_notify(bo, new_mem, bo->resource);
561 	return ret;
562 }
563 
564 struct ttm_device_funcs vmw_bo_driver = {
565 	.ttm_tt_create = &vmw_ttm_tt_create,
566 	.ttm_tt_populate = &vmw_ttm_populate,
567 	.ttm_tt_unpopulate = &vmw_ttm_unpopulate,
568 	.ttm_tt_destroy = &vmw_ttm_destroy,
569 	.eviction_valuable = ttm_bo_eviction_valuable,
570 	.evict_flags = vmw_evict_flags,
571 	.move = vmw_move,
572 	.swap_notify = vmw_swap_notify,
573 	.io_mem_reserve = &vmw_ttm_io_mem_reserve,
574 };
575 
576 int vmw_bo_create_and_populate(struct vmw_private *dev_priv,
577 			       size_t bo_size, u32 domain,
578 			       struct vmw_bo **bo_p)
579 {
580 	struct ttm_operation_ctx ctx = {
581 		.interruptible = false,
582 		.no_wait_gpu = false
583 	};
584 	struct vmw_bo *vbo;
585 	int ret;
586 	struct vmw_bo_params bo_params = {
587 		.domain = domain,
588 		.busy_domain = domain,
589 		.bo_type = ttm_bo_type_kernel,
590 		.size = bo_size,
591 		.pin = true
592 	};
593 
594 	ret = vmw_bo_create(dev_priv, &bo_params, &vbo);
595 	if (unlikely(ret != 0))
596 		return ret;
597 
598 	ret = ttm_bo_reserve(&vbo->tbo, false, true, NULL);
599 	BUG_ON(ret != 0);
600 	ret = vmw_ttm_populate(vbo->tbo.bdev, vbo->tbo.ttm, &ctx);
601 	if (likely(ret == 0)) {
602 		struct vmw_ttm_tt *vmw_tt =
603 			container_of(vbo->tbo.ttm, struct vmw_ttm_tt, dma_ttm);
604 		ret = vmw_ttm_map_dma(vmw_tt);
605 	}
606 
607 	ttm_bo_unreserve(&vbo->tbo);
608 
609 	if (likely(ret == 0))
610 		*bo_p = vbo;
611 	return ret;
612 }
613