xref: /openbmc/linux/drivers/gpu/drm/lima/lima_gem.c (revision 5e2421ce)
1 // SPDX-License-Identifier: GPL-2.0 OR MIT
2 /* Copyright 2017-2019 Qiang Yu <yuq825@gmail.com> */
3 
4 #include <linux/mm.h>
5 #include <linux/sync_file.h>
6 #include <linux/pagemap.h>
7 #include <linux/shmem_fs.h>
8 #include <linux/dma-mapping.h>
9 
10 #include <drm/drm_file.h>
11 #include <drm/drm_syncobj.h>
12 #include <drm/drm_utils.h>
13 
14 #include <drm/lima_drm.h>
15 
16 #include "lima_drv.h"
17 #include "lima_gem.h"
18 #include "lima_vm.h"
19 
20 int lima_heap_alloc(struct lima_bo *bo, struct lima_vm *vm)
21 {
22 	struct page **pages;
23 	struct address_space *mapping = bo->base.base.filp->f_mapping;
24 	struct device *dev = bo->base.base.dev->dev;
25 	size_t old_size = bo->heap_size;
26 	size_t new_size = bo->heap_size ? bo->heap_size * 2 :
27 		(lima_heap_init_nr_pages << PAGE_SHIFT);
28 	struct sg_table sgt;
29 	int i, ret;
30 
31 	if (bo->heap_size >= bo->base.base.size)
32 		return -ENOSPC;
33 
34 	new_size = min(new_size, bo->base.base.size);
35 
36 	mutex_lock(&bo->base.pages_lock);
37 
38 	if (bo->base.pages) {
39 		pages = bo->base.pages;
40 	} else {
41 		pages = kvmalloc_array(bo->base.base.size >> PAGE_SHIFT,
42 				       sizeof(*pages), GFP_KERNEL | __GFP_ZERO);
43 		if (!pages) {
44 			mutex_unlock(&bo->base.pages_lock);
45 			return -ENOMEM;
46 		}
47 
48 		bo->base.pages = pages;
49 		bo->base.pages_use_count = 1;
50 
51 		mapping_set_unevictable(mapping);
52 	}
53 
54 	for (i = old_size >> PAGE_SHIFT; i < new_size >> PAGE_SHIFT; i++) {
55 		struct page *page = shmem_read_mapping_page(mapping, i);
56 
57 		if (IS_ERR(page)) {
58 			mutex_unlock(&bo->base.pages_lock);
59 			return PTR_ERR(page);
60 		}
61 		pages[i] = page;
62 	}
63 
64 	mutex_unlock(&bo->base.pages_lock);
65 
66 	ret = sg_alloc_table_from_pages(&sgt, pages, i, 0,
67 					new_size, GFP_KERNEL);
68 	if (ret)
69 		return ret;
70 
71 	if (bo->base.sgt) {
72 		dma_unmap_sgtable(dev, bo->base.sgt, DMA_BIDIRECTIONAL, 0);
73 		sg_free_table(bo->base.sgt);
74 	} else {
75 		bo->base.sgt = kmalloc(sizeof(*bo->base.sgt), GFP_KERNEL);
76 		if (!bo->base.sgt) {
77 			sg_free_table(&sgt);
78 			return -ENOMEM;
79 		}
80 	}
81 
82 	ret = dma_map_sgtable(dev, &sgt, DMA_BIDIRECTIONAL, 0);
83 	if (ret) {
84 		sg_free_table(&sgt);
85 		kfree(bo->base.sgt);
86 		bo->base.sgt = NULL;
87 		return ret;
88 	}
89 
90 	*bo->base.sgt = sgt;
91 
92 	if (vm) {
93 		ret = lima_vm_map_bo(vm, bo, old_size >> PAGE_SHIFT);
94 		if (ret)
95 			return ret;
96 	}
97 
98 	bo->heap_size = new_size;
99 	return 0;
100 }
101 
102 int lima_gem_create_handle(struct drm_device *dev, struct drm_file *file,
103 			   u32 size, u32 flags, u32 *handle)
104 {
105 	int err;
106 	gfp_t mask;
107 	struct drm_gem_shmem_object *shmem;
108 	struct drm_gem_object *obj;
109 	struct lima_bo *bo;
110 	bool is_heap = flags & LIMA_BO_FLAG_HEAP;
111 
112 	shmem = drm_gem_shmem_create(dev, size);
113 	if (IS_ERR(shmem))
114 		return PTR_ERR(shmem);
115 
116 	obj = &shmem->base;
117 
118 	/* Mali Utgard GPU can only support 32bit address space */
119 	mask = mapping_gfp_mask(obj->filp->f_mapping);
120 	mask &= ~__GFP_HIGHMEM;
121 	mask |= __GFP_DMA32;
122 	mapping_set_gfp_mask(obj->filp->f_mapping, mask);
123 
124 	if (is_heap) {
125 		bo = to_lima_bo(obj);
126 		err = lima_heap_alloc(bo, NULL);
127 		if (err)
128 			goto out;
129 	} else {
130 		struct sg_table *sgt = drm_gem_shmem_get_pages_sgt(shmem);
131 
132 		if (IS_ERR(sgt)) {
133 			err = PTR_ERR(sgt);
134 			goto out;
135 		}
136 	}
137 
138 	err = drm_gem_handle_create(file, obj, handle);
139 
140 out:
141 	/* drop reference from allocate - handle holds it now */
142 	drm_gem_object_put(obj);
143 
144 	return err;
145 }
146 
147 static void lima_gem_free_object(struct drm_gem_object *obj)
148 {
149 	struct lima_bo *bo = to_lima_bo(obj);
150 
151 	if (!list_empty(&bo->va))
152 		dev_err(obj->dev->dev, "lima gem free bo still has va\n");
153 
154 	drm_gem_shmem_free(&bo->base);
155 }
156 
157 static int lima_gem_object_open(struct drm_gem_object *obj, struct drm_file *file)
158 {
159 	struct lima_bo *bo = to_lima_bo(obj);
160 	struct lima_drm_priv *priv = to_lima_drm_priv(file);
161 	struct lima_vm *vm = priv->vm;
162 
163 	return lima_vm_bo_add(vm, bo, true);
164 }
165 
166 static void lima_gem_object_close(struct drm_gem_object *obj, struct drm_file *file)
167 {
168 	struct lima_bo *bo = to_lima_bo(obj);
169 	struct lima_drm_priv *priv = to_lima_drm_priv(file);
170 	struct lima_vm *vm = priv->vm;
171 
172 	lima_vm_bo_del(vm, bo);
173 }
174 
175 static int lima_gem_pin(struct drm_gem_object *obj)
176 {
177 	struct lima_bo *bo = to_lima_bo(obj);
178 
179 	if (bo->heap_size)
180 		return -EINVAL;
181 
182 	return drm_gem_shmem_pin(&bo->base);
183 }
184 
185 static int lima_gem_vmap(struct drm_gem_object *obj, struct dma_buf_map *map)
186 {
187 	struct lima_bo *bo = to_lima_bo(obj);
188 
189 	if (bo->heap_size)
190 		return -EINVAL;
191 
192 	return drm_gem_shmem_vmap(&bo->base, map);
193 }
194 
195 static int lima_gem_mmap(struct drm_gem_object *obj, struct vm_area_struct *vma)
196 {
197 	struct lima_bo *bo = to_lima_bo(obj);
198 
199 	if (bo->heap_size)
200 		return -EINVAL;
201 
202 	return drm_gem_shmem_mmap(&bo->base, vma);
203 }
204 
205 static const struct drm_gem_object_funcs lima_gem_funcs = {
206 	.free = lima_gem_free_object,
207 	.open = lima_gem_object_open,
208 	.close = lima_gem_object_close,
209 	.print_info = drm_gem_shmem_object_print_info,
210 	.pin = lima_gem_pin,
211 	.unpin = drm_gem_shmem_object_unpin,
212 	.get_sg_table = drm_gem_shmem_object_get_sg_table,
213 	.vmap = lima_gem_vmap,
214 	.vunmap = drm_gem_shmem_object_vunmap,
215 	.mmap = lima_gem_mmap,
216 	.vm_ops = &drm_gem_shmem_vm_ops,
217 };
218 
219 struct drm_gem_object *lima_gem_create_object(struct drm_device *dev, size_t size)
220 {
221 	struct lima_bo *bo;
222 
223 	bo = kzalloc(sizeof(*bo), GFP_KERNEL);
224 	if (!bo)
225 		return ERR_PTR(-ENOMEM);
226 
227 	mutex_init(&bo->lock);
228 	INIT_LIST_HEAD(&bo->va);
229 	bo->base.map_wc = true;
230 	bo->base.base.funcs = &lima_gem_funcs;
231 
232 	return &bo->base.base;
233 }
234 
235 int lima_gem_get_info(struct drm_file *file, u32 handle, u32 *va, u64 *offset)
236 {
237 	struct drm_gem_object *obj;
238 	struct lima_bo *bo;
239 	struct lima_drm_priv *priv = to_lima_drm_priv(file);
240 	struct lima_vm *vm = priv->vm;
241 
242 	obj = drm_gem_object_lookup(file, handle);
243 	if (!obj)
244 		return -ENOENT;
245 
246 	bo = to_lima_bo(obj);
247 
248 	*va = lima_vm_get_va(vm, bo);
249 
250 	*offset = drm_vma_node_offset_addr(&obj->vma_node);
251 
252 	drm_gem_object_put(obj);
253 	return 0;
254 }
255 
256 static int lima_gem_sync_bo(struct lima_sched_task *task, struct lima_bo *bo,
257 			    bool write, bool explicit)
258 {
259 	int err = 0;
260 
261 	if (!write) {
262 		err = dma_resv_reserve_shared(lima_bo_resv(bo), 1);
263 		if (err)
264 			return err;
265 	}
266 
267 	/* explicit sync use user passed dep fence */
268 	if (explicit)
269 		return 0;
270 
271 	return drm_sched_job_add_implicit_dependencies(&task->base,
272 						       &bo->base.base,
273 						       write);
274 }
275 
276 static int lima_gem_add_deps(struct drm_file *file, struct lima_submit *submit)
277 {
278 	int i, err;
279 
280 	for (i = 0; i < ARRAY_SIZE(submit->in_sync); i++) {
281 		struct dma_fence *fence = NULL;
282 
283 		if (!submit->in_sync[i])
284 			continue;
285 
286 		err = drm_syncobj_find_fence(file, submit->in_sync[i],
287 					     0, 0, &fence);
288 		if (err)
289 			return err;
290 
291 		err = drm_sched_job_add_dependency(&submit->task->base, fence);
292 		if (err) {
293 			dma_fence_put(fence);
294 			return err;
295 		}
296 	}
297 
298 	return 0;
299 }
300 
301 int lima_gem_submit(struct drm_file *file, struct lima_submit *submit)
302 {
303 	int i, err = 0;
304 	struct ww_acquire_ctx ctx;
305 	struct lima_drm_priv *priv = to_lima_drm_priv(file);
306 	struct lima_vm *vm = priv->vm;
307 	struct drm_syncobj *out_sync = NULL;
308 	struct dma_fence *fence;
309 	struct lima_bo **bos = submit->lbos;
310 
311 	if (submit->out_sync) {
312 		out_sync = drm_syncobj_find(file, submit->out_sync);
313 		if (!out_sync)
314 			return -ENOENT;
315 	}
316 
317 	for (i = 0; i < submit->nr_bos; i++) {
318 		struct drm_gem_object *obj;
319 		struct lima_bo *bo;
320 
321 		obj = drm_gem_object_lookup(file, submit->bos[i].handle);
322 		if (!obj) {
323 			err = -ENOENT;
324 			goto err_out0;
325 		}
326 
327 		bo = to_lima_bo(obj);
328 
329 		/* increase refcnt of gpu va map to prevent unmapped when executing,
330 		 * will be decreased when task done
331 		 */
332 		err = lima_vm_bo_add(vm, bo, false);
333 		if (err) {
334 			drm_gem_object_put(obj);
335 			goto err_out0;
336 		}
337 
338 		bos[i] = bo;
339 	}
340 
341 	err = drm_gem_lock_reservations((struct drm_gem_object **)bos,
342 					submit->nr_bos, &ctx);
343 	if (err)
344 		goto err_out0;
345 
346 	err = lima_sched_task_init(
347 		submit->task, submit->ctx->context + submit->pipe,
348 		bos, submit->nr_bos, vm);
349 	if (err)
350 		goto err_out1;
351 
352 	err = lima_gem_add_deps(file, submit);
353 	if (err)
354 		goto err_out2;
355 
356 	for (i = 0; i < submit->nr_bos; i++) {
357 		err = lima_gem_sync_bo(
358 			submit->task, bos[i],
359 			submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE,
360 			submit->flags & LIMA_SUBMIT_FLAG_EXPLICIT_FENCE);
361 		if (err)
362 			goto err_out2;
363 	}
364 
365 	fence = lima_sched_context_queue_task(submit->task);
366 
367 	for (i = 0; i < submit->nr_bos; i++) {
368 		if (submit->bos[i].flags & LIMA_SUBMIT_BO_WRITE)
369 			dma_resv_add_excl_fence(lima_bo_resv(bos[i]), fence);
370 		else
371 			dma_resv_add_shared_fence(lima_bo_resv(bos[i]), fence);
372 	}
373 
374 	drm_gem_unlock_reservations((struct drm_gem_object **)bos,
375 				    submit->nr_bos, &ctx);
376 
377 	for (i = 0; i < submit->nr_bos; i++)
378 		drm_gem_object_put(&bos[i]->base.base);
379 
380 	if (out_sync) {
381 		drm_syncobj_replace_fence(out_sync, fence);
382 		drm_syncobj_put(out_sync);
383 	}
384 
385 	dma_fence_put(fence);
386 
387 	return 0;
388 
389 err_out2:
390 	lima_sched_task_fini(submit->task);
391 err_out1:
392 	drm_gem_unlock_reservations((struct drm_gem_object **)bos,
393 				    submit->nr_bos, &ctx);
394 err_out0:
395 	for (i = 0; i < submit->nr_bos; i++) {
396 		if (!bos[i])
397 			break;
398 		lima_vm_bo_del(vm, bos[i]);
399 		drm_gem_object_put(&bos[i]->base.base);
400 	}
401 	if (out_sync)
402 		drm_syncobj_put(out_sync);
403 	return err;
404 }
405 
406 int lima_gem_wait(struct drm_file *file, u32 handle, u32 op, s64 timeout_ns)
407 {
408 	bool write = op & LIMA_GEM_WAIT_WRITE;
409 	long ret, timeout;
410 
411 	if (!op)
412 		return 0;
413 
414 	timeout = drm_timeout_abs_to_jiffies(timeout_ns);
415 
416 	ret = drm_gem_dma_resv_wait(file, handle, write, timeout);
417 	if (ret == -ETIME)
418 		ret = timeout ? -ETIMEDOUT : -EBUSY;
419 
420 	return ret;
421 }
422