xref: /openbmc/linux/drivers/dma-buf/dma-resv.c (revision 20e2fc42)
1 /*
2  * Copyright (C) 2012-2014 Canonical Ltd (Maarten Lankhorst)
3  *
4  * Based on bo.c which bears the following copyright notice,
5  * but is dual licensed:
6  *
7  * Copyright (c) 2006-2009 VMware, Inc., Palo Alto, CA., USA
8  * All Rights Reserved.
9  *
10  * Permission is hereby granted, free of charge, to any person obtaining a
11  * copy of this software and associated documentation files (the
12  * "Software"), to deal in the Software without restriction, including
13  * without limitation the rights to use, copy, modify, merge, publish,
14  * distribute, sub license, and/or sell copies of the Software, and to
15  * permit persons to whom the Software is furnished to do so, subject to
16  * the following conditions:
17  *
18  * The above copyright notice and this permission notice (including the
19  * next paragraph) shall be included in all copies or substantial portions
20  * of the Software.
21  *
22  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
23  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
24  * FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL
25  * THE COPYRIGHT HOLDERS, AUTHORS AND/OR ITS SUPPLIERS BE LIABLE FOR ANY CLAIM,
26  * DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
27  * OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
28  * USE OR OTHER DEALINGS IN THE SOFTWARE.
29  *
30  **************************************************************************/
31 /*
32  * Authors: Thomas Hellstrom <thellstrom-at-vmware-dot-com>
33  */
34 
35 #include <linux/dma-resv.h>
36 #include <linux/export.h>
37 
38 /**
39  * DOC: Reservation Object Overview
40  *
41  * The reservation object provides a mechanism to manage shared and
42  * exclusive fences associated with a buffer.  A reservation object
43  * can have attached one exclusive fence (normally associated with
44  * write operations) or N shared fences (read operations).  The RCU
45  * mechanism is used to protect read access to fences from locked
46  * write-side updates.
47  */
48 
49 DEFINE_WD_CLASS(reservation_ww_class);
50 EXPORT_SYMBOL(reservation_ww_class);
51 
52 struct lock_class_key reservation_seqcount_class;
53 EXPORT_SYMBOL(reservation_seqcount_class);
54 
55 const char reservation_seqcount_string[] = "reservation_seqcount";
56 EXPORT_SYMBOL(reservation_seqcount_string);
57 
58 /**
59  * dma_resv_list_alloc - allocate fence list
60  * @shared_max: number of fences we need space for
61  *
62  * Allocate a new dma_resv_list and make sure to correctly initialize
63  * shared_max.
64  */
65 static struct dma_resv_list *dma_resv_list_alloc(unsigned int shared_max)
66 {
67 	struct dma_resv_list *list;
68 
69 	list = kmalloc(offsetof(typeof(*list), shared[shared_max]), GFP_KERNEL);
70 	if (!list)
71 		return NULL;
72 
73 	list->shared_max = (ksize(list) - offsetof(typeof(*list), shared)) /
74 		sizeof(*list->shared);
75 
76 	return list;
77 }
78 
79 /**
80  * dma_resv_list_free - free fence list
81  * @list: list to free
82  *
83  * Free a dma_resv_list and make sure to drop all references.
84  */
85 static void dma_resv_list_free(struct dma_resv_list *list)
86 {
87 	unsigned int i;
88 
89 	if (!list)
90 		return;
91 
92 	for (i = 0; i < list->shared_count; ++i)
93 		dma_fence_put(rcu_dereference_protected(list->shared[i], true));
94 
95 	kfree_rcu(list, rcu);
96 }
97 
98 /**
99  * dma_resv_init - initialize a reservation object
100  * @obj: the reservation object
101  */
102 void dma_resv_init(struct dma_resv *obj)
103 {
104 	ww_mutex_init(&obj->lock, &reservation_ww_class);
105 
106 	__seqcount_init(&obj->seq, reservation_seqcount_string,
107 			&reservation_seqcount_class);
108 	RCU_INIT_POINTER(obj->fence, NULL);
109 	RCU_INIT_POINTER(obj->fence_excl, NULL);
110 }
111 EXPORT_SYMBOL(dma_resv_init);
112 
113 /**
114  * dma_resv_fini - destroys a reservation object
115  * @obj: the reservation object
116  */
117 void dma_resv_fini(struct dma_resv *obj)
118 {
119 	struct dma_resv_list *fobj;
120 	struct dma_fence *excl;
121 
122 	/*
123 	 * This object should be dead and all references must have
124 	 * been released to it, so no need to be protected with rcu.
125 	 */
126 	excl = rcu_dereference_protected(obj->fence_excl, 1);
127 	if (excl)
128 		dma_fence_put(excl);
129 
130 	fobj = rcu_dereference_protected(obj->fence, 1);
131 	dma_resv_list_free(fobj);
132 	ww_mutex_destroy(&obj->lock);
133 }
134 EXPORT_SYMBOL(dma_resv_fini);
135 
136 /**
137  * dma_resv_reserve_shared - Reserve space to add shared fences to
138  * a dma_resv.
139  * @obj: reservation object
140  * @num_fences: number of fences we want to add
141  *
142  * Should be called before dma_resv_add_shared_fence().  Must
143  * be called with obj->lock held.
144  *
145  * RETURNS
146  * Zero for success, or -errno
147  */
148 int dma_resv_reserve_shared(struct dma_resv *obj, unsigned int num_fences)
149 {
150 	struct dma_resv_list *old, *new;
151 	unsigned int i, j, k, max;
152 
153 	dma_resv_assert_held(obj);
154 
155 	old = dma_resv_get_list(obj);
156 
157 	if (old && old->shared_max) {
158 		if ((old->shared_count + num_fences) <= old->shared_max)
159 			return 0;
160 		else
161 			max = max(old->shared_count + num_fences,
162 				  old->shared_max * 2);
163 	} else {
164 		max = 4;
165 	}
166 
167 	new = dma_resv_list_alloc(max);
168 	if (!new)
169 		return -ENOMEM;
170 
171 	/*
172 	 * no need to bump fence refcounts, rcu_read access
173 	 * requires the use of kref_get_unless_zero, and the
174 	 * references from the old struct are carried over to
175 	 * the new.
176 	 */
177 	for (i = 0, j = 0, k = max; i < (old ? old->shared_count : 0); ++i) {
178 		struct dma_fence *fence;
179 
180 		fence = rcu_dereference_protected(old->shared[i],
181 						  dma_resv_held(obj));
182 		if (dma_fence_is_signaled(fence))
183 			RCU_INIT_POINTER(new->shared[--k], fence);
184 		else
185 			RCU_INIT_POINTER(new->shared[j++], fence);
186 	}
187 	new->shared_count = j;
188 
189 	/*
190 	 * We are not changing the effective set of fences here so can
191 	 * merely update the pointer to the new array; both existing
192 	 * readers and new readers will see exactly the same set of
193 	 * active (unsignaled) shared fences. Individual fences and the
194 	 * old array are protected by RCU and so will not vanish under
195 	 * the gaze of the rcu_read_lock() readers.
196 	 */
197 	rcu_assign_pointer(obj->fence, new);
198 
199 	if (!old)
200 		return 0;
201 
202 	/* Drop the references to the signaled fences */
203 	for (i = k; i < max; ++i) {
204 		struct dma_fence *fence;
205 
206 		fence = rcu_dereference_protected(new->shared[i],
207 						  dma_resv_held(obj));
208 		dma_fence_put(fence);
209 	}
210 	kfree_rcu(old, rcu);
211 
212 	return 0;
213 }
214 EXPORT_SYMBOL(dma_resv_reserve_shared);
215 
216 /**
217  * dma_resv_add_shared_fence - Add a fence to a shared slot
218  * @obj: the reservation object
219  * @fence: the shared fence to add
220  *
221  * Add a fence to a shared slot, obj->lock must be held, and
222  * dma_resv_reserve_shared() has been called.
223  */
224 void dma_resv_add_shared_fence(struct dma_resv *obj, struct dma_fence *fence)
225 {
226 	struct dma_resv_list *fobj;
227 	struct dma_fence *old;
228 	unsigned int i, count;
229 
230 	dma_fence_get(fence);
231 
232 	dma_resv_assert_held(obj);
233 
234 	fobj = dma_resv_get_list(obj);
235 	count = fobj->shared_count;
236 
237 	preempt_disable();
238 	write_seqcount_begin(&obj->seq);
239 
240 	for (i = 0; i < count; ++i) {
241 
242 		old = rcu_dereference_protected(fobj->shared[i],
243 						dma_resv_held(obj));
244 		if (old->context == fence->context ||
245 		    dma_fence_is_signaled(old))
246 			goto replace;
247 	}
248 
249 	BUG_ON(fobj->shared_count >= fobj->shared_max);
250 	old = NULL;
251 	count++;
252 
253 replace:
254 	RCU_INIT_POINTER(fobj->shared[i], fence);
255 	/* pointer update must be visible before we extend the shared_count */
256 	smp_store_mb(fobj->shared_count, count);
257 
258 	write_seqcount_end(&obj->seq);
259 	preempt_enable();
260 	dma_fence_put(old);
261 }
262 EXPORT_SYMBOL(dma_resv_add_shared_fence);
263 
264 /**
265  * dma_resv_add_excl_fence - Add an exclusive fence.
266  * @obj: the reservation object
267  * @fence: the shared fence to add
268  *
269  * Add a fence to the exclusive slot.  The obj->lock must be held.
270  */
271 void dma_resv_add_excl_fence(struct dma_resv *obj, struct dma_fence *fence)
272 {
273 	struct dma_fence *old_fence = dma_resv_get_excl(obj);
274 	struct dma_resv_list *old;
275 	u32 i = 0;
276 
277 	dma_resv_assert_held(obj);
278 
279 	old = dma_resv_get_list(obj);
280 	if (old)
281 		i = old->shared_count;
282 
283 	if (fence)
284 		dma_fence_get(fence);
285 
286 	preempt_disable();
287 	write_seqcount_begin(&obj->seq);
288 	/* write_seqcount_begin provides the necessary memory barrier */
289 	RCU_INIT_POINTER(obj->fence_excl, fence);
290 	if (old)
291 		old->shared_count = 0;
292 	write_seqcount_end(&obj->seq);
293 	preempt_enable();
294 
295 	/* inplace update, no shared fences */
296 	while (i--)
297 		dma_fence_put(rcu_dereference_protected(old->shared[i],
298 						dma_resv_held(obj)));
299 
300 	dma_fence_put(old_fence);
301 }
302 EXPORT_SYMBOL(dma_resv_add_excl_fence);
303 
304 /**
305 * dma_resv_copy_fences - Copy all fences from src to dst.
306 * @dst: the destination reservation object
307 * @src: the source reservation object
308 *
309 * Copy all fences from src to dst. dst-lock must be held.
310 */
311 int dma_resv_copy_fences(struct dma_resv *dst, struct dma_resv *src)
312 {
313 	struct dma_resv_list *src_list, *dst_list;
314 	struct dma_fence *old, *new;
315 	unsigned i;
316 
317 	dma_resv_assert_held(dst);
318 
319 	rcu_read_lock();
320 	src_list = rcu_dereference(src->fence);
321 
322 retry:
323 	if (src_list) {
324 		unsigned shared_count = src_list->shared_count;
325 
326 		rcu_read_unlock();
327 
328 		dst_list = dma_resv_list_alloc(shared_count);
329 		if (!dst_list)
330 			return -ENOMEM;
331 
332 		rcu_read_lock();
333 		src_list = rcu_dereference(src->fence);
334 		if (!src_list || src_list->shared_count > shared_count) {
335 			kfree(dst_list);
336 			goto retry;
337 		}
338 
339 		dst_list->shared_count = 0;
340 		for (i = 0; i < src_list->shared_count; ++i) {
341 			struct dma_fence *fence;
342 
343 			fence = rcu_dereference(src_list->shared[i]);
344 			if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT,
345 				     &fence->flags))
346 				continue;
347 
348 			if (!dma_fence_get_rcu(fence)) {
349 				dma_resv_list_free(dst_list);
350 				src_list = rcu_dereference(src->fence);
351 				goto retry;
352 			}
353 
354 			if (dma_fence_is_signaled(fence)) {
355 				dma_fence_put(fence);
356 				continue;
357 			}
358 
359 			rcu_assign_pointer(dst_list->shared[dst_list->shared_count++], fence);
360 		}
361 	} else {
362 		dst_list = NULL;
363 	}
364 
365 	new = dma_fence_get_rcu_safe(&src->fence_excl);
366 	rcu_read_unlock();
367 
368 	src_list = dma_resv_get_list(dst);
369 	old = dma_resv_get_excl(dst);
370 
371 	preempt_disable();
372 	write_seqcount_begin(&dst->seq);
373 	/* write_seqcount_begin provides the necessary memory barrier */
374 	RCU_INIT_POINTER(dst->fence_excl, new);
375 	RCU_INIT_POINTER(dst->fence, dst_list);
376 	write_seqcount_end(&dst->seq);
377 	preempt_enable();
378 
379 	dma_resv_list_free(src_list);
380 	dma_fence_put(old);
381 
382 	return 0;
383 }
384 EXPORT_SYMBOL(dma_resv_copy_fences);
385 
386 /**
387  * dma_resv_get_fences_rcu - Get an object's shared and exclusive
388  * fences without update side lock held
389  * @obj: the reservation object
390  * @pfence_excl: the returned exclusive fence (or NULL)
391  * @pshared_count: the number of shared fences returned
392  * @pshared: the array of shared fence ptrs returned (array is krealloc'd to
393  * the required size, and must be freed by caller)
394  *
395  * Retrieve all fences from the reservation object. If the pointer for the
396  * exclusive fence is not specified the fence is put into the array of the
397  * shared fences as well. Returns either zero or -ENOMEM.
398  */
399 int dma_resv_get_fences_rcu(struct dma_resv *obj,
400 			    struct dma_fence **pfence_excl,
401 			    unsigned *pshared_count,
402 			    struct dma_fence ***pshared)
403 {
404 	struct dma_fence **shared = NULL;
405 	struct dma_fence *fence_excl;
406 	unsigned int shared_count;
407 	int ret = 1;
408 
409 	do {
410 		struct dma_resv_list *fobj;
411 		unsigned int i, seq;
412 		size_t sz = 0;
413 
414 		shared_count = i = 0;
415 
416 		rcu_read_lock();
417 		seq = read_seqcount_begin(&obj->seq);
418 
419 		fence_excl = rcu_dereference(obj->fence_excl);
420 		if (fence_excl && !dma_fence_get_rcu(fence_excl))
421 			goto unlock;
422 
423 		fobj = rcu_dereference(obj->fence);
424 		if (fobj)
425 			sz += sizeof(*shared) * fobj->shared_max;
426 
427 		if (!pfence_excl && fence_excl)
428 			sz += sizeof(*shared);
429 
430 		if (sz) {
431 			struct dma_fence **nshared;
432 
433 			nshared = krealloc(shared, sz,
434 					   GFP_NOWAIT | __GFP_NOWARN);
435 			if (!nshared) {
436 				rcu_read_unlock();
437 
438 				dma_fence_put(fence_excl);
439 				fence_excl = NULL;
440 
441 				nshared = krealloc(shared, sz, GFP_KERNEL);
442 				if (nshared) {
443 					shared = nshared;
444 					continue;
445 				}
446 
447 				ret = -ENOMEM;
448 				break;
449 			}
450 			shared = nshared;
451 			shared_count = fobj ? fobj->shared_count : 0;
452 			for (i = 0; i < shared_count; ++i) {
453 				shared[i] = rcu_dereference(fobj->shared[i]);
454 				if (!dma_fence_get_rcu(shared[i]))
455 					break;
456 			}
457 		}
458 
459 		if (i != shared_count || read_seqcount_retry(&obj->seq, seq)) {
460 			while (i--)
461 				dma_fence_put(shared[i]);
462 			dma_fence_put(fence_excl);
463 			goto unlock;
464 		}
465 
466 		ret = 0;
467 unlock:
468 		rcu_read_unlock();
469 	} while (ret);
470 
471 	if (pfence_excl)
472 		*pfence_excl = fence_excl;
473 	else if (fence_excl)
474 		shared[shared_count++] = fence_excl;
475 
476 	if (!shared_count) {
477 		kfree(shared);
478 		shared = NULL;
479 	}
480 
481 	*pshared_count = shared_count;
482 	*pshared = shared;
483 	return ret;
484 }
485 EXPORT_SYMBOL_GPL(dma_resv_get_fences_rcu);
486 
487 /**
488  * dma_resv_wait_timeout_rcu - Wait on reservation's objects
489  * shared and/or exclusive fences.
490  * @obj: the reservation object
491  * @wait_all: if true, wait on all fences, else wait on just exclusive fence
492  * @intr: if true, do interruptible wait
493  * @timeout: timeout value in jiffies or zero to return immediately
494  *
495  * RETURNS
496  * Returns -ERESTARTSYS if interrupted, 0 if the wait timed out, or
497  * greater than zer on success.
498  */
499 long dma_resv_wait_timeout_rcu(struct dma_resv *obj,
500 			       bool wait_all, bool intr,
501 			       unsigned long timeout)
502 {
503 	struct dma_fence *fence;
504 	unsigned seq, shared_count;
505 	long ret = timeout ? timeout : 1;
506 	int i;
507 
508 retry:
509 	shared_count = 0;
510 	seq = read_seqcount_begin(&obj->seq);
511 	rcu_read_lock();
512 	i = -1;
513 
514 	fence = rcu_dereference(obj->fence_excl);
515 	if (fence && !test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &fence->flags)) {
516 		if (!dma_fence_get_rcu(fence))
517 			goto unlock_retry;
518 
519 		if (dma_fence_is_signaled(fence)) {
520 			dma_fence_put(fence);
521 			fence = NULL;
522 		}
523 
524 	} else {
525 		fence = NULL;
526 	}
527 
528 	if (wait_all) {
529 		struct dma_resv_list *fobj = rcu_dereference(obj->fence);
530 
531 		if (fobj)
532 			shared_count = fobj->shared_count;
533 
534 		for (i = 0; !fence && i < shared_count; ++i) {
535 			struct dma_fence *lfence = rcu_dereference(fobj->shared[i]);
536 
537 			if (test_bit(DMA_FENCE_FLAG_SIGNALED_BIT,
538 				     &lfence->flags))
539 				continue;
540 
541 			if (!dma_fence_get_rcu(lfence))
542 				goto unlock_retry;
543 
544 			if (dma_fence_is_signaled(lfence)) {
545 				dma_fence_put(lfence);
546 				continue;
547 			}
548 
549 			fence = lfence;
550 			break;
551 		}
552 	}
553 
554 	rcu_read_unlock();
555 	if (fence) {
556 		if (read_seqcount_retry(&obj->seq, seq)) {
557 			dma_fence_put(fence);
558 			goto retry;
559 		}
560 
561 		ret = dma_fence_wait_timeout(fence, intr, ret);
562 		dma_fence_put(fence);
563 		if (ret > 0 && wait_all && (i + 1 < shared_count))
564 			goto retry;
565 	}
566 	return ret;
567 
568 unlock_retry:
569 	rcu_read_unlock();
570 	goto retry;
571 }
572 EXPORT_SYMBOL_GPL(dma_resv_wait_timeout_rcu);
573 
574 
575 static inline int dma_resv_test_signaled_single(struct dma_fence *passed_fence)
576 {
577 	struct dma_fence *fence, *lfence = passed_fence;
578 	int ret = 1;
579 
580 	if (!test_bit(DMA_FENCE_FLAG_SIGNALED_BIT, &lfence->flags)) {
581 		fence = dma_fence_get_rcu(lfence);
582 		if (!fence)
583 			return -1;
584 
585 		ret = !!dma_fence_is_signaled(fence);
586 		dma_fence_put(fence);
587 	}
588 	return ret;
589 }
590 
591 /**
592  * dma_resv_test_signaled_rcu - Test if a reservation object's
593  * fences have been signaled.
594  * @obj: the reservation object
595  * @test_all: if true, test all fences, otherwise only test the exclusive
596  * fence
597  *
598  * RETURNS
599  * true if all fences signaled, else false
600  */
601 bool dma_resv_test_signaled_rcu(struct dma_resv *obj, bool test_all)
602 {
603 	unsigned seq, shared_count;
604 	int ret;
605 
606 	rcu_read_lock();
607 retry:
608 	ret = true;
609 	shared_count = 0;
610 	seq = read_seqcount_begin(&obj->seq);
611 
612 	if (test_all) {
613 		unsigned i;
614 
615 		struct dma_resv_list *fobj = rcu_dereference(obj->fence);
616 
617 		if (fobj)
618 			shared_count = fobj->shared_count;
619 
620 		for (i = 0; i < shared_count; ++i) {
621 			struct dma_fence *fence = rcu_dereference(fobj->shared[i]);
622 
623 			ret = dma_resv_test_signaled_single(fence);
624 			if (ret < 0)
625 				goto retry;
626 			else if (!ret)
627 				break;
628 		}
629 
630 		if (read_seqcount_retry(&obj->seq, seq))
631 			goto retry;
632 	}
633 
634 	if (!shared_count) {
635 		struct dma_fence *fence_excl = rcu_dereference(obj->fence_excl);
636 
637 		if (fence_excl) {
638 			ret = dma_resv_test_signaled_single(fence_excl);
639 			if (ret < 0)
640 				goto retry;
641 
642 			if (read_seqcount_retry(&obj->seq, seq))
643 				goto retry;
644 		}
645 	}
646 
647 	rcu_read_unlock();
648 	return ret;
649 }
650 EXPORT_SYMBOL_GPL(dma_resv_test_signaled_rcu);
651