xref: /linux/drivers/dma-buf/dma-fence-array.c (revision 2622649ad6cdbb3e77bfafc8c0fe686090b77f70)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * dma-fence-array: aggregate fences to be waited together
4  *
5  * Copyright (C) 2016 Collabora Ltd
6  * Copyright (C) 2016 Advanced Micro Devices, Inc.
7  * Authors:
8  *	Gustavo Padovan <gustavo@padovan.org>
9  *	Christian König <christian.koenig@amd.com>
10  */
11 
12 #include <linux/export.h>
13 #include <linux/slab.h>
14 #include <linux/dma-fence-array.h>
15 
16 #define PENDING_ERROR 1
17 
18 static const char *dma_fence_array_get_driver_name(struct dma_fence *fence)
19 {
20 	return "dma_fence_array";
21 }
22 
23 static const char *dma_fence_array_get_timeline_name(struct dma_fence *fence)
24 {
25 	return "unbound";
26 }
27 
28 static void dma_fence_array_set_pending_error(struct dma_fence_array *array,
29 					      int error)
30 {
31 	/*
32 	 * Propagate the first error reported by any of our fences, but only
33 	 * before we ourselves are signaled.
34 	 */
35 	if (error)
36 		cmpxchg(&array->base.error, PENDING_ERROR, error);
37 }
38 
39 static void dma_fence_array_clear_pending_error(struct dma_fence_array *array)
40 {
41 	/* Clear the error flag if not actually set. */
42 	cmpxchg(&array->base.error, PENDING_ERROR, 0);
43 }
44 
45 static void irq_dma_fence_array_work(struct irq_work *wrk)
46 {
47 	struct dma_fence_array *array = container_of(wrk, typeof(*array), work);
48 
49 	dma_fence_array_clear_pending_error(array);
50 
51 	dma_fence_signal(&array->base);
52 	dma_fence_put(&array->base);
53 }
54 
55 static void dma_fence_array_cb_func(struct dma_fence *f,
56 				    struct dma_fence_cb *cb)
57 {
58 	struct dma_fence_array_cb *array_cb =
59 		container_of(cb, struct dma_fence_array_cb, cb);
60 	struct dma_fence_array *array = array_cb->array;
61 
62 	dma_fence_array_set_pending_error(array, f->error);
63 
64 	if (atomic_dec_and_test(&array->num_pending))
65 		irq_work_queue(&array->work);
66 	else
67 		dma_fence_put(&array->base);
68 }
69 
70 static bool dma_fence_array_enable_signaling(struct dma_fence *fence)
71 {
72 	struct dma_fence_array *array = to_dma_fence_array(fence);
73 	struct dma_fence_array_cb *cb = array->callbacks;
74 	unsigned i;
75 
76 	for (i = 0; i < array->num_fences; ++i) {
77 		cb[i].array = array;
78 		/*
79 		 * As we may report that the fence is signaled before all
80 		 * callbacks are complete, we need to take an additional
81 		 * reference count on the array so that we do not free it too
82 		 * early. The core fence handling will only hold the reference
83 		 * until we signal the array as complete (but that is now
84 		 * insufficient).
85 		 */
86 		dma_fence_get(&array->base);
87 		if (dma_fence_add_callback(array->fences[i], &cb[i].cb,
88 					   dma_fence_array_cb_func)) {
89 			int error = array->fences[i]->error;
90 
91 			dma_fence_array_set_pending_error(array, error);
92 			dma_fence_put(&array->base);
93 			if (atomic_dec_and_test(&array->num_pending)) {
94 				dma_fence_array_clear_pending_error(array);
95 				return false;
96 			}
97 		}
98 	}
99 
100 	return true;
101 }
102 
103 static bool dma_fence_array_signaled(struct dma_fence *fence)
104 {
105 	struct dma_fence_array *array = to_dma_fence_array(fence);
106 	int num_pending;
107 	unsigned int i;
108 
109 	/*
110 	 * We need to read num_pending before checking the enable_signal bit
111 	 * to avoid racing with the enable_signaling() implementation, which
112 	 * might decrement the counter, and cause a partial check.
113 	 * atomic_read_acquire() pairs with atomic_dec_and_test() in
114 	 * dma_fence_array_enable_signaling()
115 	 *
116 	 * The !--num_pending check is here to account for the any_signaled case
117 	 * if we race with enable_signaling(), that means the !num_pending check
118 	 * in the is_signalling_enabled branch might be outdated (num_pending
119 	 * might have been decremented), but that's fine. The user will get the
120 	 * right value when testing again later.
121 	 */
122 	num_pending = atomic_read_acquire(&array->num_pending);
123 	if (test_bit(DMA_FENCE_FLAG_ENABLE_SIGNAL_BIT, &array->base.flags)) {
124 		if (num_pending <= 0)
125 			goto signal;
126 		return false;
127 	}
128 
129 	for (i = 0; i < array->num_fences; ++i) {
130 		if (dma_fence_is_signaled(array->fences[i]) && !--num_pending)
131 			goto signal;
132 	}
133 	return false;
134 
135 signal:
136 	dma_fence_array_clear_pending_error(array);
137 	return true;
138 }
139 
140 static void dma_fence_array_release(struct dma_fence *fence)
141 {
142 	struct dma_fence_array *array = to_dma_fence_array(fence);
143 	unsigned i;
144 
145 	for (i = 0; i < array->num_fences; ++i)
146 		dma_fence_put(array->fences[i]);
147 
148 	kfree(array->fences);
149 	dma_fence_free(fence);
150 }
151 
152 static void dma_fence_array_set_deadline(struct dma_fence *fence,
153 					 ktime_t deadline)
154 {
155 	struct dma_fence_array *array = to_dma_fence_array(fence);
156 	unsigned i;
157 
158 	for (i = 0; i < array->num_fences; ++i)
159 		dma_fence_set_deadline(array->fences[i], deadline);
160 }
161 
162 const struct dma_fence_ops dma_fence_array_ops = {
163 	.get_driver_name = dma_fence_array_get_driver_name,
164 	.get_timeline_name = dma_fence_array_get_timeline_name,
165 	.enable_signaling = dma_fence_array_enable_signaling,
166 	.signaled = dma_fence_array_signaled,
167 	.release = dma_fence_array_release,
168 	.set_deadline = dma_fence_array_set_deadline,
169 };
170 EXPORT_SYMBOL(dma_fence_array_ops);
171 
172 /**
173  * dma_fence_array_alloc - Allocate a custom fence array
174  * @num_fences:		[in]	number of fences to add in the array
175  *
176  * Return dma fence array on success, NULL on failure
177  */
178 struct dma_fence_array *dma_fence_array_alloc(int num_fences)
179 {
180 	struct dma_fence_array *array;
181 
182 	return kzalloc_flex(*array, callbacks, num_fences);
183 }
184 EXPORT_SYMBOL(dma_fence_array_alloc);
185 
186 /**
187  * dma_fence_array_init - Init a custom fence array
188  * @array:		[in]	dma fence array to arm
189  * @num_fences:		[in]	number of fences to add in the array
190  * @fences:		[in]	array containing the fences
191  * @context:		[in]	fence context to use
192  * @seqno:		[in]	sequence number to use
193  * @signal_on_any:	[in]	signal on any fence in the array
194  *
195  * Implementation of @dma_fence_array_create without allocation. Useful to init
196  * a preallocated dma fence array in the path of reclaim or dma fence signaling.
197  */
198 void dma_fence_array_init(struct dma_fence_array *array,
199 			  int num_fences, struct dma_fence **fences,
200 			  u64 context, unsigned seqno,
201 			  bool signal_on_any)
202 {
203 	static struct lock_class_key dma_fence_array_lock_key;
204 
205 	WARN_ON(!num_fences || !fences);
206 
207 	array->num_fences = num_fences;
208 
209 	dma_fence_init(&array->base, &dma_fence_array_ops, NULL, context,
210 		       seqno);
211 	init_irq_work(&array->work, irq_dma_fence_array_work);
212 
213 	/*
214 	 * dma_fence_array_enable_signaling() is invoked while holding
215 	 * array->base.inline_lock and may call dma_fence_add_callback()
216 	 * on the underlying fences, which takes their inline_lock.
217 	 *
218 	 * Since both locks share the same lockdep class, this legitimate
219 	 * nesting confuses lockdep and triggers a recursive locking
220 	 * warning. Assign a separate lockdep class to the array lock
221 	 * to model this hierarchy correctly.
222 	 */
223 	lockdep_set_class(&array->base.inline_lock, &dma_fence_array_lock_key);
224 
225 	atomic_set(&array->num_pending, signal_on_any ? 1 : num_fences);
226 	array->fences = fences;
227 
228 	array->base.error = PENDING_ERROR;
229 
230 	/*
231 	 * dma_fence_array objects should never contain any other fence
232 	 * containers or otherwise we run into recursion and potential kernel
233 	 * stack overflow on operations on the dma_fence_array.
234 	 *
235 	 * The correct way of handling this is to flatten out the array by the
236 	 * caller instead.
237 	 *
238 	 * Enforce this here by checking that we don't create a dma_fence_array
239 	 * with any container inside.
240 	 */
241 	while (num_fences--)
242 		WARN_ON(dma_fence_is_container(fences[num_fences]));
243 }
244 EXPORT_SYMBOL(dma_fence_array_init);
245 
246 /**
247  * dma_fence_array_create - Create a custom fence array
248  * @num_fences:		[in]	number of fences to add in the array
249  * @fences:		[in]	array containing the fences
250  * @context:		[in]	fence context to use
251  * @seqno:		[in]	sequence number to use
252  * @signal_on_any:	[in]	signal on any fence in the array
253  *
254  * Allocate a dma_fence_array object and initialize the base fence with
255  * dma_fence_init().
256  * In case of error it returns NULL.
257  *
258  * The caller should allocate the fences array with num_fences size
259  * and fill it with the fences it wants to add to the object. Ownership of this
260  * array is taken and dma_fence_put() is used on each fence on release.
261  *
262  * If @signal_on_any is true the fence array signals if any fence in the array
263  * signals, otherwise it signals when all fences in the array signal.
264  */
265 struct dma_fence_array *dma_fence_array_create(int num_fences,
266 					       struct dma_fence **fences,
267 					       u64 context, unsigned seqno,
268 					       bool signal_on_any)
269 {
270 	struct dma_fence_array *array;
271 
272 	array = dma_fence_array_alloc(num_fences);
273 	if (!array)
274 		return NULL;
275 
276 	dma_fence_array_init(array, num_fences, fences,
277 			     context, seqno, signal_on_any);
278 
279 	return array;
280 }
281 EXPORT_SYMBOL(dma_fence_array_create);
282 
283 /**
284  * dma_fence_match_context - Check if all fences are from the given context
285  * @fence:		[in]	fence or fence array
286  * @context:		[in]	fence context to check all fences against
287  *
288  * Checks the provided fence or, for a fence array, all fences in the array
289  * against the given context. Returns false if any fence is from a different
290  * context.
291  */
292 bool dma_fence_match_context(struct dma_fence *fence, u64 context)
293 {
294 	struct dma_fence_array *array = to_dma_fence_array(fence);
295 	unsigned i;
296 
297 	if (!dma_fence_is_array(fence))
298 		return fence->context == context;
299 
300 	for (i = 0; i < array->num_fences; i++) {
301 		if (array->fences[i]->context != context)
302 			return false;
303 	}
304 
305 	return true;
306 }
307 EXPORT_SYMBOL(dma_fence_match_context);
308 
309 struct dma_fence *dma_fence_array_first(struct dma_fence *head)
310 {
311 	struct dma_fence_array *array;
312 
313 	if (!head)
314 		return NULL;
315 
316 	array = to_dma_fence_array(head);
317 	if (!array)
318 		return head;
319 
320 	if (!array->num_fences)
321 		return NULL;
322 
323 	return array->fences[0];
324 }
325 EXPORT_SYMBOL(dma_fence_array_first);
326 
327 struct dma_fence *dma_fence_array_next(struct dma_fence *head,
328 				       unsigned int index)
329 {
330 	struct dma_fence_array *array = to_dma_fence_array(head);
331 
332 	if (!array || index >= array->num_fences)
333 		return NULL;
334 
335 	return array->fences[index];
336 }
337 EXPORT_SYMBOL(dma_fence_array_next);
338