xref: /OK3568_Linux_fs/kernel/drivers/dma-buf/st-dma-fence-chain.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: MIT
2*4882a593Smuzhiyun 
3*4882a593Smuzhiyun /*
4*4882a593Smuzhiyun  * Copyright © 2019 Intel Corporation
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include <linux/delay.h>
8*4882a593Smuzhiyun #include <linux/dma-fence.h>
9*4882a593Smuzhiyun #include <linux/dma-fence-chain.h>
10*4882a593Smuzhiyun #include <linux/kernel.h>
11*4882a593Smuzhiyun #include <linux/kthread.h>
12*4882a593Smuzhiyun #include <linux/mm.h>
13*4882a593Smuzhiyun #include <linux/sched/signal.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun #include <linux/spinlock.h>
16*4882a593Smuzhiyun #include <linux/random.h>
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun #include "selftest.h"
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun #define CHAIN_SZ (4 << 10)
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun static struct kmem_cache *slab_fences;
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun static inline struct mock_fence {
25*4882a593Smuzhiyun 	struct dma_fence base;
26*4882a593Smuzhiyun 	spinlock_t lock;
to_mock_fence(struct dma_fence * f)27*4882a593Smuzhiyun } *to_mock_fence(struct dma_fence *f) {
28*4882a593Smuzhiyun 	return container_of(f, struct mock_fence, base);
29*4882a593Smuzhiyun }
30*4882a593Smuzhiyun 
mock_name(struct dma_fence * f)31*4882a593Smuzhiyun static const char *mock_name(struct dma_fence *f)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun 	return "mock";
34*4882a593Smuzhiyun }
35*4882a593Smuzhiyun 
mock_fence_release(struct dma_fence * f)36*4882a593Smuzhiyun static void mock_fence_release(struct dma_fence *f)
37*4882a593Smuzhiyun {
38*4882a593Smuzhiyun 	kmem_cache_free(slab_fences, to_mock_fence(f));
39*4882a593Smuzhiyun }
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun static const struct dma_fence_ops mock_ops = {
42*4882a593Smuzhiyun 	.get_driver_name = mock_name,
43*4882a593Smuzhiyun 	.get_timeline_name = mock_name,
44*4882a593Smuzhiyun 	.release = mock_fence_release,
45*4882a593Smuzhiyun };
46*4882a593Smuzhiyun 
mock_fence(void)47*4882a593Smuzhiyun static struct dma_fence *mock_fence(void)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun 	struct mock_fence *f;
50*4882a593Smuzhiyun 
51*4882a593Smuzhiyun 	f = kmem_cache_alloc(slab_fences, GFP_KERNEL);
52*4882a593Smuzhiyun 	if (!f)
53*4882a593Smuzhiyun 		return NULL;
54*4882a593Smuzhiyun 
55*4882a593Smuzhiyun 	spin_lock_init(&f->lock);
56*4882a593Smuzhiyun 	dma_fence_init(&f->base, &mock_ops, &f->lock, 0, 0);
57*4882a593Smuzhiyun 
58*4882a593Smuzhiyun 	return &f->base;
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun 
61*4882a593Smuzhiyun static inline struct mock_chain {
62*4882a593Smuzhiyun 	struct dma_fence_chain base;
to_mock_chain(struct dma_fence * f)63*4882a593Smuzhiyun } *to_mock_chain(struct dma_fence *f) {
64*4882a593Smuzhiyun 	return container_of(f, struct mock_chain, base.base);
65*4882a593Smuzhiyun }
66*4882a593Smuzhiyun 
mock_chain(struct dma_fence * prev,struct dma_fence * fence,u64 seqno)67*4882a593Smuzhiyun static struct dma_fence *mock_chain(struct dma_fence *prev,
68*4882a593Smuzhiyun 				    struct dma_fence *fence,
69*4882a593Smuzhiyun 				    u64 seqno)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun 	struct mock_chain *f;
72*4882a593Smuzhiyun 
73*4882a593Smuzhiyun 	f = kmalloc(sizeof(*f), GFP_KERNEL);
74*4882a593Smuzhiyun 	if (!f)
75*4882a593Smuzhiyun 		return NULL;
76*4882a593Smuzhiyun 
77*4882a593Smuzhiyun 	dma_fence_chain_init(&f->base,
78*4882a593Smuzhiyun 			     dma_fence_get(prev),
79*4882a593Smuzhiyun 			     dma_fence_get(fence),
80*4882a593Smuzhiyun 			     seqno);
81*4882a593Smuzhiyun 
82*4882a593Smuzhiyun 	return &f->base.base;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun 
sanitycheck(void * arg)85*4882a593Smuzhiyun static int sanitycheck(void *arg)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun 	struct dma_fence *f, *chain;
88*4882a593Smuzhiyun 	int err = 0;
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	f = mock_fence();
91*4882a593Smuzhiyun 	if (!f)
92*4882a593Smuzhiyun 		return -ENOMEM;
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun 	chain = mock_chain(NULL, f, 1);
95*4882a593Smuzhiyun 	if (!chain)
96*4882a593Smuzhiyun 		err = -ENOMEM;
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	dma_fence_signal(f);
99*4882a593Smuzhiyun 	dma_fence_put(f);
100*4882a593Smuzhiyun 
101*4882a593Smuzhiyun 	dma_fence_put(chain);
102*4882a593Smuzhiyun 
103*4882a593Smuzhiyun 	return err;
104*4882a593Smuzhiyun }
105*4882a593Smuzhiyun 
106*4882a593Smuzhiyun struct fence_chains {
107*4882a593Smuzhiyun 	unsigned int chain_length;
108*4882a593Smuzhiyun 	struct dma_fence **fences;
109*4882a593Smuzhiyun 	struct dma_fence **chains;
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	struct dma_fence *tail;
112*4882a593Smuzhiyun };
113*4882a593Smuzhiyun 
seqno_inc(unsigned int i)114*4882a593Smuzhiyun static uint64_t seqno_inc(unsigned int i)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun 	return i + 1;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun 
fence_chains_init(struct fence_chains * fc,unsigned int count,uint64_t (* seqno_fn)(unsigned int))119*4882a593Smuzhiyun static int fence_chains_init(struct fence_chains *fc, unsigned int count,
120*4882a593Smuzhiyun 			     uint64_t (*seqno_fn)(unsigned int))
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun 	unsigned int i;
123*4882a593Smuzhiyun 	int err = 0;
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	fc->chains = kvmalloc_array(count, sizeof(*fc->chains),
126*4882a593Smuzhiyun 				    GFP_KERNEL | __GFP_ZERO);
127*4882a593Smuzhiyun 	if (!fc->chains)
128*4882a593Smuzhiyun 		return -ENOMEM;
129*4882a593Smuzhiyun 
130*4882a593Smuzhiyun 	fc->fences = kvmalloc_array(count, sizeof(*fc->fences),
131*4882a593Smuzhiyun 				    GFP_KERNEL | __GFP_ZERO);
132*4882a593Smuzhiyun 	if (!fc->fences) {
133*4882a593Smuzhiyun 		err = -ENOMEM;
134*4882a593Smuzhiyun 		goto err_chains;
135*4882a593Smuzhiyun 	}
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun 	fc->tail = NULL;
138*4882a593Smuzhiyun 	for (i = 0; i < count; i++) {
139*4882a593Smuzhiyun 		fc->fences[i] = mock_fence();
140*4882a593Smuzhiyun 		if (!fc->fences[i]) {
141*4882a593Smuzhiyun 			err = -ENOMEM;
142*4882a593Smuzhiyun 			goto unwind;
143*4882a593Smuzhiyun 		}
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 		fc->chains[i] = mock_chain(fc->tail,
146*4882a593Smuzhiyun 					   fc->fences[i],
147*4882a593Smuzhiyun 					   seqno_fn(i));
148*4882a593Smuzhiyun 		if (!fc->chains[i]) {
149*4882a593Smuzhiyun 			err = -ENOMEM;
150*4882a593Smuzhiyun 			goto unwind;
151*4882a593Smuzhiyun 		}
152*4882a593Smuzhiyun 
153*4882a593Smuzhiyun 		fc->tail = fc->chains[i];
154*4882a593Smuzhiyun 	}
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun 	fc->chain_length = i;
157*4882a593Smuzhiyun 	return 0;
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun unwind:
160*4882a593Smuzhiyun 	for (i = 0; i < count; i++) {
161*4882a593Smuzhiyun 		dma_fence_put(fc->fences[i]);
162*4882a593Smuzhiyun 		dma_fence_put(fc->chains[i]);
163*4882a593Smuzhiyun 	}
164*4882a593Smuzhiyun 	kvfree(fc->fences);
165*4882a593Smuzhiyun err_chains:
166*4882a593Smuzhiyun 	kvfree(fc->chains);
167*4882a593Smuzhiyun 	return err;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun 
fence_chains_fini(struct fence_chains * fc)170*4882a593Smuzhiyun static void fence_chains_fini(struct fence_chains *fc)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun 	unsigned int i;
173*4882a593Smuzhiyun 
174*4882a593Smuzhiyun 	for (i = 0; i < fc->chain_length; i++) {
175*4882a593Smuzhiyun 		dma_fence_signal(fc->fences[i]);
176*4882a593Smuzhiyun 		dma_fence_put(fc->fences[i]);
177*4882a593Smuzhiyun 	}
178*4882a593Smuzhiyun 	kvfree(fc->fences);
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun 	for (i = 0; i < fc->chain_length; i++)
181*4882a593Smuzhiyun 		dma_fence_put(fc->chains[i]);
182*4882a593Smuzhiyun 	kvfree(fc->chains);
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun 
find_seqno(void * arg)185*4882a593Smuzhiyun static int find_seqno(void *arg)
186*4882a593Smuzhiyun {
187*4882a593Smuzhiyun 	struct fence_chains fc;
188*4882a593Smuzhiyun 	struct dma_fence *fence;
189*4882a593Smuzhiyun 	int err;
190*4882a593Smuzhiyun 	int i;
191*4882a593Smuzhiyun 
192*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 64, seqno_inc);
193*4882a593Smuzhiyun 	if (err)
194*4882a593Smuzhiyun 		return err;
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	fence = dma_fence_get(fc.tail);
197*4882a593Smuzhiyun 	err = dma_fence_chain_find_seqno(&fence, 0);
198*4882a593Smuzhiyun 	dma_fence_put(fence);
199*4882a593Smuzhiyun 	if (err) {
200*4882a593Smuzhiyun 		pr_err("Reported %d for find_seqno(0)!\n", err);
201*4882a593Smuzhiyun 		goto err;
202*4882a593Smuzhiyun 	}
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++) {
205*4882a593Smuzhiyun 		fence = dma_fence_get(fc.tail);
206*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, i + 1);
207*4882a593Smuzhiyun 		dma_fence_put(fence);
208*4882a593Smuzhiyun 		if (err) {
209*4882a593Smuzhiyun 			pr_err("Reported %d for find_seqno(%d:%d)!\n",
210*4882a593Smuzhiyun 			       err, fc.chain_length + 1, i + 1);
211*4882a593Smuzhiyun 			goto err;
212*4882a593Smuzhiyun 		}
213*4882a593Smuzhiyun 		if (fence != fc.chains[i]) {
214*4882a593Smuzhiyun 			pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
215*4882a593Smuzhiyun 			       fc.chain_length + 1, i + 1);
216*4882a593Smuzhiyun 			err = -EINVAL;
217*4882a593Smuzhiyun 			goto err;
218*4882a593Smuzhiyun 		}
219*4882a593Smuzhiyun 
220*4882a593Smuzhiyun 		dma_fence_get(fence);
221*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, i + 1);
222*4882a593Smuzhiyun 		dma_fence_put(fence);
223*4882a593Smuzhiyun 		if (err) {
224*4882a593Smuzhiyun 			pr_err("Error reported for finding self\n");
225*4882a593Smuzhiyun 			goto err;
226*4882a593Smuzhiyun 		}
227*4882a593Smuzhiyun 		if (fence != fc.chains[i]) {
228*4882a593Smuzhiyun 			pr_err("Incorrect fence reported by find self\n");
229*4882a593Smuzhiyun 			err = -EINVAL;
230*4882a593Smuzhiyun 			goto err;
231*4882a593Smuzhiyun 		}
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun 		dma_fence_get(fence);
234*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, i + 2);
235*4882a593Smuzhiyun 		dma_fence_put(fence);
236*4882a593Smuzhiyun 		if (!err) {
237*4882a593Smuzhiyun 			pr_err("Error not reported for future fence: find_seqno(%d:%d)!\n",
238*4882a593Smuzhiyun 			       i + 1, i + 2);
239*4882a593Smuzhiyun 			err = -EINVAL;
240*4882a593Smuzhiyun 			goto err;
241*4882a593Smuzhiyun 		}
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun 		dma_fence_get(fence);
244*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, i);
245*4882a593Smuzhiyun 		dma_fence_put(fence);
246*4882a593Smuzhiyun 		if (err) {
247*4882a593Smuzhiyun 			pr_err("Error reported for previous fence!\n");
248*4882a593Smuzhiyun 			goto err;
249*4882a593Smuzhiyun 		}
250*4882a593Smuzhiyun 		if (i > 0 && fence != fc.chains[i - 1]) {
251*4882a593Smuzhiyun 			pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
252*4882a593Smuzhiyun 			       i + 1, i);
253*4882a593Smuzhiyun 			err = -EINVAL;
254*4882a593Smuzhiyun 			goto err;
255*4882a593Smuzhiyun 		}
256*4882a593Smuzhiyun 	}
257*4882a593Smuzhiyun 
258*4882a593Smuzhiyun err:
259*4882a593Smuzhiyun 	fence_chains_fini(&fc);
260*4882a593Smuzhiyun 	return err;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun 
find_signaled(void * arg)263*4882a593Smuzhiyun static int find_signaled(void *arg)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun 	struct fence_chains fc;
266*4882a593Smuzhiyun 	struct dma_fence *fence;
267*4882a593Smuzhiyun 	int err;
268*4882a593Smuzhiyun 
269*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 2, seqno_inc);
270*4882a593Smuzhiyun 	if (err)
271*4882a593Smuzhiyun 		return err;
272*4882a593Smuzhiyun 
273*4882a593Smuzhiyun 	dma_fence_signal(fc.fences[0]);
274*4882a593Smuzhiyun 
275*4882a593Smuzhiyun 	fence = dma_fence_get(fc.tail);
276*4882a593Smuzhiyun 	err = dma_fence_chain_find_seqno(&fence, 1);
277*4882a593Smuzhiyun 	dma_fence_put(fence);
278*4882a593Smuzhiyun 	if (err) {
279*4882a593Smuzhiyun 		pr_err("Reported %d for find_seqno()!\n", err);
280*4882a593Smuzhiyun 		goto err;
281*4882a593Smuzhiyun 	}
282*4882a593Smuzhiyun 
283*4882a593Smuzhiyun 	if (fence && fence != fc.chains[0]) {
284*4882a593Smuzhiyun 		pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:1\n",
285*4882a593Smuzhiyun 		       fence->seqno);
286*4882a593Smuzhiyun 
287*4882a593Smuzhiyun 		dma_fence_get(fence);
288*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, 1);
289*4882a593Smuzhiyun 		dma_fence_put(fence);
290*4882a593Smuzhiyun 		if (err)
291*4882a593Smuzhiyun 			pr_err("Reported %d for finding self!\n", err);
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 		err = -EINVAL;
294*4882a593Smuzhiyun 	}
295*4882a593Smuzhiyun 
296*4882a593Smuzhiyun err:
297*4882a593Smuzhiyun 	fence_chains_fini(&fc);
298*4882a593Smuzhiyun 	return err;
299*4882a593Smuzhiyun }
300*4882a593Smuzhiyun 
find_out_of_order(void * arg)301*4882a593Smuzhiyun static int find_out_of_order(void *arg)
302*4882a593Smuzhiyun {
303*4882a593Smuzhiyun 	struct fence_chains fc;
304*4882a593Smuzhiyun 	struct dma_fence *fence;
305*4882a593Smuzhiyun 	int err;
306*4882a593Smuzhiyun 
307*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 3, seqno_inc);
308*4882a593Smuzhiyun 	if (err)
309*4882a593Smuzhiyun 		return err;
310*4882a593Smuzhiyun 
311*4882a593Smuzhiyun 	dma_fence_signal(fc.fences[1]);
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun 	fence = dma_fence_get(fc.tail);
314*4882a593Smuzhiyun 	err = dma_fence_chain_find_seqno(&fence, 2);
315*4882a593Smuzhiyun 	dma_fence_put(fence);
316*4882a593Smuzhiyun 	if (err) {
317*4882a593Smuzhiyun 		pr_err("Reported %d for find_seqno()!\n", err);
318*4882a593Smuzhiyun 		goto err;
319*4882a593Smuzhiyun 	}
320*4882a593Smuzhiyun 
321*4882a593Smuzhiyun 	/*
322*4882a593Smuzhiyun 	 * We signaled the middle fence (2) of the 1-2-3 chain. The behavior
323*4882a593Smuzhiyun 	 * of the dma-fence-chain is to make us wait for all the fences up to
324*4882a593Smuzhiyun 	 * the point we want. Since fence 1 is still not signaled, this what
325*4882a593Smuzhiyun 	 * we should get as fence to wait upon (fence 2 being garbage
326*4882a593Smuzhiyun 	 * collected during the traversal of the chain).
327*4882a593Smuzhiyun 	 */
328*4882a593Smuzhiyun 	if (fence != fc.chains[0]) {
329*4882a593Smuzhiyun 		pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:2\n",
330*4882a593Smuzhiyun 		       fence ? fence->seqno : 0);
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun 		err = -EINVAL;
333*4882a593Smuzhiyun 	}
334*4882a593Smuzhiyun 
335*4882a593Smuzhiyun err:
336*4882a593Smuzhiyun 	fence_chains_fini(&fc);
337*4882a593Smuzhiyun 	return err;
338*4882a593Smuzhiyun }
339*4882a593Smuzhiyun 
seqno_inc2(unsigned int i)340*4882a593Smuzhiyun static uint64_t seqno_inc2(unsigned int i)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun 	return 2 * i + 2;
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun 
find_gap(void * arg)345*4882a593Smuzhiyun static int find_gap(void *arg)
346*4882a593Smuzhiyun {
347*4882a593Smuzhiyun 	struct fence_chains fc;
348*4882a593Smuzhiyun 	struct dma_fence *fence;
349*4882a593Smuzhiyun 	int err;
350*4882a593Smuzhiyun 	int i;
351*4882a593Smuzhiyun 
352*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 64, seqno_inc2);
353*4882a593Smuzhiyun 	if (err)
354*4882a593Smuzhiyun 		return err;
355*4882a593Smuzhiyun 
356*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++) {
357*4882a593Smuzhiyun 		fence = dma_fence_get(fc.tail);
358*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, 2 * i + 1);
359*4882a593Smuzhiyun 		dma_fence_put(fence);
360*4882a593Smuzhiyun 		if (err) {
361*4882a593Smuzhiyun 			pr_err("Reported %d for find_seqno(%d:%d)!\n",
362*4882a593Smuzhiyun 			       err, fc.chain_length + 1, 2 * i + 1);
363*4882a593Smuzhiyun 			goto err;
364*4882a593Smuzhiyun 		}
365*4882a593Smuzhiyun 		if (fence != fc.chains[i]) {
366*4882a593Smuzhiyun 			pr_err("Incorrect fence.seqno:%lld reported by find_seqno(%d:%d)\n",
367*4882a593Smuzhiyun 			       fence->seqno,
368*4882a593Smuzhiyun 			       fc.chain_length + 1,
369*4882a593Smuzhiyun 			       2 * i + 1);
370*4882a593Smuzhiyun 			err = -EINVAL;
371*4882a593Smuzhiyun 			goto err;
372*4882a593Smuzhiyun 		}
373*4882a593Smuzhiyun 
374*4882a593Smuzhiyun 		dma_fence_get(fence);
375*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, 2 * i + 2);
376*4882a593Smuzhiyun 		dma_fence_put(fence);
377*4882a593Smuzhiyun 		if (err) {
378*4882a593Smuzhiyun 			pr_err("Error reported for finding self\n");
379*4882a593Smuzhiyun 			goto err;
380*4882a593Smuzhiyun 		}
381*4882a593Smuzhiyun 		if (fence != fc.chains[i]) {
382*4882a593Smuzhiyun 			pr_err("Incorrect fence reported by find self\n");
383*4882a593Smuzhiyun 			err = -EINVAL;
384*4882a593Smuzhiyun 			goto err;
385*4882a593Smuzhiyun 		}
386*4882a593Smuzhiyun 	}
387*4882a593Smuzhiyun 
388*4882a593Smuzhiyun err:
389*4882a593Smuzhiyun 	fence_chains_fini(&fc);
390*4882a593Smuzhiyun 	return err;
391*4882a593Smuzhiyun }
392*4882a593Smuzhiyun 
393*4882a593Smuzhiyun struct find_race {
394*4882a593Smuzhiyun 	struct fence_chains fc;
395*4882a593Smuzhiyun 	atomic_t children;
396*4882a593Smuzhiyun };
397*4882a593Smuzhiyun 
__find_race(void * arg)398*4882a593Smuzhiyun static int __find_race(void *arg)
399*4882a593Smuzhiyun {
400*4882a593Smuzhiyun 	struct find_race *data = arg;
401*4882a593Smuzhiyun 	int err = 0;
402*4882a593Smuzhiyun 
403*4882a593Smuzhiyun 	while (!kthread_should_stop()) {
404*4882a593Smuzhiyun 		struct dma_fence *fence = dma_fence_get(data->fc.tail);
405*4882a593Smuzhiyun 		int seqno;
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 		seqno = prandom_u32_max(data->fc.chain_length) + 1;
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 		err = dma_fence_chain_find_seqno(&fence, seqno);
410*4882a593Smuzhiyun 		if (err) {
411*4882a593Smuzhiyun 			pr_err("Failed to find fence seqno:%d\n",
412*4882a593Smuzhiyun 			       seqno);
413*4882a593Smuzhiyun 			dma_fence_put(fence);
414*4882a593Smuzhiyun 			break;
415*4882a593Smuzhiyun 		}
416*4882a593Smuzhiyun 		if (!fence)
417*4882a593Smuzhiyun 			goto signal;
418*4882a593Smuzhiyun 
419*4882a593Smuzhiyun 		/*
420*4882a593Smuzhiyun 		 * We can only find ourselves if we are on fence we were
421*4882a593Smuzhiyun 		 * looking for.
422*4882a593Smuzhiyun 		 */
423*4882a593Smuzhiyun 		if (fence->seqno == seqno) {
424*4882a593Smuzhiyun 			err = dma_fence_chain_find_seqno(&fence, seqno);
425*4882a593Smuzhiyun 			if (err) {
426*4882a593Smuzhiyun 				pr_err("Reported an invalid fence for find-self:%d\n",
427*4882a593Smuzhiyun 				       seqno);
428*4882a593Smuzhiyun 				dma_fence_put(fence);
429*4882a593Smuzhiyun 				break;
430*4882a593Smuzhiyun 			}
431*4882a593Smuzhiyun 		}
432*4882a593Smuzhiyun 
433*4882a593Smuzhiyun 		dma_fence_put(fence);
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun signal:
436*4882a593Smuzhiyun 		seqno = prandom_u32_max(data->fc.chain_length - 1);
437*4882a593Smuzhiyun 		dma_fence_signal(data->fc.fences[seqno]);
438*4882a593Smuzhiyun 		cond_resched();
439*4882a593Smuzhiyun 	}
440*4882a593Smuzhiyun 
441*4882a593Smuzhiyun 	if (atomic_dec_and_test(&data->children))
442*4882a593Smuzhiyun 		wake_up_var(&data->children);
443*4882a593Smuzhiyun 	return err;
444*4882a593Smuzhiyun }
445*4882a593Smuzhiyun 
find_race(void * arg)446*4882a593Smuzhiyun static int find_race(void *arg)
447*4882a593Smuzhiyun {
448*4882a593Smuzhiyun 	struct find_race data;
449*4882a593Smuzhiyun 	int ncpus = num_online_cpus();
450*4882a593Smuzhiyun 	struct task_struct **threads;
451*4882a593Smuzhiyun 	unsigned long count;
452*4882a593Smuzhiyun 	int err;
453*4882a593Smuzhiyun 	int i;
454*4882a593Smuzhiyun 
455*4882a593Smuzhiyun 	err = fence_chains_init(&data.fc, CHAIN_SZ, seqno_inc);
456*4882a593Smuzhiyun 	if (err)
457*4882a593Smuzhiyun 		return err;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	threads = kmalloc_array(ncpus, sizeof(*threads), GFP_KERNEL);
460*4882a593Smuzhiyun 	if (!threads) {
461*4882a593Smuzhiyun 		err = -ENOMEM;
462*4882a593Smuzhiyun 		goto err;
463*4882a593Smuzhiyun 	}
464*4882a593Smuzhiyun 
465*4882a593Smuzhiyun 	atomic_set(&data.children, 0);
466*4882a593Smuzhiyun 	for (i = 0; i < ncpus; i++) {
467*4882a593Smuzhiyun 		threads[i] = kthread_run(__find_race, &data, "dmabuf/%d", i);
468*4882a593Smuzhiyun 		if (IS_ERR(threads[i])) {
469*4882a593Smuzhiyun 			ncpus = i;
470*4882a593Smuzhiyun 			break;
471*4882a593Smuzhiyun 		}
472*4882a593Smuzhiyun 		atomic_inc(&data.children);
473*4882a593Smuzhiyun 		get_task_struct(threads[i]);
474*4882a593Smuzhiyun 	}
475*4882a593Smuzhiyun 
476*4882a593Smuzhiyun 	wait_var_event_timeout(&data.children,
477*4882a593Smuzhiyun 			       !atomic_read(&data.children),
478*4882a593Smuzhiyun 			       5 * HZ);
479*4882a593Smuzhiyun 
480*4882a593Smuzhiyun 	for (i = 0; i < ncpus; i++) {
481*4882a593Smuzhiyun 		int ret;
482*4882a593Smuzhiyun 
483*4882a593Smuzhiyun 		ret = kthread_stop(threads[i]);
484*4882a593Smuzhiyun 		if (ret && !err)
485*4882a593Smuzhiyun 			err = ret;
486*4882a593Smuzhiyun 		put_task_struct(threads[i]);
487*4882a593Smuzhiyun 	}
488*4882a593Smuzhiyun 	kfree(threads);
489*4882a593Smuzhiyun 
490*4882a593Smuzhiyun 	count = 0;
491*4882a593Smuzhiyun 	for (i = 0; i < data.fc.chain_length; i++)
492*4882a593Smuzhiyun 		if (dma_fence_is_signaled(data.fc.fences[i]))
493*4882a593Smuzhiyun 			count++;
494*4882a593Smuzhiyun 	pr_info("Completed %lu cycles\n", count);
495*4882a593Smuzhiyun 
496*4882a593Smuzhiyun err:
497*4882a593Smuzhiyun 	fence_chains_fini(&data.fc);
498*4882a593Smuzhiyun 	return err;
499*4882a593Smuzhiyun }
500*4882a593Smuzhiyun 
signal_forward(void * arg)501*4882a593Smuzhiyun static int signal_forward(void *arg)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun 	struct fence_chains fc;
504*4882a593Smuzhiyun 	int err;
505*4882a593Smuzhiyun 	int i;
506*4882a593Smuzhiyun 
507*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 64, seqno_inc);
508*4882a593Smuzhiyun 	if (err)
509*4882a593Smuzhiyun 		return err;
510*4882a593Smuzhiyun 
511*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++) {
512*4882a593Smuzhiyun 		dma_fence_signal(fc.fences[i]);
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 		if (!dma_fence_is_signaled(fc.chains[i])) {
515*4882a593Smuzhiyun 			pr_err("chain[%d] not signaled!\n", i);
516*4882a593Smuzhiyun 			err = -EINVAL;
517*4882a593Smuzhiyun 			goto err;
518*4882a593Smuzhiyun 		}
519*4882a593Smuzhiyun 
520*4882a593Smuzhiyun 		if (i + 1 < fc.chain_length &&
521*4882a593Smuzhiyun 		    dma_fence_is_signaled(fc.chains[i + 1])) {
522*4882a593Smuzhiyun 			pr_err("chain[%d] is signaled!\n", i);
523*4882a593Smuzhiyun 			err = -EINVAL;
524*4882a593Smuzhiyun 			goto err;
525*4882a593Smuzhiyun 		}
526*4882a593Smuzhiyun 	}
527*4882a593Smuzhiyun 
528*4882a593Smuzhiyun err:
529*4882a593Smuzhiyun 	fence_chains_fini(&fc);
530*4882a593Smuzhiyun 	return err;
531*4882a593Smuzhiyun }
532*4882a593Smuzhiyun 
signal_backward(void * arg)533*4882a593Smuzhiyun static int signal_backward(void *arg)
534*4882a593Smuzhiyun {
535*4882a593Smuzhiyun 	struct fence_chains fc;
536*4882a593Smuzhiyun 	int err;
537*4882a593Smuzhiyun 	int i;
538*4882a593Smuzhiyun 
539*4882a593Smuzhiyun 	err = fence_chains_init(&fc, 64, seqno_inc);
540*4882a593Smuzhiyun 	if (err)
541*4882a593Smuzhiyun 		return err;
542*4882a593Smuzhiyun 
543*4882a593Smuzhiyun 	for (i = fc.chain_length; i--; ) {
544*4882a593Smuzhiyun 		dma_fence_signal(fc.fences[i]);
545*4882a593Smuzhiyun 
546*4882a593Smuzhiyun 		if (i > 0 && dma_fence_is_signaled(fc.chains[i])) {
547*4882a593Smuzhiyun 			pr_err("chain[%d] is signaled!\n", i);
548*4882a593Smuzhiyun 			err = -EINVAL;
549*4882a593Smuzhiyun 			goto err;
550*4882a593Smuzhiyun 		}
551*4882a593Smuzhiyun 	}
552*4882a593Smuzhiyun 
553*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++) {
554*4882a593Smuzhiyun 		if (!dma_fence_is_signaled(fc.chains[i])) {
555*4882a593Smuzhiyun 			pr_err("chain[%d] was not signaled!\n", i);
556*4882a593Smuzhiyun 			err = -EINVAL;
557*4882a593Smuzhiyun 			goto err;
558*4882a593Smuzhiyun 		}
559*4882a593Smuzhiyun 	}
560*4882a593Smuzhiyun 
561*4882a593Smuzhiyun err:
562*4882a593Smuzhiyun 	fence_chains_fini(&fc);
563*4882a593Smuzhiyun 	return err;
564*4882a593Smuzhiyun }
565*4882a593Smuzhiyun 
__wait_fence_chains(void * arg)566*4882a593Smuzhiyun static int __wait_fence_chains(void *arg)
567*4882a593Smuzhiyun {
568*4882a593Smuzhiyun 	struct fence_chains *fc = arg;
569*4882a593Smuzhiyun 
570*4882a593Smuzhiyun 	if (dma_fence_wait(fc->tail, false))
571*4882a593Smuzhiyun 		return -EIO;
572*4882a593Smuzhiyun 
573*4882a593Smuzhiyun 	return 0;
574*4882a593Smuzhiyun }
575*4882a593Smuzhiyun 
wait_forward(void * arg)576*4882a593Smuzhiyun static int wait_forward(void *arg)
577*4882a593Smuzhiyun {
578*4882a593Smuzhiyun 	struct fence_chains fc;
579*4882a593Smuzhiyun 	struct task_struct *tsk;
580*4882a593Smuzhiyun 	int err;
581*4882a593Smuzhiyun 	int i;
582*4882a593Smuzhiyun 
583*4882a593Smuzhiyun 	err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
584*4882a593Smuzhiyun 	if (err)
585*4882a593Smuzhiyun 		return err;
586*4882a593Smuzhiyun 
587*4882a593Smuzhiyun 	tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
588*4882a593Smuzhiyun 	if (IS_ERR(tsk)) {
589*4882a593Smuzhiyun 		err = PTR_ERR(tsk);
590*4882a593Smuzhiyun 		goto err;
591*4882a593Smuzhiyun 	}
592*4882a593Smuzhiyun 	get_task_struct(tsk);
593*4882a593Smuzhiyun 	yield_to(tsk, true);
594*4882a593Smuzhiyun 
595*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++)
596*4882a593Smuzhiyun 		dma_fence_signal(fc.fences[i]);
597*4882a593Smuzhiyun 
598*4882a593Smuzhiyun 	err = kthread_stop(tsk);
599*4882a593Smuzhiyun 	put_task_struct(tsk);
600*4882a593Smuzhiyun 
601*4882a593Smuzhiyun err:
602*4882a593Smuzhiyun 	fence_chains_fini(&fc);
603*4882a593Smuzhiyun 	return err;
604*4882a593Smuzhiyun }
605*4882a593Smuzhiyun 
wait_backward(void * arg)606*4882a593Smuzhiyun static int wait_backward(void *arg)
607*4882a593Smuzhiyun {
608*4882a593Smuzhiyun 	struct fence_chains fc;
609*4882a593Smuzhiyun 	struct task_struct *tsk;
610*4882a593Smuzhiyun 	int err;
611*4882a593Smuzhiyun 	int i;
612*4882a593Smuzhiyun 
613*4882a593Smuzhiyun 	err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
614*4882a593Smuzhiyun 	if (err)
615*4882a593Smuzhiyun 		return err;
616*4882a593Smuzhiyun 
617*4882a593Smuzhiyun 	tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
618*4882a593Smuzhiyun 	if (IS_ERR(tsk)) {
619*4882a593Smuzhiyun 		err = PTR_ERR(tsk);
620*4882a593Smuzhiyun 		goto err;
621*4882a593Smuzhiyun 	}
622*4882a593Smuzhiyun 	get_task_struct(tsk);
623*4882a593Smuzhiyun 	yield_to(tsk, true);
624*4882a593Smuzhiyun 
625*4882a593Smuzhiyun 	for (i = fc.chain_length; i--; )
626*4882a593Smuzhiyun 		dma_fence_signal(fc.fences[i]);
627*4882a593Smuzhiyun 
628*4882a593Smuzhiyun 	err = kthread_stop(tsk);
629*4882a593Smuzhiyun 	put_task_struct(tsk);
630*4882a593Smuzhiyun 
631*4882a593Smuzhiyun err:
632*4882a593Smuzhiyun 	fence_chains_fini(&fc);
633*4882a593Smuzhiyun 	return err;
634*4882a593Smuzhiyun }
635*4882a593Smuzhiyun 
randomise_fences(struct fence_chains * fc)636*4882a593Smuzhiyun static void randomise_fences(struct fence_chains *fc)
637*4882a593Smuzhiyun {
638*4882a593Smuzhiyun 	unsigned int count = fc->chain_length;
639*4882a593Smuzhiyun 
640*4882a593Smuzhiyun 	/* Fisher-Yates shuffle courtesy of Knuth */
641*4882a593Smuzhiyun 	while (--count) {
642*4882a593Smuzhiyun 		unsigned int swp;
643*4882a593Smuzhiyun 
644*4882a593Smuzhiyun 		swp = prandom_u32_max(count + 1);
645*4882a593Smuzhiyun 		if (swp == count)
646*4882a593Smuzhiyun 			continue;
647*4882a593Smuzhiyun 
648*4882a593Smuzhiyun 		swap(fc->fences[count], fc->fences[swp]);
649*4882a593Smuzhiyun 	}
650*4882a593Smuzhiyun }
651*4882a593Smuzhiyun 
wait_random(void * arg)652*4882a593Smuzhiyun static int wait_random(void *arg)
653*4882a593Smuzhiyun {
654*4882a593Smuzhiyun 	struct fence_chains fc;
655*4882a593Smuzhiyun 	struct task_struct *tsk;
656*4882a593Smuzhiyun 	int err;
657*4882a593Smuzhiyun 	int i;
658*4882a593Smuzhiyun 
659*4882a593Smuzhiyun 	err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
660*4882a593Smuzhiyun 	if (err)
661*4882a593Smuzhiyun 		return err;
662*4882a593Smuzhiyun 
663*4882a593Smuzhiyun 	randomise_fences(&fc);
664*4882a593Smuzhiyun 
665*4882a593Smuzhiyun 	tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
666*4882a593Smuzhiyun 	if (IS_ERR(tsk)) {
667*4882a593Smuzhiyun 		err = PTR_ERR(tsk);
668*4882a593Smuzhiyun 		goto err;
669*4882a593Smuzhiyun 	}
670*4882a593Smuzhiyun 	get_task_struct(tsk);
671*4882a593Smuzhiyun 	yield_to(tsk, true);
672*4882a593Smuzhiyun 
673*4882a593Smuzhiyun 	for (i = 0; i < fc.chain_length; i++)
674*4882a593Smuzhiyun 		dma_fence_signal(fc.fences[i]);
675*4882a593Smuzhiyun 
676*4882a593Smuzhiyun 	err = kthread_stop(tsk);
677*4882a593Smuzhiyun 	put_task_struct(tsk);
678*4882a593Smuzhiyun 
679*4882a593Smuzhiyun err:
680*4882a593Smuzhiyun 	fence_chains_fini(&fc);
681*4882a593Smuzhiyun 	return err;
682*4882a593Smuzhiyun }
683*4882a593Smuzhiyun 
dma_fence_chain(void)684*4882a593Smuzhiyun int dma_fence_chain(void)
685*4882a593Smuzhiyun {
686*4882a593Smuzhiyun 	static const struct subtest tests[] = {
687*4882a593Smuzhiyun 		SUBTEST(sanitycheck),
688*4882a593Smuzhiyun 		SUBTEST(find_seqno),
689*4882a593Smuzhiyun 		SUBTEST(find_signaled),
690*4882a593Smuzhiyun 		SUBTEST(find_out_of_order),
691*4882a593Smuzhiyun 		SUBTEST(find_gap),
692*4882a593Smuzhiyun 		SUBTEST(find_race),
693*4882a593Smuzhiyun 		SUBTEST(signal_forward),
694*4882a593Smuzhiyun 		SUBTEST(signal_backward),
695*4882a593Smuzhiyun 		SUBTEST(wait_forward),
696*4882a593Smuzhiyun 		SUBTEST(wait_backward),
697*4882a593Smuzhiyun 		SUBTEST(wait_random),
698*4882a593Smuzhiyun 	};
699*4882a593Smuzhiyun 	int ret;
700*4882a593Smuzhiyun 
701*4882a593Smuzhiyun 	pr_info("sizeof(dma_fence_chain)=%zu\n",
702*4882a593Smuzhiyun 		sizeof(struct dma_fence_chain));
703*4882a593Smuzhiyun 
704*4882a593Smuzhiyun 	slab_fences = KMEM_CACHE(mock_fence,
705*4882a593Smuzhiyun 				 SLAB_TYPESAFE_BY_RCU |
706*4882a593Smuzhiyun 				 SLAB_HWCACHE_ALIGN);
707*4882a593Smuzhiyun 	if (!slab_fences)
708*4882a593Smuzhiyun 		return -ENOMEM;
709*4882a593Smuzhiyun 
710*4882a593Smuzhiyun 	ret = subtests(tests, NULL);
711*4882a593Smuzhiyun 
712*4882a593Smuzhiyun 	kmem_cache_destroy(slab_fences);
713*4882a593Smuzhiyun 	return ret;
714*4882a593Smuzhiyun }
715