1*4882a593Smuzhiyun // SPDX-License-Identifier: MIT
2*4882a593Smuzhiyun
3*4882a593Smuzhiyun /*
4*4882a593Smuzhiyun * Copyright © 2019 Intel Corporation
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include <linux/delay.h>
8*4882a593Smuzhiyun #include <linux/dma-fence.h>
9*4882a593Smuzhiyun #include <linux/dma-fence-chain.h>
10*4882a593Smuzhiyun #include <linux/kernel.h>
11*4882a593Smuzhiyun #include <linux/kthread.h>
12*4882a593Smuzhiyun #include <linux/mm.h>
13*4882a593Smuzhiyun #include <linux/sched/signal.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun #include <linux/spinlock.h>
16*4882a593Smuzhiyun #include <linux/random.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #include "selftest.h"
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun #define CHAIN_SZ (4 << 10)
21*4882a593Smuzhiyun
22*4882a593Smuzhiyun static struct kmem_cache *slab_fences;
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun static inline struct mock_fence {
25*4882a593Smuzhiyun struct dma_fence base;
26*4882a593Smuzhiyun spinlock_t lock;
to_mock_fence(struct dma_fence * f)27*4882a593Smuzhiyun } *to_mock_fence(struct dma_fence *f) {
28*4882a593Smuzhiyun return container_of(f, struct mock_fence, base);
29*4882a593Smuzhiyun }
30*4882a593Smuzhiyun
mock_name(struct dma_fence * f)31*4882a593Smuzhiyun static const char *mock_name(struct dma_fence *f)
32*4882a593Smuzhiyun {
33*4882a593Smuzhiyun return "mock";
34*4882a593Smuzhiyun }
35*4882a593Smuzhiyun
mock_fence_release(struct dma_fence * f)36*4882a593Smuzhiyun static void mock_fence_release(struct dma_fence *f)
37*4882a593Smuzhiyun {
38*4882a593Smuzhiyun kmem_cache_free(slab_fences, to_mock_fence(f));
39*4882a593Smuzhiyun }
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun static const struct dma_fence_ops mock_ops = {
42*4882a593Smuzhiyun .get_driver_name = mock_name,
43*4882a593Smuzhiyun .get_timeline_name = mock_name,
44*4882a593Smuzhiyun .release = mock_fence_release,
45*4882a593Smuzhiyun };
46*4882a593Smuzhiyun
mock_fence(void)47*4882a593Smuzhiyun static struct dma_fence *mock_fence(void)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun struct mock_fence *f;
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun f = kmem_cache_alloc(slab_fences, GFP_KERNEL);
52*4882a593Smuzhiyun if (!f)
53*4882a593Smuzhiyun return NULL;
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun spin_lock_init(&f->lock);
56*4882a593Smuzhiyun dma_fence_init(&f->base, &mock_ops, &f->lock, 0, 0);
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun return &f->base;
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun static inline struct mock_chain {
62*4882a593Smuzhiyun struct dma_fence_chain base;
to_mock_chain(struct dma_fence * f)63*4882a593Smuzhiyun } *to_mock_chain(struct dma_fence *f) {
64*4882a593Smuzhiyun return container_of(f, struct mock_chain, base.base);
65*4882a593Smuzhiyun }
66*4882a593Smuzhiyun
mock_chain(struct dma_fence * prev,struct dma_fence * fence,u64 seqno)67*4882a593Smuzhiyun static struct dma_fence *mock_chain(struct dma_fence *prev,
68*4882a593Smuzhiyun struct dma_fence *fence,
69*4882a593Smuzhiyun u64 seqno)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun struct mock_chain *f;
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun f = kmalloc(sizeof(*f), GFP_KERNEL);
74*4882a593Smuzhiyun if (!f)
75*4882a593Smuzhiyun return NULL;
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun dma_fence_chain_init(&f->base,
78*4882a593Smuzhiyun dma_fence_get(prev),
79*4882a593Smuzhiyun dma_fence_get(fence),
80*4882a593Smuzhiyun seqno);
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun return &f->base.base;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
sanitycheck(void * arg)85*4882a593Smuzhiyun static int sanitycheck(void *arg)
86*4882a593Smuzhiyun {
87*4882a593Smuzhiyun struct dma_fence *f, *chain;
88*4882a593Smuzhiyun int err = 0;
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun f = mock_fence();
91*4882a593Smuzhiyun if (!f)
92*4882a593Smuzhiyun return -ENOMEM;
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun chain = mock_chain(NULL, f, 1);
95*4882a593Smuzhiyun if (!chain)
96*4882a593Smuzhiyun err = -ENOMEM;
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun dma_fence_signal(f);
99*4882a593Smuzhiyun dma_fence_put(f);
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun dma_fence_put(chain);
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun return err;
104*4882a593Smuzhiyun }
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun struct fence_chains {
107*4882a593Smuzhiyun unsigned int chain_length;
108*4882a593Smuzhiyun struct dma_fence **fences;
109*4882a593Smuzhiyun struct dma_fence **chains;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun struct dma_fence *tail;
112*4882a593Smuzhiyun };
113*4882a593Smuzhiyun
seqno_inc(unsigned int i)114*4882a593Smuzhiyun static uint64_t seqno_inc(unsigned int i)
115*4882a593Smuzhiyun {
116*4882a593Smuzhiyun return i + 1;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
fence_chains_init(struct fence_chains * fc,unsigned int count,uint64_t (* seqno_fn)(unsigned int))119*4882a593Smuzhiyun static int fence_chains_init(struct fence_chains *fc, unsigned int count,
120*4882a593Smuzhiyun uint64_t (*seqno_fn)(unsigned int))
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun unsigned int i;
123*4882a593Smuzhiyun int err = 0;
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun fc->chains = kvmalloc_array(count, sizeof(*fc->chains),
126*4882a593Smuzhiyun GFP_KERNEL | __GFP_ZERO);
127*4882a593Smuzhiyun if (!fc->chains)
128*4882a593Smuzhiyun return -ENOMEM;
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun fc->fences = kvmalloc_array(count, sizeof(*fc->fences),
131*4882a593Smuzhiyun GFP_KERNEL | __GFP_ZERO);
132*4882a593Smuzhiyun if (!fc->fences) {
133*4882a593Smuzhiyun err = -ENOMEM;
134*4882a593Smuzhiyun goto err_chains;
135*4882a593Smuzhiyun }
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun fc->tail = NULL;
138*4882a593Smuzhiyun for (i = 0; i < count; i++) {
139*4882a593Smuzhiyun fc->fences[i] = mock_fence();
140*4882a593Smuzhiyun if (!fc->fences[i]) {
141*4882a593Smuzhiyun err = -ENOMEM;
142*4882a593Smuzhiyun goto unwind;
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun fc->chains[i] = mock_chain(fc->tail,
146*4882a593Smuzhiyun fc->fences[i],
147*4882a593Smuzhiyun seqno_fn(i));
148*4882a593Smuzhiyun if (!fc->chains[i]) {
149*4882a593Smuzhiyun err = -ENOMEM;
150*4882a593Smuzhiyun goto unwind;
151*4882a593Smuzhiyun }
152*4882a593Smuzhiyun
153*4882a593Smuzhiyun fc->tail = fc->chains[i];
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun fc->chain_length = i;
157*4882a593Smuzhiyun return 0;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun unwind:
160*4882a593Smuzhiyun for (i = 0; i < count; i++) {
161*4882a593Smuzhiyun dma_fence_put(fc->fences[i]);
162*4882a593Smuzhiyun dma_fence_put(fc->chains[i]);
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun kvfree(fc->fences);
165*4882a593Smuzhiyun err_chains:
166*4882a593Smuzhiyun kvfree(fc->chains);
167*4882a593Smuzhiyun return err;
168*4882a593Smuzhiyun }
169*4882a593Smuzhiyun
fence_chains_fini(struct fence_chains * fc)170*4882a593Smuzhiyun static void fence_chains_fini(struct fence_chains *fc)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun unsigned int i;
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun for (i = 0; i < fc->chain_length; i++) {
175*4882a593Smuzhiyun dma_fence_signal(fc->fences[i]);
176*4882a593Smuzhiyun dma_fence_put(fc->fences[i]);
177*4882a593Smuzhiyun }
178*4882a593Smuzhiyun kvfree(fc->fences);
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun for (i = 0; i < fc->chain_length; i++)
181*4882a593Smuzhiyun dma_fence_put(fc->chains[i]);
182*4882a593Smuzhiyun kvfree(fc->chains);
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun
find_seqno(void * arg)185*4882a593Smuzhiyun static int find_seqno(void *arg)
186*4882a593Smuzhiyun {
187*4882a593Smuzhiyun struct fence_chains fc;
188*4882a593Smuzhiyun struct dma_fence *fence;
189*4882a593Smuzhiyun int err;
190*4882a593Smuzhiyun int i;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun err = fence_chains_init(&fc, 64, seqno_inc);
193*4882a593Smuzhiyun if (err)
194*4882a593Smuzhiyun return err;
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun fence = dma_fence_get(fc.tail);
197*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 0);
198*4882a593Smuzhiyun dma_fence_put(fence);
199*4882a593Smuzhiyun if (err) {
200*4882a593Smuzhiyun pr_err("Reported %d for find_seqno(0)!\n", err);
201*4882a593Smuzhiyun goto err;
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++) {
205*4882a593Smuzhiyun fence = dma_fence_get(fc.tail);
206*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, i + 1);
207*4882a593Smuzhiyun dma_fence_put(fence);
208*4882a593Smuzhiyun if (err) {
209*4882a593Smuzhiyun pr_err("Reported %d for find_seqno(%d:%d)!\n",
210*4882a593Smuzhiyun err, fc.chain_length + 1, i + 1);
211*4882a593Smuzhiyun goto err;
212*4882a593Smuzhiyun }
213*4882a593Smuzhiyun if (fence != fc.chains[i]) {
214*4882a593Smuzhiyun pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
215*4882a593Smuzhiyun fc.chain_length + 1, i + 1);
216*4882a593Smuzhiyun err = -EINVAL;
217*4882a593Smuzhiyun goto err;
218*4882a593Smuzhiyun }
219*4882a593Smuzhiyun
220*4882a593Smuzhiyun dma_fence_get(fence);
221*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, i + 1);
222*4882a593Smuzhiyun dma_fence_put(fence);
223*4882a593Smuzhiyun if (err) {
224*4882a593Smuzhiyun pr_err("Error reported for finding self\n");
225*4882a593Smuzhiyun goto err;
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun if (fence != fc.chains[i]) {
228*4882a593Smuzhiyun pr_err("Incorrect fence reported by find self\n");
229*4882a593Smuzhiyun err = -EINVAL;
230*4882a593Smuzhiyun goto err;
231*4882a593Smuzhiyun }
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun dma_fence_get(fence);
234*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, i + 2);
235*4882a593Smuzhiyun dma_fence_put(fence);
236*4882a593Smuzhiyun if (!err) {
237*4882a593Smuzhiyun pr_err("Error not reported for future fence: find_seqno(%d:%d)!\n",
238*4882a593Smuzhiyun i + 1, i + 2);
239*4882a593Smuzhiyun err = -EINVAL;
240*4882a593Smuzhiyun goto err;
241*4882a593Smuzhiyun }
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun dma_fence_get(fence);
244*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, i);
245*4882a593Smuzhiyun dma_fence_put(fence);
246*4882a593Smuzhiyun if (err) {
247*4882a593Smuzhiyun pr_err("Error reported for previous fence!\n");
248*4882a593Smuzhiyun goto err;
249*4882a593Smuzhiyun }
250*4882a593Smuzhiyun if (i > 0 && fence != fc.chains[i - 1]) {
251*4882a593Smuzhiyun pr_err("Incorrect fence reported by find_seqno(%d:%d)\n",
252*4882a593Smuzhiyun i + 1, i);
253*4882a593Smuzhiyun err = -EINVAL;
254*4882a593Smuzhiyun goto err;
255*4882a593Smuzhiyun }
256*4882a593Smuzhiyun }
257*4882a593Smuzhiyun
258*4882a593Smuzhiyun err:
259*4882a593Smuzhiyun fence_chains_fini(&fc);
260*4882a593Smuzhiyun return err;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun
find_signaled(void * arg)263*4882a593Smuzhiyun static int find_signaled(void *arg)
264*4882a593Smuzhiyun {
265*4882a593Smuzhiyun struct fence_chains fc;
266*4882a593Smuzhiyun struct dma_fence *fence;
267*4882a593Smuzhiyun int err;
268*4882a593Smuzhiyun
269*4882a593Smuzhiyun err = fence_chains_init(&fc, 2, seqno_inc);
270*4882a593Smuzhiyun if (err)
271*4882a593Smuzhiyun return err;
272*4882a593Smuzhiyun
273*4882a593Smuzhiyun dma_fence_signal(fc.fences[0]);
274*4882a593Smuzhiyun
275*4882a593Smuzhiyun fence = dma_fence_get(fc.tail);
276*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 1);
277*4882a593Smuzhiyun dma_fence_put(fence);
278*4882a593Smuzhiyun if (err) {
279*4882a593Smuzhiyun pr_err("Reported %d for find_seqno()!\n", err);
280*4882a593Smuzhiyun goto err;
281*4882a593Smuzhiyun }
282*4882a593Smuzhiyun
283*4882a593Smuzhiyun if (fence && fence != fc.chains[0]) {
284*4882a593Smuzhiyun pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:1\n",
285*4882a593Smuzhiyun fence->seqno);
286*4882a593Smuzhiyun
287*4882a593Smuzhiyun dma_fence_get(fence);
288*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 1);
289*4882a593Smuzhiyun dma_fence_put(fence);
290*4882a593Smuzhiyun if (err)
291*4882a593Smuzhiyun pr_err("Reported %d for finding self!\n", err);
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun err = -EINVAL;
294*4882a593Smuzhiyun }
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun err:
297*4882a593Smuzhiyun fence_chains_fini(&fc);
298*4882a593Smuzhiyun return err;
299*4882a593Smuzhiyun }
300*4882a593Smuzhiyun
find_out_of_order(void * arg)301*4882a593Smuzhiyun static int find_out_of_order(void *arg)
302*4882a593Smuzhiyun {
303*4882a593Smuzhiyun struct fence_chains fc;
304*4882a593Smuzhiyun struct dma_fence *fence;
305*4882a593Smuzhiyun int err;
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun err = fence_chains_init(&fc, 3, seqno_inc);
308*4882a593Smuzhiyun if (err)
309*4882a593Smuzhiyun return err;
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun dma_fence_signal(fc.fences[1]);
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun fence = dma_fence_get(fc.tail);
314*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 2);
315*4882a593Smuzhiyun dma_fence_put(fence);
316*4882a593Smuzhiyun if (err) {
317*4882a593Smuzhiyun pr_err("Reported %d for find_seqno()!\n", err);
318*4882a593Smuzhiyun goto err;
319*4882a593Smuzhiyun }
320*4882a593Smuzhiyun
321*4882a593Smuzhiyun /*
322*4882a593Smuzhiyun * We signaled the middle fence (2) of the 1-2-3 chain. The behavior
323*4882a593Smuzhiyun * of the dma-fence-chain is to make us wait for all the fences up to
324*4882a593Smuzhiyun * the point we want. Since fence 1 is still not signaled, this what
325*4882a593Smuzhiyun * we should get as fence to wait upon (fence 2 being garbage
326*4882a593Smuzhiyun * collected during the traversal of the chain).
327*4882a593Smuzhiyun */
328*4882a593Smuzhiyun if (fence != fc.chains[0]) {
329*4882a593Smuzhiyun pr_err("Incorrect chain-fence.seqno:%lld reported for completed seqno:2\n",
330*4882a593Smuzhiyun fence ? fence->seqno : 0);
331*4882a593Smuzhiyun
332*4882a593Smuzhiyun err = -EINVAL;
333*4882a593Smuzhiyun }
334*4882a593Smuzhiyun
335*4882a593Smuzhiyun err:
336*4882a593Smuzhiyun fence_chains_fini(&fc);
337*4882a593Smuzhiyun return err;
338*4882a593Smuzhiyun }
339*4882a593Smuzhiyun
seqno_inc2(unsigned int i)340*4882a593Smuzhiyun static uint64_t seqno_inc2(unsigned int i)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun return 2 * i + 2;
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun
find_gap(void * arg)345*4882a593Smuzhiyun static int find_gap(void *arg)
346*4882a593Smuzhiyun {
347*4882a593Smuzhiyun struct fence_chains fc;
348*4882a593Smuzhiyun struct dma_fence *fence;
349*4882a593Smuzhiyun int err;
350*4882a593Smuzhiyun int i;
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun err = fence_chains_init(&fc, 64, seqno_inc2);
353*4882a593Smuzhiyun if (err)
354*4882a593Smuzhiyun return err;
355*4882a593Smuzhiyun
356*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++) {
357*4882a593Smuzhiyun fence = dma_fence_get(fc.tail);
358*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 2 * i + 1);
359*4882a593Smuzhiyun dma_fence_put(fence);
360*4882a593Smuzhiyun if (err) {
361*4882a593Smuzhiyun pr_err("Reported %d for find_seqno(%d:%d)!\n",
362*4882a593Smuzhiyun err, fc.chain_length + 1, 2 * i + 1);
363*4882a593Smuzhiyun goto err;
364*4882a593Smuzhiyun }
365*4882a593Smuzhiyun if (fence != fc.chains[i]) {
366*4882a593Smuzhiyun pr_err("Incorrect fence.seqno:%lld reported by find_seqno(%d:%d)\n",
367*4882a593Smuzhiyun fence->seqno,
368*4882a593Smuzhiyun fc.chain_length + 1,
369*4882a593Smuzhiyun 2 * i + 1);
370*4882a593Smuzhiyun err = -EINVAL;
371*4882a593Smuzhiyun goto err;
372*4882a593Smuzhiyun }
373*4882a593Smuzhiyun
374*4882a593Smuzhiyun dma_fence_get(fence);
375*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, 2 * i + 2);
376*4882a593Smuzhiyun dma_fence_put(fence);
377*4882a593Smuzhiyun if (err) {
378*4882a593Smuzhiyun pr_err("Error reported for finding self\n");
379*4882a593Smuzhiyun goto err;
380*4882a593Smuzhiyun }
381*4882a593Smuzhiyun if (fence != fc.chains[i]) {
382*4882a593Smuzhiyun pr_err("Incorrect fence reported by find self\n");
383*4882a593Smuzhiyun err = -EINVAL;
384*4882a593Smuzhiyun goto err;
385*4882a593Smuzhiyun }
386*4882a593Smuzhiyun }
387*4882a593Smuzhiyun
388*4882a593Smuzhiyun err:
389*4882a593Smuzhiyun fence_chains_fini(&fc);
390*4882a593Smuzhiyun return err;
391*4882a593Smuzhiyun }
392*4882a593Smuzhiyun
393*4882a593Smuzhiyun struct find_race {
394*4882a593Smuzhiyun struct fence_chains fc;
395*4882a593Smuzhiyun atomic_t children;
396*4882a593Smuzhiyun };
397*4882a593Smuzhiyun
__find_race(void * arg)398*4882a593Smuzhiyun static int __find_race(void *arg)
399*4882a593Smuzhiyun {
400*4882a593Smuzhiyun struct find_race *data = arg;
401*4882a593Smuzhiyun int err = 0;
402*4882a593Smuzhiyun
403*4882a593Smuzhiyun while (!kthread_should_stop()) {
404*4882a593Smuzhiyun struct dma_fence *fence = dma_fence_get(data->fc.tail);
405*4882a593Smuzhiyun int seqno;
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun seqno = prandom_u32_max(data->fc.chain_length) + 1;
408*4882a593Smuzhiyun
409*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, seqno);
410*4882a593Smuzhiyun if (err) {
411*4882a593Smuzhiyun pr_err("Failed to find fence seqno:%d\n",
412*4882a593Smuzhiyun seqno);
413*4882a593Smuzhiyun dma_fence_put(fence);
414*4882a593Smuzhiyun break;
415*4882a593Smuzhiyun }
416*4882a593Smuzhiyun if (!fence)
417*4882a593Smuzhiyun goto signal;
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun /*
420*4882a593Smuzhiyun * We can only find ourselves if we are on fence we were
421*4882a593Smuzhiyun * looking for.
422*4882a593Smuzhiyun */
423*4882a593Smuzhiyun if (fence->seqno == seqno) {
424*4882a593Smuzhiyun err = dma_fence_chain_find_seqno(&fence, seqno);
425*4882a593Smuzhiyun if (err) {
426*4882a593Smuzhiyun pr_err("Reported an invalid fence for find-self:%d\n",
427*4882a593Smuzhiyun seqno);
428*4882a593Smuzhiyun dma_fence_put(fence);
429*4882a593Smuzhiyun break;
430*4882a593Smuzhiyun }
431*4882a593Smuzhiyun }
432*4882a593Smuzhiyun
433*4882a593Smuzhiyun dma_fence_put(fence);
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun signal:
436*4882a593Smuzhiyun seqno = prandom_u32_max(data->fc.chain_length - 1);
437*4882a593Smuzhiyun dma_fence_signal(data->fc.fences[seqno]);
438*4882a593Smuzhiyun cond_resched();
439*4882a593Smuzhiyun }
440*4882a593Smuzhiyun
441*4882a593Smuzhiyun if (atomic_dec_and_test(&data->children))
442*4882a593Smuzhiyun wake_up_var(&data->children);
443*4882a593Smuzhiyun return err;
444*4882a593Smuzhiyun }
445*4882a593Smuzhiyun
find_race(void * arg)446*4882a593Smuzhiyun static int find_race(void *arg)
447*4882a593Smuzhiyun {
448*4882a593Smuzhiyun struct find_race data;
449*4882a593Smuzhiyun int ncpus = num_online_cpus();
450*4882a593Smuzhiyun struct task_struct **threads;
451*4882a593Smuzhiyun unsigned long count;
452*4882a593Smuzhiyun int err;
453*4882a593Smuzhiyun int i;
454*4882a593Smuzhiyun
455*4882a593Smuzhiyun err = fence_chains_init(&data.fc, CHAIN_SZ, seqno_inc);
456*4882a593Smuzhiyun if (err)
457*4882a593Smuzhiyun return err;
458*4882a593Smuzhiyun
459*4882a593Smuzhiyun threads = kmalloc_array(ncpus, sizeof(*threads), GFP_KERNEL);
460*4882a593Smuzhiyun if (!threads) {
461*4882a593Smuzhiyun err = -ENOMEM;
462*4882a593Smuzhiyun goto err;
463*4882a593Smuzhiyun }
464*4882a593Smuzhiyun
465*4882a593Smuzhiyun atomic_set(&data.children, 0);
466*4882a593Smuzhiyun for (i = 0; i < ncpus; i++) {
467*4882a593Smuzhiyun threads[i] = kthread_run(__find_race, &data, "dmabuf/%d", i);
468*4882a593Smuzhiyun if (IS_ERR(threads[i])) {
469*4882a593Smuzhiyun ncpus = i;
470*4882a593Smuzhiyun break;
471*4882a593Smuzhiyun }
472*4882a593Smuzhiyun atomic_inc(&data.children);
473*4882a593Smuzhiyun get_task_struct(threads[i]);
474*4882a593Smuzhiyun }
475*4882a593Smuzhiyun
476*4882a593Smuzhiyun wait_var_event_timeout(&data.children,
477*4882a593Smuzhiyun !atomic_read(&data.children),
478*4882a593Smuzhiyun 5 * HZ);
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun for (i = 0; i < ncpus; i++) {
481*4882a593Smuzhiyun int ret;
482*4882a593Smuzhiyun
483*4882a593Smuzhiyun ret = kthread_stop(threads[i]);
484*4882a593Smuzhiyun if (ret && !err)
485*4882a593Smuzhiyun err = ret;
486*4882a593Smuzhiyun put_task_struct(threads[i]);
487*4882a593Smuzhiyun }
488*4882a593Smuzhiyun kfree(threads);
489*4882a593Smuzhiyun
490*4882a593Smuzhiyun count = 0;
491*4882a593Smuzhiyun for (i = 0; i < data.fc.chain_length; i++)
492*4882a593Smuzhiyun if (dma_fence_is_signaled(data.fc.fences[i]))
493*4882a593Smuzhiyun count++;
494*4882a593Smuzhiyun pr_info("Completed %lu cycles\n", count);
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun err:
497*4882a593Smuzhiyun fence_chains_fini(&data.fc);
498*4882a593Smuzhiyun return err;
499*4882a593Smuzhiyun }
500*4882a593Smuzhiyun
signal_forward(void * arg)501*4882a593Smuzhiyun static int signal_forward(void *arg)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun struct fence_chains fc;
504*4882a593Smuzhiyun int err;
505*4882a593Smuzhiyun int i;
506*4882a593Smuzhiyun
507*4882a593Smuzhiyun err = fence_chains_init(&fc, 64, seqno_inc);
508*4882a593Smuzhiyun if (err)
509*4882a593Smuzhiyun return err;
510*4882a593Smuzhiyun
511*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++) {
512*4882a593Smuzhiyun dma_fence_signal(fc.fences[i]);
513*4882a593Smuzhiyun
514*4882a593Smuzhiyun if (!dma_fence_is_signaled(fc.chains[i])) {
515*4882a593Smuzhiyun pr_err("chain[%d] not signaled!\n", i);
516*4882a593Smuzhiyun err = -EINVAL;
517*4882a593Smuzhiyun goto err;
518*4882a593Smuzhiyun }
519*4882a593Smuzhiyun
520*4882a593Smuzhiyun if (i + 1 < fc.chain_length &&
521*4882a593Smuzhiyun dma_fence_is_signaled(fc.chains[i + 1])) {
522*4882a593Smuzhiyun pr_err("chain[%d] is signaled!\n", i);
523*4882a593Smuzhiyun err = -EINVAL;
524*4882a593Smuzhiyun goto err;
525*4882a593Smuzhiyun }
526*4882a593Smuzhiyun }
527*4882a593Smuzhiyun
528*4882a593Smuzhiyun err:
529*4882a593Smuzhiyun fence_chains_fini(&fc);
530*4882a593Smuzhiyun return err;
531*4882a593Smuzhiyun }
532*4882a593Smuzhiyun
signal_backward(void * arg)533*4882a593Smuzhiyun static int signal_backward(void *arg)
534*4882a593Smuzhiyun {
535*4882a593Smuzhiyun struct fence_chains fc;
536*4882a593Smuzhiyun int err;
537*4882a593Smuzhiyun int i;
538*4882a593Smuzhiyun
539*4882a593Smuzhiyun err = fence_chains_init(&fc, 64, seqno_inc);
540*4882a593Smuzhiyun if (err)
541*4882a593Smuzhiyun return err;
542*4882a593Smuzhiyun
543*4882a593Smuzhiyun for (i = fc.chain_length; i--; ) {
544*4882a593Smuzhiyun dma_fence_signal(fc.fences[i]);
545*4882a593Smuzhiyun
546*4882a593Smuzhiyun if (i > 0 && dma_fence_is_signaled(fc.chains[i])) {
547*4882a593Smuzhiyun pr_err("chain[%d] is signaled!\n", i);
548*4882a593Smuzhiyun err = -EINVAL;
549*4882a593Smuzhiyun goto err;
550*4882a593Smuzhiyun }
551*4882a593Smuzhiyun }
552*4882a593Smuzhiyun
553*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++) {
554*4882a593Smuzhiyun if (!dma_fence_is_signaled(fc.chains[i])) {
555*4882a593Smuzhiyun pr_err("chain[%d] was not signaled!\n", i);
556*4882a593Smuzhiyun err = -EINVAL;
557*4882a593Smuzhiyun goto err;
558*4882a593Smuzhiyun }
559*4882a593Smuzhiyun }
560*4882a593Smuzhiyun
561*4882a593Smuzhiyun err:
562*4882a593Smuzhiyun fence_chains_fini(&fc);
563*4882a593Smuzhiyun return err;
564*4882a593Smuzhiyun }
565*4882a593Smuzhiyun
__wait_fence_chains(void * arg)566*4882a593Smuzhiyun static int __wait_fence_chains(void *arg)
567*4882a593Smuzhiyun {
568*4882a593Smuzhiyun struct fence_chains *fc = arg;
569*4882a593Smuzhiyun
570*4882a593Smuzhiyun if (dma_fence_wait(fc->tail, false))
571*4882a593Smuzhiyun return -EIO;
572*4882a593Smuzhiyun
573*4882a593Smuzhiyun return 0;
574*4882a593Smuzhiyun }
575*4882a593Smuzhiyun
wait_forward(void * arg)576*4882a593Smuzhiyun static int wait_forward(void *arg)
577*4882a593Smuzhiyun {
578*4882a593Smuzhiyun struct fence_chains fc;
579*4882a593Smuzhiyun struct task_struct *tsk;
580*4882a593Smuzhiyun int err;
581*4882a593Smuzhiyun int i;
582*4882a593Smuzhiyun
583*4882a593Smuzhiyun err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
584*4882a593Smuzhiyun if (err)
585*4882a593Smuzhiyun return err;
586*4882a593Smuzhiyun
587*4882a593Smuzhiyun tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
588*4882a593Smuzhiyun if (IS_ERR(tsk)) {
589*4882a593Smuzhiyun err = PTR_ERR(tsk);
590*4882a593Smuzhiyun goto err;
591*4882a593Smuzhiyun }
592*4882a593Smuzhiyun get_task_struct(tsk);
593*4882a593Smuzhiyun yield_to(tsk, true);
594*4882a593Smuzhiyun
595*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++)
596*4882a593Smuzhiyun dma_fence_signal(fc.fences[i]);
597*4882a593Smuzhiyun
598*4882a593Smuzhiyun err = kthread_stop(tsk);
599*4882a593Smuzhiyun put_task_struct(tsk);
600*4882a593Smuzhiyun
601*4882a593Smuzhiyun err:
602*4882a593Smuzhiyun fence_chains_fini(&fc);
603*4882a593Smuzhiyun return err;
604*4882a593Smuzhiyun }
605*4882a593Smuzhiyun
wait_backward(void * arg)606*4882a593Smuzhiyun static int wait_backward(void *arg)
607*4882a593Smuzhiyun {
608*4882a593Smuzhiyun struct fence_chains fc;
609*4882a593Smuzhiyun struct task_struct *tsk;
610*4882a593Smuzhiyun int err;
611*4882a593Smuzhiyun int i;
612*4882a593Smuzhiyun
613*4882a593Smuzhiyun err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
614*4882a593Smuzhiyun if (err)
615*4882a593Smuzhiyun return err;
616*4882a593Smuzhiyun
617*4882a593Smuzhiyun tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
618*4882a593Smuzhiyun if (IS_ERR(tsk)) {
619*4882a593Smuzhiyun err = PTR_ERR(tsk);
620*4882a593Smuzhiyun goto err;
621*4882a593Smuzhiyun }
622*4882a593Smuzhiyun get_task_struct(tsk);
623*4882a593Smuzhiyun yield_to(tsk, true);
624*4882a593Smuzhiyun
625*4882a593Smuzhiyun for (i = fc.chain_length; i--; )
626*4882a593Smuzhiyun dma_fence_signal(fc.fences[i]);
627*4882a593Smuzhiyun
628*4882a593Smuzhiyun err = kthread_stop(tsk);
629*4882a593Smuzhiyun put_task_struct(tsk);
630*4882a593Smuzhiyun
631*4882a593Smuzhiyun err:
632*4882a593Smuzhiyun fence_chains_fini(&fc);
633*4882a593Smuzhiyun return err;
634*4882a593Smuzhiyun }
635*4882a593Smuzhiyun
randomise_fences(struct fence_chains * fc)636*4882a593Smuzhiyun static void randomise_fences(struct fence_chains *fc)
637*4882a593Smuzhiyun {
638*4882a593Smuzhiyun unsigned int count = fc->chain_length;
639*4882a593Smuzhiyun
640*4882a593Smuzhiyun /* Fisher-Yates shuffle courtesy of Knuth */
641*4882a593Smuzhiyun while (--count) {
642*4882a593Smuzhiyun unsigned int swp;
643*4882a593Smuzhiyun
644*4882a593Smuzhiyun swp = prandom_u32_max(count + 1);
645*4882a593Smuzhiyun if (swp == count)
646*4882a593Smuzhiyun continue;
647*4882a593Smuzhiyun
648*4882a593Smuzhiyun swap(fc->fences[count], fc->fences[swp]);
649*4882a593Smuzhiyun }
650*4882a593Smuzhiyun }
651*4882a593Smuzhiyun
wait_random(void * arg)652*4882a593Smuzhiyun static int wait_random(void *arg)
653*4882a593Smuzhiyun {
654*4882a593Smuzhiyun struct fence_chains fc;
655*4882a593Smuzhiyun struct task_struct *tsk;
656*4882a593Smuzhiyun int err;
657*4882a593Smuzhiyun int i;
658*4882a593Smuzhiyun
659*4882a593Smuzhiyun err = fence_chains_init(&fc, CHAIN_SZ, seqno_inc);
660*4882a593Smuzhiyun if (err)
661*4882a593Smuzhiyun return err;
662*4882a593Smuzhiyun
663*4882a593Smuzhiyun randomise_fences(&fc);
664*4882a593Smuzhiyun
665*4882a593Smuzhiyun tsk = kthread_run(__wait_fence_chains, &fc, "dmabuf/wait");
666*4882a593Smuzhiyun if (IS_ERR(tsk)) {
667*4882a593Smuzhiyun err = PTR_ERR(tsk);
668*4882a593Smuzhiyun goto err;
669*4882a593Smuzhiyun }
670*4882a593Smuzhiyun get_task_struct(tsk);
671*4882a593Smuzhiyun yield_to(tsk, true);
672*4882a593Smuzhiyun
673*4882a593Smuzhiyun for (i = 0; i < fc.chain_length; i++)
674*4882a593Smuzhiyun dma_fence_signal(fc.fences[i]);
675*4882a593Smuzhiyun
676*4882a593Smuzhiyun err = kthread_stop(tsk);
677*4882a593Smuzhiyun put_task_struct(tsk);
678*4882a593Smuzhiyun
679*4882a593Smuzhiyun err:
680*4882a593Smuzhiyun fence_chains_fini(&fc);
681*4882a593Smuzhiyun return err;
682*4882a593Smuzhiyun }
683*4882a593Smuzhiyun
dma_fence_chain(void)684*4882a593Smuzhiyun int dma_fence_chain(void)
685*4882a593Smuzhiyun {
686*4882a593Smuzhiyun static const struct subtest tests[] = {
687*4882a593Smuzhiyun SUBTEST(sanitycheck),
688*4882a593Smuzhiyun SUBTEST(find_seqno),
689*4882a593Smuzhiyun SUBTEST(find_signaled),
690*4882a593Smuzhiyun SUBTEST(find_out_of_order),
691*4882a593Smuzhiyun SUBTEST(find_gap),
692*4882a593Smuzhiyun SUBTEST(find_race),
693*4882a593Smuzhiyun SUBTEST(signal_forward),
694*4882a593Smuzhiyun SUBTEST(signal_backward),
695*4882a593Smuzhiyun SUBTEST(wait_forward),
696*4882a593Smuzhiyun SUBTEST(wait_backward),
697*4882a593Smuzhiyun SUBTEST(wait_random),
698*4882a593Smuzhiyun };
699*4882a593Smuzhiyun int ret;
700*4882a593Smuzhiyun
701*4882a593Smuzhiyun pr_info("sizeof(dma_fence_chain)=%zu\n",
702*4882a593Smuzhiyun sizeof(struct dma_fence_chain));
703*4882a593Smuzhiyun
704*4882a593Smuzhiyun slab_fences = KMEM_CACHE(mock_fence,
705*4882a593Smuzhiyun SLAB_TYPESAFE_BY_RCU |
706*4882a593Smuzhiyun SLAB_HWCACHE_ALIGN);
707*4882a593Smuzhiyun if (!slab_fences)
708*4882a593Smuzhiyun return -ENOMEM;
709*4882a593Smuzhiyun
710*4882a593Smuzhiyun ret = subtests(tests, NULL);
711*4882a593Smuzhiyun
712*4882a593Smuzhiyun kmem_cache_destroy(slab_fences);
713*4882a593Smuzhiyun return ret;
714*4882a593Smuzhiyun }
715