1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-or-later
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright 2015, Cyril Bur, IBM Corp.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * This test attempts to see if the VSX registers change across preemption.
6*4882a593Smuzhiyun * There is no way to be sure preemption happened so this test just
7*4882a593Smuzhiyun * uses many threads and a long wait. As such, a successful test
8*4882a593Smuzhiyun * doesn't mean much but a failure is bad.
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun
11*4882a593Smuzhiyun #include <stdio.h>
12*4882a593Smuzhiyun #include <string.h>
13*4882a593Smuzhiyun #include <unistd.h>
14*4882a593Smuzhiyun #include <sys/syscall.h>
15*4882a593Smuzhiyun #include <sys/time.h>
16*4882a593Smuzhiyun #include <sys/types.h>
17*4882a593Smuzhiyun #include <sys/wait.h>
18*4882a593Smuzhiyun #include <stdlib.h>
19*4882a593Smuzhiyun #include <pthread.h>
20*4882a593Smuzhiyun
21*4882a593Smuzhiyun #include "utils.h"
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun /* Time to wait for workers to get preempted (seconds) */
24*4882a593Smuzhiyun #define PREEMPT_TIME 20
25*4882a593Smuzhiyun /*
26*4882a593Smuzhiyun * Factor by which to multiply number of online CPUs for total number of
27*4882a593Smuzhiyun * worker threads
28*4882a593Smuzhiyun */
29*4882a593Smuzhiyun #define THREAD_FACTOR 8
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun /*
32*4882a593Smuzhiyun * Ensure there is twice the number of non-volatile VMX regs!
33*4882a593Smuzhiyun * check_vmx() is going to use the other half as space to put the live
34*4882a593Smuzhiyun * registers before calling vsx_memcmp()
35*4882a593Smuzhiyun */
36*4882a593Smuzhiyun __thread vector int varray[24] = {
37*4882a593Smuzhiyun {1, 2, 3, 4 }, {5, 6, 7, 8 }, {9, 10,11,12},
38*4882a593Smuzhiyun {13,14,15,16}, {17,18,19,20}, {21,22,23,24},
39*4882a593Smuzhiyun {25,26,27,28}, {29,30,31,32}, {33,34,35,36},
40*4882a593Smuzhiyun {37,38,39,40}, {41,42,43,44}, {45,46,47,48}
41*4882a593Smuzhiyun };
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun int threads_starting;
44*4882a593Smuzhiyun int running;
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun extern long preempt_vsx(vector int *varray, int *threads_starting, int *running);
47*4882a593Smuzhiyun
vsx_memcmp(vector int * a)48*4882a593Smuzhiyun long vsx_memcmp(vector int *a) {
49*4882a593Smuzhiyun vector int zero = {0, 0, 0, 0};
50*4882a593Smuzhiyun int i;
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun FAIL_IF(a != varray);
53*4882a593Smuzhiyun
54*4882a593Smuzhiyun for(i = 0; i < 12; i++) {
55*4882a593Smuzhiyun if (memcmp(&a[i + 12], &zero, sizeof(vector int)) == 0) {
56*4882a593Smuzhiyun fprintf(stderr, "Detected zero from the VSX reg %d\n", i + 12);
57*4882a593Smuzhiyun return 2;
58*4882a593Smuzhiyun }
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun if (memcmp(a, &a[12], 12 * sizeof(vector int))) {
62*4882a593Smuzhiyun long *p = (long *)a;
63*4882a593Smuzhiyun fprintf(stderr, "VSX mismatch\n");
64*4882a593Smuzhiyun for (i = 0; i < 24; i=i+2)
65*4882a593Smuzhiyun fprintf(stderr, "%d: 0x%08lx%08lx | 0x%08lx%08lx\n",
66*4882a593Smuzhiyun i/2 + i%2 + 20, p[i], p[i + 1], p[i + 24], p[i + 25]);
67*4882a593Smuzhiyun return 1;
68*4882a593Smuzhiyun }
69*4882a593Smuzhiyun return 0;
70*4882a593Smuzhiyun }
71*4882a593Smuzhiyun
preempt_vsx_c(void * p)72*4882a593Smuzhiyun void *preempt_vsx_c(void *p)
73*4882a593Smuzhiyun {
74*4882a593Smuzhiyun int i, j;
75*4882a593Smuzhiyun long rc;
76*4882a593Smuzhiyun srand(pthread_self());
77*4882a593Smuzhiyun for (i = 0; i < 12; i++)
78*4882a593Smuzhiyun for (j = 0; j < 4; j++) {
79*4882a593Smuzhiyun varray[i][j] = rand();
80*4882a593Smuzhiyun /* Don't want zero because it hides kernel problems */
81*4882a593Smuzhiyun if (varray[i][j] == 0)
82*4882a593Smuzhiyun j--;
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun rc = preempt_vsx(varray, &threads_starting, &running);
85*4882a593Smuzhiyun if (rc == 2)
86*4882a593Smuzhiyun fprintf(stderr, "Caught zeros in VSX compares\n");
87*4882a593Smuzhiyun return (void *)rc;
88*4882a593Smuzhiyun }
89*4882a593Smuzhiyun
test_preempt_vsx(void)90*4882a593Smuzhiyun int test_preempt_vsx(void)
91*4882a593Smuzhiyun {
92*4882a593Smuzhiyun int i, rc, threads;
93*4882a593Smuzhiyun pthread_t *tids;
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun SKIP_IF(!have_hwcap(PPC_FEATURE_HAS_VSX));
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun threads = sysconf(_SC_NPROCESSORS_ONLN) * THREAD_FACTOR;
98*4882a593Smuzhiyun tids = malloc(threads * sizeof(pthread_t));
99*4882a593Smuzhiyun FAIL_IF(!tids);
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun running = true;
102*4882a593Smuzhiyun threads_starting = threads;
103*4882a593Smuzhiyun for (i = 0; i < threads; i++) {
104*4882a593Smuzhiyun rc = pthread_create(&tids[i], NULL, preempt_vsx_c, NULL);
105*4882a593Smuzhiyun FAIL_IF(rc);
106*4882a593Smuzhiyun }
107*4882a593Smuzhiyun
108*4882a593Smuzhiyun setbuf(stdout, NULL);
109*4882a593Smuzhiyun /* Not really nessesary but nice to wait for every thread to start */
110*4882a593Smuzhiyun printf("\tWaiting for %d workers to start...", threads_starting);
111*4882a593Smuzhiyun while(threads_starting)
112*4882a593Smuzhiyun asm volatile("": : :"memory");
113*4882a593Smuzhiyun printf("done\n");
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun printf("\tWaiting for %d seconds to let some workers get preempted...", PREEMPT_TIME);
116*4882a593Smuzhiyun sleep(PREEMPT_TIME);
117*4882a593Smuzhiyun printf("done\n");
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun printf("\tStopping workers...");
120*4882a593Smuzhiyun /*
121*4882a593Smuzhiyun * Working are checking this value every loop. In preempt_vsx 'cmpwi r5,0; bne 2b'.
122*4882a593Smuzhiyun * r5 will have loaded the value of running.
123*4882a593Smuzhiyun */
124*4882a593Smuzhiyun running = 0;
125*4882a593Smuzhiyun for (i = 0; i < threads; i++) {
126*4882a593Smuzhiyun void *rc_p;
127*4882a593Smuzhiyun pthread_join(tids[i], &rc_p);
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /*
130*4882a593Smuzhiyun * Harness will say the fail was here, look at why preempt_vsx
131*4882a593Smuzhiyun * returned
132*4882a593Smuzhiyun */
133*4882a593Smuzhiyun if ((long) rc_p)
134*4882a593Smuzhiyun printf("oops\n");
135*4882a593Smuzhiyun FAIL_IF((long) rc_p);
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun printf("done\n");
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun return 0;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun
main(int argc,char * argv[])142*4882a593Smuzhiyun int main(int argc, char *argv[])
143*4882a593Smuzhiyun {
144*4882a593Smuzhiyun return test_harness(test_preempt_vsx, "vsx_preempt");
145*4882a593Smuzhiyun }
146