1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Smp timebase synchronization for ppc.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2003 Samuel Rydh (samuel@ibrium.se)
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun */
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/kernel.h>
10*4882a593Smuzhiyun #include <linux/sched.h>
11*4882a593Smuzhiyun #include <linux/smp.h>
12*4882a593Smuzhiyun #include <linux/unistd.h>
13*4882a593Smuzhiyun #include <linux/slab.h>
14*4882a593Smuzhiyun #include <linux/atomic.h>
15*4882a593Smuzhiyun #include <asm/smp.h>
16*4882a593Smuzhiyun #include <asm/time.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #define NUM_ITER 300
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun enum {
21*4882a593Smuzhiyun kExit=0, kSetAndTest, kTest
22*4882a593Smuzhiyun };
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun static struct {
25*4882a593Smuzhiyun volatile u64 tb;
26*4882a593Smuzhiyun volatile u64 mark;
27*4882a593Smuzhiyun volatile int cmd;
28*4882a593Smuzhiyun volatile int handshake;
29*4882a593Smuzhiyun int filler[2];
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun volatile int ack;
32*4882a593Smuzhiyun int filler2[7];
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun volatile int race_result;
35*4882a593Smuzhiyun } *tbsync;
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun static volatile int running;
38*4882a593Smuzhiyun
enter_contest(u64 mark,long add)39*4882a593Smuzhiyun static void enter_contest(u64 mark, long add)
40*4882a593Smuzhiyun {
41*4882a593Smuzhiyun while (get_tb() < mark)
42*4882a593Smuzhiyun tbsync->race_result = add;
43*4882a593Smuzhiyun }
44*4882a593Smuzhiyun
smp_generic_take_timebase(void)45*4882a593Smuzhiyun void smp_generic_take_timebase(void)
46*4882a593Smuzhiyun {
47*4882a593Smuzhiyun int cmd;
48*4882a593Smuzhiyun u64 tb;
49*4882a593Smuzhiyun unsigned long flags;
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun local_irq_save(flags);
52*4882a593Smuzhiyun while (!running)
53*4882a593Smuzhiyun barrier();
54*4882a593Smuzhiyun rmb();
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun for (;;) {
57*4882a593Smuzhiyun tbsync->ack = 1;
58*4882a593Smuzhiyun while (!tbsync->handshake)
59*4882a593Smuzhiyun barrier();
60*4882a593Smuzhiyun rmb();
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun cmd = tbsync->cmd;
63*4882a593Smuzhiyun tb = tbsync->tb;
64*4882a593Smuzhiyun mb();
65*4882a593Smuzhiyun tbsync->ack = 0;
66*4882a593Smuzhiyun if (cmd == kExit)
67*4882a593Smuzhiyun break;
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun while (tbsync->handshake)
70*4882a593Smuzhiyun barrier();
71*4882a593Smuzhiyun if (cmd == kSetAndTest)
72*4882a593Smuzhiyun set_tb(tb >> 32, tb & 0xfffffffful);
73*4882a593Smuzhiyun enter_contest(tbsync->mark, -1);
74*4882a593Smuzhiyun }
75*4882a593Smuzhiyun local_irq_restore(flags);
76*4882a593Smuzhiyun }
77*4882a593Smuzhiyun
start_contest(int cmd,long offset,int num)78*4882a593Smuzhiyun static int start_contest(int cmd, long offset, int num)
79*4882a593Smuzhiyun {
80*4882a593Smuzhiyun int i, score=0;
81*4882a593Smuzhiyun u64 tb;
82*4882a593Smuzhiyun u64 mark;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun tbsync->cmd = cmd;
85*4882a593Smuzhiyun
86*4882a593Smuzhiyun local_irq_disable();
87*4882a593Smuzhiyun for (i = -3; i < num; ) {
88*4882a593Smuzhiyun tb = get_tb() + 400;
89*4882a593Smuzhiyun tbsync->tb = tb + offset;
90*4882a593Smuzhiyun tbsync->mark = mark = tb + 400;
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun wmb();
93*4882a593Smuzhiyun
94*4882a593Smuzhiyun tbsync->handshake = 1;
95*4882a593Smuzhiyun while (tbsync->ack)
96*4882a593Smuzhiyun barrier();
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun while (get_tb() <= tb)
99*4882a593Smuzhiyun barrier();
100*4882a593Smuzhiyun tbsync->handshake = 0;
101*4882a593Smuzhiyun enter_contest(mark, 1);
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun while (!tbsync->ack)
104*4882a593Smuzhiyun barrier();
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun if (i++ > 0)
107*4882a593Smuzhiyun score += tbsync->race_result;
108*4882a593Smuzhiyun }
109*4882a593Smuzhiyun local_irq_enable();
110*4882a593Smuzhiyun return score;
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
smp_generic_give_timebase(void)113*4882a593Smuzhiyun void smp_generic_give_timebase(void)
114*4882a593Smuzhiyun {
115*4882a593Smuzhiyun int i, score, score2, old, min=0, max=5000, offset=1000;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun pr_debug("Software timebase sync\n");
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun /* if this fails then this kernel won't work anyway... */
120*4882a593Smuzhiyun tbsync = kzalloc( sizeof(*tbsync), GFP_KERNEL );
121*4882a593Smuzhiyun mb();
122*4882a593Smuzhiyun running = 1;
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun while (!tbsync->ack)
125*4882a593Smuzhiyun barrier();
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun pr_debug("Got ack\n");
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /* binary search */
130*4882a593Smuzhiyun for (old = -1; old != offset ; offset = (min+max) / 2) {
131*4882a593Smuzhiyun score = start_contest(kSetAndTest, offset, NUM_ITER);
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun pr_debug("score %d, offset %d\n", score, offset );
134*4882a593Smuzhiyun
135*4882a593Smuzhiyun if( score > 0 )
136*4882a593Smuzhiyun max = offset;
137*4882a593Smuzhiyun else
138*4882a593Smuzhiyun min = offset;
139*4882a593Smuzhiyun old = offset;
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun score = start_contest(kSetAndTest, min, NUM_ITER);
142*4882a593Smuzhiyun score2 = start_contest(kSetAndTest, max, NUM_ITER);
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun pr_debug("Min %d (score %d), Max %d (score %d)\n",
145*4882a593Smuzhiyun min, score, max, score2);
146*4882a593Smuzhiyun score = abs(score);
147*4882a593Smuzhiyun score2 = abs(score2);
148*4882a593Smuzhiyun offset = (score < score2) ? min : max;
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun /* guard against inaccurate mttb */
151*4882a593Smuzhiyun for (i = 0; i < 10; i++) {
152*4882a593Smuzhiyun start_contest(kSetAndTest, offset, NUM_ITER/10);
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun if ((score2 = start_contest(kTest, offset, NUM_ITER)) < 0)
155*4882a593Smuzhiyun score2 = -score2;
156*4882a593Smuzhiyun if (score2 <= score || score2 < 20)
157*4882a593Smuzhiyun break;
158*4882a593Smuzhiyun }
159*4882a593Smuzhiyun pr_debug("Final offset: %d (%d/%d)\n", offset, score2, NUM_ITER );
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun /* exiting */
162*4882a593Smuzhiyun tbsync->cmd = kExit;
163*4882a593Smuzhiyun wmb();
164*4882a593Smuzhiyun tbsync->handshake = 1;
165*4882a593Smuzhiyun while (tbsync->ack)
166*4882a593Smuzhiyun barrier();
167*4882a593Smuzhiyun tbsync->handshake = 0;
168*4882a593Smuzhiyun kfree(tbsync);
169*4882a593Smuzhiyun tbsync = NULL;
170*4882a593Smuzhiyun running = 0;
171*4882a593Smuzhiyun }
172