xref: /OK3568_Linux_fs/kernel/arch/arc/include/asm/atomic.h (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-only */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) 2004, 2007-2010, 2011-2012 Synopsys, Inc. (www.synopsys.com)
4*4882a593Smuzhiyun  */
5*4882a593Smuzhiyun 
6*4882a593Smuzhiyun #ifndef _ASM_ARC_ATOMIC_H
7*4882a593Smuzhiyun #define _ASM_ARC_ATOMIC_H
8*4882a593Smuzhiyun 
9*4882a593Smuzhiyun #ifndef __ASSEMBLY__
10*4882a593Smuzhiyun 
11*4882a593Smuzhiyun #include <linux/types.h>
12*4882a593Smuzhiyun #include <linux/compiler.h>
13*4882a593Smuzhiyun #include <asm/cmpxchg.h>
14*4882a593Smuzhiyun #include <asm/barrier.h>
15*4882a593Smuzhiyun #include <asm/smp.h>
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #define atomic_read(v)  READ_ONCE((v)->counter)
18*4882a593Smuzhiyun 
19*4882a593Smuzhiyun #ifdef CONFIG_ARC_HAS_LLSC
20*4882a593Smuzhiyun 
21*4882a593Smuzhiyun #define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op)					\
24*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v)			\
25*4882a593Smuzhiyun {									\
26*4882a593Smuzhiyun 	unsigned int val;						\
27*4882a593Smuzhiyun 									\
28*4882a593Smuzhiyun 	__asm__ __volatile__(						\
29*4882a593Smuzhiyun 	"1:	llock   %[val], [%[ctr]]		\n"		\
30*4882a593Smuzhiyun 	"	" #asm_op " %[val], %[val], %[i]	\n"		\
31*4882a593Smuzhiyun 	"	scond   %[val], [%[ctr]]		\n"		\
32*4882a593Smuzhiyun 	"	bnz     1b				\n"		\
33*4882a593Smuzhiyun 	: [val]	"=&r"	(val) /* Early clobber to prevent reg reuse */	\
34*4882a593Smuzhiyun 	: [ctr]	"r"	(&v->counter), /* Not "m": llock only supports reg direct addr mode */	\
35*4882a593Smuzhiyun 	  [i]	"ir"	(i)						\
36*4882a593Smuzhiyun 	: "cc");							\
37*4882a593Smuzhiyun }									\
38*4882a593Smuzhiyun 
39*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op)				\
40*4882a593Smuzhiyun static inline int atomic_##op##_return(int i, atomic_t *v)		\
41*4882a593Smuzhiyun {									\
42*4882a593Smuzhiyun 	unsigned int val;						\
43*4882a593Smuzhiyun 									\
44*4882a593Smuzhiyun 	/*								\
45*4882a593Smuzhiyun 	 * Explicit full memory barrier needed before/after as		\
46*4882a593Smuzhiyun 	 * LLOCK/SCOND themselves don't provide any such semantics	\
47*4882a593Smuzhiyun 	 */								\
48*4882a593Smuzhiyun 	smp_mb();							\
49*4882a593Smuzhiyun 									\
50*4882a593Smuzhiyun 	__asm__ __volatile__(						\
51*4882a593Smuzhiyun 	"1:	llock   %[val], [%[ctr]]		\n"		\
52*4882a593Smuzhiyun 	"	" #asm_op " %[val], %[val], %[i]	\n"		\
53*4882a593Smuzhiyun 	"	scond   %[val], [%[ctr]]		\n"		\
54*4882a593Smuzhiyun 	"	bnz     1b				\n"		\
55*4882a593Smuzhiyun 	: [val]	"=&r"	(val)						\
56*4882a593Smuzhiyun 	: [ctr]	"r"	(&v->counter),					\
57*4882a593Smuzhiyun 	  [i]	"ir"	(i)						\
58*4882a593Smuzhiyun 	: "cc");							\
59*4882a593Smuzhiyun 									\
60*4882a593Smuzhiyun 	smp_mb();							\
61*4882a593Smuzhiyun 									\
62*4882a593Smuzhiyun 	return val;							\
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun 
65*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op)				\
66*4882a593Smuzhiyun static inline int atomic_fetch_##op(int i, atomic_t *v)			\
67*4882a593Smuzhiyun {									\
68*4882a593Smuzhiyun 	unsigned int val, orig;						\
69*4882a593Smuzhiyun 									\
70*4882a593Smuzhiyun 	/*								\
71*4882a593Smuzhiyun 	 * Explicit full memory barrier needed before/after as		\
72*4882a593Smuzhiyun 	 * LLOCK/SCOND themselves don't provide any such semantics	\
73*4882a593Smuzhiyun 	 */								\
74*4882a593Smuzhiyun 	smp_mb();							\
75*4882a593Smuzhiyun 									\
76*4882a593Smuzhiyun 	__asm__ __volatile__(						\
77*4882a593Smuzhiyun 	"1:	llock   %[orig], [%[ctr]]		\n"		\
78*4882a593Smuzhiyun 	"	" #asm_op " %[val], %[orig], %[i]	\n"		\
79*4882a593Smuzhiyun 	"	scond   %[val], [%[ctr]]		\n"		\
80*4882a593Smuzhiyun 	"	bnz     1b				\n"		\
81*4882a593Smuzhiyun 	: [val]	"=&r"	(val),						\
82*4882a593Smuzhiyun 	  [orig] "=&r" (orig)						\
83*4882a593Smuzhiyun 	: [ctr]	"r"	(&v->counter),					\
84*4882a593Smuzhiyun 	  [i]	"ir"	(i)						\
85*4882a593Smuzhiyun 	: "cc");							\
86*4882a593Smuzhiyun 									\
87*4882a593Smuzhiyun 	smp_mb();							\
88*4882a593Smuzhiyun 									\
89*4882a593Smuzhiyun 	return orig;							\
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun #else	/* !CONFIG_ARC_HAS_LLSC */
93*4882a593Smuzhiyun 
94*4882a593Smuzhiyun #ifndef CONFIG_SMP
95*4882a593Smuzhiyun 
96*4882a593Smuzhiyun  /* violating atomic_xxx API locking protocol in UP for optimization sake */
97*4882a593Smuzhiyun #define atomic_set(v, i) WRITE_ONCE(((v)->counter), (i))
98*4882a593Smuzhiyun 
99*4882a593Smuzhiyun #else
100*4882a593Smuzhiyun 
atomic_set(atomic_t * v,int i)101*4882a593Smuzhiyun static inline void atomic_set(atomic_t *v, int i)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun 	/*
104*4882a593Smuzhiyun 	 * Independent of hardware support, all of the atomic_xxx() APIs need
105*4882a593Smuzhiyun 	 * to follow the same locking rules to make sure that a "hardware"
106*4882a593Smuzhiyun 	 * atomic insn (e.g. LD) doesn't clobber an "emulated" atomic insn
107*4882a593Smuzhiyun 	 * sequence
108*4882a593Smuzhiyun 	 *
109*4882a593Smuzhiyun 	 * Thus atomic_set() despite being 1 insn (and seemingly atomic)
110*4882a593Smuzhiyun 	 * requires the locking.
111*4882a593Smuzhiyun 	 */
112*4882a593Smuzhiyun 	unsigned long flags;
113*4882a593Smuzhiyun 
114*4882a593Smuzhiyun 	atomic_ops_lock(flags);
115*4882a593Smuzhiyun 	WRITE_ONCE(v->counter, i);
116*4882a593Smuzhiyun 	atomic_ops_unlock(flags);
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun #define atomic_set_release(v, i)	atomic_set((v), (i))
120*4882a593Smuzhiyun 
121*4882a593Smuzhiyun #endif
122*4882a593Smuzhiyun 
123*4882a593Smuzhiyun /*
124*4882a593Smuzhiyun  * Non hardware assisted Atomic-R-M-W
125*4882a593Smuzhiyun  * Locking would change to irq-disabling only (UP) and spinlocks (SMP)
126*4882a593Smuzhiyun  */
127*4882a593Smuzhiyun 
128*4882a593Smuzhiyun #define ATOMIC_OP(op, c_op, asm_op)					\
129*4882a593Smuzhiyun static inline void atomic_##op(int i, atomic_t *v)			\
130*4882a593Smuzhiyun {									\
131*4882a593Smuzhiyun 	unsigned long flags;						\
132*4882a593Smuzhiyun 									\
133*4882a593Smuzhiyun 	atomic_ops_lock(flags);						\
134*4882a593Smuzhiyun 	v->counter c_op i;						\
135*4882a593Smuzhiyun 	atomic_ops_unlock(flags);					\
136*4882a593Smuzhiyun }
137*4882a593Smuzhiyun 
138*4882a593Smuzhiyun #define ATOMIC_OP_RETURN(op, c_op, asm_op)				\
139*4882a593Smuzhiyun static inline int atomic_##op##_return(int i, atomic_t *v)		\
140*4882a593Smuzhiyun {									\
141*4882a593Smuzhiyun 	unsigned long flags;						\
142*4882a593Smuzhiyun 	unsigned long temp;						\
143*4882a593Smuzhiyun 									\
144*4882a593Smuzhiyun 	/*								\
145*4882a593Smuzhiyun 	 * spin lock/unlock provides the needed smp_mb() before/after	\
146*4882a593Smuzhiyun 	 */								\
147*4882a593Smuzhiyun 	atomic_ops_lock(flags);						\
148*4882a593Smuzhiyun 	temp = v->counter;						\
149*4882a593Smuzhiyun 	temp c_op i;							\
150*4882a593Smuzhiyun 	v->counter = temp;						\
151*4882a593Smuzhiyun 	atomic_ops_unlock(flags);					\
152*4882a593Smuzhiyun 									\
153*4882a593Smuzhiyun 	return temp;							\
154*4882a593Smuzhiyun }
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun #define ATOMIC_FETCH_OP(op, c_op, asm_op)				\
157*4882a593Smuzhiyun static inline int atomic_fetch_##op(int i, atomic_t *v)			\
158*4882a593Smuzhiyun {									\
159*4882a593Smuzhiyun 	unsigned long flags;						\
160*4882a593Smuzhiyun 	unsigned long orig;						\
161*4882a593Smuzhiyun 									\
162*4882a593Smuzhiyun 	/*								\
163*4882a593Smuzhiyun 	 * spin lock/unlock provides the needed smp_mb() before/after	\
164*4882a593Smuzhiyun 	 */								\
165*4882a593Smuzhiyun 	atomic_ops_lock(flags);						\
166*4882a593Smuzhiyun 	orig = v->counter;						\
167*4882a593Smuzhiyun 	v->counter c_op i;						\
168*4882a593Smuzhiyun 	atomic_ops_unlock(flags);					\
169*4882a593Smuzhiyun 									\
170*4882a593Smuzhiyun 	return orig;							\
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun #endif /* !CONFIG_ARC_HAS_LLSC */
174*4882a593Smuzhiyun 
175*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op)					\
176*4882a593Smuzhiyun 	ATOMIC_OP(op, c_op, asm_op)					\
177*4882a593Smuzhiyun 	ATOMIC_OP_RETURN(op, c_op, asm_op)				\
178*4882a593Smuzhiyun 	ATOMIC_FETCH_OP(op, c_op, asm_op)
179*4882a593Smuzhiyun 
180*4882a593Smuzhiyun ATOMIC_OPS(add, +=, add)
181*4882a593Smuzhiyun ATOMIC_OPS(sub, -=, sub)
182*4882a593Smuzhiyun 
183*4882a593Smuzhiyun #define atomic_andnot		atomic_andnot
184*4882a593Smuzhiyun #define atomic_fetch_andnot	atomic_fetch_andnot
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun #undef ATOMIC_OPS
187*4882a593Smuzhiyun #define ATOMIC_OPS(op, c_op, asm_op)					\
188*4882a593Smuzhiyun 	ATOMIC_OP(op, c_op, asm_op)					\
189*4882a593Smuzhiyun 	ATOMIC_FETCH_OP(op, c_op, asm_op)
190*4882a593Smuzhiyun 
191*4882a593Smuzhiyun ATOMIC_OPS(and, &=, and)
192*4882a593Smuzhiyun ATOMIC_OPS(andnot, &= ~, bic)
193*4882a593Smuzhiyun ATOMIC_OPS(or, |=, or)
194*4882a593Smuzhiyun ATOMIC_OPS(xor, ^=, xor)
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun #undef ATOMIC_OPS
197*4882a593Smuzhiyun #undef ATOMIC_FETCH_OP
198*4882a593Smuzhiyun #undef ATOMIC_OP_RETURN
199*4882a593Smuzhiyun #undef ATOMIC_OP
200*4882a593Smuzhiyun 
201*4882a593Smuzhiyun #ifdef CONFIG_GENERIC_ATOMIC64
202*4882a593Smuzhiyun 
203*4882a593Smuzhiyun #include <asm-generic/atomic64.h>
204*4882a593Smuzhiyun 
205*4882a593Smuzhiyun #else	/* Kconfig ensures this is only enabled with needed h/w assist */
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun /*
208*4882a593Smuzhiyun  * ARCv2 supports 64-bit exclusive load (LLOCKD) / store (SCONDD)
209*4882a593Smuzhiyun  *  - The address HAS to be 64-bit aligned
210*4882a593Smuzhiyun  *  - There are 2 semantics involved here:
211*4882a593Smuzhiyun  *    = exclusive implies no interim update between load/store to same addr
212*4882a593Smuzhiyun  *    = both words are observed/updated together: this is guaranteed even
213*4882a593Smuzhiyun  *      for regular 64-bit load (LDD) / store (STD). Thus atomic64_set()
214*4882a593Smuzhiyun  *      is NOT required to use LLOCKD+SCONDD, STD suffices
215*4882a593Smuzhiyun  */
216*4882a593Smuzhiyun 
217*4882a593Smuzhiyun typedef struct {
218*4882a593Smuzhiyun 	s64 __aligned(8) counter;
219*4882a593Smuzhiyun } atomic64_t;
220*4882a593Smuzhiyun 
221*4882a593Smuzhiyun #define ATOMIC64_INIT(a) { (a) }
222*4882a593Smuzhiyun 
223*4882a593Smuzhiyun static inline s64 atomic64_read(const atomic64_t *v)
224*4882a593Smuzhiyun {
225*4882a593Smuzhiyun 	s64 val;
226*4882a593Smuzhiyun 
227*4882a593Smuzhiyun 	__asm__ __volatile__(
228*4882a593Smuzhiyun 	"	ldd   %0, [%1]	\n"
229*4882a593Smuzhiyun 	: "=r"(val)
230*4882a593Smuzhiyun 	: "r"(&v->counter));
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun 	return val;
233*4882a593Smuzhiyun }
234*4882a593Smuzhiyun 
235*4882a593Smuzhiyun static inline void atomic64_set(atomic64_t *v, s64 a)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun 	/*
238*4882a593Smuzhiyun 	 * This could have been a simple assignment in "C" but would need
239*4882a593Smuzhiyun 	 * explicit volatile. Otherwise gcc optimizers could elide the store
240*4882a593Smuzhiyun 	 * which borked atomic64 self-test
241*4882a593Smuzhiyun 	 * In the inline asm version, memory clobber needed for exact same
242*4882a593Smuzhiyun 	 * reason, to tell gcc about the store.
243*4882a593Smuzhiyun 	 *
244*4882a593Smuzhiyun 	 * This however is not needed for sibling atomic64_add() etc since both
245*4882a593Smuzhiyun 	 * load/store are explicitly done in inline asm. As long as API is used
246*4882a593Smuzhiyun 	 * for each access, gcc has no way to optimize away any load/store
247*4882a593Smuzhiyun 	 */
248*4882a593Smuzhiyun 	__asm__ __volatile__(
249*4882a593Smuzhiyun 	"	std   %0, [%1]	\n"
250*4882a593Smuzhiyun 	:
251*4882a593Smuzhiyun 	: "r"(a), "r"(&v->counter)
252*4882a593Smuzhiyun 	: "memory");
253*4882a593Smuzhiyun }
254*4882a593Smuzhiyun 
255*4882a593Smuzhiyun #define ATOMIC64_OP(op, op1, op2)					\
256*4882a593Smuzhiyun static inline void atomic64_##op(s64 a, atomic64_t *v)			\
257*4882a593Smuzhiyun {									\
258*4882a593Smuzhiyun 	s64 val;							\
259*4882a593Smuzhiyun 									\
260*4882a593Smuzhiyun 	__asm__ __volatile__(						\
261*4882a593Smuzhiyun 	"1:				\n"				\
262*4882a593Smuzhiyun 	"	llockd  %0, [%1]	\n"				\
263*4882a593Smuzhiyun 	"	" #op1 " %L0, %L0, %L2	\n"				\
264*4882a593Smuzhiyun 	"	" #op2 " %H0, %H0, %H2	\n"				\
265*4882a593Smuzhiyun 	"	scondd   %0, [%1]	\n"				\
266*4882a593Smuzhiyun 	"	bnz     1b		\n"				\
267*4882a593Smuzhiyun 	: "=&r"(val)							\
268*4882a593Smuzhiyun 	: "r"(&v->counter), "ir"(a)					\
269*4882a593Smuzhiyun 	: "cc");							\
270*4882a593Smuzhiyun }									\
271*4882a593Smuzhiyun 
272*4882a593Smuzhiyun #define ATOMIC64_OP_RETURN(op, op1, op2)		        	\
273*4882a593Smuzhiyun static inline s64 atomic64_##op##_return(s64 a, atomic64_t *v)		\
274*4882a593Smuzhiyun {									\
275*4882a593Smuzhiyun 	s64 val;							\
276*4882a593Smuzhiyun 									\
277*4882a593Smuzhiyun 	smp_mb();							\
278*4882a593Smuzhiyun 									\
279*4882a593Smuzhiyun 	__asm__ __volatile__(						\
280*4882a593Smuzhiyun 	"1:				\n"				\
281*4882a593Smuzhiyun 	"	llockd   %0, [%1]	\n"				\
282*4882a593Smuzhiyun 	"	" #op1 " %L0, %L0, %L2	\n"				\
283*4882a593Smuzhiyun 	"	" #op2 " %H0, %H0, %H2	\n"				\
284*4882a593Smuzhiyun 	"	scondd   %0, [%1]	\n"				\
285*4882a593Smuzhiyun 	"	bnz     1b		\n"				\
286*4882a593Smuzhiyun 	: [val] "=&r"(val)						\
287*4882a593Smuzhiyun 	: "r"(&v->counter), "ir"(a)					\
288*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */	\
289*4882a593Smuzhiyun 									\
290*4882a593Smuzhiyun 	smp_mb();							\
291*4882a593Smuzhiyun 									\
292*4882a593Smuzhiyun 	return val;							\
293*4882a593Smuzhiyun }
294*4882a593Smuzhiyun 
295*4882a593Smuzhiyun #define ATOMIC64_FETCH_OP(op, op1, op2)		        		\
296*4882a593Smuzhiyun static inline s64 atomic64_fetch_##op(s64 a, atomic64_t *v)		\
297*4882a593Smuzhiyun {									\
298*4882a593Smuzhiyun 	s64 val, orig;							\
299*4882a593Smuzhiyun 									\
300*4882a593Smuzhiyun 	smp_mb();							\
301*4882a593Smuzhiyun 									\
302*4882a593Smuzhiyun 	__asm__ __volatile__(						\
303*4882a593Smuzhiyun 	"1:				\n"				\
304*4882a593Smuzhiyun 	"	llockd   %0, [%2]	\n"				\
305*4882a593Smuzhiyun 	"	" #op1 " %L1, %L0, %L3	\n"				\
306*4882a593Smuzhiyun 	"	" #op2 " %H1, %H0, %H3	\n"				\
307*4882a593Smuzhiyun 	"	scondd   %1, [%2]	\n"				\
308*4882a593Smuzhiyun 	"	bnz     1b		\n"				\
309*4882a593Smuzhiyun 	: "=&r"(orig), "=&r"(val)					\
310*4882a593Smuzhiyun 	: "r"(&v->counter), "ir"(a)					\
311*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */	\
312*4882a593Smuzhiyun 									\
313*4882a593Smuzhiyun 	smp_mb();							\
314*4882a593Smuzhiyun 									\
315*4882a593Smuzhiyun 	return orig;							\
316*4882a593Smuzhiyun }
317*4882a593Smuzhiyun 
318*4882a593Smuzhiyun #define ATOMIC64_OPS(op, op1, op2)					\
319*4882a593Smuzhiyun 	ATOMIC64_OP(op, op1, op2)					\
320*4882a593Smuzhiyun 	ATOMIC64_OP_RETURN(op, op1, op2)				\
321*4882a593Smuzhiyun 	ATOMIC64_FETCH_OP(op, op1, op2)
322*4882a593Smuzhiyun 
323*4882a593Smuzhiyun #define atomic64_andnot		atomic64_andnot
324*4882a593Smuzhiyun #define atomic64_fetch_andnot	atomic64_fetch_andnot
325*4882a593Smuzhiyun 
326*4882a593Smuzhiyun ATOMIC64_OPS(add, add.f, adc)
327*4882a593Smuzhiyun ATOMIC64_OPS(sub, sub.f, sbc)
328*4882a593Smuzhiyun ATOMIC64_OPS(and, and, and)
329*4882a593Smuzhiyun ATOMIC64_OPS(andnot, bic, bic)
330*4882a593Smuzhiyun ATOMIC64_OPS(or, or, or)
331*4882a593Smuzhiyun ATOMIC64_OPS(xor, xor, xor)
332*4882a593Smuzhiyun 
333*4882a593Smuzhiyun #undef ATOMIC64_OPS
334*4882a593Smuzhiyun #undef ATOMIC64_FETCH_OP
335*4882a593Smuzhiyun #undef ATOMIC64_OP_RETURN
336*4882a593Smuzhiyun #undef ATOMIC64_OP
337*4882a593Smuzhiyun 
338*4882a593Smuzhiyun static inline s64
339*4882a593Smuzhiyun atomic64_cmpxchg(atomic64_t *ptr, s64 expected, s64 new)
340*4882a593Smuzhiyun {
341*4882a593Smuzhiyun 	s64 prev;
342*4882a593Smuzhiyun 
343*4882a593Smuzhiyun 	smp_mb();
344*4882a593Smuzhiyun 
345*4882a593Smuzhiyun 	__asm__ __volatile__(
346*4882a593Smuzhiyun 	"1:	llockd  %0, [%1]	\n"
347*4882a593Smuzhiyun 	"	brne    %L0, %L2, 2f	\n"
348*4882a593Smuzhiyun 	"	brne    %H0, %H2, 2f	\n"
349*4882a593Smuzhiyun 	"	scondd  %3, [%1]	\n"
350*4882a593Smuzhiyun 	"	bnz     1b		\n"
351*4882a593Smuzhiyun 	"2:				\n"
352*4882a593Smuzhiyun 	: "=&r"(prev)
353*4882a593Smuzhiyun 	: "r"(ptr), "ir"(expected), "r"(new)
354*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */
355*4882a593Smuzhiyun 
356*4882a593Smuzhiyun 	smp_mb();
357*4882a593Smuzhiyun 
358*4882a593Smuzhiyun 	return prev;
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun 
361*4882a593Smuzhiyun static inline s64 atomic64_xchg(atomic64_t *ptr, s64 new)
362*4882a593Smuzhiyun {
363*4882a593Smuzhiyun 	s64 prev;
364*4882a593Smuzhiyun 
365*4882a593Smuzhiyun 	smp_mb();
366*4882a593Smuzhiyun 
367*4882a593Smuzhiyun 	__asm__ __volatile__(
368*4882a593Smuzhiyun 	"1:	llockd  %0, [%1]	\n"
369*4882a593Smuzhiyun 	"	scondd  %2, [%1]	\n"
370*4882a593Smuzhiyun 	"	bnz     1b		\n"
371*4882a593Smuzhiyun 	"2:				\n"
372*4882a593Smuzhiyun 	: "=&r"(prev)
373*4882a593Smuzhiyun 	: "r"(ptr), "r"(new)
374*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */
375*4882a593Smuzhiyun 
376*4882a593Smuzhiyun 	smp_mb();
377*4882a593Smuzhiyun 
378*4882a593Smuzhiyun 	return prev;
379*4882a593Smuzhiyun }
380*4882a593Smuzhiyun 
381*4882a593Smuzhiyun /**
382*4882a593Smuzhiyun  * atomic64_dec_if_positive - decrement by 1 if old value positive
383*4882a593Smuzhiyun  * @v: pointer of type atomic64_t
384*4882a593Smuzhiyun  *
385*4882a593Smuzhiyun  * The function returns the old value of *v minus 1, even if
386*4882a593Smuzhiyun  * the atomic variable, v, was not decremented.
387*4882a593Smuzhiyun  */
388*4882a593Smuzhiyun 
389*4882a593Smuzhiyun static inline s64 atomic64_dec_if_positive(atomic64_t *v)
390*4882a593Smuzhiyun {
391*4882a593Smuzhiyun 	s64 val;
392*4882a593Smuzhiyun 
393*4882a593Smuzhiyun 	smp_mb();
394*4882a593Smuzhiyun 
395*4882a593Smuzhiyun 	__asm__ __volatile__(
396*4882a593Smuzhiyun 	"1:	llockd  %0, [%1]	\n"
397*4882a593Smuzhiyun 	"	sub.f   %L0, %L0, 1	# w0 - 1, set C on borrow\n"
398*4882a593Smuzhiyun 	"	sub.c   %H0, %H0, 1	# if C set, w1 - 1\n"
399*4882a593Smuzhiyun 	"	brlt    %H0, 0, 2f	\n"
400*4882a593Smuzhiyun 	"	scondd  %0, [%1]	\n"
401*4882a593Smuzhiyun 	"	bnz     1b		\n"
402*4882a593Smuzhiyun 	"2:				\n"
403*4882a593Smuzhiyun 	: "=&r"(val)
404*4882a593Smuzhiyun 	: "r"(&v->counter)
405*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */
406*4882a593Smuzhiyun 
407*4882a593Smuzhiyun 	smp_mb();
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 	return val;
410*4882a593Smuzhiyun }
411*4882a593Smuzhiyun #define atomic64_dec_if_positive atomic64_dec_if_positive
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun /**
414*4882a593Smuzhiyun  * atomic64_fetch_add_unless - add unless the number is a given value
415*4882a593Smuzhiyun  * @v: pointer of type atomic64_t
416*4882a593Smuzhiyun  * @a: the amount to add to v...
417*4882a593Smuzhiyun  * @u: ...unless v is equal to u.
418*4882a593Smuzhiyun  *
419*4882a593Smuzhiyun  * Atomically adds @a to @v, if it was not @u.
420*4882a593Smuzhiyun  * Returns the old value of @v
421*4882a593Smuzhiyun  */
422*4882a593Smuzhiyun static inline s64 atomic64_fetch_add_unless(atomic64_t *v, s64 a, s64 u)
423*4882a593Smuzhiyun {
424*4882a593Smuzhiyun 	s64 old, temp;
425*4882a593Smuzhiyun 
426*4882a593Smuzhiyun 	smp_mb();
427*4882a593Smuzhiyun 
428*4882a593Smuzhiyun 	__asm__ __volatile__(
429*4882a593Smuzhiyun 	"1:	llockd  %0, [%2]	\n"
430*4882a593Smuzhiyun 	"	brne	%L0, %L4, 2f	# continue to add since v != u \n"
431*4882a593Smuzhiyun 	"	breq.d	%H0, %H4, 3f	# return since v == u \n"
432*4882a593Smuzhiyun 	"2:				\n"
433*4882a593Smuzhiyun 	"	add.f   %L1, %L0, %L3	\n"
434*4882a593Smuzhiyun 	"	adc     %H1, %H0, %H3	\n"
435*4882a593Smuzhiyun 	"	scondd  %1, [%2]	\n"
436*4882a593Smuzhiyun 	"	bnz     1b		\n"
437*4882a593Smuzhiyun 	"3:				\n"
438*4882a593Smuzhiyun 	: "=&r"(old), "=&r" (temp)
439*4882a593Smuzhiyun 	: "r"(&v->counter), "r"(a), "r"(u)
440*4882a593Smuzhiyun 	: "cc");	/* memory clobber comes from smp_mb() */
441*4882a593Smuzhiyun 
442*4882a593Smuzhiyun 	smp_mb();
443*4882a593Smuzhiyun 
444*4882a593Smuzhiyun 	return old;
445*4882a593Smuzhiyun }
446*4882a593Smuzhiyun #define atomic64_fetch_add_unless atomic64_fetch_add_unless
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun #endif	/* !CONFIG_GENERIC_ATOMIC64 */
449*4882a593Smuzhiyun 
450*4882a593Smuzhiyun #endif	/* !__ASSEMBLY__ */
451*4882a593Smuzhiyun 
452*4882a593Smuzhiyun #endif
453